From daf40ecbede543144091cd4d450f95c4310102c6 Mon Sep 17 00:00:00 2001 From: Jim Jiang Date: Wed, 9 Oct 2024 04:45:32 +0000 Subject: [PATCH] delete commit --- scripts/nohup.out | 601210 ------------------------------------------- 1 file changed, 601210 deletions(-) delete mode 100644 scripts/nohup.out diff --git a/scripts/nohup.out b/scripts/nohup.out deleted file mode 100644 index 42db4af..0000000 --- a/scripts/nohup.out +++ /dev/null @@ -1,601210 +0,0 @@ -Start training for LSTM_PPO -Using cpu device -Wrapping the env with a `Monitor` wrapper -Wrapping the env in a DummyVecEnv. -Logging to /home/rstudio/logs/RecurrentPPO_4 ----------------------------- -| time/ | | -| fps | 289 | -| iterations | 1 | -| time_elapsed | 0 | -| total_timesteps | 128 | ----------------------------- --------------------------------------------- -| time/ | | -| fps | 24 | -| iterations | 2 | -| time_elapsed | 10 | -| total_timesteps | 256 | -| train/ | | -| approx_kl | 0.000113586895 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.0842 | -| learning_rate | 0.0003 | -| loss | 0.00259 | -| n_updates | 10 | -| policy_gradient_loss | -0.000681 | -| std | 1 | -| value_loss | 0.00829 | --------------------------------------------- ------------------------------------------- -| time/ | | -| fps | 26 | -| iterations | 3 | -| time_elapsed | 14 | -| total_timesteps | 384 | -| train/ | | -| approx_kl | 0.0002446049 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | -0.000644 | -| n_updates | 20 | -| policy_gradient_loss | -0.000305 | -| std | 1.01 | -| value_loss | 7.12e-05 | ------------------------------------------- ------------------------------------------- -| time/ | | -| fps | 27 | -| iterations | 4 | -| time_elapsed | 18 | -| total_timesteps | 512 | -| train/ | | -| approx_kl | 0.0011929246 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 30 | -| policy_gradient_loss | -0.0014 | -| std | 1.01 | -| value_loss | 2.95e-05 | ------------------------------------------- ------------------------------------------ -| time/ | | -| fps | 27 | -| iterations | 5 | -| time_elapsed | 22 | -| total_timesteps | 640 | -| train/ | | -| approx_kl | 0.001483202 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | 0.000413 | -| n_updates | 40 | -| policy_gradient_loss | 0.000255 | -| std | 1.01 | -| value_loss | 1.57e-05 | ------------------------------------------ ------------------------------------------ -| time/ | | -| fps | 28 | -| iterations | 6 | -| time_elapsed | 26 | -| total_timesteps | 768 | -| train/ | | -| approx_kl | 0.011552145 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.00472 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 50 | -| policy_gradient_loss | -0.00433 | -| std | 1.01 | -| value_loss | 1.15e-05 | ------------------------------------------ ------------------------------------------- -| time/ | | -| fps | 28 | -| iterations | 7 | -| time_elapsed | 31 | -| total_timesteps | 896 | -| train/ | | -| approx_kl | 0.0015612617 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.00968 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 60 | -| policy_gradient_loss | -0.00129 | -| std | 1.01 | -| value_loss | 1.18e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 29 | -| iterations | 8 | -| time_elapsed | 34 | -| total_timesteps | 1024 | -| train/ | | -| approx_kl | 0.012862865 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 70 | -| policy_gradient_loss | -0.00328 | -| std | 1.01 | -| value_loss | 1.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 27 | -| iterations | 9 | -| time_elapsed | 41 | -| total_timesteps | 1152 | -| train/ | | -| approx_kl | 0.035483662 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.136 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 80 | -| policy_gradient_loss | -0.00704 | -| std | 1.01 | -| value_loss | 0.0047 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 27 | -| iterations | 10 | -| time_elapsed | 46 | -| total_timesteps | 1280 | -| train/ | | -| approx_kl | 0.013930913 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 90 | -| policy_gradient_loss | -0.00258 | -| std | 1.01 | -| value_loss | 1.34e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 28 | -| iterations | 11 | -| time_elapsed | 50 | -| total_timesteps | 1408 | -| train/ | | -| approx_kl | 0.008416437 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -5.32 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 100 | -| policy_gradient_loss | -0.00111 | -| std | 1.02 | -| value_loss | 1.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 28 | -| iterations | 12 | -| time_elapsed | 54 | -| total_timesteps | 1536 | -| train/ | | -| approx_kl | 0.012205945 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.783 | -| learning_rate | 0.0003 | -| loss | -0.0087 | -| n_updates | 110 | -| policy_gradient_loss | -0.0061 | -| std | 1.02 | -| value_loss | 2.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 28 | -| iterations | 13 | -| time_elapsed | 58 | -| total_timesteps | 1664 | -| train/ | | -| approx_kl | 0.008145172 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.00487 | -| learning_rate | 0.0003 | -| loss | -0.00737 | -| n_updates | 120 | -| policy_gradient_loss | -0.00289 | -| std | 1.02 | -| value_loss | 1.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 28 | -| iterations | 14 | -| time_elapsed | 62 | -| total_timesteps | 1792 | -| train/ | | -| approx_kl | 0.016046433 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 130 | -| policy_gradient_loss | -0.0047 | -| std | 1.02 | -| value_loss | 5.71e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 29 | -| iterations | 15 | -| time_elapsed | 65 | -| total_timesteps | 1920 | -| train/ | | -| approx_kl | 0.0066089467 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 140 | -| policy_gradient_loss | -0.00438 | -| std | 1.02 | -| value_loss | 3.25e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 29 | -| iterations | 16 | -| time_elapsed | 69 | -| total_timesteps | 2048 | -| train/ | | -| approx_kl | 0.011983199 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.07 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 150 | -| policy_gradient_loss | -0.00893 | -| std | 1.02 | -| value_loss | 1.59e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 28 | -| iterations | 17 | -| time_elapsed | 76 | -| total_timesteps | 2176 | -| train/ | | -| approx_kl | 0.00068130996 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.233 | -| learning_rate | 0.0003 | -| loss | 0.00232 | -| n_updates | 160 | -| policy_gradient_loss | 0.000851 | -| std | 1.02 | -| value_loss | 0.00244 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 28 | -| iterations | 18 | -| time_elapsed | 80 | -| total_timesteps | 2304 | -| train/ | | -| approx_kl | 0.0014098329 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -130 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 170 | -| policy_gradient_loss | -0.00608 | -| std | 1.02 | -| value_loss | 1.6e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 28 | -| iterations | 19 | -| time_elapsed | 84 | -| total_timesteps | 2432 | -| train/ | | -| approx_kl | 0.0033599092 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -163 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 180 | -| policy_gradient_loss | -0.00501 | -| std | 1.02 | -| value_loss | 7.06e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 28 | -| iterations | 20 | -| time_elapsed | 88 | -| total_timesteps | 2560 | -| train/ | | -| approx_kl | 0.00096970005 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -142 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 190 | -| policy_gradient_loss | -0.000733 | -| std | 1.01 | -| value_loss | 4.43e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 28 | -| iterations | 21 | -| time_elapsed | 92 | -| total_timesteps | 2688 | -| train/ | | -| approx_kl | 0.0010001645 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -37.5 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 200 | -| policy_gradient_loss | -0.00151 | -| std | 1.01 | -| value_loss | 2.89e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 28 | -| iterations | 22 | -| time_elapsed | 97 | -| total_timesteps | 2816 | -| train/ | | -| approx_kl | 0.00078976294 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 210 | -| policy_gradient_loss | -0.0014 | -| std | 1.01 | -| value_loss | 7.89e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 28 | -| iterations | 23 | -| time_elapsed | 102 | -| total_timesteps | 2944 | -| train/ | | -| approx_kl | 0.0005437271 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | 0.000723 | -| n_updates | 220 | -| policy_gradient_loss | 0.00049 | -| std | 1.01 | -| value_loss | 2.63e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 28 | -| iterations | 24 | -| time_elapsed | 106 | -| total_timesteps | 3072 | -| train/ | | -| approx_kl | 0.00016476912 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.0215 | -| learning_rate | 0.0003 | -| loss | -0.000771 | -| n_updates | 230 | -| policy_gradient_loss | -0.00034 | -| std | 1.01 | -| value_loss | 1.15e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 27 | -| iterations | 25 | -| time_elapsed | 114 | -| total_timesteps | 3200 | -| train/ | | -| approx_kl | 0.00037914794 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.164 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 240 | -| policy_gradient_loss | -0.00164 | -| std | 1.02 | -| value_loss | 0.0129 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 27 | -| iterations | 26 | -| time_elapsed | 119 | -| total_timesteps | 3328 | -| train/ | | -| approx_kl | 8.114753e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -126 | -| learning_rate | 0.0003 | -| loss | 0.000385 | -| n_updates | 250 | -| policy_gradient_loss | 0.000255 | -| std | 1.02 | -| value_loss | 4e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 28 | -| iterations | 27 | -| time_elapsed | 123 | -| total_timesteps | 3456 | -| train/ | | -| approx_kl | 1.7454382e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -133 | -| learning_rate | 0.0003 | -| loss | -0.000183 | -| n_updates | 260 | -| policy_gradient_loss | -5.21e-05 | -| std | 1.02 | -| value_loss | 1.17e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 28 | -| iterations | 28 | -| time_elapsed | 127 | -| total_timesteps | 3584 | -| train/ | | -| approx_kl | 7.751863e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | -1.24e-05 | -| n_updates | 270 | -| policy_gradient_loss | 2.14e-05 | -| std | 1.02 | -| value_loss | 1.95e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 28 | -| iterations | 29 | -| time_elapsed | 131 | -| total_timesteps | 3712 | -| train/ | | -| approx_kl | 0.0001460677 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -9.91 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 280 | -| policy_gradient_loss | -0.000476 | -| std | 1.02 | -| value_loss | 9.16e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 28 | -| iterations | 30 | -| time_elapsed | 136 | -| total_timesteps | 3840 | -| train/ | | -| approx_kl | 0.0002108952 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.000215 | -| n_updates | 290 | -| policy_gradient_loss | -0.000124 | -| std | 1.02 | -| value_loss | 3.32e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 28 | -| iterations | 31 | -| time_elapsed | 140 | -| total_timesteps | 3968 | -| train/ | | -| approx_kl | 4.8140064e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | -0.000566 | -| n_updates | 300 | -| policy_gradient_loss | -0.00015 | -| std | 1.02 | -| value_loss | 8.82e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 28 | -| iterations | 32 | -| time_elapsed | 144 | -| total_timesteps | 4096 | -| train/ | | -| approx_kl | 4.5935158e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.00679 | -| learning_rate | 0.0003 | -| loss | -0.000377 | -| n_updates | 310 | -| policy_gradient_loss | -0.000207 | -| std | 1.03 | -| value_loss | 3.92e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 27 | -| iterations | 33 | -| time_elapsed | 151 | -| total_timesteps | 4224 | -| train/ | | -| approx_kl | 0.00020552194 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 320 | -| policy_gradient_loss | -0.000818 | -| std | 1.03 | -| value_loss | 0.000636 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 27 | -| iterations | 34 | -| time_elapsed | 156 | -| total_timesteps | 4352 | -| train/ | | -| approx_kl | 0.0003304975 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -74.8 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 330 | -| policy_gradient_loss | -0.00067 | -| std | 1.03 | -| value_loss | 4.5e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 27 | -| iterations | 35 | -| time_elapsed | 160 | -| total_timesteps | 4480 | -| train/ | | -| approx_kl | 0.00011760881 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -58 | -| learning_rate | 0.0003 | -| loss | -0.00047 | -| n_updates | 340 | -| policy_gradient_loss | -0.000237 | -| std | 1.03 | -| value_loss | 6.78e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 27 | -| iterations | 36 | -| time_elapsed | 164 | -| total_timesteps | 4608 | -| train/ | | -| approx_kl | 6.065704e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -2.55 | -| learning_rate | 0.0003 | -| loss | -0.000134 | -| n_updates | 350 | -| policy_gradient_loss | 2.21e-06 | -| std | 1.03 | -| value_loss | 9.3e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 28 | -| iterations | 37 | -| time_elapsed | 168 | -| total_timesteps | 4736 | -| train/ | | -| approx_kl | 3.1501986e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -3.73 | -| learning_rate | 0.0003 | -| loss | 4.74e-05 | -| n_updates | 360 | -| policy_gradient_loss | 3.6e-05 | -| std | 1.03 | -| value_loss | 2.76e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 28 | -| iterations | 38 | -| time_elapsed | 171 | -| total_timesteps | 4864 | -| train/ | | -| approx_kl | 2.4660956e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.00784 | -| learning_rate | 0.0003 | -| loss | -0.000241 | -| n_updates | 370 | -| policy_gradient_loss | -0.000103 | -| std | 1.03 | -| value_loss | 1.43e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 28 | -| iterations | 39 | -| time_elapsed | 175 | -| total_timesteps | 4992 | -| train/ | | -| approx_kl | 1.3159122e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.0109 | -| learning_rate | 0.0003 | -| loss | 4.88e-06 | -| n_updates | 380 | -| policy_gradient_loss | 7.8e-06 | -| std | 1.04 | -| value_loss | 5.92e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 28 | -| iterations | 40 | -| time_elapsed | 179 | -| total_timesteps | 5120 | -| train/ | | -| approx_kl | 0.0004103179 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 390 | -| policy_gradient_loss | -0.00111 | -| std | 1.04 | -| value_loss | 5.38e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 27 | -| iterations | 41 | -| time_elapsed | 190 | -| total_timesteps | 5248 | -| train/ | | -| approx_kl | 0.0007283706 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.497 | -| learning_rate | 0.0003 | -| loss | 0.000289 | -| n_updates | 400 | -| policy_gradient_loss | -0.000369 | -| std | 1.03 | -| value_loss | 0.00209 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 27 | -| iterations | 42 | -| time_elapsed | 192 | -| total_timesteps | 5376 | -| train/ | | -| approx_kl | 0.0014841538 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -19 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 410 | -| policy_gradient_loss | -0.0016 | -| std | 1.03 | -| value_loss | 4.11e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 27 | -| iterations | 43 | -| time_elapsed | 196 | -| total_timesteps | 5504 | -| train/ | | -| approx_kl | 0.0007407884 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -13.9 | -| learning_rate | 0.0003 | -| loss | 0.000327 | -| n_updates | 420 | -| policy_gradient_loss | 0.000289 | -| std | 1.03 | -| value_loss | 1.33e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 28 | -| iterations | 44 | -| time_elapsed | 200 | -| total_timesteps | 5632 | -| train/ | | -| approx_kl | 0.0036382102 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -2.95 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 430 | -| policy_gradient_loss | -0.00428 | -| std | 1.03 | -| value_loss | 9.34e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 28 | -| iterations | 45 | -| time_elapsed | 204 | -| total_timesteps | 5760 | -| train/ | | -| approx_kl | 0.00094752247 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.733 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 440 | -| policy_gradient_loss | 0.000978 | -| std | 1.03 | -| value_loss | 3.86e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 28 | -| iterations | 46 | -| time_elapsed | 208 | -| total_timesteps | 5888 | -| train/ | | -| approx_kl | 4.596077e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.42 | -| learning_rate | 0.0003 | -| loss | 3.05e-05 | -| n_updates | 450 | -| policy_gradient_loss | 3.99e-05 | -| std | 1.03 | -| value_loss | 3.98e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 28 | -| iterations | 47 | -| time_elapsed | 212 | -| total_timesteps | 6016 | -| train/ | | -| approx_kl | 0.0002101101 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 460 | -| policy_gradient_loss | -0.000511 | -| std | 1.03 | -| value_loss | 1.74e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 27 | -| iterations | 48 | -| time_elapsed | 221 | -| total_timesteps | 6144 | -| train/ | | -| approx_kl | 0.00021675229 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.479 | -| learning_rate | 0.0003 | -| loss | 0.00276 | -| n_updates | 470 | -| policy_gradient_loss | -0.000316 | -| std | 1.04 | -| value_loss | 0.00902 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 27 | -| iterations | 49 | -| time_elapsed | 226 | -| total_timesteps | 6272 | -| train/ | | -| approx_kl | 0.0024344032 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -59.4 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 480 | -| policy_gradient_loss | -0.00627 | -| std | 1.03 | -| value_loss | 0.00055 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 27 | -| iterations | 50 | -| time_elapsed | 230 | -| total_timesteps | 6400 | -| train/ | | -| approx_kl | 0.008396704 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -16.1 | -| learning_rate | 0.0003 | -| loss | -0.0094 | -| n_updates | 490 | -| policy_gradient_loss | -0.0048 | -| std | 1.03 | -| value_loss | 0.000537 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 27 | -| iterations | 51 | -| time_elapsed | 234 | -| total_timesteps | 6528 | -| train/ | | -| approx_kl | 0.006329242 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -5.13 | -| learning_rate | 0.0003 | -| loss | -0.000373 | -| n_updates | 500 | -| policy_gradient_loss | -0.000313 | -| std | 1.03 | -| value_loss | 0.000235 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 27 | -| iterations | 52 | -| time_elapsed | 238 | -| total_timesteps | 6656 | -| train/ | | -| approx_kl | 0.0015110415 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.67 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 510 | -| policy_gradient_loss | -0.00151 | -| std | 1.03 | -| value_loss | 0.00019 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 28 | -| iterations | 53 | -| time_elapsed | 241 | -| total_timesteps | 6784 | -| train/ | | -| approx_kl | 0.015062594 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 520 | -| policy_gradient_loss | -0.00844 | -| std | 1.03 | -| value_loss | 2.69e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 28 | -| iterations | 54 | -| time_elapsed | 245 | -| total_timesteps | 6912 | -| train/ | | -| approx_kl | 0.00010663783 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.0201 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 530 | -| policy_gradient_loss | 0.000382 | -| std | 1.03 | -| value_loss | 4.83e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 28 | -| iterations | 55 | -| time_elapsed | 249 | -| total_timesteps | 7040 | -| train/ | | -| approx_kl | 0.0034327772 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | -0.00361 | -| n_updates | 540 | -| policy_gradient_loss | -0.00184 | -| std | 1.04 | -| value_loss | 3.13e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 27 | -| iterations | 56 | -| time_elapsed | 257 | -| total_timesteps | 7168 | -| train/ | | -| approx_kl | 0.00017237104 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.87 | -| learning_rate | 0.0003 | -| loss | 0.00136 | -| n_updates | 550 | -| policy_gradient_loss | 0.000584 | -| std | 1.03 | -| value_loss | 0.00186 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 27 | -| iterations | 57 | -| time_elapsed | 261 | -| total_timesteps | 7296 | -| train/ | | -| approx_kl | 0.002334142 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -69.2 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 560 | -| policy_gradient_loss | -0.00153 | -| std | 1.03 | -| value_loss | 3.17e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 27 | -| iterations | 58 | -| time_elapsed | 265 | -| total_timesteps | 7424 | -| train/ | | -| approx_kl | 0.00088998023 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -47.7 | -| learning_rate | 0.0003 | -| loss | -0.000406 | -| n_updates | 570 | -| policy_gradient_loss | -0.000181 | -| std | 1.03 | -| value_loss | 1.49e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 28 | -| iterations | 59 | -| time_elapsed | 269 | -| total_timesteps | 7552 | -| train/ | | -| approx_kl | 0.00028054742 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -44.5 | -| learning_rate | 0.0003 | -| loss | -0.000501 | -| n_updates | 580 | -| policy_gradient_loss | -0.000224 | -| std | 1.03 | -| value_loss | 1.63e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 28 | -| iterations | 60 | -| time_elapsed | 271 | -| total_timesteps | 7680 | -| train/ | | -| approx_kl | 5.218666e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.52 | -| learning_rate | 0.0003 | -| loss | -0.000481 | -| n_updates | 590 | -| policy_gradient_loss | -0.000126 | -| std | 1.03 | -| value_loss | 1.28e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 28 | -| iterations | 61 | -| time_elapsed | 275 | -| total_timesteps | 7808 | -| train/ | | -| approx_kl | 0.0031361762 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -2.69 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 600 | -| policy_gradient_loss | -0.00325 | -| std | 1.03 | -| value_loss | 7.44e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 28 | -| iterations | 62 | -| time_elapsed | 280 | -| total_timesteps | 7936 | -| train/ | | -| approx_kl | 0.0006426731 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.846 | -| learning_rate | 0.0003 | -| loss | -0.000932 | -| n_updates | 610 | -| policy_gradient_loss | 0.00075 | -| std | 1.03 | -| value_loss | 7.86e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 28 | -| iterations | 63 | -| time_elapsed | 285 | -| total_timesteps | 8064 | -| train/ | | -| approx_kl | 0.0012498447 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 620 | -| policy_gradient_loss | -0.000894 | -| std | 1.04 | -| value_loss | 3.94e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 28 | -| iterations | 64 | -| time_elapsed | 292 | -| total_timesteps | 8192 | -| train/ | | -| approx_kl | 0.0010702871 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.814 | -| learning_rate | 0.0003 | -| loss | -2.49e-06 | -| n_updates | 630 | -| policy_gradient_loss | -0.000586 | -| std | 1.04 | -| value_loss | 0.00436 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 27 | -| iterations | 65 | -| time_elapsed | 297 | -| total_timesteps | 8320 | -| train/ | | -| approx_kl | 0.0028191889 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -95.5 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 640 | -| policy_gradient_loss | -0.00465 | -| std | 1.03 | -| value_loss | 0.000202 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 27 | -| iterations | 66 | -| time_elapsed | 302 | -| total_timesteps | 8448 | -| train/ | | -| approx_kl | 0.0023025507 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -117 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 650 | -| policy_gradient_loss | -0.00227 | -| std | 1.03 | -| value_loss | 1.41e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 28 | -| iterations | 67 | -| time_elapsed | 306 | -| total_timesteps | 8576 | -| train/ | | -| approx_kl | 0.00019716984 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -3.06 | -| learning_rate | 0.0003 | -| loss | 0.00086 | -| n_updates | 660 | -| policy_gradient_loss | 0.000559 | -| std | 1.03 | -| value_loss | 6.12e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 28 | -| iterations | 68 | -| time_elapsed | 310 | -| total_timesteps | 8704 | -| train/ | | -| approx_kl | 3.739493e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -3.18 | -| learning_rate | 0.0003 | -| loss | -0.000552 | -| n_updates | 670 | -| policy_gradient_loss | -0.00021 | -| std | 1.03 | -| value_loss | 1.35e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 28 | -| iterations | 69 | -| time_elapsed | 314 | -| total_timesteps | 8832 | -| train/ | | -| approx_kl | 0.00037989626 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.00315 | -| learning_rate | 0.0003 | -| loss | -0.00348 | -| n_updates | 680 | -| policy_gradient_loss | -0.00153 | -| std | 1.04 | -| value_loss | 6.53e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 28 | -| iterations | 70 | -| time_elapsed | 318 | -| total_timesteps | 8960 | -| train/ | | -| approx_kl | 0.00085838046 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0876 | -| learning_rate | 0.0003 | -| loss | -0.00269 | -| n_updates | 690 | -| policy_gradient_loss | -0.0013 | -| std | 1.04 | -| value_loss | 3.73e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 71 | -| time_elapsed | 322 | -| total_timesteps | 9088 | -| train/ | | -| approx_kl | 0.0036855647 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.46 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 700 | -| policy_gradient_loss | -0.00586 | -| std | 1.04 | -| value_loss | 2.66e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 72 | -| time_elapsed | 328 | -| total_timesteps | 9216 | -| train/ | | -| approx_kl | 0.006764061 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -1.46 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 710 | -| policy_gradient_loss | -0.00364 | -| std | 1.04 | -| value_loss | 0.00125 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 73 | -| time_elapsed | 332 | -| total_timesteps | 9344 | -| train/ | | -| approx_kl | 0.0049943035 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.46 | -| explained_variance | -101 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 720 | -| policy_gradient_loss | -0.00202 | -| std | 1.04 | -| value_loss | 1.56e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 74 | -| time_elapsed | 336 | -| total_timesteps | 9472 | -| train/ | | -| approx_kl | 0.0009838603 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.46 | -| explained_variance | -109 | -| learning_rate | 0.0003 | -| loss | -0.00489 | -| n_updates | 730 | -| policy_gradient_loss | -0.000841 | -| std | 1.04 | -| value_loss | 4.28e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 75 | -| time_elapsed | 339 | -| total_timesteps | 9600 | -| train/ | | -| approx_kl | 0.001119629 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -19.3 | -| learning_rate | 0.0003 | -| loss | 0.00137 | -| n_updates | 740 | -| policy_gradient_loss | 0.000933 | -| std | 1.04 | -| value_loss | 6.46e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 76 | -| time_elapsed | 343 | -| total_timesteps | 9728 | -| train/ | | -| approx_kl | 0.0002458659 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0619 | -| learning_rate | 0.0003 | -| loss | -0.000543 | -| n_updates | 750 | -| policy_gradient_loss | -0.000225 | -| std | 1.03 | -| value_loss | 1.41e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 77 | -| time_elapsed | 347 | -| total_timesteps | 9856 | -| train/ | | -| approx_kl | 0.0006223023 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.0178 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 760 | -| policy_gradient_loss | -0.000681 | -| std | 1.03 | -| value_loss | 8.07e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 28 | -| iterations | 78 | -| time_elapsed | 351 | -| total_timesteps | 9984 | -| train/ | | -| approx_kl | 0.0016925028 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.00237 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 770 | -| policy_gradient_loss | -0.000631 | -| std | 1.03 | -| value_loss | 1.98e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.801 | -| time/ | | -| fps | 28 | -| iterations | 79 | -| time_elapsed | 355 | -| total_timesteps | 10112 | -| train/ | | -| approx_kl | 2.0859297e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.000208 | -| n_updates | 780 | -| policy_gradient_loss | 0.000265 | -| std | 1.04 | -| value_loss | 1.42e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.801 | -| time/ | | -| fps | 27 | -| iterations | 80 | -| time_elapsed | 366 | -| total_timesteps | 10240 | -| train/ | | -| approx_kl | 6.779097e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.66 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 790 | -| policy_gradient_loss | -6.41e-05 | -| std | 1.04 | -| value_loss | 0.00304 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.801 | -| time/ | | -| fps | 27 | -| iterations | 81 | -| time_elapsed | 370 | -| total_timesteps | 10368 | -| train/ | | -| approx_kl | 0.0029496327 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -44.4 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 800 | -| policy_gradient_loss | -0.00578 | -| std | 1.04 | -| value_loss | 1.74e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.801 | -| time/ | | -| fps | 28 | -| iterations | 82 | -| time_elapsed | 374 | -| total_timesteps | 10496 | -| train/ | | -| approx_kl | 0.003969173 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -88.3 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 810 | -| policy_gradient_loss | -0.0057 | -| std | 1.03 | -| value_loss | 6.29e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.801 | -| time/ | | -| fps | 28 | -| iterations | 83 | -| time_elapsed | 378 | -| total_timesteps | 10624 | -| train/ | | -| approx_kl | 0.00052866014 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -5.35 | -| learning_rate | 0.0003 | -| loss | 0.00122 | -| n_updates | 820 | -| policy_gradient_loss | 0.000763 | -| std | 1.03 | -| value_loss | 2.73e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.801 | -| time/ | | -| fps | 28 | -| iterations | 84 | -| time_elapsed | 381 | -| total_timesteps | 10752 | -| train/ | | -| approx_kl | 7.001683e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.000189 | -| n_updates | 830 | -| policy_gradient_loss | -2.28e-05 | -| std | 1.03 | -| value_loss | 9.7e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.801 | -| time/ | | -| fps | 28 | -| iterations | 85 | -| time_elapsed | 385 | -| total_timesteps | 10880 | -| train/ | | -| approx_kl | 0.00012378767 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.00369 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 840 | -| policy_gradient_loss | -0.00067 | -| std | 1.03 | -| value_loss | 7.05e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 28 | -| iterations | 86 | -| time_elapsed | 390 | -| total_timesteps | 11008 | -| train/ | | -| approx_kl | 1.1320226e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.00176 | -| learning_rate | 0.0003 | -| loss | -0.000123 | -| n_updates | 850 | -| policy_gradient_loss | 0.000406 | -| std | 1.03 | -| value_loss | 5.68e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 87 | -| time_elapsed | 400 | -| total_timesteps | 11136 | -| train/ | | -| approx_kl | 6.687315e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | 0.000503 | -| n_updates | 860 | -| policy_gradient_loss | 4.03e-05 | -| std | 1.03 | -| value_loss | 0.00123 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 88 | -| time_elapsed | 404 | -| total_timesteps | 11264 | -| train/ | | -| approx_kl | 0.00031878008 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -2.14 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 870 | -| policy_gradient_loss | -0.00161 | -| std | 1.03 | -| value_loss | 3.78e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 89 | -| time_elapsed | 409 | -| total_timesteps | 11392 | -| train/ | | -| approx_kl | 0.00020910194 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -176 | -| learning_rate | 0.0003 | -| loss | 0.000612 | -| n_updates | 880 | -| policy_gradient_loss | 0.000378 | -| std | 1.04 | -| value_loss | 3.98e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 90 | -| time_elapsed | 412 | -| total_timesteps | 11520 | -| train/ | | -| approx_kl | 1.559453e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -5.72 | -| learning_rate | 0.0003 | -| loss | -0.000308 | -| n_updates | 890 | -| policy_gradient_loss | -8.09e-05 | -| std | 1.04 | -| value_loss | 6.3e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 91 | -| time_elapsed | 417 | -| total_timesteps | 11648 | -| train/ | | -| approx_kl | 1.759082e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -3.44 | -| learning_rate | 0.0003 | -| loss | 2.81e-05 | -| n_updates | 900 | -| policy_gradient_loss | 2.7e-05 | -| std | 1.03 | -| value_loss | 2.86e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 92 | -| time_elapsed | 420 | -| total_timesteps | 11776 | -| train/ | | -| approx_kl | 0.00017342577 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 910 | -| policy_gradient_loss | -0.000864 | -| std | 1.03 | -| value_loss | 1.06e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 93 | -| time_elapsed | 425 | -| total_timesteps | 11904 | -| train/ | | -| approx_kl | 0.000342133 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.321 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 920 | -| policy_gradient_loss | -0.00154 | -| std | 1.03 | -| value_loss | 4.93e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 94 | -| time_elapsed | 430 | -| total_timesteps | 12032 | -| train/ | | -| approx_kl | 0.0005376688 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.00831 | -| learning_rate | 0.0003 | -| loss | -0.00516 | -| n_updates | 930 | -| policy_gradient_loss | -0.00255 | -| std | 1.03 | -| value_loss | 1.83e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 95 | -| time_elapsed | 438 | -| total_timesteps | 12160 | -| train/ | | -| approx_kl | 0.000196598 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | -1.23e-05 | -| n_updates | 940 | -| policy_gradient_loss | -0.000103 | -| std | 1.03 | -| value_loss | 0.000337 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 96 | -| time_elapsed | 443 | -| total_timesteps | 12288 | -| train/ | | -| approx_kl | 2.622325e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -137 | -| learning_rate | 0.0003 | -| loss | -8.46e-05 | -| n_updates | 950 | -| policy_gradient_loss | -4.28e-05 | -| std | 1.03 | -| value_loss | 2.15e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 97 | -| time_elapsed | 446 | -| total_timesteps | 12416 | -| train/ | | -| approx_kl | 4.665926e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -171 | -| learning_rate | 0.0003 | -| loss | -1.47e-05 | -| n_updates | 960 | -| policy_gradient_loss | 1.76e-05 | -| std | 1.03 | -| value_loss | 6.88e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 98 | -| time_elapsed | 450 | -| total_timesteps | 12544 | -| train/ | | -| approx_kl | 6.3995365e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -135 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 970 | -| policy_gradient_loss | -0.000662 | -| std | 1.03 | -| value_loss | 1.53e-09 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 99 | -| time_elapsed | 453 | -| total_timesteps | 12672 | -| train/ | | -| approx_kl | 0.000104510225 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -5.3 | -| learning_rate | 0.0003 | -| loss | -0.000947 | -| n_updates | 980 | -| policy_gradient_loss | -0.000481 | -| std | 1.03 | -| value_loss | 6.86e-11 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 100 | -| time_elapsed | 458 | -| total_timesteps | 12800 | -| train/ | | -| approx_kl | 8.257665e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -3.96 | -| learning_rate | 0.0003 | -| loss | -0.000958 | -| n_updates | 990 | -| policy_gradient_loss | -0.000479 | -| std | 1.03 | -| value_loss | 2.45e-11 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 27 | -| iterations | 101 | -| time_elapsed | 463 | -| total_timesteps | 12928 | -| train/ | | -| approx_kl | 1.9129366e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.00401 | -| learning_rate | 0.0003 | -| loss | -0.000848 | -| n_updates | 1000 | -| policy_gradient_loss | -0.000113 | -| std | 1.02 | -| value_loss | 6.66e-12 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 102 | -| time_elapsed | 466 | -| total_timesteps | 13056 | -| train/ | | -| approx_kl | 0.00015095994 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 1010 | -| policy_gradient_loss | -0.000673 | -| std | 1.02 | -| value_loss | 3.88e-12 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 103 | -| time_elapsed | 473 | -| total_timesteps | 13184 | -| train/ | | -| approx_kl | 0.00010137679 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | -0.000932 | -| n_updates | 1020 | -| policy_gradient_loss | -0.000511 | -| std | 1.02 | -| value_loss | 0.000132 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 104 | -| time_elapsed | 478 | -| total_timesteps | 13312 | -| train/ | | -| approx_kl | 8.272426e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 1030 | -| policy_gradient_loss | -0.00114 | -| std | 1.02 | -| value_loss | 1.84e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 105 | -| time_elapsed | 483 | -| total_timesteps | 13440 | -| train/ | | -| approx_kl | 8.682348e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -6.35 | -| learning_rate | 0.0003 | -| loss | -0.000785 | -| n_updates | 1040 | -| policy_gradient_loss | -0.000416 | -| std | 1.03 | -| value_loss | 5.29e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 106 | -| time_elapsed | 488 | -| total_timesteps | 13568 | -| train/ | | -| approx_kl | 1.0043848e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.21 | -| learning_rate | 0.0003 | -| loss | 0.000112 | -| n_updates | 1050 | -| policy_gradient_loss | 6.94e-05 | -| std | 1.03 | -| value_loss | 8.43e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 107 | -| time_elapsed | 493 | -| total_timesteps | 13696 | -| train/ | | -| approx_kl | 4.810281e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.00502 | -| learning_rate | 0.0003 | -| loss | -0.00038 | -| n_updates | 1060 | -| policy_gradient_loss | -0.000152 | -| std | 1.03 | -| value_loss | 4.04e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 108 | -| time_elapsed | 497 | -| total_timesteps | 13824 | -| train/ | | -| approx_kl | 3.3783726e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -3.65e-05 | -| n_updates | 1070 | -| policy_gradient_loss | -1.94e-05 | -| std | 1.03 | -| value_loss | 1.84e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.732 | -| time/ | | -| fps | 27 | -| iterations | 109 | -| time_elapsed | 501 | -| total_timesteps | 13952 | -| train/ | | -| approx_kl | 5.9492886e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.000357 | -| n_updates | 1080 | -| policy_gradient_loss | -0.000112 | -| std | 1.03 | -| value_loss | 1.36e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 110 | -| time_elapsed | 506 | -| total_timesteps | 14080 | -| train/ | | -| approx_kl | 1.6735867e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.000244 | -| n_updates | 1090 | -| policy_gradient_loss | -9.09e-05 | -| std | 1.03 | -| value_loss | 8.75e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 111 | -| time_elapsed | 513 | -| total_timesteps | 14208 | -| train/ | | -| approx_kl | 3.3517834e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 1100 | -| policy_gradient_loss | -0.000464 | -| std | 1.03 | -| value_loss | 0.000184 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 112 | -| time_elapsed | 517 | -| total_timesteps | 14336 | -| train/ | | -| approx_kl | 1.0444783e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -157 | -| learning_rate | 0.0003 | -| loss | -6.69e-05 | -| n_updates | 1110 | -| policy_gradient_loss | 0.000119 | -| std | 1.03 | -| value_loss | 1.33e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 113 | -| time_elapsed | 521 | -| total_timesteps | 14464 | -| train/ | | -| approx_kl | 1.1869241e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -134 | -| learning_rate | 0.0003 | -| loss | -6.04e-06 | -| n_updates | 1120 | -| policy_gradient_loss | -1.36e-06 | -| std | 1.02 | -| value_loss | 3.71e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 114 | -| time_elapsed | 526 | -| total_timesteps | 14592 | -| train/ | | -| approx_kl | 1.3690442e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -72.7 | -| learning_rate | 0.0003 | -| loss | -8.89e-05 | -| n_updates | 1130 | -| policy_gradient_loss | -1.86e-05 | -| std | 1.02 | -| value_loss | 1.94e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 115 | -| time_elapsed | 530 | -| total_timesteps | 14720 | -| train/ | | -| approx_kl | 1.6756356e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.00031 | -| n_updates | 1140 | -| policy_gradient_loss | -0.000144 | -| std | 1.03 | -| value_loss | 4.14e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 116 | -| time_elapsed | 533 | -| total_timesteps | 14848 | -| train/ | | -| approx_kl | 2.7478673e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | -0.000675 | -| n_updates | 1150 | -| policy_gradient_loss | -0.000315 | -| std | 1.03 | -| value_loss | 1.14e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.705 | -| time/ | | -| fps | 27 | -| iterations | 117 | -| time_elapsed | 538 | -| total_timesteps | 14976 | -| train/ | | -| approx_kl | 1.1648983e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.0151 | -| learning_rate | 0.0003 | -| loss | -0.000261 | -| n_updates | 1160 | -| policy_gradient_loss | 9.35e-06 | -| std | 1.03 | -| value_loss | 5.06e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 27 | -| iterations | 118 | -| time_elapsed | 542 | -| total_timesteps | 15104 | -| train/ | | -| approx_kl | 2.4842564e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | -0.000325 | -| n_updates | 1170 | -| policy_gradient_loss | -0.000149 | -| std | 1.03 | -| value_loss | 2.09e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 27 | -| iterations | 119 | -| time_elapsed | 551 | -| total_timesteps | 15232 | -| train/ | | -| approx_kl | 1.6195234e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.475 | -| learning_rate | 0.0003 | -| loss | 0.00431 | -| n_updates | 1180 | -| policy_gradient_loss | -0.000182 | -| std | 1.03 | -| value_loss | 0.0108 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 27 | -| iterations | 120 | -| time_elapsed | 556 | -| total_timesteps | 15360 | -| train/ | | -| approx_kl | 1.5571248e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -139 | -| learning_rate | 0.0003 | -| loss | -0.000151 | -| n_updates | 1190 | -| policy_gradient_loss | -0.000106 | -| std | 1.02 | -| value_loss | 0.000196 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 27 | -| iterations | 121 | -| time_elapsed | 560 | -| total_timesteps | 15488 | -| train/ | | -| approx_kl | 2.5692862e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -121 | -| learning_rate | 0.0003 | -| loss | -0.000647 | -| n_updates | 1200 | -| policy_gradient_loss | -0.000316 | -| std | 1.02 | -| value_loss | 8.48e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 27 | -| iterations | 122 | -| time_elapsed | 565 | -| total_timesteps | 15616 | -| train/ | | -| approx_kl | 3.549829e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.967 | -| learning_rate | 0.0003 | -| loss | -0.000798 | -| n_updates | 1210 | -| policy_gradient_loss | -0.000358 | -| std | 1.02 | -| value_loss | 4.45e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 27 | -| iterations | 123 | -| time_elapsed | 569 | -| total_timesteps | 15744 | -| train/ | | -| approx_kl | 2.7008355e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -0.00023 | -| n_updates | 1220 | -| policy_gradient_loss | 5.45e-05 | -| std | 1.02 | -| value_loss | 3.92e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 27 | -| iterations | 124 | -| time_elapsed | 574 | -| total_timesteps | 15872 | -| train/ | | -| approx_kl | 1.8274412e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 1230 | -| policy_gradient_loss | -0.000488 | -| std | 1.03 | -| value_loss | 2.7e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 125 | -| time_elapsed | 579 | -| total_timesteps | 16000 | -| train/ | | -| approx_kl | 7.550232e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.0118 | -| learning_rate | 0.0003 | -| loss | -2.49e-05 | -| n_updates | 1240 | -| policy_gradient_loss | 8.14e-07 | -| std | 1.03 | -| value_loss | 1.09e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 126 | -| time_elapsed | 583 | -| total_timesteps | 16128 | -| train/ | | -| approx_kl | 1.5916303e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.00342 | -| learning_rate | 0.0003 | -| loss | -0.000266 | -| n_updates | 1250 | -| policy_gradient_loss | -4.86e-05 | -| std | 1.03 | -| value_loss | 1.28e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 127 | -| time_elapsed | 595 | -| total_timesteps | 16256 | -| train/ | | -| approx_kl | 2.2457913e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.597 | -| learning_rate | 0.0003 | -| loss | 0.00456 | -| n_updates | 1260 | -| policy_gradient_loss | -0.000178 | -| std | 1.03 | -| value_loss | 0.0116 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 128 | -| time_elapsed | 600 | -| total_timesteps | 16384 | -| train/ | | -| approx_kl | 1.5957281e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -162 | -| learning_rate | 0.0003 | -| loss | -0.000232 | -| n_updates | 1270 | -| policy_gradient_loss | -0.000165 | -| std | 1.03 | -| value_loss | 0.000173 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 129 | -| time_elapsed | 604 | -| total_timesteps | 16512 | -| train/ | | -| approx_kl | 3.1804666e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -102 | -| learning_rate | 0.0003 | -| loss | -0.000564 | -| n_updates | 1280 | -| policy_gradient_loss | -0.000112 | -| std | 1.03 | -| value_loss | 8.62e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 130 | -| time_elapsed | 610 | -| total_timesteps | 16640 | -| train/ | | -| approx_kl | 6.8983063e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -81.2 | -| learning_rate | 0.0003 | -| loss | -7.71e-05 | -| n_updates | 1290 | -| policy_gradient_loss | 2.7e-05 | -| std | 1.03 | -| value_loss | 1.3e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 131 | -| time_elapsed | 615 | -| total_timesteps | 16768 | -| train/ | | -| approx_kl | 3.7094578e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -8.05 | -| learning_rate | 0.0003 | -| loss | 1.65e-05 | -| n_updates | 1300 | -| policy_gradient_loss | 2.82e-05 | -| std | 1.03 | -| value_loss | 2.74e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.73 | -| time/ | | -| fps | 27 | -| iterations | 132 | -| time_elapsed | 619 | -| total_timesteps | 16896 | -| train/ | | -| approx_kl | 2.5087036e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.000853 | -| n_updates | 1310 | -| policy_gradient_loss | -0.000358 | -| std | 1.03 | -| value_loss | 4.09e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 133 | -| time_elapsed | 624 | -| total_timesteps | 17024 | -| train/ | | -| approx_kl | 2.4563633e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | 0.000153 | -| n_updates | 1320 | -| policy_gradient_loss | 0.000154 | -| std | 1.03 | -| value_loss | 6.95e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 134 | -| time_elapsed | 634 | -| total_timesteps | 17152 | -| train/ | | -| approx_kl | 4.940666e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.724 | -| learning_rate | 0.0003 | -| loss | 0.00279 | -| n_updates | 1330 | -| policy_gradient_loss | 1.82e-05 | -| std | 1.03 | -| value_loss | 0.006 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 135 | -| time_elapsed | 638 | -| total_timesteps | 17280 | -| train/ | | -| approx_kl | 2.3548491e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -138 | -| learning_rate | 0.0003 | -| loss | -8.61e-05 | -| n_updates | 1340 | -| policy_gradient_loss | -4.01e-05 | -| std | 1.03 | -| value_loss | 7.09e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 136 | -| time_elapsed | 642 | -| total_timesteps | 17408 | -| train/ | | -| approx_kl | 1.936825e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | -0.000895 | -| n_updates | 1350 | -| policy_gradient_loss | -0.000398 | -| std | 1.03 | -| value_loss | 3.17e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 137 | -| time_elapsed | 646 | -| total_timesteps | 17536 | -| train/ | | -| approx_kl | 3.784895e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -34.5 | -| learning_rate | 0.0003 | -| loss | 0.000102 | -| n_updates | 1360 | -| policy_gradient_loss | 0.000111 | -| std | 1.03 | -| value_loss | 1.69e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 138 | -| time_elapsed | 650 | -| total_timesteps | 17664 | -| train/ | | -| approx_kl | 6.679911e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.000395 | -| n_updates | 1370 | -| policy_gradient_loss | -0.000185 | -| std | 1.03 | -| value_loss | 1.47e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 139 | -| time_elapsed | 655 | -| total_timesteps | 17792 | -| train/ | | -| approx_kl | 1.846999e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | -0.00048 | -| n_updates | 1380 | -| policy_gradient_loss | -0.000226 | -| std | 1.03 | -| value_loss | 1.79e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 27 | -| iterations | 140 | -| time_elapsed | 660 | -| total_timesteps | 17920 | -| train/ | | -| approx_kl | 1.3788231e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -22.6 | -| learning_rate | 0.0003 | -| loss | -0.000277 | -| n_updates | 1390 | -| policy_gradient_loss | 1.03e-05 | -| std | 1.03 | -| value_loss | 1.17e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 141 | -| time_elapsed | 663 | -| total_timesteps | 18048 | -| train/ | | -| approx_kl | 6.072689e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.68 | -| learning_rate | 0.0003 | -| loss | 4.23e-05 | -| n_updates | 1400 | -| policy_gradient_loss | 5.32e-05 | -| std | 1.03 | -| value_loss | 3.32e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 142 | -| time_elapsed | 670 | -| total_timesteps | 18176 | -| train/ | | -| approx_kl | 3.2386743e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 1410 | -| policy_gradient_loss | -0.000918 | -| std | 1.03 | -| value_loss | 0.0018 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 143 | -| time_elapsed | 675 | -| total_timesteps | 18304 | -| train/ | | -| approx_kl | 7.3032454e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -330 | -| learning_rate | 0.0003 | -| loss | -0.00038 | -| n_updates | 1420 | -| policy_gradient_loss | -0.000192 | -| std | 1.03 | -| value_loss | 1.72e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 144 | -| time_elapsed | 679 | -| total_timesteps | 18432 | -| train/ | | -| approx_kl | 2.5542453e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -795 | -| learning_rate | 0.0003 | -| loss | -0.000141 | -| n_updates | 1430 | -| policy_gradient_loss | -7.35e-05 | -| std | 1.03 | -| value_loss | 6.46e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 145 | -| time_elapsed | 683 | -| total_timesteps | 18560 | -| train/ | | -| approx_kl | 3.0526426e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -147 | -| learning_rate | 0.0003 | -| loss | -0.000856 | -| n_updates | 1440 | -| policy_gradient_loss | -0.000377 | -| std | 1.03 | -| value_loss | 3.29e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 146 | -| time_elapsed | 687 | -| total_timesteps | 18688 | -| train/ | | -| approx_kl | 0.00015797513 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -93.3 | -| learning_rate | 0.0003 | -| loss | -0.00266 | -| n_updates | 1450 | -| policy_gradient_loss | -0.00117 | -| std | 1.02 | -| value_loss | 5.56e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 147 | -| time_elapsed | 691 | -| total_timesteps | 18816 | -| train/ | | -| approx_kl | 0.0010570735 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -251 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 1460 | -| policy_gradient_loss | -0.0014 | -| std | 1.02 | -| value_loss | 4.88e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 27 | -| iterations | 148 | -| time_elapsed | 695 | -| total_timesteps | 18944 | -| train/ | | -| approx_kl | 5.6251884e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -3.67 | -| learning_rate | 0.0003 | -| loss | -0.000722 | -| n_updates | 1470 | -| policy_gradient_loss | 0.000129 | -| std | 1.02 | -| value_loss | 9.05e-11 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 149 | -| time_elapsed | 700 | -| total_timesteps | 19072 | -| train/ | | -| approx_kl | 0.00041744765 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -40 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 1480 | -| policy_gradient_loss | -0.00209 | -| std | 1.01 | -| value_loss | 6.72e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 150 | -| time_elapsed | 707 | -| total_timesteps | 19200 | -| train/ | | -| approx_kl | 0.0004228372 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 1490 | -| policy_gradient_loss | -0.00118 | -| std | 1 | -| value_loss | 0.00199 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 151 | -| time_elapsed | 711 | -| total_timesteps | 19328 | -| train/ | | -| approx_kl | 2.536457e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -161 | -| learning_rate | 0.0003 | -| loss | 0.000438 | -| n_updates | 1500 | -| policy_gradient_loss | 0.000434 | -| std | 1 | -| value_loss | 1.32e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 152 | -| time_elapsed | 715 | -| total_timesteps | 19456 | -| train/ | | -| approx_kl | 7.669441e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -121 | -| learning_rate | 0.0003 | -| loss | 3.88e-06 | -| n_updates | 1510 | -| policy_gradient_loss | 1.72e-05 | -| std | 1 | -| value_loss | 2.41e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 153 | -| time_elapsed | 718 | -| total_timesteps | 19584 | -| train/ | | -| approx_kl | 0.00015115831 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -61.9 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 1520 | -| policy_gradient_loss | -0.0011 | -| std | 1 | -| value_loss | 8.71e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 154 | -| time_elapsed | 721 | -| total_timesteps | 19712 | -| train/ | | -| approx_kl | 6.240327e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -371 | -| learning_rate | 0.0003 | -| loss | -0.000433 | -| n_updates | 1530 | -| policy_gradient_loss | 0.000331 | -| std | 0.999 | -| value_loss | 3.81e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 155 | -| time_elapsed | 726 | -| total_timesteps | 19840 | -| train/ | | -| approx_kl | 1.5312806e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -8.85 | -| learning_rate | 0.0003 | -| loss | 0.000338 | -| n_updates | 1540 | -| policy_gradient_loss | 0.00031 | -| std | 0.998 | -| value_loss | 1.74e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 27 | -| iterations | 156 | -| time_elapsed | 729 | -| total_timesteps | 19968 | -| train/ | | -| approx_kl | 6.7907386e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -66.9 | -| learning_rate | 0.0003 | -| loss | -0.000314 | -| n_updates | 1550 | -| policy_gradient_loss | -6.17e-05 | -| std | 0.998 | -| value_loss | 8.01e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 157 | -| time_elapsed | 732 | -| total_timesteps | 20096 | -| train/ | | -| approx_kl | 8.152053e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.0897 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 1560 | -| policy_gradient_loss | -0.000666 | -| std | 1 | -| value_loss | 3e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 158 | -| time_elapsed | 742 | -| total_timesteps | 20224 | -| train/ | | -| approx_kl | 5.8513135e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | -0.000385 | -| n_updates | 1570 | -| policy_gradient_loss | -0.000534 | -| std | 1 | -| value_loss | 0.00131 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 159 | -| time_elapsed | 746 | -| total_timesteps | 20352 | -| train/ | | -| approx_kl | 5.190028e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 1580 | -| policy_gradient_loss | -0.000654 | -| std | 1 | -| value_loss | 4.88e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 160 | -| time_elapsed | 750 | -| total_timesteps | 20480 | -| train/ | | -| approx_kl | 2.1134969e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | -0.000475 | -| n_updates | 1590 | -| policy_gradient_loss | -0.000253 | -| std | 1 | -| value_loss | 1.15e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 161 | -| time_elapsed | 753 | -| total_timesteps | 20608 | -| train/ | | -| approx_kl | 7.881783e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | -5.92e-05 | -| n_updates | 1600 | -| policy_gradient_loss | -3.49e-05 | -| std | 0.999 | -| value_loss | 8.37e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 162 | -| time_elapsed | 757 | -| total_timesteps | 20736 | -| train/ | | -| approx_kl | 1.1641532e-08 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 7.7e-06 | -| n_updates | 1610 | -| policy_gradient_loss | 1.97e-05 | -| std | 0.999 | -| value_loss | 4.33e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 163 | -| time_elapsed | 761 | -| total_timesteps | 20864 | -| train/ | | -| approx_kl | 3.9287843e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.00961 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 1620 | -| policy_gradient_loss | -0.000916 | -| std | 1 | -| value_loss | 8.65e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 27 | -| iterations | 164 | -| time_elapsed | 764 | -| total_timesteps | 20992 | -| train/ | | -| approx_kl | 4.9234834e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.00596 | -| learning_rate | 0.0003 | -| loss | -0.000282 | -| n_updates | 1630 | -| policy_gradient_loss | -0.000111 | -| std | 1.01 | -| value_loss | 1.15e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 27 | -| iterations | 165 | -| time_elapsed | 769 | -| total_timesteps | 21120 | -| train/ | | -| approx_kl | 1.3033394e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -0.000749 | -| n_updates | 1640 | -| policy_gradient_loss | -0.000265 | -| std | 1.01 | -| value_loss | 1.6e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 27 | -| iterations | 166 | -| time_elapsed | 780 | -| total_timesteps | 21248 | -| train/ | | -| approx_kl | 4.232861e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.605 | -| learning_rate | 0.0003 | -| loss | 0.000161 | -| n_updates | 1650 | -| policy_gradient_loss | 9.16e-05 | -| std | 1.01 | -| value_loss | 0.000988 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 27 | -| iterations | 167 | -| time_elapsed | 785 | -| total_timesteps | 21376 | -| train/ | | -| approx_kl | 2.2750814e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -295 | -| learning_rate | 0.0003 | -| loss | -0.000426 | -| n_updates | 1660 | -| policy_gradient_loss | -0.000213 | -| std | 1.01 | -| value_loss | 3.01e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 27 | -| iterations | 168 | -| time_elapsed | 790 | -| total_timesteps | 21504 | -| train/ | | -| approx_kl | 3.0759256e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -247 | -| learning_rate | 0.0003 | -| loss | -0.000589 | -| n_updates | 1670 | -| policy_gradient_loss | -0.000285 | -| std | 1 | -| value_loss | 4.11e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 27 | -| iterations | 169 | -| time_elapsed | 795 | -| total_timesteps | 21632 | -| train/ | | -| approx_kl | 7.691793e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | -0.000629 | -| n_updates | 1680 | -| policy_gradient_loss | -0.000149 | -| std | 1 | -| value_loss | 1.13e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 27 | -| iterations | 170 | -| time_elapsed | 800 | -| total_timesteps | 21760 | -| train/ | | -| approx_kl | 3.6400743e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -3.98 | -| learning_rate | 0.0003 | -| loss | 0.000127 | -| n_updates | 1690 | -| policy_gradient_loss | 0.000104 | -| std | 1 | -| value_loss | 9.86e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 27 | -| iterations | 171 | -| time_elapsed | 805 | -| total_timesteps | 21888 | -| train/ | | -| approx_kl | 1.9700266e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.00847 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 1700 | -| policy_gradient_loss | -0.000413 | -| std | 0.999 | -| value_loss | 9.57e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 172 | -| time_elapsed | 810 | -| total_timesteps | 22016 | -| train/ | | -| approx_kl | 4.9415976e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -3.6e-05 | -| n_updates | 1710 | -| policy_gradient_loss | 7.21e-05 | -| std | 0.997 | -| value_loss | 9.59e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 173 | -| time_elapsed | 819 | -| total_timesteps | 22144 | -| train/ | | -| approx_kl | 9.3271956e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | 0.000303 | -| n_updates | 1720 | -| policy_gradient_loss | 2.61e-05 | -| std | 0.996 | -| value_loss | 0.000762 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 174 | -| time_elapsed | 823 | -| total_timesteps | 22272 | -| train/ | | -| approx_kl | 1.3148878e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -388 | -| learning_rate | 0.0003 | -| loss | -0.000541 | -| n_updates | 1730 | -| policy_gradient_loss | -0.000253 | -| std | 0.997 | -| value_loss | 5.94e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 175 | -| time_elapsed | 828 | -| total_timesteps | 22400 | -| train/ | | -| approx_kl | 1.8524006e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -457 | -| learning_rate | 0.0003 | -| loss | 0.000105 | -| n_updates | 1740 | -| policy_gradient_loss | 8.47e-05 | -| std | 0.996 | -| value_loss | 9.51e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 176 | -| time_elapsed | 832 | -| total_timesteps | 22528 | -| train/ | | -| approx_kl | 1.7588027e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -11.9 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 1750 | -| policy_gradient_loss | -0.000519 | -| std | 0.997 | -| value_loss | 3.3e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 177 | -| time_elapsed | 836 | -| total_timesteps | 22656 | -| train/ | | -| approx_kl | 1.9766856e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -20.4 | -| learning_rate | 0.0003 | -| loss | 1.3e-05 | -| n_updates | 1760 | -| policy_gradient_loss | 4.15e-05 | -| std | 0.997 | -| value_loss | 1.24e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 178 | -| time_elapsed | 839 | -| total_timesteps | 22784 | -| train/ | | -| approx_kl | 2.8992072e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.497 | -| learning_rate | 0.0003 | -| loss | -0.000168 | -| n_updates | 1770 | -| policy_gradient_loss | -2.89e-05 | -| std | 0.999 | -| value_loss | 3.32e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 27 | -| iterations | 179 | -| time_elapsed | 844 | -| total_timesteps | 22912 | -| train/ | | -| approx_kl | 6.5012835e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 1780 | -| policy_gradient_loss | -0.000852 | -| std | 1 | -| value_loss | 1.67e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 180 | -| time_elapsed | 848 | -| total_timesteps | 23040 | -| train/ | | -| approx_kl | 7.532025e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.000715 | -| n_updates | 1790 | -| policy_gradient_loss | -0.000372 | -| std | 1 | -| value_loss | 6.34e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 181 | -| time_elapsed | 856 | -| total_timesteps | 23168 | -| train/ | | -| approx_kl | 0.00011726795 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.328 | -| learning_rate | 0.0003 | -| loss | 0.00109 | -| n_updates | 1800 | -| policy_gradient_loss | -0.000851 | -| std | 1.01 | -| value_loss | 0.00616 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 182 | -| time_elapsed | 861 | -| total_timesteps | 23296 | -| train/ | | -| approx_kl | 4.6792906e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.797 | -| learning_rate | 0.0003 | -| loss | 0.000258 | -| n_updates | 1810 | -| policy_gradient_loss | 0.00017 | -| std | 1.01 | -| value_loss | 0.000101 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 183 | -| time_elapsed | 865 | -| total_timesteps | 23424 | -| train/ | | -| approx_kl | 6.7850575e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.000601 | -| n_updates | 1820 | -| policy_gradient_loss | -0.000224 | -| std | 1.01 | -| value_loss | 3.63e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 184 | -| time_elapsed | 868 | -| total_timesteps | 23552 | -| train/ | | -| approx_kl | 0.00033481838 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 1830 | -| policy_gradient_loss | -0.000591 | -| std | 1.01 | -| value_loss | 1.45e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 185 | -| time_elapsed | 872 | -| total_timesteps | 23680 | -| train/ | | -| approx_kl | 0.0069561955 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -4.72e-05 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 1840 | -| policy_gradient_loss | -0.00556 | -| std | 1.01 | -| value_loss | 8.12e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 186 | -| time_elapsed | 874 | -| total_timesteps | 23808 | -| train/ | | -| approx_kl | 0.00046759844 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.00385 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 1850 | -| policy_gradient_loss | 0.000901 | -| std | 1.01 | -| value_loss | 6.36e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 27 | -| iterations | 187 | -| time_elapsed | 879 | -| total_timesteps | 23936 | -| train/ | | -| approx_kl | 0.0012384476 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.00525 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 1860 | -| policy_gradient_loss | 0.00119 | -| std | 1 | -| value_loss | 5.71e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 188 | -| time_elapsed | 884 | -| total_timesteps | 24064 | -| train/ | | -| approx_kl | 0.00038927468 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.00701 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 1870 | -| policy_gradient_loss | -0.00089 | -| std | 1 | -| value_loss | 5.28e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 189 | -| time_elapsed | 891 | -| total_timesteps | 24192 | -| train/ | | -| approx_kl | 0.00048638182 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.674 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 1880 | -| policy_gradient_loss | -0.00138 | -| std | 1.01 | -| value_loss | 0.00357 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 190 | -| time_elapsed | 896 | -| total_timesteps | 24320 | -| train/ | | -| approx_kl | 0.00015090406 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.000228 | -| n_updates | 1890 | -| policy_gradient_loss | -0.00012 | -| std | 1.01 | -| value_loss | 5.79e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 191 | -| time_elapsed | 900 | -| total_timesteps | 24448 | -| train/ | | -| approx_kl | 1.5123747e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.554 | -| learning_rate | 0.0003 | -| loss | -0.000867 | -| n_updates | 1900 | -| policy_gradient_loss | -0.000198 | -| std | 1.01 | -| value_loss | 6.49e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 192 | -| time_elapsed | 904 | -| total_timesteps | 24576 | -| train/ | | -| approx_kl | 1.2070406e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0042 | -| learning_rate | 0.0003 | -| loss | 0.000305 | -| n_updates | 1910 | -| policy_gradient_loss | 0.000234 | -| std | 1.01 | -| value_loss | 7.95e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 193 | -| time_elapsed | 905 | -| total_timesteps | 24704 | -| train/ | | -| approx_kl | 6.506266e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.000632 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 1920 | -| policy_gradient_loss | -0.0005 | -| std | 1.01 | -| value_loss | 7.69e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 194 | -| time_elapsed | 909 | -| total_timesteps | 24832 | -| train/ | | -| approx_kl | 0.00021674205 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 1930 | -| policy_gradient_loss | -0.00154 | -| std | 1.01 | -| value_loss | 5.75e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 27 | -| iterations | 195 | -| time_elapsed | 912 | -| total_timesteps | 24960 | -| train/ | | -| approx_kl | 3.2137614e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | 0.000446 | -| n_updates | 1940 | -| policy_gradient_loss | 0.000333 | -| std | 1.01 | -| value_loss | 3.38e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 196 | -| time_elapsed | 920 | -| total_timesteps | 25088 | -| train/ | | -| approx_kl | 2.8009526e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -2.82 | -| learning_rate | 0.0003 | -| loss | -0.000158 | -| n_updates | 1950 | -| policy_gradient_loss | -4.17e-05 | -| std | 1.01 | -| value_loss | 1.55e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 197 | -| time_elapsed | 929 | -| total_timesteps | 25216 | -| train/ | | -| approx_kl | 4.5318156e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.553 | -| learning_rate | 0.0003 | -| loss | 9.13e-05 | -| n_updates | 1960 | -| policy_gradient_loss | -0.00013 | -| std | 1.01 | -| value_loss | 0.00158 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 198 | -| time_elapsed | 934 | -| total_timesteps | 25344 | -| train/ | | -| approx_kl | 4.45405e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -399 | -| learning_rate | 0.0003 | -| loss | -8.2e-05 | -| n_updates | 1970 | -| policy_gradient_loss | -8.03e-06 | -| std | 1 | -| value_loss | 2.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 199 | -| time_elapsed | 938 | -| total_timesteps | 25472 | -| train/ | | -| approx_kl | 6.83791e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -534 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 1980 | -| policy_gradient_loss | -0.000859 | -| std | 1 | -| value_loss | 4.47e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 200 | -| time_elapsed | 943 | -| total_timesteps | 25600 | -| train/ | | -| approx_kl | 6.6850334e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -3.31e+03 | -| learning_rate | 0.0003 | -| loss | -0.000164 | -| n_updates | 1990 | -| policy_gradient_loss | -7.78e-05 | -| std | 1.01 | -| value_loss | 3.48e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 201 | -| time_elapsed | 947 | -| total_timesteps | 25728 | -| train/ | | -| approx_kl | 1.1706725e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -138 | -| learning_rate | 0.0003 | -| loss | -3.42e-05 | -| n_updates | 2000 | -| policy_gradient_loss | -4.45e-06 | -| std | 1.01 | -| value_loss | 9.76e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 202 | -| time_elapsed | 951 | -| total_timesteps | 25856 | -| train/ | | -| approx_kl | 7.0810784e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -32 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 2010 | -| policy_gradient_loss | -0.000983 | -| std | 1 | -| value_loss | 5.62e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 203 | -| time_elapsed | 955 | -| total_timesteps | 25984 | -| train/ | | -| approx_kl | 3.9784238e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.485 | -| learning_rate | 0.0003 | -| loss | -6.21e-05 | -| n_updates | 2020 | -| policy_gradient_loss | -3.45e-05 | -| std | 1 | -| value_loss | 6.49e-11 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.806 | -| time/ | | -| fps | 27 | -| iterations | 204 | -| time_elapsed | 958 | -| total_timesteps | 26112 | -| train/ | | -| approx_kl | 2.8107781e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.000929 | -| n_updates | 2030 | -| policy_gradient_loss | -0.000443 | -| std | 0.997 | -| value_loss | 3.95e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.806 | -| time/ | | -| fps | 27 | -| iterations | 205 | -| time_elapsed | 969 | -| total_timesteps | 26240 | -| train/ | | -| approx_kl | 1.546694e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.56 | -| learning_rate | 0.0003 | -| loss | 0.00363 | -| n_updates | 2040 | -| policy_gradient_loss | -8.22e-05 | -| std | 0.996 | -| value_loss | 0.00964 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.806 | -| time/ | | -| fps | 27 | -| iterations | 206 | -| time_elapsed | 972 | -| total_timesteps | 26368 | -| train/ | | -| approx_kl | 3.289245e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -289 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 2050 | -| policy_gradient_loss | -0.000591 | -| std | 0.993 | -| value_loss | 0.000221 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.806 | -| time/ | | -| fps | 27 | -| iterations | 207 | -| time_elapsed | 976 | -| total_timesteps | 26496 | -| train/ | | -| approx_kl | 2.6495196e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -195 | -| learning_rate | 0.0003 | -| loss | -0.000182 | -| n_updates | 2060 | -| policy_gradient_loss | -8.11e-05 | -| std | 0.993 | -| value_loss | 4.22e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.806 | -| time/ | | -| fps | 27 | -| iterations | 208 | -| time_elapsed | 979 | -| total_timesteps | 26624 | -| train/ | | -| approx_kl | 8.814968e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -21 | -| learning_rate | 0.0003 | -| loss | -7.92e-05 | -| n_updates | 2070 | -| policy_gradient_loss | 3.14e-05 | -| std | 0.992 | -| value_loss | 4.99e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.806 | -| time/ | | -| fps | 27 | -| iterations | 209 | -| time_elapsed | 983 | -| total_timesteps | 26752 | -| train/ | | -| approx_kl | 1.8447638e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | -0.000406 | -| n_updates | 2080 | -| policy_gradient_loss | -0.000196 | -| std | 0.99 | -| value_loss | 9.1e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.806 | -| time/ | | -| fps | 27 | -| iterations | 210 | -| time_elapsed | 988 | -| total_timesteps | 26880 | -| train/ | | -| approx_kl | 2.3199245e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 8.17e-05 | -| n_updates | 2090 | -| policy_gradient_loss | 5.35e-05 | -| std | 0.989 | -| value_loss | 3.38e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 211 | -| time_elapsed | 992 | -| total_timesteps | 27008 | -| train/ | | -| approx_kl | 1.7697457e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 2100 | -| policy_gradient_loss | -0.000483 | -| std | 0.989 | -| value_loss | 2.37e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 212 | -| time_elapsed | 1004 | -| total_timesteps | 27136 | -| train/ | | -| approx_kl | 1.952611e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -8.9 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 2110 | -| policy_gradient_loss | -0.000167 | -| std | 0.99 | -| value_loss | 0.0048 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 213 | -| time_elapsed | 1009 | -| total_timesteps | 27264 | -| train/ | | -| approx_kl | 2.37301e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -322 | -| learning_rate | 0.0003 | -| loss | 0.000144 | -| n_updates | 2120 | -| policy_gradient_loss | 4.97e-05 | -| std | 0.991 | -| value_loss | 0.000125 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 214 | -| time_elapsed | 1013 | -| total_timesteps | 27392 | -| train/ | | -| approx_kl | 7.576309e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -219 | -| learning_rate | 0.0003 | -| loss | -4.61e-05 | -| n_updates | 2130 | -| policy_gradient_loss | -1.91e-05 | -| std | 0.992 | -| value_loss | 1.81e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 215 | -| time_elapsed | 1017 | -| total_timesteps | 27520 | -| train/ | | -| approx_kl | 3.8417056e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.000294 | -| n_updates | 2140 | -| policy_gradient_loss | -0.000105 | -| std | 0.994 | -| value_loss | 6.18e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 216 | -| time_elapsed | 1021 | -| total_timesteps | 27648 | -| train/ | | -| approx_kl | 7.737428e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.000418 | -| n_updates | 2150 | -| policy_gradient_loss | -0.000166 | -| std | 0.996 | -| value_loss | 2.06e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 217 | -| time_elapsed | 1024 | -| total_timesteps | 27776 | -| train/ | | -| approx_kl | 1.0333955e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.00667 | -| learning_rate | 0.0003 | -| loss | -0.000277 | -| n_updates | 2160 | -| policy_gradient_loss | -0.000143 | -| std | 0.999 | -| value_loss | 1.52e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 27 | -| iterations | 218 | -| time_elapsed | 1028 | -| total_timesteps | 27904 | -| train/ | | -| approx_kl | 5.954411e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.00805 | -| learning_rate | 0.0003 | -| loss | -0.000182 | -| n_updates | 2170 | -| policy_gradient_loss | -8.83e-05 | -| std | 1 | -| value_loss | 1.02e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 219 | -| time_elapsed | 1031 | -| total_timesteps | 28032 | -| train/ | | -| approx_kl | 2.877554e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.00966 | -| learning_rate | 0.0003 | -| loss | -0.000828 | -| n_updates | 2180 | -| policy_gradient_loss | -0.00037 | -| std | 1 | -| value_loss | 7.23e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 220 | -| time_elapsed | 1039 | -| total_timesteps | 28160 | -| train/ | | -| approx_kl | 1.312606e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.668 | -| learning_rate | 0.0003 | -| loss | 0.00207 | -| n_updates | 2190 | -| policy_gradient_loss | 6.94e-05 | -| std | 1 | -| value_loss | 0.00464 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 221 | -| time_elapsed | 1043 | -| total_timesteps | 28288 | -| train/ | | -| approx_kl | 1.414679e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -414 | -| learning_rate | 0.0003 | -| loss | -6.72e-06 | -| n_updates | 2200 | -| policy_gradient_loss | -8.58e-06 | -| std | 1 | -| value_loss | 4.76e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 222 | -| time_elapsed | 1048 | -| total_timesteps | 28416 | -| train/ | | -| approx_kl | 7.412629e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -202 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 2210 | -| policy_gradient_loss | -0.000792 | -| std | 1 | -| value_loss | 1.48e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 223 | -| time_elapsed | 1053 | -| total_timesteps | 28544 | -| train/ | | -| approx_kl | 0.00012322841 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.000963 | -| n_updates | 2220 | -| policy_gradient_loss | -0.00047 | -| std | 0.997 | -| value_loss | 1.02e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 224 | -| time_elapsed | 1057 | -| total_timesteps | 28672 | -| train/ | | -| approx_kl | 2.0746142e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | -0.000359 | -| n_updates | 2230 | -| policy_gradient_loss | -0.00018 | -| std | 0.993 | -| value_loss | 6e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 225 | -| time_elapsed | 1062 | -| total_timesteps | 28800 | -| train/ | | -| approx_kl | 9.254087e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0966 | -| learning_rate | 0.0003 | -| loss | -0.000228 | -| n_updates | 2240 | -| policy_gradient_loss | -0.000101 | -| std | 0.991 | -| value_loss | 8.47e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 27 | -| iterations | 226 | -| time_elapsed | 1065 | -| total_timesteps | 28928 | -| train/ | | -| approx_kl | 8.230098e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | -0.000289 | -| n_updates | 2250 | -| policy_gradient_loss | -6.27e-05 | -| std | 0.99 | -| value_loss | 6.39e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 227 | -| time_elapsed | 1070 | -| total_timesteps | 29056 | -| train/ | | -| approx_kl | 7.098727e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0937 | -| learning_rate | 0.0003 | -| loss | -0.000318 | -| n_updates | 2260 | -| policy_gradient_loss | -0.000152 | -| std | 0.989 | -| value_loss | 3.13e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 228 | -| time_elapsed | 1078 | -| total_timesteps | 29184 | -| train/ | | -| approx_kl | 9.846687e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -9.02 | -| learning_rate | 0.0003 | -| loss | 0.000566 | -| n_updates | 2270 | -| policy_gradient_loss | -0.000261 | -| std | 0.99 | -| value_loss | 0.0031 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 229 | -| time_elapsed | 1083 | -| total_timesteps | 29312 | -| train/ | | -| approx_kl | 0.000109059736 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -460 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 2280 | -| policy_gradient_loss | -0.00052 | -| std | 0.99 | -| value_loss | 4.42e-05 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 230 | -| time_elapsed | 1086 | -| total_timesteps | 29440 | -| train/ | | -| approx_kl | 0.00013327785 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -652 | -| learning_rate | 0.0003 | -| loss | 4.66e-05 | -| n_updates | 2290 | -| policy_gradient_loss | 4.74e-05 | -| std | 0.989 | -| value_loss | 8.52e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 231 | -| time_elapsed | 1089 | -| total_timesteps | 29568 | -| train/ | | -| approx_kl | 4.07123e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -578 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 2300 | -| policy_gradient_loss | -0.000462 | -| std | 0.99 | -| value_loss | 9.67e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 232 | -| time_elapsed | 1093 | -| total_timesteps | 29696 | -| train/ | | -| approx_kl | 8.306606e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -16.4 | -| learning_rate | 0.0003 | -| loss | 2.89e-05 | -| n_updates | 2310 | -| policy_gradient_loss | 0.000138 | -| std | 0.99 | -| value_loss | 3.09e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 233 | -| time_elapsed | 1098 | -| total_timesteps | 29824 | -| train/ | | -| approx_kl | 0.00032600528 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -8.25 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 2320 | -| policy_gradient_loss | -0.00299 | -| std | 0.985 | -| value_loss | 9.29e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 27 | -| iterations | 234 | -| time_elapsed | 1103 | -| total_timesteps | 29952 | -| train/ | | -| approx_kl | 0.00027817255 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.589 | -| learning_rate | 0.0003 | -| loss | -0.000983 | -| n_updates | 2330 | -| policy_gradient_loss | -0.000538 | -| std | 0.983 | -| value_loss | 2.28e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 27 | -| iterations | 235 | -| time_elapsed | 1107 | -| total_timesteps | 30080 | -| train/ | | -| approx_kl | 8.454546e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | 0.000294 | -| n_updates | 2340 | -| policy_gradient_loss | 0.00023 | -| std | 0.982 | -| value_loss | 1.41e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 27 | -| iterations | 236 | -| time_elapsed | 1116 | -| total_timesteps | 30208 | -| train/ | | -| approx_kl | 3.1727366e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.399 | -| learning_rate | 0.0003 | -| loss | 0.00743 | -| n_updates | 2350 | -| policy_gradient_loss | -0.000432 | -| std | 0.981 | -| value_loss | 0.0195 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 26 | -| iterations | 237 | -| time_elapsed | 1124 | -| total_timesteps | 30336 | -| train/ | | -| approx_kl | 1.0705553e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -69.2 | -| learning_rate | 0.0003 | -| loss | 0.000453 | -| n_updates | 2360 | -| policy_gradient_loss | 0.000204 | -| std | 0.981 | -| value_loss | 0.000515 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 26 | -| iterations | 238 | -| time_elapsed | 1132 | -| total_timesteps | 30464 | -| train/ | | -| approx_kl | 6.7194924e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -215 | -| learning_rate | 0.0003 | -| loss | 2.81e-05 | -| n_updates | 2370 | -| policy_gradient_loss | 2.8e-05 | -| std | 0.981 | -| value_loss | 0.00027 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 26 | -| iterations | 239 | -| time_elapsed | 1141 | -| total_timesteps | 30592 | -| train/ | | -| approx_kl | 2.1964777e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | -0.000554 | -| n_updates | 2380 | -| policy_gradient_loss | -0.000226 | -| std | 0.981 | -| value_loss | 9.93e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 26 | -| iterations | 240 | -| time_elapsed | 1152 | -| total_timesteps | 30720 | -| train/ | | -| approx_kl | 1.2817327e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.000129 | -| n_updates | 2390 | -| policy_gradient_loss | -3.78e-05 | -| std | 0.979 | -| value_loss | 3.66e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 26 | -| iterations | 241 | -| time_elapsed | 1161 | -| total_timesteps | 30848 | -| train/ | | -| approx_kl | 2.9948074e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.00765 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 2400 | -| policy_gradient_loss | -0.000509 | -| std | 0.976 | -| value_loss | 1.12e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 26 | -| iterations | 242 | -| time_elapsed | 1169 | -| total_timesteps | 30976 | -| train/ | | -| approx_kl | 0.00081540504 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | -0.0093 | -| n_updates | 2410 | -| policy_gradient_loss | -0.00373 | -| std | 0.975 | -| value_loss | 4e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 26 | -| iterations | 243 | -| time_elapsed | 1174 | -| total_timesteps | 31104 | -| train/ | | -| approx_kl | 0.0058117453 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.00443 | -| learning_rate | 0.0003 | -| loss | -0.00882 | -| n_updates | 2420 | -| policy_gradient_loss | -0.00407 | -| std | 0.975 | -| value_loss | 4.08e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 26 | -| iterations | 244 | -| time_elapsed | 1196 | -| total_timesteps | 31232 | -| train/ | | -| approx_kl | 0.024499005 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.735 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 2430 | -| policy_gradient_loss | -0.00567 | -| std | 0.974 | -| value_loss | 0.00412 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 26 | -| iterations | 245 | -| time_elapsed | 1205 | -| total_timesteps | 31360 | -| train/ | | -| approx_kl | 0.0012726244 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -149 | -| learning_rate | 0.0003 | -| loss | 0.000973 | -| n_updates | 2440 | -| policy_gradient_loss | 0.000785 | -| std | 0.974 | -| value_loss | 0.000122 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 25 | -| iterations | 246 | -| time_elapsed | 1214 | -| total_timesteps | 31488 | -| train/ | | -| approx_kl | 0.026607504 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -119 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 2450 | -| policy_gradient_loss | -0.00726 | -| std | 0.975 | -| value_loss | 2.16e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 25 | -| iterations | 247 | -| time_elapsed | 1225 | -| total_timesteps | 31616 | -| train/ | | -| approx_kl | 2.8877985e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -282 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 2460 | -| policy_gradient_loss | 0.000493 | -| std | 0.977 | -| value_loss | 8.52e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 25 | -| iterations | 248 | -| time_elapsed | 1233 | -| total_timesteps | 31744 | -| train/ | | -| approx_kl | 0.0005604159 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -56.2 | -| learning_rate | 0.0003 | -| loss | 0.00089 | -| n_updates | 2470 | -| policy_gradient_loss | 0.000631 | -| std | 0.977 | -| value_loss | 3.97e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 25 | -| iterations | 249 | -| time_elapsed | 1239 | -| total_timesteps | 31872 | -| train/ | | -| approx_kl | 0.0007869792 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -33.6 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 2480 | -| policy_gradient_loss | -0.000737 | -| std | 0.977 | -| value_loss | 2.47e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 250 | -| time_elapsed | 1246 | -| total_timesteps | 32000 | -| train/ | | -| approx_kl | 0.004332003 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -4.31 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 2490 | -| policy_gradient_loss | -0.00344 | -| std | 0.977 | -| value_loss | 1.51e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 251 | -| time_elapsed | 1253 | -| total_timesteps | 32128 | -| train/ | | -| approx_kl | 0.0013022888 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | -0.000641 | -| n_updates | 2500 | -| policy_gradient_loss | -0.000363 | -| std | 0.977 | -| value_loss | 9.82e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 252 | -| time_elapsed | 1276 | -| total_timesteps | 32256 | -| train/ | | -| approx_kl | 9.677233e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | 0.00112 | -| n_updates | 2510 | -| policy_gradient_loss | -1.12e-05 | -| std | 0.976 | -| value_loss | 0.00334 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 253 | -| time_elapsed | 1286 | -| total_timesteps | 32384 | -| train/ | | -| approx_kl | 7.450348e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -148 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 2520 | -| policy_gradient_loss | -0.000209 | -| std | 0.976 | -| value_loss | 0.000191 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 254 | -| time_elapsed | 1294 | -| total_timesteps | 32512 | -| train/ | | -| approx_kl | 5.5134296e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -257 | -| learning_rate | 0.0003 | -| loss | -7.19e-05 | -| n_updates | 2530 | -| policy_gradient_loss | 6.64e-05 | -| std | 0.976 | -| value_loss | 8.29e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 255 | -| time_elapsed | 1299 | -| total_timesteps | 32640 | -| train/ | | -| approx_kl | 5.637575e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -53.9 | -| learning_rate | 0.0003 | -| loss | -0.000809 | -| n_updates | 2540 | -| policy_gradient_loss | -0.000246 | -| std | 0.975 | -| value_loss | 5.57e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 256 | -| time_elapsed | 1308 | -| total_timesteps | 32768 | -| train/ | | -| approx_kl | 0.00045676576 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.0028 | -| n_updates | 2550 | -| policy_gradient_loss | -0.00134 | -| std | 0.973 | -| value_loss | 4.25e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 25 | -| iterations | 257 | -| time_elapsed | 1314 | -| total_timesteps | 32896 | -| train/ | | -| approx_kl | 0.00033646822 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -3.83 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 2560 | -| policy_gradient_loss | -0.000745 | -| std | 0.972 | -| value_loss | 4.45e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 258 | -| time_elapsed | 1325 | -| total_timesteps | 33024 | -| train/ | | -| approx_kl | 0.0002092882 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -85.7 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 2570 | -| policy_gradient_loss | -0.000563 | -| std | 0.973 | -| value_loss | 8.02e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 259 | -| time_elapsed | 1343 | -| total_timesteps | 33152 | -| train/ | | -| approx_kl | 4.705973e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -4.86 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 2580 | -| policy_gradient_loss | 2.16e-05 | -| std | 0.975 | -| value_loss | 0.0092 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 260 | -| time_elapsed | 1354 | -| total_timesteps | 33280 | -| train/ | | -| approx_kl | 6.1155297e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -217 | -| learning_rate | 0.0003 | -| loss | -0.000172 | -| n_updates | 2590 | -| policy_gradient_loss | -5.48e-05 | -| std | 0.976 | -| value_loss | 0.000437 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 261 | -| time_elapsed | 1364 | -| total_timesteps | 33408 | -| train/ | | -| approx_kl | 7.336913e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -319 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 2600 | -| policy_gradient_loss | -0.00027 | -| std | 0.976 | -| value_loss | 2.75e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 262 | -| time_elapsed | 1374 | -| total_timesteps | 33536 | -| train/ | | -| approx_kl | 5.847914e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | 0.000102 | -| n_updates | 2610 | -| policy_gradient_loss | 0.000102 | -| std | 0.974 | -| value_loss | 1.58e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 263 | -| time_elapsed | 1382 | -| total_timesteps | 33664 | -| train/ | | -| approx_kl | 3.0898023e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | -0.000403 | -| n_updates | 2620 | -| policy_gradient_loss | -0.000145 | -| std | 0.973 | -| value_loss | 7.06e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 264 | -| time_elapsed | 1390 | -| total_timesteps | 33792 | -| train/ | | -| approx_kl | 9.4281975e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 2630 | -| policy_gradient_loss | -0.000491 | -| std | 0.975 | -| value_loss | 1.4e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 24 | -| iterations | 265 | -| time_elapsed | 1399 | -| total_timesteps | 33920 | -| train/ | | -| approx_kl | 0.00038398942 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 2640 | -| policy_gradient_loss | -0.00128 | -| std | 0.977 | -| value_loss | 6.43e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 24 | -| iterations | 266 | -| time_elapsed | 1405 | -| total_timesteps | 34048 | -| train/ | | -| approx_kl | 0.00033268332 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.000259 | -| n_updates | 2650 | -| policy_gradient_loss | -0.000105 | -| std | 0.976 | -| value_loss | 1.12e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 24 | -| iterations | 267 | -| time_elapsed | 1421 | -| total_timesteps | 34176 | -| train/ | | -| approx_kl | 0.00013541104 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.888 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 2660 | -| policy_gradient_loss | -0.00153 | -| std | 0.972 | -| value_loss | 0.00145 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 268 | -| time_elapsed | 1429 | -| total_timesteps | 34304 | -| train/ | | -| approx_kl | 0.000510524 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -71 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 2670 | -| policy_gradient_loss | -0.00114 | -| std | 0.967 | -| value_loss | 6.6e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 269 | -| time_elapsed | 1440 | -| total_timesteps | 34432 | -| train/ | | -| approx_kl | 0.00027049333 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -85.4 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 2680 | -| policy_gradient_loss | -0.000824 | -| std | 0.964 | -| value_loss | 2.44e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 270 | -| time_elapsed | 1448 | -| total_timesteps | 34560 | -| train/ | | -| approx_kl | 8.017896e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -12.8 | -| learning_rate | 0.0003 | -| loss | -0.000958 | -| n_updates | 2690 | -| policy_gradient_loss | -0.000491 | -| std | 0.961 | -| value_loss | 2e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 271 | -| time_elapsed | 1454 | -| total_timesteps | 34688 | -| train/ | | -| approx_kl | 5.4575503e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.642 | -| learning_rate | 0.0003 | -| loss | 5.86e-05 | -| n_updates | 2700 | -| policy_gradient_loss | 0.000156 | -| std | 0.96 | -| value_loss | 4.11e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 272 | -| time_elapsed | 1458 | -| total_timesteps | 34816 | -| train/ | | -| approx_kl | 3.0240044e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | 6.04e-05 | -| n_updates | 2710 | -| policy_gradient_loss | 5.41e-05 | -| std | 0.96 | -| value_loss | 1.79e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 273 | -| time_elapsed | 1462 | -| total_timesteps | 34944 | -| train/ | | -| approx_kl | 0.00013529463 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 2720 | -| policy_gradient_loss | -0.00126 | -| std | 0.959 | -| value_loss | 9.06e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 274 | -| time_elapsed | 1466 | -| total_timesteps | 35072 | -| train/ | | -| approx_kl | 0.00016384851 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | -0.000403 | -| n_updates | 2730 | -| policy_gradient_loss | -0.000188 | -| std | 0.959 | -| value_loss | 4.63e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 275 | -| time_elapsed | 1473 | -| total_timesteps | 35200 | -| train/ | | -| approx_kl | 3.8580038e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.583 | -| learning_rate | 0.0003 | -| loss | 0.0038 | -| n_updates | 2740 | -| policy_gradient_loss | 2.36e-05 | -| std | 0.96 | -| value_loss | 0.00843 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 276 | -| time_elapsed | 1478 | -| total_timesteps | 35328 | -| train/ | | -| approx_kl | 1.3969839e-08 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -34.4 | -| learning_rate | 0.0003 | -| loss | 1.63e-05 | -| n_updates | 2750 | -| policy_gradient_loss | 6.39e-06 | -| std | 0.96 | -| value_loss | 4.86e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 277 | -| time_elapsed | 1483 | -| total_timesteps | 35456 | -| train/ | | -| approx_kl | 0.00010472117 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -98.8 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 2760 | -| policy_gradient_loss | -0.000749 | -| std | 0.96 | -| value_loss | 2.24e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 278 | -| time_elapsed | 1488 | -| total_timesteps | 35584 | -| train/ | | -| approx_kl | 5.5448152e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -1.88 | -| learning_rate | 0.0003 | -| loss | 7.21e-05 | -| n_updates | 2770 | -| policy_gradient_loss | 4.55e-05 | -| std | 0.96 | -| value_loss | 2.73e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 279 | -| time_elapsed | 1493 | -| total_timesteps | 35712 | -| train/ | | -| approx_kl | 7.2335824e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | -5.66e-05 | -| n_updates | 2780 | -| policy_gradient_loss | -2.77e-05 | -| std | 0.959 | -| value_loss | 5.06e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 280 | -| time_elapsed | 1497 | -| total_timesteps | 35840 | -| train/ | | -| approx_kl | 8.8335946e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.00467 | -| learning_rate | 0.0003 | -| loss | -4.03e-05 | -| n_updates | 2790 | -| policy_gradient_loss | -1.48e-06 | -| std | 0.959 | -| value_loss | 3.33e-07 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 281 | -| time_elapsed | 1502 | -| total_timesteps | 35968 | -| train/ | | -| approx_kl | 0.000103960745 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00199 | -| n_updates | 2800 | -| policy_gradient_loss | -0.000834 | -| std | 0.958 | -| value_loss | 1.92e-07 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 282 | -| time_elapsed | 1506 | -| total_timesteps | 36096 | -| train/ | | -| approx_kl | 6.8512745e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.00659 | -| learning_rate | 0.0003 | -| loss | 0.000193 | -| n_updates | 2810 | -| policy_gradient_loss | 0.000114 | -| std | 0.957 | -| value_loss | 1.43e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 283 | -| time_elapsed | 1514 | -| total_timesteps | 36224 | -| train/ | | -| approx_kl | 6.659888e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.523 | -| learning_rate | 0.0003 | -| loss | 0.00717 | -| n_updates | 2820 | -| policy_gradient_loss | -0.000457 | -| std | 0.956 | -| value_loss | 0.0205 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 284 | -| time_elapsed | 1518 | -| total_timesteps | 36352 | -| train/ | | -| approx_kl | 4.8175454e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -174 | -| learning_rate | 0.0003 | -| loss | 0.000418 | -| n_updates | 2830 | -| policy_gradient_loss | -4.88e-06 | -| std | 0.956 | -| value_loss | 0.000725 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 285 | -| time_elapsed | 1521 | -| total_timesteps | 36480 | -| train/ | | -| approx_kl | 0.00037551904 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -127 | -| learning_rate | 0.0003 | -| loss | -0.00611 | -| n_updates | 2840 | -| policy_gradient_loss | -0.00235 | -| std | 0.955 | -| value_loss | 0.000223 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 286 | -| time_elapsed | 1527 | -| total_timesteps | 36608 | -| train/ | | -| approx_kl | 8.1382226e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -95.1 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 2850 | -| policy_gradient_loss | 0.000898 | -| std | 0.953 | -| value_loss | 2.81e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 287 | -| time_elapsed | 1531 | -| total_timesteps | 36736 | -| train/ | | -| approx_kl | 3.2484531e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -25.1 | -| learning_rate | 0.0003 | -| loss | -0.000227 | -| n_updates | 2860 | -| policy_gradient_loss | -7.33e-05 | -| std | 0.952 | -| value_loss | 5.53e-07 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 24 | -| iterations | 288 | -| time_elapsed | 1534 | -| total_timesteps | 36864 | -| train/ | | -| approx_kl | 1.46133825e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -26.1 | -| learning_rate | 0.0003 | -| loss | -0.000592 | -| n_updates | 2870 | -| policy_gradient_loss | -0.000129 | -| std | 0.952 | -| value_loss | 6.33e-07 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 24 | -| iterations | 289 | -| time_elapsed | 1537 | -| total_timesteps | 36992 | -| train/ | | -| approx_kl | 5.5134296e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.711 | -| learning_rate | 0.0003 | -| loss | 1.16e-05 | -| n_updates | 2880 | -| policy_gradient_loss | 0.000133 | -| std | 0.953 | -| value_loss | 1.52e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 24 | -| iterations | 290 | -| time_elapsed | 1541 | -| total_timesteps | 37120 | -| train/ | | -| approx_kl | 1.9127969e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.79 | -| learning_rate | 0.0003 | -| loss | -0.000169 | -| n_updates | 2890 | -| policy_gradient_loss | -6.63e-05 | -| std | 0.955 | -| value_loss | 1e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 24 | -| iterations | 291 | -| time_elapsed | 1551 | -| total_timesteps | 37248 | -| train/ | | -| approx_kl | 2.7720816e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 2900 | -| policy_gradient_loss | -3.68e-05 | -| std | 0.954 | -| value_loss | 0.00595 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 24 | -| iterations | 292 | -| time_elapsed | 1555 | -| total_timesteps | 37376 | -| train/ | | -| approx_kl | 1.7898623e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -64.6 | -| learning_rate | 0.0003 | -| loss | -0.000789 | -| n_updates | 2910 | -| policy_gradient_loss | -0.000385 | -| std | 0.951 | -| value_loss | 0.00011 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 24 | -| iterations | 293 | -| time_elapsed | 1560 | -| total_timesteps | 37504 | -| train/ | | -| approx_kl | 3.6688056e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -13.3 | -| learning_rate | 0.0003 | -| loss | -0.000776 | -| n_updates | 2920 | -| policy_gradient_loss | -0.000366 | -| std | 0.949 | -| value_loss | 2.28e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 24 | -| iterations | 294 | -| time_elapsed | 1564 | -| total_timesteps | 37632 | -| train/ | | -| approx_kl | 3.589131e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -30.9 | -| learning_rate | 0.0003 | -| loss | -0.000544 | -| n_updates | 2930 | -| policy_gradient_loss | -0.000274 | -| std | 0.948 | -| value_loss | 2.06e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 24 | -| iterations | 295 | -| time_elapsed | 1567 | -| total_timesteps | 37760 | -| train/ | | -| approx_kl | 9.936281e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -4.29 | -| learning_rate | 0.0003 | -| loss | 4.82e-05 | -| n_updates | 2940 | -| policy_gradient_loss | 3.53e-05 | -| std | 0.949 | -| value_loss | 3.75e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 296 | -| time_elapsed | 1592 | -| total_timesteps | 37888 | -| train/ | | -| approx_kl | 1.7541461e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.721 | -| learning_rate | 0.0003 | -| loss | -9.5e-05 | -| n_updates | 2950 | -| policy_gradient_loss | -3.01e-05 | -| std | 0.949 | -| value_loss | 6.57e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 297 | -| time_elapsed | 1633 | -| total_timesteps | 38016 | -| train/ | | -| approx_kl | 1.648441e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.948 | -| learning_rate | 0.0003 | -| loss | -3.38e-05 | -| n_updates | 2960 | -| policy_gradient_loss | 1.16e-05 | -| std | 0.949 | -| value_loss | 1.02e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 22 | -| iterations | 298 | -| time_elapsed | 1714 | -| total_timesteps | 38144 | -| train/ | | -| approx_kl | 2.2848137e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.387 | -| learning_rate | 0.0003 | -| loss | 0.00068 | -| n_updates | 2970 | -| policy_gradient_loss | -0.000241 | -| std | 0.949 | -| value_loss | 0.00461 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 299 | -| time_elapsed | 1746 | -| total_timesteps | 38272 | -| train/ | | -| approx_kl | 1.0609161e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -127 | -| learning_rate | 0.0003 | -| loss | 0.000164 | -| n_updates | 2980 | -| policy_gradient_loss | 3.17e-05 | -| std | 0.949 | -| value_loss | 0.000285 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 300 | -| time_elapsed | 1797 | -| total_timesteps | 38400 | -| train/ | | -| approx_kl | 4.132092e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -67 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 2990 | -| policy_gradient_loss | -0.000513 | -| std | 0.95 | -| value_loss | 9.99e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 301 | -| time_elapsed | 1831 | -| total_timesteps | 38528 | -| train/ | | -| approx_kl | 5.634036e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -3.39e-06 | -| n_updates | 3000 | -| policy_gradient_loss | 0.000188 | -| std | 0.948 | -| value_loss | 2.29e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 20 | -| iterations | 302 | -| time_elapsed | 1848 | -| total_timesteps | 38656 | -| train/ | | -| approx_kl | 1.2754463e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.949 | -| learning_rate | 0.0003 | -| loss | 9.5e-05 | -| n_updates | 3010 | -| policy_gradient_loss | 9.34e-05 | -| std | 0.947 | -| value_loss | 5.85e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 20 | -| iterations | 303 | -| time_elapsed | 1872 | -| total_timesteps | 38784 | -| train/ | | -| approx_kl | 8.9327805e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0807 | -| learning_rate | 0.0003 | -| loss | -0.000877 | -| n_updates | 3020 | -| policy_gradient_loss | -0.000336 | -| std | 0.95 | -| value_loss | 4.63e-07 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 20 | -| iterations | 304 | -| time_elapsed | 1907 | -| total_timesteps | 38912 | -| train/ | | -| approx_kl | 1.09467655e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.000411 | -| n_updates | 3030 | -| policy_gradient_loss | -0.000212 | -| std | 0.954 | -| value_loss | 3.84e-07 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 20 | -| iterations | 305 | -| time_elapsed | 1942 | -| total_timesteps | 39040 | -| train/ | | -| approx_kl | 1.9250438e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.00963 | -| learning_rate | 0.0003 | -| loss | 1.85e-05 | -| n_updates | 3040 | -| policy_gradient_loss | 2.87e-05 | -| std | 0.955 | -| value_loss | 3.27e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 19 | -| iterations | 306 | -| time_elapsed | 2005 | -| total_timesteps | 39168 | -| train/ | | -| approx_kl | 7.3420815e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.0265 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 3050 | -| policy_gradient_loss | -0.000138 | -| std | 0.957 | -| value_loss | 0.00333 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 19 | -| iterations | 307 | -| time_elapsed | 2029 | -| total_timesteps | 39296 | -| train/ | | -| approx_kl | 5.640881e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -153 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 3060 | -| policy_gradient_loss | -0.000795 | -| std | 0.959 | -| value_loss | 4.8e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 19 | -| iterations | 308 | -| time_elapsed | 2065 | -| total_timesteps | 39424 | -| train/ | | -| approx_kl | 2.7073082e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -131 | -| learning_rate | 0.0003 | -| loss | 0.000322 | -| n_updates | 3070 | -| policy_gradient_loss | 0.000201 | -| std | 0.96 | -| value_loss | 1.01e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 18 | -| iterations | 309 | -| time_elapsed | 2096 | -| total_timesteps | 39552 | -| train/ | | -| approx_kl | 1.1078082e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -14.4 | -| learning_rate | 0.0003 | -| loss | -0.00012 | -| n_updates | 3080 | -| policy_gradient_loss | -4.62e-05 | -| std | 0.959 | -| value_loss | 1.1e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 18 | -| iterations | 310 | -| time_elapsed | 2126 | -| total_timesteps | 39680 | -| train/ | | -| approx_kl | 3.2277312e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.514 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 3090 | -| policy_gradient_loss | -0.000531 | -| std | 0.958 | -| value_loss | 3.33e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 18 | -| iterations | 311 | -| time_elapsed | 2163 | -| total_timesteps | 39808 | -| train/ | | -| approx_kl | 4.0514395e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0099 | -| learning_rate | 0.0003 | -| loss | -0.000404 | -| n_updates | 3100 | -| policy_gradient_loss | -0.000214 | -| std | 0.956 | -| value_loss | 1.86e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 18 | -| iterations | 312 | -| time_elapsed | 2198 | -| total_timesteps | 39936 | -| train/ | | -| approx_kl | 2.4164096e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.00396 | -| learning_rate | 0.0003 | -| loss | -0.000587 | -| n_updates | 3110 | -| policy_gradient_loss | -0.000263 | -| std | 0.957 | -| value_loss | 5.63e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 17 | -| iterations | 313 | -| time_elapsed | 2241 | -| total_timesteps | 40064 | -| train/ | | -| approx_kl | 2.2025313e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | -0.000618 | -| n_updates | 3120 | -| policy_gradient_loss | -0.000299 | -| std | 0.96 | -| value_loss | 3.63e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 17 | -| iterations | 314 | -| time_elapsed | 2308 | -| total_timesteps | 40192 | -| train/ | | -| approx_kl | 4.620757e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.612 | -| learning_rate | 0.0003 | -| loss | -0.000631 | -| n_updates | 3130 | -| policy_gradient_loss | -0.00064 | -| std | 0.961 | -| value_loss | 0.00184 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 17 | -| iterations | 315 | -| time_elapsed | 2330 | -| total_timesteps | 40320 | -| train/ | | -| approx_kl | 1.7064158e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -184 | -| learning_rate | 0.0003 | -| loss | -5.81e-05 | -| n_updates | 3140 | -| policy_gradient_loss | -3.45e-05 | -| std | 0.962 | -| value_loss | 6.93e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 17 | -| iterations | 316 | -| time_elapsed | 2355 | -| total_timesteps | 40448 | -| train/ | | -| approx_kl | 6.596092e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -261 | -| learning_rate | 0.0003 | -| loss | -0.000713 | -| n_updates | 3150 | -| policy_gradient_loss | -0.000217 | -| std | 0.963 | -| value_loss | 2.05e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 17 | -| iterations | 317 | -| time_elapsed | 2378 | -| total_timesteps | 40576 | -| train/ | | -| approx_kl | 1.049228e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -193 | -| learning_rate | 0.0003 | -| loss | 0.000122 | -| n_updates | 3160 | -| policy_gradient_loss | 9.84e-05 | -| std | 0.963 | -| value_loss | 7.17e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 318 | -| time_elapsed | 2412 | -| total_timesteps | 40704 | -| train/ | | -| approx_kl | 1.191441e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.000597 | -| n_updates | 3170 | -| policy_gradient_loss | -0.000216 | -| std | 0.963 | -| value_loss | 7.2e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 319 | -| time_elapsed | 2446 | -| total_timesteps | 40832 | -| train/ | | -| approx_kl | 3.9557926e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.463 | -| learning_rate | 0.0003 | -| loss | -2.13e-05 | -| n_updates | 3180 | -| policy_gradient_loss | 1.96e-05 | -| std | 0.964 | -| value_loss | 2.31e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 320 | -| time_elapsed | 2478 | -| total_timesteps | 40960 | -| train/ | | -| approx_kl | 1.2437813e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -2.13e-05 | -| n_updates | 3190 | -| policy_gradient_loss | -4.54e-06 | -| std | 0.965 | -| value_loss | 1.08e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 16 | -| iterations | 321 | -| time_elapsed | 2508 | -| total_timesteps | 41088 | -| train/ | | -| approx_kl | 1.409091e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -7.15e-05 | -| n_updates | 3200 | -| policy_gradient_loss | -2.75e-05 | -| std | 0.965 | -| value_loss | 6.35e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 16 | -| iterations | 322 | -| time_elapsed | 2571 | -| total_timesteps | 41216 | -| train/ | | -| approx_kl | 3.981404e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.313 | -| learning_rate | 0.0003 | -| loss | 0.000242 | -| n_updates | 3210 | -| policy_gradient_loss | -8.84e-06 | -| std | 0.965 | -| value_loss | 0.000729 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 15 | -| iterations | 323 | -| time_elapsed | 2594 | -| total_timesteps | 41344 | -| train/ | | -| approx_kl | 8.7730587e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -41.6 | -| learning_rate | 0.0003 | -| loss | -1.1e-05 | -| n_updates | 3220 | -| policy_gradient_loss | 9.44e-06 | -| std | 0.965 | -| value_loss | 3.28e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 15 | -| iterations | 324 | -| time_elapsed | 2618 | -| total_timesteps | 41472 | -| train/ | | -| approx_kl | 1.5124679e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -41.3 | -| learning_rate | 0.0003 | -| loss | -0.00011 | -| n_updates | 3230 | -| policy_gradient_loss | -5.24e-05 | -| std | 0.964 | -| value_loss | 1.26e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 15 | -| iterations | 325 | -| time_elapsed | 2651 | -| total_timesteps | 41600 | -| train/ | | -| approx_kl | 5.1436946e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -6.7 | -| learning_rate | 0.0003 | -| loss | -0.000272 | -| n_updates | 3240 | -| policy_gradient_loss | -0.000115 | -| std | 0.963 | -| value_loss | 1.85e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 15 | -| iterations | 326 | -| time_elapsed | 2678 | -| total_timesteps | 41728 | -| train/ | | -| approx_kl | 2.4954788e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.617 | -| learning_rate | 0.0003 | -| loss | -0.000901 | -| n_updates | 3250 | -| policy_gradient_loss | -0.000416 | -| std | 0.963 | -| value_loss | 5.28e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 15 | -| iterations | 327 | -| time_elapsed | 2703 | -| total_timesteps | 41856 | -| train/ | | -| approx_kl | 5.6716148e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 3260 | -| policy_gradient_loss | -0.000812 | -| std | 0.964 | -| value_loss | 2.25e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 15 | -| iterations | 328 | -| time_elapsed | 2729 | -| total_timesteps | 41984 | -| train/ | | -| approx_kl | 2.1902379e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | -5.65e-05 | -| n_updates | 3270 | -| policy_gradient_loss | 1.88e-05 | -| std | 0.967 | -| value_loss | 1.1e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 15 | -| iterations | 329 | -| time_elapsed | 2743 | -| total_timesteps | 42112 | -| train/ | | -| approx_kl | 9.963289e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | -0.000282 | -| n_updates | 3280 | -| policy_gradient_loss | -0.00014 | -| std | 0.97 | -| value_loss | 5.5e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 14 | -| iterations | 330 | -| time_elapsed | 2818 | -| total_timesteps | 42240 | -| train/ | | -| approx_kl | 2.654735e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.766 | -| learning_rate | 0.0003 | -| loss | 0.000687 | -| n_updates | 3290 | -| policy_gradient_loss | -4.04e-05 | -| std | 0.972 | -| value_loss | 0.00172 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 14 | -| iterations | 331 | -| time_elapsed | 2848 | -| total_timesteps | 42368 | -| train/ | | -| approx_kl | 8.186791e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -14.6 | -| learning_rate | 0.0003 | -| loss | -0.000183 | -| n_updates | 3300 | -| policy_gradient_loss | -8.8e-05 | -| std | 0.972 | -| value_loss | 9.73e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 14 | -| iterations | 332 | -| time_elapsed | 2884 | -| total_timesteps | 42496 | -| train/ | | -| approx_kl | 1.7848797e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -19.1 | -| learning_rate | 0.0003 | -| loss | -1.86e-05 | -| n_updates | 3310 | -| policy_gradient_loss | -4.72e-06 | -| std | 0.973 | -| value_loss | 4.27e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 14 | -| iterations | 333 | -| time_elapsed | 2923 | -| total_timesteps | 42624 | -| train/ | | -| approx_kl | 7.9195015e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -3.29 | -| learning_rate | 0.0003 | -| loss | -0.000386 | -| n_updates | 3320 | -| policy_gradient_loss | -0.000158 | -| std | 0.975 | -| value_loss | 3.31e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 14 | -| iterations | 334 | -| time_elapsed | 2960 | -| total_timesteps | 42752 | -| train/ | | -| approx_kl | 3.283331e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.000371 | -| n_updates | 3330 | -| policy_gradient_loss | -0.000161 | -| std | 0.975 | -| value_loss | 2.2e-07 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 14 | -| iterations | 335 | -| time_elapsed | 2990 | -| total_timesteps | 42880 | -| train/ | | -| approx_kl | 0.000110466965 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 3340 | -| policy_gradient_loss | -0.000417 | -| std | 0.977 | -| value_loss | 6.33e-08 | --------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 14 | -| iterations | 336 | -| time_elapsed | 3018 | -| total_timesteps | 43008 | -| train/ | | -| approx_kl | 0.000113833696 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | -0.000736 | -| n_updates | 3350 | -| policy_gradient_loss | -0.000367 | -| std | 0.981 | -| value_loss | 5.04e-08 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 13 | -| iterations | 337 | -| time_elapsed | 3092 | -| total_timesteps | 43136 | -| train/ | | -| approx_kl | 2.7373899e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.606 | -| learning_rate | 0.0003 | -| loss | 0.00397 | -| n_updates | 3360 | -| policy_gradient_loss | 4.66e-05 | -| std | 0.983 | -| value_loss | 0.00903 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 13 | -| iterations | 338 | -| time_elapsed | 3131 | -| total_timesteps | 43264 | -| train/ | | -| approx_kl | 0.0009104037 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -97.4 | -| learning_rate | 0.0003 | -| loss | -0.00627 | -| n_updates | 3370 | -| policy_gradient_loss | -0.00281 | -| std | 0.982 | -| value_loss | 7.86e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 13 | -| iterations | 339 | -| time_elapsed | 3176 | -| total_timesteps | 43392 | -| train/ | | -| approx_kl | 0.00017556595 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 3380 | -| policy_gradient_loss | -0.0021 | -| std | 0.98 | -| value_loss | 2.1e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 13 | -| iterations | 340 | -| time_elapsed | 3213 | -| total_timesteps | 43520 | -| train/ | | -| approx_kl | 1.9673724e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.000865 | -| n_updates | 3390 | -| policy_gradient_loss | -0.000169 | -| std | 0.978 | -| value_loss | 6.56e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 13 | -| iterations | 341 | -| time_elapsed | 3250 | -| total_timesteps | 43648 | -| train/ | | -| approx_kl | 4.9513765e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | 0.000274 | -| n_updates | 3400 | -| policy_gradient_loss | 0.000297 | -| std | 0.979 | -| value_loss | 4.77e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 13 | -| iterations | 342 | -| time_elapsed | 3300 | -| total_timesteps | 43776 | -| train/ | | -| approx_kl | 4.9799215e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | -0.000761 | -| n_updates | 3410 | -| policy_gradient_loss | -0.000368 | -| std | 0.979 | -| value_loss | 3.8e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 13 | -| iterations | 343 | -| time_elapsed | 3329 | -| total_timesteps | 43904 | -| train/ | | -| approx_kl | 4.7769397e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.000769 | -| n_updates | 3420 | -| policy_gradient_loss | -0.00038 | -| std | 0.979 | -| value_loss | 3.89e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 13 | -| iterations | 344 | -| time_elapsed | 3358 | -| total_timesteps | 44032 | -| train/ | | -| approx_kl | 7.424969e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.0057 | -| learning_rate | 0.0003 | -| loss | -0.000322 | -| n_updates | 3430 | -| policy_gradient_loss | -6.99e-05 | -| std | 0.976 | -| value_loss | 3.95e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 12 | -| iterations | 345 | -| time_elapsed | 3455 | -| total_timesteps | 44160 | -| train/ | | -| approx_kl | 8.1765465e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.773 | -| learning_rate | 0.0003 | -| loss | 0.000237 | -| n_updates | 3440 | -| policy_gradient_loss | 1.24e-05 | -| std | 0.976 | -| value_loss | 0.000791 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 12 | -| iterations | 346 | -| time_elapsed | 3484 | -| total_timesteps | 44288 | -| train/ | | -| approx_kl | 8.0280006e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | 3.3e-05 | -| n_updates | 3450 | -| policy_gradient_loss | 2.34e-05 | -| std | 0.976 | -| value_loss | 1.36e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 12 | -| iterations | 347 | -| time_elapsed | 3511 | -| total_timesteps | 44416 | -| train/ | | -| approx_kl | 1.2065284e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -47.7 | -| learning_rate | 0.0003 | -| loss | -4.48e-05 | -| n_updates | 3460 | -| policy_gradient_loss | -2.01e-05 | -| std | 0.975 | -| value_loss | 2.66e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 12 | -| iterations | 348 | -| time_elapsed | 3555 | -| total_timesteps | 44544 | -| train/ | | -| approx_kl | 4.102476e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0818 | -| learning_rate | 0.0003 | -| loss | -0.000228 | -| n_updates | 3470 | -| policy_gradient_loss | -0.000103 | -| std | 0.974 | -| value_loss | 2e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 12 | -| iterations | 349 | -| time_elapsed | 3599 | -| total_timesteps | 44672 | -| train/ | | -| approx_kl | 1.5015714e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.407 | -| learning_rate | 0.0003 | -| loss | -0.00043 | -| n_updates | 3480 | -| policy_gradient_loss | -0.000204 | -| std | 0.972 | -| value_loss | 1.75e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 12 | -| iterations | 350 | -| time_elapsed | 3635 | -| total_timesteps | 44800 | -| train/ | | -| approx_kl | 3.4894794e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 3490 | -| policy_gradient_loss | -0.000419 | -| std | 0.972 | -| value_loss | 1.14e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 12 | -| iterations | 351 | -| time_elapsed | 3675 | -| total_timesteps | 44928 | -| train/ | | -| approx_kl | 2.7712435e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.00154 | -| learning_rate | 0.0003 | -| loss | 6.48e-05 | -| n_updates | 3500 | -| policy_gradient_loss | 4.6e-05 | -| std | 0.973 | -| value_loss | 8.17e-08 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 12 | -| iterations | 352 | -| time_elapsed | 3712 | -| total_timesteps | 45056 | -| train/ | | -| approx_kl | 1.44978985e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.000101 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 3510 | -| policy_gradient_loss | -0.000252 | -| std | 0.97 | -| value_loss | 6.01e-08 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 12 | -| iterations | 353 | -| time_elapsed | 3762 | -| total_timesteps | 45184 | -| train/ | | -| approx_kl | 1.5932135e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | 0.00144 | -| n_updates | 3520 | -| policy_gradient_loss | -0.000219 | -| std | 0.967 | -| value_loss | 0.00441 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 11 | -| iterations | 354 | -| time_elapsed | 3787 | -| total_timesteps | 45312 | -| train/ | | -| approx_kl | 2.3658853e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -140 | -| learning_rate | 0.0003 | -| loss | -0.000941 | -| n_updates | 3530 | -| policy_gradient_loss | -0.000337 | -| std | 0.965 | -| value_loss | 8.31e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 11 | -| iterations | 355 | -| time_elapsed | 3816 | -| total_timesteps | 45440 | -| train/ | | -| approx_kl | 8.418318e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 3540 | -| policy_gradient_loss | -0.000525 | -| std | 0.962 | -| value_loss | 2.84e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 11 | -| iterations | 356 | -| time_elapsed | 3860 | -| total_timesteps | 45568 | -| train/ | | -| approx_kl | 9.6804e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -1.47 | -| learning_rate | 0.0003 | -| loss | -0.000198 | -| n_updates | 3550 | -| policy_gradient_loss | -8.87e-05 | -| std | 0.962 | -| value_loss | 2.45e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 11 | -| iterations | 357 | -| time_elapsed | 3895 | -| total_timesteps | 45696 | -| train/ | | -| approx_kl | 9.8713674e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.000625 | -| n_updates | 3560 | -| policy_gradient_loss | -0.000262 | -| std | 0.961 | -| value_loss | 1.2e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 11 | -| iterations | 358 | -| time_elapsed | 3912 | -| total_timesteps | 45824 | -| train/ | | -| approx_kl | 2.4816487e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.00142 | -| learning_rate | 0.0003 | -| loss | 2.04e-05 | -| n_updates | 3570 | -| policy_gradient_loss | 1.34e-05 | -| std | 0.959 | -| value_loss | 1.19e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 11 | -| iterations | 359 | -| time_elapsed | 3952 | -| total_timesteps | 45952 | -| train/ | | -| approx_kl | 0.00066755246 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.0063 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 3580 | -| policy_gradient_loss | -0.000785 | -| std | 0.958 | -| value_loss | 5.96e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 11 | -| iterations | 360 | -| time_elapsed | 4000 | -| total_timesteps | 46080 | -| train/ | | -| approx_kl | 0.0070292614 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 3590 | -| policy_gradient_loss | -0.00216 | -| std | 0.958 | -| value_loss | 2.3e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 11 | -| iterations | 361 | -| time_elapsed | 4059 | -| total_timesteps | 46208 | -| train/ | | -| approx_kl | 9.994069e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.0958 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 3600 | -| policy_gradient_loss | 0.000148 | -| std | 0.96 | -| value_loss | 0.0039 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 11 | -| iterations | 362 | -| time_elapsed | 4079 | -| total_timesteps | 46336 | -| train/ | | -| approx_kl | 4.924927e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -150 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 3610 | -| policy_gradient_loss | -0.000266 | -| std | 0.96 | -| value_loss | 8.02e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 11 | -| iterations | 363 | -| time_elapsed | 4112 | -| total_timesteps | 46464 | -| train/ | | -| approx_kl | 7.4726995e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -195 | -| learning_rate | 0.0003 | -| loss | -0.000515 | -| n_updates | 3620 | -| policy_gradient_loss | -0.000202 | -| std | 0.958 | -| value_loss | 1.26e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 11 | -| iterations | 364 | -| time_elapsed | 4167 | -| total_timesteps | 46592 | -| train/ | | -| approx_kl | 2.2173394e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -26.6 | -| learning_rate | 0.0003 | -| loss | -0.000231 | -| n_updates | 3630 | -| policy_gradient_loss | -5.39e-05 | -| std | 0.955 | -| value_loss | 2.31e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 11 | -| iterations | 365 | -| time_elapsed | 4198 | -| total_timesteps | 46720 | -| train/ | | -| approx_kl | 0.0010996065 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -36.3 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 3640 | -| policy_gradient_loss | -0.00106 | -| std | 0.951 | -| value_loss | 2.99e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 11 | -| iterations | 366 | -| time_elapsed | 4243 | -| total_timesteps | 46848 | -| train/ | | -| approx_kl | 0.008424021 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 3650 | -| policy_gradient_loss | -0.00773 | -| std | 0.948 | -| value_loss | 3.1e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 10 | -| iterations | 367 | -| time_elapsed | 4275 | -| total_timesteps | 46976 | -| train/ | | -| approx_kl | 0.0003448287 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.000606 | -| n_updates | 3660 | -| policy_gradient_loss | 0.000411 | -| std | 0.949 | -| value_loss | 1.93e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 10 | -| iterations | 368 | -| time_elapsed | 4315 | -| total_timesteps | 47104 | -| train/ | | -| approx_kl | 8.1841834e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0826 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 3670 | -| policy_gradient_loss | -0.000748 | -| std | 0.95 | -| value_loss | 1.29e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 10 | -| iterations | 369 | -| time_elapsed | 4375 | -| total_timesteps | 47232 | -| train/ | | -| approx_kl | 1.5296973e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | 0.000539 | -| n_updates | 3680 | -| policy_gradient_loss | 0.000275 | -| std | 0.95 | -| value_loss | 0.000736 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 10 | -| iterations | 370 | -| time_elapsed | 4413 | -| total_timesteps | 47360 | -| train/ | | -| approx_kl | 2.9620249e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -235 | -| learning_rate | 0.0003 | -| loss | -0.000379 | -| n_updates | 3690 | -| policy_gradient_loss | -0.00018 | -| std | 0.95 | -| value_loss | 1.28e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 10 | -| iterations | 371 | -| time_elapsed | 4445 | -| total_timesteps | 47488 | -| train/ | | -| approx_kl | 9.338837e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -97.8 | -| learning_rate | 0.0003 | -| loss | -0.000278 | -| n_updates | 3700 | -| policy_gradient_loss | -0.000131 | -| std | 0.952 | -| value_loss | 2.52e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 10 | -| iterations | 372 | -| time_elapsed | 4485 | -| total_timesteps | 47616 | -| train/ | | -| approx_kl | 3.3965334e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -3.74 | -| learning_rate | 0.0003 | -| loss | -0.000266 | -| n_updates | 3710 | -| policy_gradient_loss | -0.000103 | -| std | 0.955 | -| value_loss | 6.54e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 10 | -| iterations | 373 | -| time_elapsed | 4521 | -| total_timesteps | 47744 | -| train/ | | -| approx_kl | 1.6691629e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.429 | -| learning_rate | 0.0003 | -| loss | -0.000305 | -| n_updates | 3720 | -| policy_gradient_loss | -0.000145 | -| std | 0.955 | -| value_loss | 3.4e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 10 | -| iterations | 374 | -| time_elapsed | 4547 | -| total_timesteps | 47872 | -| train/ | | -| approx_kl | 1.2903474e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.000473 | -| learning_rate | 0.0003 | -| loss | 3.19e-05 | -| n_updates | 3730 | -| policy_gradient_loss | 4.86e-05 | -| std | 0.955 | -| value_loss | 2.41e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 375 | -| time_elapsed | 4591 | -| total_timesteps | 48000 | -| train/ | | -| approx_kl | 2.0532869e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.00159 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 3740 | -| policy_gradient_loss | -0.00057 | -| std | 0.958 | -| value_loss | 1.92e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 376 | -| time_elapsed | 4621 | -| total_timesteps | 48128 | -| train/ | | -| approx_kl | 2.8314535e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.000935 | -| learning_rate | 0.0003 | -| loss | -0.0004 | -| n_updates | 3750 | -| policy_gradient_loss | -0.000211 | -| std | 0.962 | -| value_loss | 9.8e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 377 | -| time_elapsed | 4690 | -| total_timesteps | 48256 | -| train/ | | -| approx_kl | 4.890375e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | 0.000573 | -| n_updates | 3760 | -| policy_gradient_loss | 6.07e-05 | -| std | 0.963 | -| value_loss | 0.000992 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 378 | -| time_elapsed | 4727 | -| total_timesteps | 48384 | -| train/ | | -| approx_kl | 1.4686957e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -196 | -| learning_rate | 0.0003 | -| loss | -0.000176 | -| n_updates | 3770 | -| policy_gradient_loss | -6.82e-05 | -| std | 0.964 | -| value_loss | 3.3e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 379 | -| time_elapsed | 4760 | -| total_timesteps | 48512 | -| train/ | | -| approx_kl | 1.9486994e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -179 | -| learning_rate | 0.0003 | -| loss | -0.000859 | -| n_updates | 3780 | -| policy_gradient_loss | -0.000312 | -| std | 0.964 | -| value_loss | 6.84e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 380 | -| time_elapsed | 4810 | -| total_timesteps | 48640 | -| train/ | | -| approx_kl | 8.1397593e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -4.2 | -| learning_rate | 0.0003 | -| loss | 0.000162 | -| n_updates | 3790 | -| policy_gradient_loss | 0.000186 | -| std | 0.963 | -| value_loss | 3.29e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 381 | -| time_elapsed | 4845 | -| total_timesteps | 48768 | -| train/ | | -| approx_kl | 2.7938746e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 3800 | -| policy_gradient_loss | -0.000478 | -| std | 0.963 | -| value_loss | 3.42e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 10 | -| iterations | 382 | -| time_elapsed | 4881 | -| total_timesteps | 48896 | -| train/ | | -| approx_kl | 3.8643833e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.000282 | -| n_updates | 3810 | -| policy_gradient_loss | -0.000148 | -| std | 0.963 | -| value_loss | 1.14e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 383 | -| time_elapsed | 4912 | -| total_timesteps | 49024 | -| train/ | | -| approx_kl | 1.498498e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | -0.000198 | -| n_updates | 3820 | -| policy_gradient_loss | 3.21e-06 | -| std | 0.963 | -| value_loss | 1.04e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 384 | -| time_elapsed | 4972 | -| total_timesteps | 49152 | -| train/ | | -| approx_kl | 2.164999e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.664 | -| learning_rate | 0.0003 | -| loss | 0.000915 | -| n_updates | 3830 | -| policy_gradient_loss | -0.000142 | -| std | 0.963 | -| value_loss | 0.00252 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 385 | -| time_elapsed | 5007 | -| total_timesteps | 49280 | -| train/ | | -| approx_kl | 2.5606249e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -182 | -| learning_rate | 0.0003 | -| loss | -0.000711 | -| n_updates | 3840 | -| policy_gradient_loss | -0.000333 | -| std | 0.966 | -| value_loss | 8.4e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 386 | -| time_elapsed | 5039 | -| total_timesteps | 49408 | -| train/ | | -| approx_kl | 3.8901344e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -176 | -| learning_rate | 0.0003 | -| loss | -7.82e-05 | -| n_updates | 3850 | -| policy_gradient_loss | -1.65e-05 | -| std | 0.968 | -| value_loss | 1.43e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 387 | -| time_elapsed | 5071 | -| total_timesteps | 49536 | -| train/ | | -| approx_kl | 3.7658028e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -23.9 | -| learning_rate | 0.0003 | -| loss | -0.000384 | -| n_updates | 3860 | -| policy_gradient_loss | -0.000178 | -| std | 0.971 | -| value_loss | 1.04e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 388 | -| time_elapsed | 5105 | -| total_timesteps | 49664 | -| train/ | | -| approx_kl | 3.2819808e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -33.8 | -| learning_rate | 0.0003 | -| loss | -0.000172 | -| n_updates | 3870 | -| policy_gradient_loss | -8.97e-05 | -| std | 0.974 | -| value_loss | 3.78e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 389 | -| time_elapsed | 5148 | -| total_timesteps | 49792 | -| train/ | | -| approx_kl | 3.5609119e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -2.43 | -| learning_rate | 0.0003 | -| loss | -0.000202 | -| n_updates | 3880 | -| policy_gradient_loss | -0.000101 | -| std | 0.976 | -| value_loss | 4.66e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 9 | -| iterations | 390 | -| time_elapsed | 5210 | -| total_timesteps | 49920 | -| train/ | | -| approx_kl | 3.5022385e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00016 | -| n_updates | 3890 | -| policy_gradient_loss | -7.36e-05 | -| std | 0.977 | -| value_loss | 3.15e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 9 | -| iterations | 391 | -| time_elapsed | 5286 | -| total_timesteps | 50048 | -| train/ | | -| approx_kl | 1.0008924e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | -0.000267 | -| n_updates | 3900 | -| policy_gradient_loss | -0.00012 | -| std | 0.978 | -| value_loss | 2.42e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 9 | -| iterations | 392 | -| time_elapsed | 5441 | -| total_timesteps | 50176 | -| train/ | | -| approx_kl | 3.4621917e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | 0.000154 | -| n_updates | 3910 | -| policy_gradient_loss | -1.84e-05 | -| std | 0.979 | -| value_loss | 0.000596 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 9 | -| iterations | 393 | -| time_elapsed | 5530 | -| total_timesteps | 50304 | -| train/ | | -| approx_kl | 2.5740359e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -286 | -| learning_rate | 0.0003 | -| loss | -0.000995 | -| n_updates | 3920 | -| policy_gradient_loss | -0.000437 | -| std | 0.982 | -| value_loss | 6e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 8 | -| iterations | 394 | -| time_elapsed | 5616 | -| total_timesteps | 50432 | -| train/ | | -| approx_kl | 4.3502077e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -264 | -| learning_rate | 0.0003 | -| loss | 0.000186 | -| n_updates | 3930 | -| policy_gradient_loss | 0.000122 | -| std | 0.983 | -| value_loss | 1.38e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 8 | -| iterations | 395 | -| time_elapsed | 5715 | -| total_timesteps | 50560 | -| train/ | | -| approx_kl | 5.662441e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -288 | -| learning_rate | 0.0003 | -| loss | -6.39e-05 | -| n_updates | 3940 | -| policy_gradient_loss | -2.36e-05 | -| std | 0.982 | -| value_loss | 3.83e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 8 | -| iterations | 396 | -| time_elapsed | 5808 | -| total_timesteps | 50688 | -| train/ | | -| approx_kl | 3.357418e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -32 | -| learning_rate | 0.0003 | -| loss | -2.23e-07 | -| n_updates | 3950 | -| policy_gradient_loss | 7.71e-06 | -| std | 0.982 | -| value_loss | 7.27e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 8 | -| iterations | 397 | -| time_elapsed | 5895 | -| total_timesteps | 50816 | -| train/ | | -| approx_kl | 4.02797e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -79.4 | -| learning_rate | 0.0003 | -| loss | -5.91e-05 | -| n_updates | 3960 | -| policy_gradient_loss | -1.45e-05 | -| std | 0.982 | -| value_loss | 1.53e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 8 | -| iterations | 398 | -| time_elapsed | 5971 | -| total_timesteps | 50944 | -| train/ | | -| approx_kl | 1.9511208e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.638 | -| learning_rate | 0.0003 | -| loss | -0.000108 | -| n_updates | 3970 | -| policy_gradient_loss | -5.3e-05 | -| std | 0.982 | -| value_loss | 3.51e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 399 | -| time_elapsed | 6053 | -| total_timesteps | 51072 | -| train/ | | -| approx_kl | 2.9234216e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.673 | -| learning_rate | 0.0003 | -| loss | -8.29e-05 | -| n_updates | 3980 | -| policy_gradient_loss | -3.65e-05 | -| std | 0.982 | -| value_loss | 7.46e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 400 | -| time_elapsed | 6127 | -| total_timesteps | 51200 | -| train/ | | -| approx_kl | 2.213288e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.844 | -| learning_rate | 0.0003 | -| loss | -8.05e-05 | -| n_updates | 3990 | -| policy_gradient_loss | -0.000125 | -| std | 0.983 | -| value_loss | 0.000682 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 401 | -| time_elapsed | 6163 | -| total_timesteps | 51328 | -| train/ | | -| approx_kl | 1.4408957e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.000295 | -| n_updates | 4000 | -| policy_gradient_loss | -0.000151 | -| std | 0.985 | -| value_loss | 2.62e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 402 | -| time_elapsed | 6192 | -| total_timesteps | 51456 | -| train/ | | -| approx_kl | 1.5214551e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | -0.000569 | -| n_updates | 4010 | -| policy_gradient_loss | -0.000271 | -| std | 0.986 | -| value_loss | 1.2e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 403 | -| time_elapsed | 6224 | -| total_timesteps | 51584 | -| train/ | | -| approx_kl | 1.0607764e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -2.36 | -| learning_rate | 0.0003 | -| loss | -9.79e-05 | -| n_updates | 4020 | -| policy_gradient_loss | -4.97e-05 | -| std | 0.987 | -| value_loss | 2.97e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 404 | -| time_elapsed | 6265 | -| total_timesteps | 51712 | -| train/ | | -| approx_kl | 1.937151e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | 1.8e-05 | -| n_updates | 4030 | -| policy_gradient_loss | 1.23e-05 | -| std | 0.987 | -| value_loss | 1.6e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 405 | -| time_elapsed | 6297 | -| total_timesteps | 51840 | -| train/ | | -| approx_kl | 7.0780516e-08 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | -7.83e-07 | -| n_updates | 4040 | -| policy_gradient_loss | 2.73e-07 | -| std | 0.987 | -| value_loss | 9.74e-11 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 8 | -| iterations | 406 | -| time_elapsed | 6336 | -| total_timesteps | 51968 | -| train/ | | -| approx_kl | 2.6253983e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.00708 | -| learning_rate | 0.0003 | -| loss | -9.66e-05 | -| n_updates | 4050 | -| policy_gradient_loss | -4.04e-05 | -| std | 0.987 | -| value_loss | 6.92e-11 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 8 | -| iterations | 407 | -| time_elapsed | 6369 | -| total_timesteps | 52096 | -| train/ | | -| approx_kl | 2.2997148e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 4060 | -| policy_gradient_loss | -0.000556 | -| std | 0.983 | -| value_loss | 4.78e-11 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 8 | -| iterations | 408 | -| time_elapsed | 6451 | -| total_timesteps | 52224 | -| train/ | | -| approx_kl | 1.2077391e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | 0.000654 | -| n_updates | 4070 | -| policy_gradient_loss | 5.31e-05 | -| std | 0.98 | -| value_loss | 0.00139 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 8 | -| iterations | 409 | -| time_elapsed | 6484 | -| total_timesteps | 52352 | -| train/ | | -| approx_kl | 7.323455e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -151 | -| learning_rate | 0.0003 | -| loss | -0.000325 | -| n_updates | 4080 | -| policy_gradient_loss | -0.000157 | -| std | 0.979 | -| value_loss | 1.3e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 8 | -| iterations | 410 | -| time_elapsed | 6516 | -| total_timesteps | 52480 | -| train/ | | -| approx_kl | 1.6625505e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -167 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 4090 | -| policy_gradient_loss | -0.000467 | -| std | 0.979 | -| value_loss | 3.83e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 8 | -| iterations | 411 | -| time_elapsed | 6549 | -| total_timesteps | 52608 | -| train/ | | -| approx_kl | 2.3840927e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -23.8 | -| learning_rate | 0.0003 | -| loss | -0.00023 | -| n_updates | 4100 | -| policy_gradient_loss | -0.000121 | -| std | 0.979 | -| value_loss | 6.34e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 8 | -| iterations | 412 | -| time_elapsed | 6580 | -| total_timesteps | 52736 | -| train/ | | -| approx_kl | 1.2079254e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.696 | -| learning_rate | 0.0003 | -| loss | -0.000159 | -| n_updates | 4110 | -| policy_gradient_loss | -8.5e-06 | -| std | 0.98 | -| value_loss | 1.08e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 7 | -| iterations | 413 | -| time_elapsed | 6614 | -| total_timesteps | 52864 | -| train/ | | -| approx_kl | 2.0700507e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.00796 | -| learning_rate | 0.0003 | -| loss | -0.000781 | -| n_updates | 4120 | -| policy_gradient_loss | -0.000384 | -| std | 0.981 | -| value_loss | 5.73e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 7 | -| iterations | 414 | -| time_elapsed | 6630 | -| total_timesteps | 52992 | -| train/ | | -| approx_kl | 2.9900111e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | -6.88e-05 | -| n_updates | 4130 | -| policy_gradient_loss | -1.3e-05 | -| std | 0.983 | -| value_loss | 1.02e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 7 | -| iterations | 415 | -| time_elapsed | 6657 | -| total_timesteps | 53120 | -| train/ | | -| approx_kl | 3.1506643e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 4140 | -| policy_gradient_loss | -6.03e-05 | -| std | 0.984 | -| value_loss | 8.03e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 7 | -| iterations | 416 | -| time_elapsed | 6743 | -| total_timesteps | 53248 | -| train/ | | -| approx_kl | 2.301298e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.505 | -| learning_rate | 0.0003 | -| loss | 0.00388 | -| n_updates | 4150 | -| policy_gradient_loss | -0.000192 | -| std | 0.986 | -| value_loss | 0.00925 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 7 | -| iterations | 417 | -| time_elapsed | 6776 | -| total_timesteps | 53376 | -| train/ | | -| approx_kl | 3.3010729e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -18.3 | -| learning_rate | 0.0003 | -| loss | -0.000144 | -| n_updates | 4160 | -| policy_gradient_loss | -7.73e-05 | -| std | 0.988 | -| value_loss | 1.72e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 7 | -| iterations | 418 | -| time_elapsed | 6823 | -| total_timesteps | 53504 | -| train/ | | -| approx_kl | 9.0058893e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -25.8 | -| learning_rate | 0.0003 | -| loss | 1.24e-05 | -| n_updates | 4170 | -| policy_gradient_loss | 1.03e-05 | -| std | 0.989 | -| value_loss | 7.64e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 7 | -| iterations | 419 | -| time_elapsed | 6861 | -| total_timesteps | 53632 | -| train/ | | -| approx_kl | 6.5471977e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.936 | -| learning_rate | 0.0003 | -| loss | -6.24e-05 | -| n_updates | 4180 | -| policy_gradient_loss | -2.12e-05 | -| std | 0.99 | -| value_loss | 1.02e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 7 | -| iterations | 420 | -| time_elapsed | 6895 | -| total_timesteps | 53760 | -| train/ | | -| approx_kl | 2.7101487e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.0046 | -| learning_rate | 0.0003 | -| loss | -2.11e-05 | -| n_updates | 4190 | -| policy_gradient_loss | 2.61e-06 | -| std | 0.991 | -| value_loss | 6.34e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 7 | -| iterations | 421 | -| time_elapsed | 6933 | -| total_timesteps | 53888 | -| train/ | | -| approx_kl | 1.3471581e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | -0.000161 | -| n_updates | 4200 | -| policy_gradient_loss | -6.34e-05 | -| std | 0.992 | -| value_loss | 4.95e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 422 | -| time_elapsed | 6963 | -| total_timesteps | 54016 | -| train/ | | -| approx_kl | 4.391186e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.00185 | -| learning_rate | 0.0003 | -| loss | 3.87e-05 | -| n_updates | 4210 | -| policy_gradient_loss | 2.85e-05 | -| std | 0.993 | -| value_loss | 4e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 423 | -| time_elapsed | 7029 | -| total_timesteps | 54144 | -| train/ | | -| approx_kl | 1.2147706e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.697 | -| learning_rate | 0.0003 | -| loss | 0.000551 | -| n_updates | 4220 | -| policy_gradient_loss | -0.000299 | -| std | 0.993 | -| value_loss | 0.00274 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 424 | -| time_elapsed | 7063 | -| total_timesteps | 54272 | -| train/ | | -| approx_kl | 6.123446e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -2.88 | -| learning_rate | 0.0003 | -| loss | 1.72e-05 | -| n_updates | 4230 | -| policy_gradient_loss | 6.74e-05 | -| std | 0.992 | -| value_loss | 2.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 425 | -| time_elapsed | 7101 | -| total_timesteps | 54400 | -| train/ | | -| approx_kl | 2.596993e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -2.08 | -| learning_rate | 0.0003 | -| loss | -2.19e-05 | -| n_updates | 4240 | -| policy_gradient_loss | 1.45e-05 | -| std | 0.992 | -| value_loss | 2.54e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 426 | -| time_elapsed | 7129 | -| total_timesteps | 54528 | -| train/ | | -| approx_kl | 4.976522e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | -0.000143 | -| n_updates | 4250 | -| policy_gradient_loss | -6.94e-05 | -| std | 0.993 | -| value_loss | 8.17e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 427 | -| time_elapsed | 7160 | -| total_timesteps | 54656 | -| train/ | | -| approx_kl | 1.9292347e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.00725 | -| learning_rate | 0.0003 | -| loss | 2e-06 | -| n_updates | 4260 | -| policy_gradient_loss | 2.32e-06 | -| std | 0.994 | -| value_loss | 5.75e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 428 | -| time_elapsed | 7194 | -| total_timesteps | 54784 | -| train/ | | -| approx_kl | 1.5599653e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.00749 | -| learning_rate | 0.0003 | -| loss | -3.16e-06 | -| n_updates | 4270 | -| policy_gradient_loss | -1.73e-06 | -| std | 0.994 | -| value_loss | 4.66e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 7 | -| iterations | 429 | -| time_elapsed | 7235 | -| total_timesteps | 54912 | -| train/ | | -| approx_kl | 8.092262e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.00594 | -| learning_rate | 0.0003 | -| loss | -0.000778 | -| n_updates | 4280 | -| policy_gradient_loss | -0.000315 | -| std | 0.998 | -| value_loss | 3.96e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 430 | -| time_elapsed | 7276 | -| total_timesteps | 55040 | -| train/ | | -| approx_kl | 1.5146565e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.00422 | -| learning_rate | 0.0003 | -| loss | -0.000209 | -| n_updates | 4290 | -| policy_gradient_loss | -0.000112 | -| std | 1 | -| value_loss | 3.41e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 431 | -| time_elapsed | 7347 | -| total_timesteps | 55168 | -| train/ | | -| approx_kl | 3.729947e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -4.15e-05 | -| n_updates | 4300 | -| policy_gradient_loss | -5.9e-05 | -| std | 1 | -| value_loss | 0.000151 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 432 | -| time_elapsed | 7383 | -| total_timesteps | 55296 | -| train/ | | -| approx_kl | 7.174909e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -7.83 | -| learning_rate | 0.0003 | -| loss | -0.000549 | -| n_updates | 4310 | -| policy_gradient_loss | -0.000247 | -| std | 1.01 | -| value_loss | 1.52e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 433 | -| time_elapsed | 7411 | -| total_timesteps | 55424 | -| train/ | | -| approx_kl | 4.65801e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -4.73 | -| learning_rate | 0.0003 | -| loss | -1.69e-05 | -| n_updates | 4320 | -| policy_gradient_loss | -2.95e-06 | -| std | 1.01 | -| value_loss | 3.93e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 434 | -| time_elapsed | 7440 | -| total_timesteps | 55552 | -| train/ | | -| approx_kl | 2.840301e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.00435 | -| learning_rate | 0.0003 | -| loss | -0.000996 | -| n_updates | 4330 | -| policy_gradient_loss | -0.000412 | -| std | 1.01 | -| value_loss | 1.45e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 435 | -| time_elapsed | 7479 | -| total_timesteps | 55680 | -| train/ | | -| approx_kl | 3.55253e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.000279 | -| n_updates | 4340 | -| policy_gradient_loss | 7.98e-05 | -| std | 1.01 | -| value_loss | 1.14e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 436 | -| time_elapsed | 7519 | -| total_timesteps | 55808 | -| train/ | | -| approx_kl | 3.7593767e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.00152 | -| learning_rate | 0.0003 | -| loss | -0.000784 | -| n_updates | 4350 | -| policy_gradient_loss | -0.0004 | -| std | 1.01 | -| value_loss | 9.62e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 7 | -| iterations | 437 | -| time_elapsed | 7547 | -| total_timesteps | 55936 | -| train/ | | -| approx_kl | 9.5954165e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.00514 | -| learning_rate | 0.0003 | -| loss | -0.000558 | -| n_updates | 4360 | -| policy_gradient_loss | -0.000216 | -| std | 1.02 | -| value_loss | 8.45e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 438 | -| time_elapsed | 7585 | -| total_timesteps | 56064 | -| train/ | | -| approx_kl | 9.384472e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.00451 | -| learning_rate | 0.0003 | -| loss | -0.000682 | -| n_updates | 4370 | -| policy_gradient_loss | -0.000244 | -| std | 1.02 | -| value_loss | 7.56e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 439 | -| time_elapsed | 7646 | -| total_timesteps | 56192 | -| train/ | | -| approx_kl | 2.5266781e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | 0.000194 | -| n_updates | 4380 | -| policy_gradient_loss | -0.000159 | -| std | 1.02 | -| value_loss | 0.00129 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 440 | -| time_elapsed | 7685 | -| total_timesteps | 56320 | -| train/ | | -| approx_kl | 1.03376806e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -451 | -| learning_rate | 0.0003 | -| loss | 3.02e-05 | -| n_updates | 4390 | -| policy_gradient_loss | 6.75e-05 | -| std | 1.02 | -| value_loss | 1.38e-05 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 441 | -| time_elapsed | 7724 | -| total_timesteps | 56448 | -| train/ | | -| approx_kl | 1.9326806e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -514 | -| learning_rate | 0.0003 | -| loss | -0.000584 | -| n_updates | 4400 | -| policy_gradient_loss | -0.000276 | -| std | 1.02 | -| value_loss | 3.03e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 442 | -| time_elapsed | 7758 | -| total_timesteps | 56576 | -| train/ | | -| approx_kl | 7.673167e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -39.2 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 4410 | -| policy_gradient_loss | -0.000326 | -| std | 1.02 | -| value_loss | 6.91e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 443 | -| time_elapsed | 7786 | -| total_timesteps | 56704 | -| train/ | | -| approx_kl | 2.751546e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.482 | -| learning_rate | 0.0003 | -| loss | -0.000835 | -| n_updates | 4420 | -| policy_gradient_loss | -0.000257 | -| std | 1.03 | -| value_loss | 1.07e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 444 | -| time_elapsed | 7816 | -| total_timesteps | 56832 | -| train/ | | -| approx_kl | 3.034342e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 4430 | -| policy_gradient_loss | -0.000564 | -| std | 1.03 | -| value_loss | 5.32e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 7 | -| iterations | 445 | -| time_elapsed | 7840 | -| total_timesteps | 56960 | -| train/ | | -| approx_kl | 3.1297095e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0829 | -| learning_rate | 0.0003 | -| loss | 0.000136 | -| n_updates | 4440 | -| policy_gradient_loss | 8.54e-05 | -| std | 1.03 | -| value_loss | 2.52e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 446 | -| time_elapsed | 7866 | -| total_timesteps | 57088 | -| train/ | | -| approx_kl | 1.3960525e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.00583 | -| learning_rate | 0.0003 | -| loss | -0.000181 | -| n_updates | 4450 | -| policy_gradient_loss | -6.11e-05 | -| std | 1.03 | -| value_loss | 1.58e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 447 | -| time_elapsed | 7932 | -| total_timesteps | 57216 | -| train/ | | -| approx_kl | 2.8000213e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.625 | -| learning_rate | 0.0003 | -| loss | 0.00283 | -| n_updates | 4460 | -| policy_gradient_loss | -4.72e-05 | -| std | 1.03 | -| value_loss | 0.0068 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 448 | -| time_elapsed | 7972 | -| total_timesteps | 57344 | -| train/ | | -| approx_kl | 9.7882e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -401 | -| learning_rate | 0.0003 | -| loss | 9.7e-06 | -| n_updates | 4470 | -| policy_gradient_loss | -2.13e-05 | -| std | 1.03 | -| value_loss | 7.2e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 449 | -| time_elapsed | 8011 | -| total_timesteps | 57472 | -| train/ | | -| approx_kl | 3.0733645e-08 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -472 | -| learning_rate | 0.0003 | -| loss | -1.47e-05 | -| n_updates | 4480 | -| policy_gradient_loss | 2.69e-06 | -| std | 1.03 | -| value_loss | 2.66e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 450 | -| time_elapsed | 8045 | -| total_timesteps | 57600 | -| train/ | | -| approx_kl | 1.240056e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.392 | -| learning_rate | 0.0003 | -| loss | -0.000134 | -| n_updates | 4490 | -| policy_gradient_loss | -6.27e-05 | -| std | 1.03 | -| value_loss | 3.6e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 451 | -| time_elapsed | 8084 | -| total_timesteps | 57728 | -| train/ | | -| approx_kl | 1.1450611e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -1.53e-05 | -| n_updates | 4500 | -| policy_gradient_loss | -3.39e-06 | -| std | 1.03 | -| value_loss | 4.52e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 452 | -| time_elapsed | 8118 | -| total_timesteps | 57856 | -| train/ | | -| approx_kl | 1.3196841e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0896 | -| learning_rate | 0.0003 | -| loss | -0.000156 | -| n_updates | 4510 | -| policy_gradient_loss | -5.58e-05 | -| std | 1.03 | -| value_loss | 6.23e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 7 | -| iterations | 453 | -| time_elapsed | 8147 | -| total_timesteps | 57984 | -| train/ | | -| approx_kl | 2.2300053e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.00589 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 4520 | -| policy_gradient_loss | -0.000613 | -| std | 1.03 | -| value_loss | 5.8e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 7 | -| iterations | 454 | -| time_elapsed | 8184 | -| total_timesteps | 58112 | -| train/ | | -| approx_kl | 6.992975e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | -0.000676 | -| n_updates | 4530 | -| policy_gradient_loss | -0.000333 | -| std | 1.03 | -| value_loss | 3.06e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 7 | -| iterations | 455 | -| time_elapsed | 8281 | -| total_timesteps | 58240 | -| train/ | | -| approx_kl | 0.00013265433 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.634 | -| learning_rate | 0.0003 | -| loss | -0.001 | -| n_updates | 4540 | -| policy_gradient_loss | -0.000637 | -| std | 1.03 | -| value_loss | 0.00109 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 7 | -| iterations | 456 | -| time_elapsed | 8313 | -| total_timesteps | 58368 | -| train/ | | -| approx_kl | 0.00036686053 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -272 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 4550 | -| policy_gradient_loss | -0.000576 | -| std | 1.03 | -| value_loss | 1.41e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 7 | -| iterations | 457 | -| time_elapsed | 8340 | -| total_timesteps | 58496 | -| train/ | | -| approx_kl | 6.297883e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -170 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 4560 | -| policy_gradient_loss | -0.000101 | -| std | 1.03 | -| value_loss | 2.62e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 6 | -| iterations | 458 | -| time_elapsed | 8385 | -| total_timesteps | 58624 | -| train/ | | -| approx_kl | 0.00010128878 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.405 | -| learning_rate | 0.0003 | -| loss | 0.000208 | -| n_updates | 4570 | -| policy_gradient_loss | 0.000142 | -| std | 1.03 | -| value_loss | 1.07e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 6 | -| iterations | 459 | -| time_elapsed | 8423 | -| total_timesteps | 58752 | -| train/ | | -| approx_kl | 8.775294e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.57 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 4580 | -| policy_gradient_loss | -0.000579 | -| std | 1.03 | -| value_loss | 5.88e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 6 | -| iterations | 460 | -| time_elapsed | 8462 | -| total_timesteps | 58880 | -| train/ | | -| approx_kl | 0.00010161521 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.00441 | -| learning_rate | 0.0003 | -| loss | -0.000837 | -| n_updates | 4590 | -| policy_gradient_loss | -0.000432 | -| std | 1.03 | -| value_loss | 4.21e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 461 | -| time_elapsed | 8503 | -| total_timesteps | 59008 | -| train/ | | -| approx_kl | 6.948132e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.000538 | -| learning_rate | 0.0003 | -| loss | -3.32e-05 | -| n_updates | 4600 | -| policy_gradient_loss | 6.51e-05 | -| std | 1.03 | -| value_loss | 3.73e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 462 | -| time_elapsed | 8605 | -| total_timesteps | 59136 | -| train/ | | -| approx_kl | 7.93254e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.801 | -| learning_rate | 0.0003 | -| loss | 0.000342 | -| n_updates | 4610 | -| policy_gradient_loss | -0.000247 | -| std | 1.03 | -| value_loss | 0.00207 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 463 | -| time_elapsed | 8631 | -| total_timesteps | 59264 | -| train/ | | -| approx_kl | 0.00011238549 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.918 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 4620 | -| policy_gradient_loss | -0.000541 | -| std | 1.02 | -| value_loss | 1.87e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 464 | -| time_elapsed | 8661 | -| total_timesteps | 59392 | -| train/ | | -| approx_kl | 2.8386712e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -223 | -| learning_rate | 0.0003 | -| loss | 8.82e-05 | -| n_updates | 4630 | -| policy_gradient_loss | 0.000218 | -| std | 1.02 | -| value_loss | 6.34e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 465 | -| time_elapsed | 8703 | -| total_timesteps | 59520 | -| train/ | | -| approx_kl | 0.00039475085 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | -0.0051 | -| n_updates | 4640 | -| policy_gradient_loss | -0.00152 | -| std | 1.02 | -| value_loss | 8.55e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 466 | -| time_elapsed | 8735 | -| total_timesteps | 59648 | -| train/ | | -| approx_kl | 0.00040073693 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -22.4 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 4650 | -| policy_gradient_loss | 0.00117 | -| std | 1.02 | -| value_loss | 1.17e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 467 | -| time_elapsed | 8770 | -| total_timesteps | 59776 | -| train/ | | -| approx_kl | 0.0010557403 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.283 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 4660 | -| policy_gradient_loss | -0.00115 | -| std | 1.02 | -| value_loss | 2.51e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 468 | -| time_elapsed | 8800 | -| total_timesteps | 59904 | -| train/ | | -| approx_kl | 0.0006564446 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | -0.00519 | -| n_updates | 4670 | -| policy_gradient_loss | -0.00286 | -| std | 1.02 | -| value_loss | 8.29e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 469 | -| time_elapsed | 8841 | -| total_timesteps | 60032 | -| train/ | | -| approx_kl | 4.462758e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.0119 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 4680 | -| policy_gradient_loss | -0.000647 | -| std | 1.02 | -| value_loss | 3.79e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 470 | -| time_elapsed | 8918 | -| total_timesteps | 60160 | -| train/ | | -| approx_kl | 7.902738e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | 0.000788 | -| n_updates | 4690 | -| policy_gradient_loss | -1.57e-05 | -| std | 1.02 | -| value_loss | 0.00239 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 471 | -| time_elapsed | 8963 | -| total_timesteps | 60288 | -| train/ | | -| approx_kl | 3.7867576e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -220 | -| learning_rate | 0.0003 | -| loss | -8.97e-05 | -| n_updates | 4700 | -| policy_gradient_loss | -5.42e-05 | -| std | 1.02 | -| value_loss | 4.72e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 472 | -| time_elapsed | 8996 | -| total_timesteps | 60416 | -| train/ | | -| approx_kl | 7.2238036e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -199 | -| learning_rate | 0.0003 | -| loss | -0.000274 | -| n_updates | 4710 | -| policy_gradient_loss | -8.41e-05 | -| std | 1.02 | -| value_loss | 9.17e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 473 | -| time_elapsed | 9031 | -| total_timesteps | 60544 | -| train/ | | -| approx_kl | 1.8002465e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -6.43 | -| learning_rate | 0.0003 | -| loss | 7.14e-05 | -| n_updates | 4720 | -| policy_gradient_loss | 6.98e-05 | -| std | 1.02 | -| value_loss | 1.83e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 474 | -| time_elapsed | 9062 | -| total_timesteps | 60672 | -| train/ | | -| approx_kl | 6.977003e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.713 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 4730 | -| policy_gradient_loss | -0.000188 | -| std | 1.02 | -| value_loss | 4.34e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 475 | -| time_elapsed | 9101 | -| total_timesteps | 60800 | -| train/ | | -| approx_kl | 4.8726797e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0595 | -| learning_rate | 0.0003 | -| loss | -7.37e-05 | -| n_updates | 4740 | -| policy_gradient_loss | 4.43e-06 | -| std | 1.02 | -| value_loss | 2.93e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 6 | -| iterations | 476 | -| time_elapsed | 9135 | -| total_timesteps | 60928 | -| train/ | | -| approx_kl | 1.7951708e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.000146 | -| learning_rate | 0.0003 | -| loss | -0.000607 | -| n_updates | 4750 | -| policy_gradient_loss | -0.000275 | -| std | 1.02 | -| value_loss | 2.26e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 477 | -| time_elapsed | 9159 | -| total_timesteps | 61056 | -| train/ | | -| approx_kl | 6.8610534e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.00956 | -| learning_rate | 0.0003 | -| loss | -0.000135 | -| n_updates | 4760 | -| policy_gradient_loss | 1.43e-05 | -| std | 1.02 | -| value_loss | 1.71e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 478 | -| time_elapsed | 9216 | -| total_timesteps | 61184 | -| train/ | | -| approx_kl | 3.006775e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.772 | -| learning_rate | 0.0003 | -| loss | 0.000525 | -| n_updates | 4770 | -| policy_gradient_loss | -2.29e-05 | -| std | 1.02 | -| value_loss | 0.00127 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 479 | -| time_elapsed | 9238 | -| total_timesteps | 61312 | -| train/ | | -| approx_kl | 3.4128316e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -5.11 | -| learning_rate | 0.0003 | -| loss | -0.000121 | -| n_updates | 4780 | -| policy_gradient_loss | -6.15e-05 | -| std | 1.02 | -| value_loss | 7.47e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 480 | -| time_elapsed | 9272 | -| total_timesteps | 61440 | -| train/ | | -| approx_kl | 8.77725e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | -0.000426 | -| n_updates | 4790 | -| policy_gradient_loss | -0.00018 | -| std | 1.01 | -| value_loss | 7.74e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 481 | -| time_elapsed | 9312 | -| total_timesteps | 61568 | -| train/ | | -| approx_kl | 1.0610558e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.000845 | -| n_updates | 4800 | -| policy_gradient_loss | -0.000251 | -| std | 1.01 | -| value_loss | 4.37e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 482 | -| time_elapsed | 9345 | -| total_timesteps | 61696 | -| train/ | | -| approx_kl | 1.9783154e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 4810 | -| policy_gradient_loss | -0.000314 | -| std | 1.01 | -| value_loss | 3.18e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 483 | -| time_elapsed | 9372 | -| total_timesteps | 61824 | -| train/ | | -| approx_kl | 2.658926e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.000111 | -| n_updates | 4820 | -| policy_gradient_loss | 4.67e-05 | -| std | 1.01 | -| value_loss | 2.48e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 6 | -| iterations | 484 | -| time_elapsed | 9413 | -| total_timesteps | 61952 | -| train/ | | -| approx_kl | 8.935574e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.00449 | -| learning_rate | 0.0003 | -| loss | -0.000229 | -| n_updates | 4830 | -| policy_gradient_loss | -0.000106 | -| std | 1.01 | -| value_loss | 1.96e-08 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 485 | -| time_elapsed | 9453 | -| total_timesteps | 62080 | -| train/ | | -| approx_kl | 1.13854185e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.00296 | -| learning_rate | 0.0003 | -| loss | -0.000383 | -| n_updates | 4840 | -| policy_gradient_loss | -0.000174 | -| std | 1.01 | -| value_loss | 1.57e-08 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 486 | -| time_elapsed | 9518 | -| total_timesteps | 62208 | -| train/ | | -| approx_kl | 3.5641715e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.727 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 4850 | -| policy_gradient_loss | 4.22e-05 | -| std | 1.01 | -| value_loss | 0.0036 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 487 | -| time_elapsed | 9557 | -| total_timesteps | 62336 | -| train/ | | -| approx_kl | 9.820797e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -417 | -| learning_rate | 0.0003 | -| loss | -6.98e-07 | -| n_updates | 4860 | -| policy_gradient_loss | -4.27e-06 | -| std | 1.01 | -| value_loss | 6.05e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 488 | -| time_elapsed | 9580 | -| total_timesteps | 62464 | -| train/ | | -| approx_kl | 1.876615e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -119 | -| learning_rate | 0.0003 | -| loss | -0.000649 | -| n_updates | 4870 | -| policy_gradient_loss | -0.0003 | -| std | 1.01 | -| value_loss | 1.63e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 489 | -| time_elapsed | 9612 | -| total_timesteps | 62592 | -| train/ | | -| approx_kl | 6.172806e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -6.65e-05 | -| n_updates | 4880 | -| policy_gradient_loss | -3.66e-05 | -| std | 1.02 | -| value_loss | 1.51e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 490 | -| time_elapsed | 9639 | -| total_timesteps | 62720 | -| train/ | | -| approx_kl | 5.3364784e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -3.32 | -| learning_rate | 0.0003 | -| loss | -2.64e-06 | -| n_updates | 4890 | -| policy_gradient_loss | 2.71e-06 | -| std | 1.02 | -| value_loss | 7.86e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 491 | -| time_elapsed | 9676 | -| total_timesteps | 62848 | -| train/ | | -| approx_kl | 3.467314e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | -0.00042 | -| n_updates | 4900 | -| policy_gradient_loss | -0.000168 | -| std | 1.02 | -| value_loss | 2.76e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 6 | -| iterations | 492 | -| time_elapsed | 9699 | -| total_timesteps | 62976 | -| train/ | | -| approx_kl | 3.3481047e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.00457 | -| learning_rate | 0.0003 | -| loss | -0.000124 | -| n_updates | 4910 | -| policy_gradient_loss | -2.08e-05 | -| std | 1.02 | -| value_loss | 1.33e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 493 | -| time_elapsed | 9735 | -| total_timesteps | 63104 | -| train/ | | -| approx_kl | 5.5972487e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | -0.000405 | -| n_updates | 4920 | -| policy_gradient_loss | -0.000195 | -| std | 1.02 | -| value_loss | 7.19e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 494 | -| time_elapsed | 9823 | -| total_timesteps | 63232 | -| train/ | | -| approx_kl | 1.9441359e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.714 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 4930 | -| policy_gradient_loss | 1.8e-05 | -| std | 1.02 | -| value_loss | 0.00698 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 495 | -| time_elapsed | 9862 | -| total_timesteps | 63360 | -| train/ | | -| approx_kl | 1.9622967e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -344 | -| learning_rate | 0.0003 | -| loss | -8.47e-05 | -| n_updates | 4940 | -| policy_gradient_loss | -9.62e-05 | -| std | 1.02 | -| value_loss | 0.000214 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 496 | -| time_elapsed | 9887 | -| total_timesteps | 63488 | -| train/ | | -| approx_kl | 1.34296715e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -319 | -| learning_rate | 0.0003 | -| loss | -0.000524 | -| n_updates | 4950 | -| policy_gradient_loss | -0.000243 | -| std | 1.03 | -| value_loss | 4.62e-05 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 497 | -| time_elapsed | 9922 | -| total_timesteps | 63616 | -| train/ | | -| approx_kl | 2.000481e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -99.8 | -| learning_rate | 0.0003 | -| loss | 8.59e-05 | -| n_updates | 4960 | -| policy_gradient_loss | 5.32e-05 | -| std | 1.03 | -| value_loss | 1.53e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 498 | -| time_elapsed | 9944 | -| total_timesteps | 63744 | -| train/ | | -| approx_kl | 6.280374e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.000349 | -| n_updates | 4970 | -| policy_gradient_loss | -0.000141 | -| std | 1.03 | -| value_loss | 1.7e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 6 | -| iterations | 499 | -| time_elapsed | 9967 | -| total_timesteps | 63872 | -| train/ | | -| approx_kl | 6.791204e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -4.97 | -| learning_rate | 0.0003 | -| loss | -0.000455 | -| n_updates | 4980 | -| policy_gradient_loss | -0.000223 | -| std | 1.03 | -| value_loss | 7.26e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 500 | -| time_elapsed | 9997 | -| total_timesteps | 64000 | -| train/ | | -| approx_kl | 1.3788231e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.966 | -| learning_rate | 0.0003 | -| loss | -0.000158 | -| n_updates | 4990 | -| policy_gradient_loss | -6.18e-06 | -| std | 1.03 | -| value_loss | 4.11e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 501 | -| time_elapsed | 10029 | -| total_timesteps | 64128 | -| train/ | | -| approx_kl | 3.168825e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.000453 | -| learning_rate | 0.0003 | -| loss | -6.92e-05 | -| n_updates | 5000 | -| policy_gradient_loss | -3.84e-05 | -| std | 1.03 | -| value_loss | 8.94e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 502 | -| time_elapsed | 10092 | -| total_timesteps | 64256 | -| train/ | | -| approx_kl | 1.9841827e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.743 | -| learning_rate | 0.0003 | -| loss | 0.00375 | -| n_updates | 5010 | -| policy_gradient_loss | -5e-05 | -| std | 1.03 | -| value_loss | 0.00903 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 503 | -| time_elapsed | 10127 | -| total_timesteps | 64384 | -| train/ | | -| approx_kl | 1.010485e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | 0.000222 | -| n_updates | 5020 | -| policy_gradient_loss | -2.92e-05 | -| std | 1.02 | -| value_loss | 0.00201 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 504 | -| time_elapsed | 10161 | -| total_timesteps | 64512 | -| train/ | | -| approx_kl | 4.976522e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.000228 | -| n_updates | 5030 | -| policy_gradient_loss | -0.000134 | -| std | 1.03 | -| value_loss | 0.000755 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 505 | -| time_elapsed | 10198 | -| total_timesteps | 64640 | -| train/ | | -| approx_kl | 5.435664e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -45.4 | -| learning_rate | 0.0003 | -| loss | 0.000108 | -| n_updates | 5040 | -| policy_gradient_loss | -6.33e-05 | -| std | 1.03 | -| value_loss | 0.000501 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 506 | -| time_elapsed | 10238 | -| total_timesteps | 64768 | -| train/ | | -| approx_kl | 1.5036203e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.71 | -| learning_rate | 0.0003 | -| loss | -4.13e-05 | -| n_updates | 5050 | -| policy_gradient_loss | -8.95e-06 | -| std | 1.03 | -| value_loss | 1.27e-05 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 6 | -| iterations | 507 | -| time_elapsed | 10271 | -| total_timesteps | 64896 | -| train/ | | -| approx_kl | 1.21071935e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -6.88 | -| learning_rate | 0.0003 | -| loss | -0.000976 | -| n_updates | 5060 | -| policy_gradient_loss | -0.000384 | -| std | 1.03 | -| value_loss | 1.37e-06 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 508 | -| time_elapsed | 10303 | -| total_timesteps | 65024 | -| train/ | | -| approx_kl | 2.1015294e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.684 | -| learning_rate | 0.0003 | -| loss | 0.000132 | -| n_updates | 5070 | -| policy_gradient_loss | 0.000106 | -| std | 1.03 | -| value_loss | 1.33e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 509 | -| time_elapsed | 10395 | -| total_timesteps | 65152 | -| train/ | | -| approx_kl | 5.2154064e-08 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -2.01 | -| learning_rate | 0.0003 | -| loss | 0.00287 | -| n_updates | 5080 | -| policy_gradient_loss | 1.07e-05 | -| std | 1.03 | -| value_loss | 0.00913 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 510 | -| time_elapsed | 10430 | -| total_timesteps | 65280 | -| train/ | | -| approx_kl | 1.3178214e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -225 | -| learning_rate | 0.0003 | -| loss | -6.19e-05 | -| n_updates | 5090 | -| policy_gradient_loss | -8.08e-05 | -| std | 1.03 | -| value_loss | 0.000254 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 511 | -| time_elapsed | 10463 | -| total_timesteps | 65408 | -| train/ | | -| approx_kl | 7.01705e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -259 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 5100 | -| policy_gradient_loss | -0.000211 | -| std | 1.02 | -| value_loss | 2.83e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 512 | -| time_elapsed | 10509 | -| total_timesteps | 65536 | -| train/ | | -| approx_kl | 1.2374949e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.000969 | -| n_updates | 5110 | -| policy_gradient_loss | -0.000419 | -| std | 1.03 | -| value_loss | 7.95e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 513 | -| time_elapsed | 10535 | -| total_timesteps | 65664 | -| train/ | | -| approx_kl | 1.422409e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.000299 | -| n_updates | 5120 | -| policy_gradient_loss | -0.000142 | -| std | 1.03 | -| value_loss | 1.27e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 514 | -| time_elapsed | 10568 | -| total_timesteps | 65792 | -| train/ | | -| approx_kl | 4.3986365e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -0.000217 | -| n_updates | 5130 | -| policy_gradient_loss | -6.99e-05 | -| std | 1.02 | -| value_loss | 3.14e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 6 | -| iterations | 515 | -| time_elapsed | 10615 | -| total_timesteps | 65920 | -| train/ | | -| approx_kl | 1.3341196e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | -0.00097 | -| n_updates | 5140 | -| policy_gradient_loss | -0.000434 | -| std | 1.02 | -| value_loss | 1.24e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 516 | -| time_elapsed | 10652 | -| total_timesteps | 66048 | -| train/ | | -| approx_kl | 1.2755394e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.000179 | -| n_updates | 5150 | -| policy_gradient_loss | -7.63e-05 | -| std | 1.02 | -| value_loss | 6.43e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 517 | -| time_elapsed | 10717 | -| total_timesteps | 66176 | -| train/ | | -| approx_kl | 4.741829e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -2.68 | -| learning_rate | 0.0003 | -| loss | 0.00098 | -| n_updates | 5160 | -| policy_gradient_loss | -0.000164 | -| std | 1.02 | -| value_loss | 0.00332 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 518 | -| time_elapsed | 10755 | -| total_timesteps | 66304 | -| train/ | | -| approx_kl | 3.3542514e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -88.7 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 5170 | -| policy_gradient_loss | -0.000922 | -| std | 1.02 | -| value_loss | 2.43e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 519 | -| time_elapsed | 10790 | -| total_timesteps | 66432 | -| train/ | | -| approx_kl | 1.20271e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -60 | -| learning_rate | 0.0003 | -| loss | 0.000115 | -| n_updates | 5180 | -| policy_gradient_loss | 9.56e-05 | -| std | 1.03 | -| value_loss | 7.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 520 | -| time_elapsed | 10824 | -| total_timesteps | 66560 | -| train/ | | -| approx_kl | 7.934403e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -3.51 | -| learning_rate | 0.0003 | -| loss | -0.000719 | -| n_updates | 5190 | -| policy_gradient_loss | -0.000292 | -| std | 1.03 | -| value_loss | 7.71e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 521 | -| time_elapsed | 10851 | -| total_timesteps | 66688 | -| train/ | | -| approx_kl | 1.1881813e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 5200 | -| policy_gradient_loss | -0.000195 | -| std | 1.03 | -| value_loss | 5.33e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 522 | -| time_elapsed | 10882 | -| total_timesteps | 66816 | -| train/ | | -| approx_kl | 6.4703636e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.000151 | -| n_updates | 5210 | -| policy_gradient_loss | -4.71e-05 | -| std | 1.03 | -| value_loss | 4.62e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 6 | -| iterations | 523 | -| time_elapsed | 10913 | -| total_timesteps | 66944 | -| train/ | | -| approx_kl | 0.00023950916 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | -0.00616 | -| n_updates | 5220 | -| policy_gradient_loss | -0.00235 | -| std | 1.03 | -| value_loss | 3.47e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 524 | -| time_elapsed | 10946 | -| total_timesteps | 67072 | -| train/ | | -| approx_kl | 0.0010438845 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | -0.000178 | -| n_updates | 5230 | -| policy_gradient_loss | -7.01e-05 | -| std | 1.03 | -| value_loss | 2.34e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 525 | -| time_elapsed | 11008 | -| total_timesteps | 67200 | -| train/ | | -| approx_kl | 0.00039466657 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.7 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 5240 | -| policy_gradient_loss | -0.00142 | -| std | 1.03 | -| value_loss | 0.00215 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 526 | -| time_elapsed | 11021 | -| total_timesteps | 67328 | -| train/ | | -| approx_kl | 0.00036130566 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.000858 | -| n_updates | 5250 | -| policy_gradient_loss | -0.000504 | -| std | 1.03 | -| value_loss | 4.92e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 527 | -| time_elapsed | 11050 | -| total_timesteps | 67456 | -| train/ | | -| approx_kl | 4.227599e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -13.6 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 5260 | -| policy_gradient_loss | -0.000671 | -| std | 1.03 | -| value_loss | 2.11e-07 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 528 | -| time_elapsed | 11084 | -| total_timesteps | 67584 | -| train/ | | -| approx_kl | 1.09523535e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | 0.000145 | -| n_updates | 5270 | -| policy_gradient_loss | 9.82e-05 | -| std | 1.03 | -| value_loss | 7.77e-08 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 529 | -| time_elapsed | 11116 | -| total_timesteps | 67712 | -| train/ | | -| approx_kl | 5.482696e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.000191 | -| n_updates | 5280 | -| policy_gradient_loss | -8.9e-05 | -| std | 1.03 | -| value_loss | 5.48e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 530 | -| time_elapsed | 11137 | -| total_timesteps | 67840 | -| train/ | | -| approx_kl | 1.4780089e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | -6.76e-05 | -| n_updates | 5290 | -| policy_gradient_loss | -4.48e-06 | -| std | 1.03 | -| value_loss | 3.61e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 6 | -| iterations | 531 | -| time_elapsed | 11173 | -| total_timesteps | 67968 | -| train/ | | -| approx_kl | 1.9122846e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | -0.000791 | -| n_updates | 5300 | -| policy_gradient_loss | -0.000336 | -| std | 1.03 | -| value_loss | 2.16e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 6 | -| iterations | 532 | -| time_elapsed | 11211 | -| total_timesteps | 68096 | -| train/ | | -| approx_kl | 4.6035275e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0702 | -| learning_rate | 0.0003 | -| loss | 4.87e-05 | -| n_updates | 5310 | -| policy_gradient_loss | 0.000118 | -| std | 1.03 | -| value_loss | 1.2e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 6 | -| iterations | 533 | -| time_elapsed | 11296 | -| total_timesteps | 68224 | -| train/ | | -| approx_kl | 4.0880404e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.627 | -| learning_rate | 0.0003 | -| loss | 5.23e-05 | -| n_updates | 5320 | -| policy_gradient_loss | -0.000106 | -| std | 1.03 | -| value_loss | 0.000664 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 6 | -| iterations | 534 | -| time_elapsed | 11338 | -| total_timesteps | 68352 | -| train/ | | -| approx_kl | 5.5879354e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -284 | -| learning_rate | 0.0003 | -| loss | 5.18e-06 | -| n_updates | 5330 | -| policy_gradient_loss | 3.51e-05 | -| std | 1.04 | -| value_loss | 1.63e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 6 | -| iterations | 535 | -| time_elapsed | 11370 | -| total_timesteps | 68480 | -| train/ | | -| approx_kl | 3.054738e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -279 | -| learning_rate | 0.0003 | -| loss | -4.72e-05 | -| n_updates | 5340 | -| policy_gradient_loss | -6.01e-06 | -| std | 1.03 | -| value_loss | 5.24e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 6 | -| iterations | 536 | -| time_elapsed | 11409 | -| total_timesteps | 68608 | -| train/ | | -| approx_kl | 1.6386621e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -51.3 | -| learning_rate | 0.0003 | -| loss | -0.000129 | -| n_updates | 5350 | -| policy_gradient_loss | -5.93e-05 | -| std | 1.03 | -| value_loss | 2.5e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 6 | -| iterations | 537 | -| time_elapsed | 11446 | -| total_timesteps | 68736 | -| train/ | | -| approx_kl | 1.127366e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -1.36 | -| learning_rate | 0.0003 | -| loss | -7.74e-06 | -| n_updates | 5360 | -| policy_gradient_loss | -3.91e-06 | -| std | 1.03 | -| value_loss | 3.92e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 5 | -| iterations | 538 | -| time_elapsed | 11480 | -| total_timesteps | 68864 | -| train/ | | -| approx_kl | 3.518071e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -0.000265 | -| n_updates | 5370 | -| policy_gradient_loss | -0.000107 | -| std | 1.03 | -| value_loss | 2.58e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 5 | -| iterations | 539 | -| time_elapsed | 11510 | -| total_timesteps | 68992 | -| train/ | | -| approx_kl | 1.2059696e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.000417 | -| n_updates | 5380 | -| policy_gradient_loss | -0.000124 | -| std | 1.03 | -| value_loss | 1.69e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 5 | -| iterations | 540 | -| time_elapsed | 11542 | -| total_timesteps | 69120 | -| train/ | | -| approx_kl | 8.7637454e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | 6.31e-05 | -| n_updates | 5390 | -| policy_gradient_loss | 9.16e-05 | -| std | 1.03 | -| value_loss | 1.05e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 5 | -| iterations | 541 | -| time_elapsed | 11638 | -| total_timesteps | 69248 | -| train/ | | -| approx_kl | 4.0368177e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.597 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 5400 | -| policy_gradient_loss | -0.000102 | -| std | 1.03 | -| value_loss | 0.00619 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 5 | -| iterations | 542 | -| time_elapsed | 11660 | -| total_timesteps | 69376 | -| train/ | | -| approx_kl | 6.52764e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -49.2 | -| learning_rate | 0.0003 | -| loss | -4.41e-05 | -| n_updates | 5410 | -| policy_gradient_loss | -2.79e-05 | -| std | 1.03 | -| value_loss | 2.89e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 5 | -| iterations | 543 | -| time_elapsed | 11690 | -| total_timesteps | 69504 | -| train/ | | -| approx_kl | 8.577481e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -31.1 | -| learning_rate | 0.0003 | -| loss | -7.08e-05 | -| n_updates | 5420 | -| policy_gradient_loss | -1.54e-05 | -| std | 1.03 | -| value_loss | 7.58e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 5 | -| iterations | 544 | -| time_elapsed | 11717 | -| total_timesteps | 69632 | -| train/ | | -| approx_kl | 3.2456592e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -2.78 | -| learning_rate | 0.0003 | -| loss | 8.06e-06 | -| n_updates | 5430 | -| policy_gradient_loss | 1.33e-05 | -| std | 1.03 | -| value_loss | 1.58e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 5 | -| iterations | 545 | -| time_elapsed | 11752 | -| total_timesteps | 69760 | -| train/ | | -| approx_kl | 4.596077e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | -9.11e-05 | -| n_updates | 5440 | -| policy_gradient_loss | -2.57e-05 | -| std | 1.03 | -| value_loss | 7.13e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 5 | -| iterations | 546 | -| time_elapsed | 11789 | -| total_timesteps | 69888 | -| train/ | | -| approx_kl | 5.988404e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | -0.000121 | -| n_updates | 5450 | -| policy_gradient_loss | -1.89e-05 | -| std | 1.03 | -| value_loss | 3.32e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 547 | -| time_elapsed | 11830 | -| total_timesteps | 70016 | -| train/ | | -| approx_kl | 1.3839453e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | -2.69e-05 | -| n_updates | 5460 | -| policy_gradient_loss | 7.15e-06 | -| std | 1.03 | -| value_loss | 1.62e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 548 | -| time_elapsed | 11906 | -| total_timesteps | 70144 | -| train/ | | -| approx_kl | 8.896925e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | 0.000245 | -| n_updates | 5470 | -| policy_gradient_loss | -0.000328 | -| std | 1.03 | -| value_loss | 0.00233 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 549 | -| time_elapsed | 11936 | -| total_timesteps | 70272 | -| train/ | | -| approx_kl | 4.492188e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -137 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 5480 | -| policy_gradient_loss | -0.000467 | -| std | 1.02 | -| value_loss | 1.21e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 550 | -| time_elapsed | 11965 | -| total_timesteps | 70400 | -| train/ | | -| approx_kl | 4.4612214e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -74.4 | -| learning_rate | 0.0003 | -| loss | -2.44e-05 | -| n_updates | 5490 | -| policy_gradient_loss | -5.42e-06 | -| std | 1.02 | -| value_loss | 3.25e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 551 | -| time_elapsed | 12006 | -| total_timesteps | 70528 | -| train/ | | -| approx_kl | 8.940697e-08 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -5.26 | -| learning_rate | 0.0003 | -| loss | -1.1e-05 | -| n_updates | 5500 | -| policy_gradient_loss | 1.07e-05 | -| std | 1.02 | -| value_loss | 3.24e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 552 | -| time_elapsed | 12046 | -| total_timesteps | 70656 | -| train/ | | -| approx_kl | 3.4212135e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.233 | -| learning_rate | 0.0003 | -| loss | -2.2e-05 | -| n_updates | 5510 | -| policy_gradient_loss | -9.31e-06 | -| std | 1.02 | -| value_loss | 1.92e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 553 | -| time_elapsed | 12074 | -| total_timesteps | 70784 | -| train/ | | -| approx_kl | 2.2093765e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | -0.000529 | -| n_updates | 5520 | -| policy_gradient_loss | -0.000235 | -| std | 1.02 | -| value_loss | 1.62e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 5 | -| iterations | 554 | -| time_elapsed | 12114 | -| total_timesteps | 70912 | -| train/ | | -| approx_kl | 4.4011977e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | -0.000991 | -| n_updates | 5530 | -| policy_gradient_loss | -0.000497 | -| std | 1.02 | -| value_loss | 1.23e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 555 | -| time_elapsed | 12155 | -| total_timesteps | 71040 | -| train/ | | -| approx_kl | 2.998393e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.000135 | -| n_updates | 5540 | -| policy_gradient_loss | 0.000121 | -| std | 1.02 | -| value_loss | 8.54e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 556 | -| time_elapsed | 12231 | -| total_timesteps | 71168 | -| train/ | | -| approx_kl | 3.501773e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.682 | -| learning_rate | 0.0003 | -| loss | 0.00209 | -| n_updates | 5550 | -| policy_gradient_loss | 2.56e-06 | -| std | 1.02 | -| value_loss | 0.00445 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 557 | -| time_elapsed | 12272 | -| total_timesteps | 71296 | -| train/ | | -| approx_kl | 1.9327272e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -287 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 5560 | -| policy_gradient_loss | -0.00044 | -| std | 1.02 | -| value_loss | 4.45e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 558 | -| time_elapsed | 12296 | -| total_timesteps | 71424 | -| train/ | | -| approx_kl | 5.847588e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -305 | -| learning_rate | 0.0003 | -| loss | -0.000172 | -| n_updates | 5570 | -| policy_gradient_loss | -7.59e-05 | -| std | 1.02 | -| value_loss | 1.51e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 559 | -| time_elapsed | 12333 | -| total_timesteps | 71552 | -| train/ | | -| approx_kl | 9.355601e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -40.8 | -| learning_rate | 0.0003 | -| loss | -0.000405 | -| n_updates | 5580 | -| policy_gradient_loss | -7.24e-05 | -| std | 1.02 | -| value_loss | 5.32e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 560 | -| time_elapsed | 12364 | -| total_timesteps | 71680 | -| train/ | | -| approx_kl | 5.106069e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 5590 | -| policy_gradient_loss | -0.00061 | -| std | 1.02 | -| value_loss | 7.56e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 561 | -| time_elapsed | 12395 | -| total_timesteps | 71808 | -| train/ | | -| approx_kl | 1.4277175e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | 0.000158 | -| n_updates | 5600 | -| policy_gradient_loss | 0.000128 | -| std | 1.02 | -| value_loss | 5.37e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 5 | -| iterations | 562 | -| time_elapsed | 12433 | -| total_timesteps | 71936 | -| train/ | | -| approx_kl | 6.07688e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -0.00011 | -| n_updates | 5610 | -| policy_gradient_loss | -2.81e-05 | -| std | 1.02 | -| value_loss | 2.76e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 563 | -| time_elapsed | 12462 | -| total_timesteps | 72064 | -| train/ | | -| approx_kl | 5.040318e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0743 | -| learning_rate | 0.0003 | -| loss | -0.000181 | -| n_updates | 5620 | -| policy_gradient_loss | -8.76e-05 | -| std | 1.02 | -| value_loss | 1.36e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 564 | -| time_elapsed | 12518 | -| total_timesteps | 72192 | -| train/ | | -| approx_kl | 5.2964315e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.653 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 5630 | -| policy_gradient_loss | -7.76e-05 | -| std | 1.02 | -| value_loss | 0.00452 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 565 | -| time_elapsed | 12546 | -| total_timesteps | 72320 | -| train/ | | -| approx_kl | 4.3315813e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -3.28 | -| learning_rate | 0.0003 | -| loss | -0.000426 | -| n_updates | 5640 | -| policy_gradient_loss | -0.00017 | -| std | 1.02 | -| value_loss | 6.12e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 566 | -| time_elapsed | 12574 | -| total_timesteps | 72448 | -| train/ | | -| approx_kl | 9.085983e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.739 | -| learning_rate | 0.0003 | -| loss | -0.000384 | -| n_updates | 5650 | -| policy_gradient_loss | -0.000195 | -| std | 1.03 | -| value_loss | 2.27e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 567 | -| time_elapsed | 12605 | -| total_timesteps | 72576 | -| train/ | | -| approx_kl | 3.2493845e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | 6.36e-05 | -| n_updates | 5660 | -| policy_gradient_loss | 3.97e-05 | -| std | 1.03 | -| value_loss | 6.78e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 568 | -| time_elapsed | 12633 | -| total_timesteps | 72704 | -| train/ | | -| approx_kl | 3.1106174e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -2.78e-05 | -| n_updates | 5670 | -| policy_gradient_loss | -1.01e-05 | -| std | 1.03 | -| value_loss | 3.88e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 569 | -| time_elapsed | 12673 | -| total_timesteps | 72832 | -| train/ | | -| approx_kl | 4.1718595e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | -0.000206 | -| n_updates | 5680 | -| policy_gradient_loss | -8.92e-05 | -| std | 1.03 | -| value_loss | 1.93e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 5 | -| iterations | 570 | -| time_elapsed | 12710 | -| total_timesteps | 72960 | -| train/ | | -| approx_kl | 3.3648685e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | -3.14e-05 | -| n_updates | 5690 | -| policy_gradient_loss | -6.67e-06 | -| std | 1.03 | -| value_loss | 1.03e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 571 | -| time_elapsed | 12744 | -| total_timesteps | 73088 | -| train/ | | -| approx_kl | 1.3029203e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | -0.000101 | -| n_updates | 5700 | -| policy_gradient_loss | -2.06e-05 | -| std | 1.03 | -| value_loss | 5.51e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 572 | -| time_elapsed | 12817 | -| total_timesteps | 73216 | -| train/ | | -| approx_kl | 2.657529e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.793 | -| learning_rate | 0.0003 | -| loss | 0.000353 | -| n_updates | 5710 | -| policy_gradient_loss | -0.000105 | -| std | 1.03 | -| value_loss | 0.00148 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 573 | -| time_elapsed | 12856 | -| total_timesteps | 73344 | -| train/ | | -| approx_kl | 1.017563e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 5720 | -| policy_gradient_loss | -6.43e-05 | -| std | 1.03 | -| value_loss | 1.56e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 574 | -| time_elapsed | 12892 | -| total_timesteps | 73472 | -| train/ | | -| approx_kl | 8.839648e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -16.6 | -| learning_rate | 0.0003 | -| loss | -0.00054 | -| n_updates | 5730 | -| policy_gradient_loss | -0.0002 | -| std | 1.03 | -| value_loss | 7.36e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 575 | -| time_elapsed | 12923 | -| total_timesteps | 73600 | -| train/ | | -| approx_kl | 7.012859e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -1.76 | -| learning_rate | 0.0003 | -| loss | 8.09e-05 | -| n_updates | 5740 | -| policy_gradient_loss | 0.000106 | -| std | 1.02 | -| value_loss | 8.44e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 576 | -| time_elapsed | 12973 | -| total_timesteps | 73728 | -| train/ | | -| approx_kl | 6.129965e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | -0.000497 | -| n_updates | 5750 | -| policy_gradient_loss | -0.000147 | -| std | 1.02 | -| value_loss | 4.12e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 577 | -| time_elapsed | 13013 | -| total_timesteps | 73856 | -| train/ | | -| approx_kl | 1.226645e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.000459 | -| n_updates | 5760 | -| policy_gradient_loss | -0.000236 | -| std | 1.02 | -| value_loss | 2.03e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 5 | -| iterations | 578 | -| time_elapsed | 13055 | -| total_timesteps | 73984 | -| train/ | | -| approx_kl | 8.749776e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | -0.000389 | -| n_updates | 5770 | -| policy_gradient_loss | -0.000143 | -| std | 1.02 | -| value_loss | 1.11e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 5 | -| iterations | 579 | -| time_elapsed | 13087 | -| total_timesteps | 74112 | -| train/ | | -| approx_kl | 5.7253055e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 2.04e-05 | -| n_updates | 5780 | -| policy_gradient_loss | 1.31e-05 | -| std | 1.02 | -| value_loss | 6e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 5 | -| iterations | 580 | -| time_elapsed | 13161 | -| total_timesteps | 74240 | -| train/ | | -| approx_kl | 3.6493875e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | 0.467 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 5790 | -| policy_gradient_loss | -0.000115 | -| std | 1.02 | -| value_loss | 0.0264 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 5 | -| iterations | 581 | -| time_elapsed | 13187 | -| total_timesteps | 74368 | -| train/ | | -| approx_kl | 1.7643906e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -20.5 | -| learning_rate | 0.0003 | -| loss | 0.000155 | -| n_updates | 5800 | -| policy_gradient_loss | -2.72e-05 | -| std | 1.03 | -| value_loss | 0.000291 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 5 | -| iterations | 582 | -| time_elapsed | 13225 | -| total_timesteps | 74496 | -| train/ | | -| approx_kl | 3.461726e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -33 | -| learning_rate | 0.0003 | -| loss | -0.000167 | -| n_updates | 5810 | -| policy_gradient_loss | -8.98e-05 | -| std | 1.03 | -| value_loss | 9.61e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 5 | -| iterations | 583 | -| time_elapsed | 13260 | -| total_timesteps | 74624 | -| train/ | | -| approx_kl | 2.8219074e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -8.51e-05 | -| n_updates | 5820 | -| policy_gradient_loss | -2.72e-05 | -| std | 1.03 | -| value_loss | 1.42e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 5 | -| iterations | 584 | -| time_elapsed | 13296 | -| total_timesteps | 74752 | -| train/ | | -| approx_kl | 3.9068982e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.335 | -| learning_rate | 0.0003 | -| loss | 2.44e-05 | -| n_updates | 5830 | -| policy_gradient_loss | 1.93e-05 | -| std | 1.03 | -| value_loss | 2.08e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 5 | -| iterations | 585 | -| time_elapsed | 13328 | -| total_timesteps | 74880 | -| train/ | | -| approx_kl | 2.225954e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0452 | -| learning_rate | 0.0003 | -| loss | -0.000741 | -| n_updates | 5840 | -| policy_gradient_loss | -0.000291 | -| std | 1.03 | -| value_loss | 2.75e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 586 | -| time_elapsed | 13359 | -| total_timesteps | 75008 | -| train/ | | -| approx_kl | 0.00013374165 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.0975 | -| learning_rate | 0.0003 | -| loss | -0.000681 | -| n_updates | 5850 | -| policy_gradient_loss | -0.000325 | -| std | 1.03 | -| value_loss | 2.64e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 587 | -| time_elapsed | 13433 | -| total_timesteps | 75136 | -| train/ | | -| approx_kl | 2.2374094e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.614 | -| learning_rate | 0.0003 | -| loss | 0.00187 | -| n_updates | 5860 | -| policy_gradient_loss | -0.000234 | -| std | 1.03 | -| value_loss | 0.00633 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 588 | -| time_elapsed | 13467 | -| total_timesteps | 75264 | -| train/ | | -| approx_kl | 0.0001684674 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -20.3 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 5870 | -| policy_gradient_loss | -0.000584 | -| std | 1.03 | -| value_loss | 6.91e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 589 | -| time_elapsed | 13506 | -| total_timesteps | 75392 | -| train/ | | -| approx_kl | 2.1356158e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -50.2 | -| learning_rate | 0.0003 | -| loss | -0.00055 | -| n_updates | 5880 | -| policy_gradient_loss | -0.000303 | -| std | 1.03 | -| value_loss | 9.1e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 590 | -| time_elapsed | 13532 | -| total_timesteps | 75520 | -| train/ | | -| approx_kl | 4.271511e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | -1.21e-05 | -| n_updates | 5890 | -| policy_gradient_loss | 5.1e-06 | -| std | 1.03 | -| value_loss | 9.52e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 591 | -| time_elapsed | 13562 | -| total_timesteps | 75648 | -| train/ | | -| approx_kl | 4.991889e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.608 | -| learning_rate | 0.0003 | -| loss | -0.000188 | -| n_updates | 5900 | -| policy_gradient_loss | -6.96e-05 | -| std | 1.03 | -| value_loss | 7.65e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 592 | -| time_elapsed | 13590 | -| total_timesteps | 75776 | -| train/ | | -| approx_kl | 3.5542063e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.00958 | -| learning_rate | 0.0003 | -| loss | -0.00096 | -| n_updates | 5910 | -| policy_gradient_loss | -0.000392 | -| std | 1.03 | -| value_loss | 5.08e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 5 | -| iterations | 593 | -| time_elapsed | 13612 | -| total_timesteps | 75904 | -| train/ | | -| approx_kl | 1.0067597e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.00869 | -| learning_rate | 0.0003 | -| loss | 0.000181 | -| n_updates | 5920 | -| policy_gradient_loss | 0.000166 | -| std | 1.03 | -| value_loss | 3.81e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 594 | -| time_elapsed | 13645 | -| total_timesteps | 76032 | -| train/ | | -| approx_kl | 5.7614874e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.000536 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 5930 | -| policy_gradient_loss | -0.000744 | -| std | 1.03 | -| value_loss | 2.91e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 595 | -| time_elapsed | 13725 | -| total_timesteps | 76160 | -| train/ | | -| approx_kl | 1.3621058e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.48 | -| learning_rate | 0.0003 | -| loss | 0.00999 | -| n_updates | 5940 | -| policy_gradient_loss | -8.04e-05 | -| std | 1.03 | -| value_loss | 0.0222 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 596 | -| time_elapsed | 13758 | -| total_timesteps | 76288 | -| train/ | | -| approx_kl | 1.5459955e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -84.5 | -| learning_rate | 0.0003 | -| loss | -0.000112 | -| n_updates | 5950 | -| policy_gradient_loss | -4.8e-05 | -| std | 1.03 | -| value_loss | 0.000282 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 597 | -| time_elapsed | 13793 | -| total_timesteps | 76416 | -| train/ | | -| approx_kl | 1.6392209e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -64.8 | -| learning_rate | 0.0003 | -| loss | -0.000439 | -| n_updates | 5960 | -| policy_gradient_loss | -0.000218 | -| std | 1.03 | -| value_loss | 7.62e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 598 | -| time_elapsed | 13814 | -| total_timesteps | 76544 | -| train/ | | -| approx_kl | 6.938353e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -5.97 | -| learning_rate | 0.0003 | -| loss | 7.19e-05 | -| n_updates | 5970 | -| policy_gradient_loss | 8.18e-05 | -| std | 1.03 | -| value_loss | 8.26e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 599 | -| time_elapsed | 13839 | -| total_timesteps | 76672 | -| train/ | | -| approx_kl | 6.012153e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -3.86 | -| learning_rate | 0.0003 | -| loss | -0.000262 | -| n_updates | 5980 | -| policy_gradient_loss | -0.000127 | -| std | 1.03 | -| value_loss | 4.53e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 600 | -| time_elapsed | 13867 | -| total_timesteps | 76800 | -| train/ | | -| approx_kl | 4.4191256e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 2.15e-05 | -| n_updates | 5990 | -| policy_gradient_loss | 3.7e-05 | -| std | 1.03 | -| value_loss | 1.14e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 5 | -| iterations | 601 | -| time_elapsed | 13903 | -| total_timesteps | 76928 | -| train/ | | -| approx_kl | 2.2337772e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | 0.00479 | -| learning_rate | 0.0003 | -| loss | -0.000103 | -| n_updates | 6000 | -| policy_gradient_loss | -4.98e-05 | -| std | 1.03 | -| value_loss | 6.09e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 602 | -| time_elapsed | 13930 | -| total_timesteps | 77056 | -| train/ | | -| approx_kl | 3.7364662e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.45 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | -0.000144 | -| n_updates | 6010 | -| policy_gradient_loss | -6.71e-05 | -| std | 1.03 | -| value_loss | 3.11e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 603 | -| time_elapsed | 14001 | -| total_timesteps | 77184 | -| train/ | | -| approx_kl | 3.4614466e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -0.648 | -| learning_rate | 0.0003 | -| loss | 0.000612 | -| n_updates | 6020 | -| policy_gradient_loss | -0.000504 | -| std | 1.02 | -| value_loss | 0.00552 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 604 | -| time_elapsed | 14030 | -| total_timesteps | 77312 | -| train/ | | -| approx_kl | 3.4861732e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -183 | -| learning_rate | 0.0003 | -| loss | -0.000163 | -| n_updates | 6030 | -| policy_gradient_loss | -0.000132 | -| std | 1.02 | -| value_loss | 0.000145 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 605 | -| time_elapsed | 14065 | -| total_timesteps | 77440 | -| train/ | | -| approx_kl | 6.2477775e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -228 | -| learning_rate | 0.0003 | -| loss | -0.000195 | -| n_updates | 6040 | -| policy_gradient_loss | -8.96e-05 | -| std | 1.02 | -| value_loss | 1.71e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 606 | -| time_elapsed | 14105 | -| total_timesteps | 77568 | -| train/ | | -| approx_kl | 4.619127e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.44 | -| explained_variance | -2.72 | -| learning_rate | 0.0003 | -| loss | -0.000531 | -| n_updates | 6050 | -| policy_gradient_loss | -0.000224 | -| std | 1.02 | -| value_loss | 5.53e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 607 | -| time_elapsed | 14126 | -| total_timesteps | 77696 | -| train/ | | -| approx_kl | 1.5140511e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -185 | -| learning_rate | 0.0003 | -| loss | -0.000929 | -| n_updates | 6060 | -| policy_gradient_loss | -0.00037 | -| std | 1.01 | -| value_loss | 6.19e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 608 | -| time_elapsed | 14151 | -| total_timesteps | 77824 | -| train/ | | -| approx_kl | 5.0254166e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -118 | -| learning_rate | 0.0003 | -| loss | 0.000178 | -| n_updates | 6070 | -| policy_gradient_loss | 0.000127 | -| std | 1.01 | -| value_loss | 2.68e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 5 | -| iterations | 609 | -| time_elapsed | 14179 | -| total_timesteps | 77952 | -| train/ | | -| approx_kl | 6.8442896e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -5.3 | -| learning_rate | 0.0003 | -| loss | -0.000272 | -| n_updates | 6080 | -| policy_gradient_loss | -0.00011 | -| std | 1.01 | -| value_loss | 5.9e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 610 | -| time_elapsed | 14216 | -| total_timesteps | 78080 | -| train/ | | -| approx_kl | 5.6692865e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.000895 | -| n_updates | 6090 | -| policy_gradient_loss | -0.000397 | -| std | 1.01 | -| value_loss | 2.73e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 611 | -| time_elapsed | 14277 | -| total_timesteps | 78208 | -| train/ | | -| approx_kl | 0.0006265552 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.628 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 6100 | -| policy_gradient_loss | -0.00185 | -| std | 1.01 | -| value_loss | 0.00759 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 612 | -| time_elapsed | 14312 | -| total_timesteps | 78336 | -| train/ | | -| approx_kl | 0.0008172598 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -14.6 | -| learning_rate | 0.0003 | -| loss | 0.000334 | -| n_updates | 6110 | -| policy_gradient_loss | 0.000234 | -| std | 1.01 | -| value_loss | 1.23e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 613 | -| time_elapsed | 14357 | -| total_timesteps | 78464 | -| train/ | | -| approx_kl | 0.0016334718 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -4.75 | -| learning_rate | 0.0003 | -| loss | -0.00746 | -| n_updates | 6120 | -| policy_gradient_loss | -0.00318 | -| std | 1.01 | -| value_loss | 3.78e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 614 | -| time_elapsed | 14392 | -| total_timesteps | 78592 | -| train/ | | -| approx_kl | 0.00024407823 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.359 | -| learning_rate | 0.0003 | -| loss | 0.000831 | -| n_updates | 6130 | -| policy_gradient_loss | 0.000556 | -| std | 1.01 | -| value_loss | 1.21e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 615 | -| time_elapsed | 14423 | -| total_timesteps | 78720 | -| train/ | | -| approx_kl | 3.8521364e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.000748 | -| n_updates | 6140 | -| policy_gradient_loss | -0.000325 | -| std | 1.01 | -| value_loss | 7.88e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 616 | -| time_elapsed | 14442 | -| total_timesteps | 78848 | -| train/ | | -| approx_kl | 9.4641e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | 8.31e-05 | -| n_updates | 6150 | -| policy_gradient_loss | 9.47e-05 | -| std | 1.01 | -| value_loss | 4.31e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 5 | -| iterations | 617 | -| time_elapsed | 14477 | -| total_timesteps | 78976 | -| train/ | | -| approx_kl | 6.5501314e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.00902 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 6160 | -| policy_gradient_loss | -0.00056 | -| std | 1.01 | -| value_loss | 3.03e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 5 | -| iterations | 618 | -| time_elapsed | 14499 | -| total_timesteps | 79104 | -| train/ | | -| approx_kl | 5.6219287e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.000314 | -| n_updates | 6170 | -| policy_gradient_loss | 0.000349 | -| std | 1.01 | -| value_loss | 2.01e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 5 | -| iterations | 619 | -| time_elapsed | 14573 | -| total_timesteps | 79232 | -| train/ | | -| approx_kl | 3.401842e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | 0.516 | -| learning_rate | 0.0003 | -| loss | 0.000736 | -| n_updates | 6180 | -| policy_gradient_loss | -0.000106 | -| std | 1.01 | -| value_loss | 0.00224 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 5 | -| iterations | 620 | -| time_elapsed | 14608 | -| total_timesteps | 79360 | -| train/ | | -| approx_kl | 3.7983991e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -204 | -| learning_rate | 0.0003 | -| loss | -3.52e-06 | -| n_updates | 6190 | -| policy_gradient_loss | 1.63e-05 | -| std | 1.01 | -| value_loss | 2.08e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 5 | -| iterations | 621 | -| time_elapsed | 14635 | -| total_timesteps | 79488 | -| train/ | | -| approx_kl | 5.6098215e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -217 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 6200 | -| policy_gradient_loss | -0.000121 | -| std | 1.01 | -| value_loss | 5.14e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 5 | -| iterations | 622 | -| time_elapsed | 14666 | -| total_timesteps | 79616 | -| train/ | | -| approx_kl | 3.3383258e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.43 | -| explained_variance | -25.1 | -| learning_rate | 0.0003 | -| loss | -0.000202 | -| n_updates | 6210 | -| policy_gradient_loss | -9.73e-05 | -| std | 1.01 | -| value_loss | 4.98e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 5 | -| iterations | 623 | -| time_elapsed | 14690 | -| total_timesteps | 79744 | -| train/ | | -| approx_kl | 3.221305e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 6220 | -| policy_gradient_loss | -0.000717 | -| std | 1 | -| value_loss | 1.33e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 5 | -| iterations | 624 | -| time_elapsed | 14720 | -| total_timesteps | 79872 | -| train/ | | -| approx_kl | 4.629977e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | -0.00077 | -| n_updates | 6230 | -| policy_gradient_loss | -0.00018 | -| std | 0.998 | -| value_loss | 6.53e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 625 | -| time_elapsed | 14750 | -| total_timesteps | 80000 | -| train/ | | -| approx_kl | 6.848015e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.0087 | -| learning_rate | 0.0003 | -| loss | 5.68e-05 | -| n_updates | 6240 | -| policy_gradient_loss | 0.000144 | -| std | 0.996 | -| value_loss | 1.68e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 626 | -| time_elapsed | 14781 | -| total_timesteps | 80128 | -| train/ | | -| approx_kl | 2.7745496e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.00536 | -| learning_rate | 0.0003 | -| loss | -0.000684 | -| n_updates | 6250 | -| policy_gradient_loss | -0.000165 | -| std | 0.996 | -| value_loss | 2.1e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 627 | -| time_elapsed | 14869 | -| total_timesteps | 80256 | -| train/ | | -| approx_kl | 0.00017097034 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.804 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 6260 | -| policy_gradient_loss | -0.000124 | -| std | 0.995 | -| value_loss | 0.00328 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 628 | -| time_elapsed | 14895 | -| total_timesteps | 80384 | -| train/ | | -| approx_kl | 0.00026943116 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -400 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 6270 | -| policy_gradient_loss | -0.00175 | -| std | 0.991 | -| value_loss | 1.59e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 629 | -| time_elapsed | 14932 | -| total_timesteps | 80512 | -| train/ | | -| approx_kl | 0.00010381173 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -355 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 6280 | -| policy_gradient_loss | -0.000158 | -| std | 0.987 | -| value_loss | 4.15e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 630 | -| time_elapsed | 14971 | -| total_timesteps | 80640 | -| train/ | | -| approx_kl | 5.335547e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -4.94 | -| learning_rate | 0.0003 | -| loss | 4e-05 | -| n_updates | 6290 | -| policy_gradient_loss | 3.93e-05 | -| std | 0.987 | -| value_loss | 2.43e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 631 | -| time_elapsed | 15003 | -| total_timesteps | 80768 | -| train/ | | -| approx_kl | 1.5849713e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -8.39 | -| learning_rate | 0.0003 | -| loss | -0.000679 | -| n_updates | 6300 | -| policy_gradient_loss | -0.000292 | -| std | 0.989 | -| value_loss | 3.18e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 632 | -| time_elapsed | 15031 | -| total_timesteps | 80896 | -| train/ | | -| approx_kl | 5.4528937e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.492 | -| learning_rate | 0.0003 | -| loss | -0.00012 | -| n_updates | 6310 | -| policy_gradient_loss | 8.13e-05 | -| std | 0.988 | -| value_loss | 9.32e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 633 | -| time_elapsed | 15058 | -| total_timesteps | 81024 | -| train/ | | -| approx_kl | 3.6587007e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0037 | -| learning_rate | 0.0003 | -| loss | 6.3e-05 | -| n_updates | 6320 | -| policy_gradient_loss | 4.16e-05 | -| std | 0.987 | -| value_loss | 5.89e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 634 | -| time_elapsed | 15121 | -| total_timesteps | 81152 | -| train/ | | -| approx_kl | 1.788605e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.857 | -| learning_rate | 0.0003 | -| loss | 0.000813 | -| n_updates | 6330 | -| policy_gradient_loss | -4.47e-05 | -| std | 0.987 | -| value_loss | 0.00197 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 635 | -| time_elapsed | 15186 | -| total_timesteps | 81280 | -| train/ | | -| approx_kl | 9.9428e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.284 | -| learning_rate | 0.0003 | -| loss | -0.000525 | -| n_updates | 6340 | -| policy_gradient_loss | -0.000244 | -| std | 0.985 | -| value_loss | 7.3e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 636 | -| time_elapsed | 15235 | -| total_timesteps | 81408 | -| train/ | | -| approx_kl | 7.100869e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -72.5 | -| learning_rate | 0.0003 | -| loss | 9.04e-05 | -| n_updates | 6350 | -| policy_gradient_loss | 6.01e-05 | -| std | 0.984 | -| value_loss | 8.44e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 637 | -| time_elapsed | 15297 | -| total_timesteps | 81536 | -| train/ | | -| approx_kl | 3.2663345e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -5 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 6360 | -| policy_gradient_loss | -0.000438 | -| std | 0.987 | -| value_loss | 8.21e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 638 | -| time_elapsed | 15352 | -| total_timesteps | 81664 | -| train/ | | -| approx_kl | 0.00018481398 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 6370 | -| policy_gradient_loss | -0.000468 | -| std | 0.988 | -| value_loss | 3.1e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 639 | -| time_elapsed | 15379 | -| total_timesteps | 81792 | -| train/ | | -| approx_kl | 2.2714958e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 3.46e-05 | -| n_updates | 6380 | -| policy_gradient_loss | 0.000182 | -| std | 0.99 | -| value_loss | 2.35e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 640 | -| time_elapsed | 15436 | -| total_timesteps | 81920 | -| train/ | | -| approx_kl | 3.195973e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.00262 | -| learning_rate | 0.0003 | -| loss | 1.39e-05 | -| n_updates | 6390 | -| policy_gradient_loss | 1.51e-05 | -| std | 0.99 | -| value_loss | 2.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 641 | -| time_elapsed | 15476 | -| total_timesteps | 82048 | -| train/ | | -| approx_kl | 0.0003711125 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.00253 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 6400 | -| policy_gradient_loss | -0.0012 | -| std | 0.991 | -| value_loss | 1.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 642 | -| time_elapsed | 15577 | -| total_timesteps | 82176 | -| train/ | | -| approx_kl | 0.015430723 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.745 | -| learning_rate | 0.0003 | -| loss | -0.004 | -| n_updates | 6410 | -| policy_gradient_loss | -0.0042 | -| std | 0.991 | -| value_loss | 0.00741 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 643 | -| time_elapsed | 15624 | -| total_timesteps | 82304 | -| train/ | | -| approx_kl | 0.0017130133 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -100 | -| learning_rate | 0.0003 | -| loss | -0.00537 | -| n_updates | 6420 | -| policy_gradient_loss | -0.0013 | -| std | 0.989 | -| value_loss | 5.66e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 644 | -| time_elapsed | 15670 | -| total_timesteps | 82432 | -| train/ | | -| approx_kl | 0.002380786 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -178 | -| learning_rate | 0.0003 | -| loss | -0.000115 | -| n_updates | 6430 | -| policy_gradient_loss | 2.84e-05 | -| std | 0.989 | -| value_loss | 1.6e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 645 | -| time_elapsed | 15730 | -| total_timesteps | 82560 | -| train/ | | -| approx_kl | 0.0011123368 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -43.6 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 6440 | -| policy_gradient_loss | -0.00092 | -| std | 0.99 | -| value_loss | 7.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 646 | -| time_elapsed | 15767 | -| total_timesteps | 82688 | -| train/ | | -| approx_kl | 0.001952522 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -28.8 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 6450 | -| policy_gradient_loss | -0.00238 | -| std | 0.99 | -| value_loss | 2.01e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 647 | -| time_elapsed | 15807 | -| total_timesteps | 82816 | -| train/ | | -| approx_kl | 0.0019557257 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -3.78 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 6460 | -| policy_gradient_loss | -0.00125 | -| std | 0.99 | -| value_loss | 2.6e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 648 | -| time_elapsed | 15878 | -| total_timesteps | 82944 | -| train/ | | -| approx_kl | 0.0019354527 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.565 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 6470 | -| policy_gradient_loss | -0.00481 | -| std | 0.988 | -| value_loss | 1.12e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 649 | -| time_elapsed | 15916 | -| total_timesteps | 83072 | -| train/ | | -| approx_kl | 0.00011779461 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.625 | -| learning_rate | 0.0003 | -| loss | 0.000341 | -| n_updates | 6480 | -| policy_gradient_loss | 0.000241 | -| std | 0.988 | -| value_loss | 6.45e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 650 | -| time_elapsed | 16027 | -| total_timesteps | 83200 | -| train/ | | -| approx_kl | 2.5009736e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.832 | -| learning_rate | 0.0003 | -| loss | -0.000149 | -| n_updates | 6490 | -| policy_gradient_loss | -0.000397 | -| std | 0.986 | -| value_loss | 0.00233 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 651 | -| time_elapsed | 16080 | -| total_timesteps | 83328 | -| train/ | | -| approx_kl | 0.0033977642 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -35.4 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 6500 | -| policy_gradient_loss | -0.00459 | -| std | 0.987 | -| value_loss | 2.65e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 652 | -| time_elapsed | 16160 | -| total_timesteps | 83456 | -| train/ | | -| approx_kl | 0.009718621 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -5.21 | -| learning_rate | 0.0003 | -| loss | 0.000126 | -| n_updates | 6510 | -| policy_gradient_loss | -0.000509 | -| std | 0.988 | -| value_loss | 3.2e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 653 | -| time_elapsed | 16189 | -| total_timesteps | 83584 | -| train/ | | -| approx_kl | 0.01529472 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.564 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 6520 | -| policy_gradient_loss | -0.0138 | -| std | 0.986 | -| value_loss | 3.47e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 654 | -| time_elapsed | 16230 | -| total_timesteps | 83712 | -| train/ | | -| approx_kl | 0.00023608236 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 6530 | -| policy_gradient_loss | 0.001 | -| std | 0.985 | -| value_loss | 4.42e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 655 | -| time_elapsed | 16266 | -| total_timesteps | 83840 | -| train/ | | -| approx_kl | 5.6773424e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.00612 | -| learning_rate | 0.0003 | -| loss | -0.000125 | -| n_updates | 6540 | -| policy_gradient_loss | -5.65e-05 | -| std | 0.983 | -| value_loss | 4.74e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 5 | -| iterations | 656 | -| time_elapsed | 16300 | -| total_timesteps | 83968 | -| train/ | | -| approx_kl | 8.368865e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.000444 | -| n_updates | 6550 | -| policy_gradient_loss | -0.00012 | -| std | 0.984 | -| value_loss | 4.23e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 657 | -| time_elapsed | 16337 | -| total_timesteps | 84096 | -| train/ | | -| approx_kl | 8.2138926e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0913 | -| learning_rate | 0.0003 | -| loss | -0.00069 | -| n_updates | 6560 | -| policy_gradient_loss | -0.00033 | -| std | 0.985 | -| value_loss | 3.22e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 658 | -| time_elapsed | 16415 | -| total_timesteps | 84224 | -| train/ | | -| approx_kl | 8.462928e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.000296 | -| n_updates | 6570 | -| policy_gradient_loss | 7.74e-06 | -| std | 0.985 | -| value_loss | 0.000351 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 659 | -| time_elapsed | 16441 | -| total_timesteps | 84352 | -| train/ | | -| approx_kl | 6.691553e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -213 | -| learning_rate | 0.0003 | -| loss | -0.000414 | -| n_updates | 6580 | -| policy_gradient_loss | -0.000225 | -| std | 0.984 | -| value_loss | 9.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 660 | -| time_elapsed | 16474 | -| total_timesteps | 84480 | -| train/ | | -| approx_kl | 2.565328e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -177 | -| learning_rate | 0.0003 | -| loss | -0.000464 | -| n_updates | 6590 | -| policy_gradient_loss | -9.57e-05 | -| std | 0.986 | -| value_loss | 1.79e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 661 | -| time_elapsed | 16510 | -| total_timesteps | 84608 | -| train/ | | -| approx_kl | 9.790063e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.000327 | -| n_updates | 6600 | -| policy_gradient_loss | -0.000161 | -| std | 0.99 | -| value_loss | 3.98e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 662 | -| time_elapsed | 16555 | -| total_timesteps | 84736 | -| train/ | | -| approx_kl | 1.8074643e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -7.4 | -| learning_rate | 0.0003 | -| loss | -0.000623 | -| n_updates | 6610 | -| policy_gradient_loss | -0.000292 | -| std | 0.993 | -| value_loss | 1.41e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 663 | -| time_elapsed | 16587 | -| total_timesteps | 84864 | -| train/ | | -| approx_kl | 2.4372712e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.00636 | -| learning_rate | 0.0003 | -| loss | 8.14e-05 | -| n_updates | 6620 | -| policy_gradient_loss | 6.28e-05 | -| std | 0.995 | -| value_loss | 5.15e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 5 | -| iterations | 664 | -| time_elapsed | 16630 | -| total_timesteps | 84992 | -| train/ | | -| approx_kl | 1.3659708e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.000485 | -| n_updates | 6630 | -| policy_gradient_loss | -0.000186 | -| std | 0.993 | -| value_loss | 2.39e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 5 | -| iterations | 665 | -| time_elapsed | 16670 | -| total_timesteps | 85120 | -| train/ | | -| approx_kl | 1.8198509e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.00376 | -| learning_rate | 0.0003 | -| loss | -6.16e-05 | -| n_updates | 6640 | -| policy_gradient_loss | -2.44e-05 | -| std | 0.992 | -| value_loss | 1.36e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 5 | -| iterations | 666 | -| time_elapsed | 16744 | -| total_timesteps | 85248 | -| train/ | | -| approx_kl | 6.8405643e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | 0.00193 | -| n_updates | 6650 | -| policy_gradient_loss | 2.22e-05 | -| std | 0.992 | -| value_loss | 0.00414 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 5 | -| iterations | 667 | -| time_elapsed | 16782 | -| total_timesteps | 85376 | -| train/ | | -| approx_kl | 4.4884626e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -302 | -| learning_rate | 0.0003 | -| loss | -0.000937 | -| n_updates | 6660 | -| policy_gradient_loss | -0.000336 | -| std | 0.993 | -| value_loss | 2.08e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 5 | -| iterations | 668 | -| time_elapsed | 16818 | -| total_timesteps | 85504 | -| train/ | | -| approx_kl | 2.4037436e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -322 | -| learning_rate | 0.0003 | -| loss | -6.25e-05 | -| n_updates | 6670 | -| policy_gradient_loss | 0.000139 | -| std | 0.994 | -| value_loss | 1.7e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 5 | -| iterations | 669 | -| time_elapsed | 16858 | -| total_timesteps | 85632 | -| train/ | | -| approx_kl | 9.844685e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -112 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 6680 | -| policy_gradient_loss | -0.000558 | -| std | 0.994 | -| value_loss | 3.42e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 5 | -| iterations | 670 | -| time_elapsed | 16885 | -| total_timesteps | 85760 | -| train/ | | -| approx_kl | 9.536743e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -70.9 | -| learning_rate | 0.0003 | -| loss | 0.000145 | -| n_updates | 6690 | -| policy_gradient_loss | 0.00014 | -| std | 0.993 | -| value_loss | 2.98e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 5 | -| iterations | 671 | -| time_elapsed | 16919 | -| total_timesteps | 85888 | -| train/ | | -| approx_kl | 2.5518239e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -44.7 | -| learning_rate | 0.0003 | -| loss | -6.32e-05 | -| n_updates | 6700 | -| policy_gradient_loss | 5.78e-06 | -| std | 0.993 | -| value_loss | 5.4e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 672 | -| time_elapsed | 16951 | -| total_timesteps | 86016 | -| train/ | | -| approx_kl | 1.5473925e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -2.25 | -| learning_rate | 0.0003 | -| loss | -2.95e-05 | -| n_updates | 6710 | -| policy_gradient_loss | -1.28e-05 | -| std | 0.995 | -| value_loss | 8.65e-10 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 673 | -| time_elapsed | 17020 | -| total_timesteps | 86144 | -| train/ | | -| approx_kl | 1.17812306e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | 0.000936 | -| n_updates | 6720 | -| policy_gradient_loss | -6.15e-06 | -| std | 0.994 | -| value_loss | 0.0023 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 674 | -| time_elapsed | 17041 | -| total_timesteps | 86272 | -| train/ | | -| approx_kl | 8.109957e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -111 | -| learning_rate | 0.0003 | -| loss | -0.000472 | -| n_updates | 6730 | -| policy_gradient_loss | -0.000191 | -| std | 0.994 | -| value_loss | 3.7e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 675 | -| time_elapsed | 17074 | -| total_timesteps | 86400 | -| train/ | | -| approx_kl | 7.737894e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -34.8 | -| learning_rate | 0.0003 | -| loss | 5.11e-05 | -| n_updates | 6740 | -| policy_gradient_loss | 4.54e-05 | -| std | 0.994 | -| value_loss | 4.26e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 676 | -| time_elapsed | 17112 | -| total_timesteps | 86528 | -| train/ | | -| approx_kl | 4.151836e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -1.54 | -| learning_rate | 0.0003 | -| loss | -0.000299 | -| n_updates | 6750 | -| policy_gradient_loss | -9.54e-05 | -| std | 0.994 | -| value_loss | 9.49e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 677 | -| time_elapsed | 17146 | -| total_timesteps | 86656 | -| train/ | | -| approx_kl | 1.2060162e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.349 | -| learning_rate | 0.0003 | -| loss | -0.000203 | -| n_updates | 6760 | -| policy_gradient_loss | -0.000104 | -| std | 0.992 | -| value_loss | 1.02e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 678 | -| time_elapsed | 17175 | -| total_timesteps | 86784 | -| train/ | | -| approx_kl | 4.60539e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 6770 | -| policy_gradient_loss | -6.05e-05 | -| std | 0.99 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 5 | -| iterations | 679 | -| time_elapsed | 17201 | -| total_timesteps | 86912 | -| train/ | | -| approx_kl | 8.498784e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | -0.000499 | -| n_updates | 6780 | -| policy_gradient_loss | -0.000163 | -| std | 0.991 | -| value_loss | 1.21e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 680 | -| time_elapsed | 17236 | -| total_timesteps | 87040 | -| train/ | | -| approx_kl | 7.157214e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | -0.00023 | -| n_updates | 6790 | -| policy_gradient_loss | -4.08e-05 | -| std | 0.993 | -| value_loss | 1.1e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 681 | -| time_elapsed | 17294 | -| total_timesteps | 87168 | -| train/ | | -| approx_kl | 1.5007332e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | 0.703 | -| learning_rate | 0.0003 | -| loss | 0.000156 | -| n_updates | 6800 | -| policy_gradient_loss | -0.000215 | -| std | 0.996 | -| value_loss | 0.00156 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 682 | -| time_elapsed | 17340 | -| total_timesteps | 87296 | -| train/ | | -| approx_kl | 4.2514876e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -346 | -| learning_rate | 0.0003 | -| loss | 1.5e-05 | -| n_updates | 6810 | -| policy_gradient_loss | 2.19e-05 | -| std | 0.997 | -| value_loss | 2.69e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 683 | -| time_elapsed | 17378 | -| total_timesteps | 87424 | -| train/ | | -| approx_kl | 1.2847595e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -286 | -| learning_rate | 0.0003 | -| loss | -0.000132 | -| n_updates | 6820 | -| policy_gradient_loss | -2.46e-05 | -| std | 0.997 | -| value_loss | 4.25e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 684 | -| time_elapsed | 17406 | -| total_timesteps | 87552 | -| train/ | | -| approx_kl | 3.8486905e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.42 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.000325 | -| n_updates | 6830 | -| policy_gradient_loss | -0.000101 | -| std | 0.995 | -| value_loss | 4.89e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 685 | -| time_elapsed | 17436 | -| total_timesteps | 87680 | -| train/ | | -| approx_kl | 5.276408e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -5.49 | -| learning_rate | 0.0003 | -| loss | -6.24e-05 | -| n_updates | 6840 | -| policy_gradient_loss | -3.4e-05 | -| std | 0.992 | -| value_loss | 2.89e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 686 | -| time_elapsed | 17471 | -| total_timesteps | 87808 | -| train/ | | -| approx_kl | 4.413817e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 6850 | -| policy_gradient_loss | -0.000721 | -| std | 0.99 | -| value_loss | 1.23e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 5 | -| iterations | 687 | -| time_elapsed | 17509 | -| total_timesteps | 87936 | -| train/ | | -| approx_kl | 0.00015345728 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0616 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 6860 | -| policy_gradient_loss | -0.000586 | -| std | 0.988 | -| value_loss | 9.3e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 5 | -| iterations | 688 | -| time_elapsed | 17537 | -| total_timesteps | 88064 | -| train/ | | -| approx_kl | 1.7468352e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.000303 | -| n_updates | 6870 | -| policy_gradient_loss | 0.000227 | -| std | 0.987 | -| value_loss | 6.63e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 5 | -| iterations | 689 | -| time_elapsed | 17582 | -| total_timesteps | 88192 | -| train/ | | -| approx_kl | 8.161645e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -10.4 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 6880 | -| policy_gradient_loss | -0.000147 | -| std | 0.987 | -| value_loss | 0.00445 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 5 | -| iterations | 690 | -| time_elapsed | 17619 | -| total_timesteps | 88320 | -| train/ | | -| approx_kl | 6.457325e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.41 | -| explained_variance | -324 | -| learning_rate | 0.0003 | -| loss | -0.000422 | -| n_updates | 6890 | -| policy_gradient_loss | -0.000212 | -| std | 0.986 | -| value_loss | 5.01e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 5 | -| iterations | 691 | -| time_elapsed | 17655 | -| total_timesteps | 88448 | -| train/ | | -| approx_kl | 3.281515e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -522 | -| learning_rate | 0.0003 | -| loss | -0.000149 | -| n_updates | 6900 | -| policy_gradient_loss | -1.95e-05 | -| std | 0.984 | -| value_loss | 1.13e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 5 | -| iterations | 692 | -| time_elapsed | 17699 | -| total_timesteps | 88576 | -| train/ | | -| approx_kl | 2.031913e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -54.7 | -| learning_rate | 0.0003 | -| loss | -0.000562 | -| n_updates | 6910 | -| policy_gradient_loss | -0.000207 | -| std | 0.981 | -| value_loss | 5.09e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 5 | -| iterations | 693 | -| time_elapsed | 17733 | -| total_timesteps | 88704 | -| train/ | | -| approx_kl | 2.5993213e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.617 | -| learning_rate | 0.0003 | -| loss | -0.000493 | -| n_updates | 6920 | -| policy_gradient_loss | -0.000114 | -| std | 0.979 | -| value_loss | 5.1e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 4 | -| iterations | 694 | -| time_elapsed | 17768 | -| total_timesteps | 88832 | -| train/ | | -| approx_kl | 0.0003863559 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 6930 | -| policy_gradient_loss | -0.00166 | -| std | 0.979 | -| value_loss | 5.36e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 4 | -| iterations | 695 | -| time_elapsed | 17801 | -| total_timesteps | 88960 | -| train/ | | -| approx_kl | 0.00025705202 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.0115 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 6940 | -| policy_gradient_loss | -0.00137 | -| std | 0.982 | -| value_loss | 2.33e-09 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 696 | -| time_elapsed | 17842 | -| total_timesteps | 89088 | -| train/ | | -| approx_kl | 0.000105711166 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.000859 | -| n_updates | 6950 | -| policy_gradient_loss | -0.00044 | -| std | 0.984 | -| value_loss | 1.33e-09 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 697 | -| time_elapsed | 17911 | -| total_timesteps | 89216 | -| train/ | | -| approx_kl | 2.3099128e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.856 | -| learning_rate | 0.0003 | -| loss | 0.000623 | -| n_updates | 6960 | -| policy_gradient_loss | 8.87e-05 | -| std | 0.984 | -| value_loss | 0.00109 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 698 | -| time_elapsed | 17945 | -| total_timesteps | 89344 | -| train/ | | -| approx_kl | 5.8021396e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -36.1 | -| learning_rate | 0.0003 | -| loss | -1.49e-05 | -| n_updates | 6970 | -| policy_gradient_loss | -1.4e-07 | -| std | 0.984 | -| value_loss | 4.85e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 699 | -| time_elapsed | 17979 | -| total_timesteps | 89472 | -| train/ | | -| approx_kl | 0.00014722953 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -53.5 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 6980 | -| policy_gradient_loss | -0.000789 | -| std | 0.984 | -| value_loss | 2.2e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 700 | -| time_elapsed | 18012 | -| total_timesteps | 89600 | -| train/ | | -| approx_kl | 0.0013699774 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -5.2 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 6990 | -| policy_gradient_loss | -0.000876 | -| std | 0.984 | -| value_loss | 1.39e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 701 | -| time_elapsed | 18052 | -| total_timesteps | 89728 | -| train/ | | -| approx_kl | 0.014366113 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 7000 | -| policy_gradient_loss | -0.00329 | -| std | 0.984 | -| value_loss | 8.58e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 702 | -| time_elapsed | 18080 | -| total_timesteps | 89856 | -| train/ | | -| approx_kl | 0.01273169 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.000803 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 7010 | -| policy_gradient_loss | -0.00801 | -| std | 0.983 | -| value_loss | 1.92e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 703 | -| time_elapsed | 18117 | -| total_timesteps | 89984 | -| train/ | | -| approx_kl | 6.1746687e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.000161 | -| n_updates | 7020 | -| policy_gradient_loss | 0.00113 | -| std | 0.983 | -| value_loss | 1.88e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 704 | -| time_elapsed | 18153 | -| total_timesteps | 90112 | -| train/ | | -| approx_kl | 0.001960929 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 7030 | -| policy_gradient_loss | -0.00129 | -| std | 0.983 | -| value_loss | 6.23e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 705 | -| time_elapsed | 18251 | -| total_timesteps | 90240 | -| train/ | | -| approx_kl | 0.000357138 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.861 | -| learning_rate | 0.0003 | -| loss | 0.000847 | -| n_updates | 7040 | -| policy_gradient_loss | 0.000413 | -| std | 0.984 | -| value_loss | 0.000755 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 706 | -| time_elapsed | 18285 | -| total_timesteps | 90368 | -| train/ | | -| approx_kl | 0.005212423 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -4.9 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 7050 | -| policy_gradient_loss | -0.00855 | -| std | 0.984 | -| value_loss | 3.93e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 707 | -| time_elapsed | 18321 | -| total_timesteps | 90496 | -| train/ | | -| approx_kl | 0.0007183566 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 7060 | -| policy_gradient_loss | -0.000801 | -| std | 0.983 | -| value_loss | 2.19e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 708 | -| time_elapsed | 18349 | -| total_timesteps | 90624 | -| train/ | | -| approx_kl | 1.3494864e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.94 | -| learning_rate | 0.0003 | -| loss | -0.000244 | -| n_updates | 7070 | -| policy_gradient_loss | 0.000183 | -| std | 0.983 | -| value_loss | 4e-08 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 709 | -| time_elapsed | 18378 | -| total_timesteps | 90752 | -| train/ | | -| approx_kl | 0.000110337045 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0588 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 7080 | -| policy_gradient_loss | -0.000804 | -| std | 0.985 | -| value_loss | 2.35e-08 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 710 | -| time_elapsed | 18402 | -| total_timesteps | 90880 | -| train/ | | -| approx_kl | 3.7439167e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.000171 | -| n_updates | 7090 | -| policy_gradient_loss | 0.000247 | -| std | 0.984 | -| value_loss | 1.14e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 711 | -| time_elapsed | 18430 | -| total_timesteps | 91008 | -| train/ | | -| approx_kl | 0.00014693383 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 7100 | -| policy_gradient_loss | -0.00121 | -| std | 0.983 | -| value_loss | 7.5e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 712 | -| time_elapsed | 18519 | -| total_timesteps | 91136 | -| train/ | | -| approx_kl | 4.2991713e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | 0.000145 | -| n_updates | 7110 | -| policy_gradient_loss | -0.000221 | -| std | 0.983 | -| value_loss | 0.00125 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 713 | -| time_elapsed | 18561 | -| total_timesteps | 91264 | -| train/ | | -| approx_kl | 1.7328653e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.914 | -| learning_rate | 0.0003 | -| loss | -0.000503 | -| n_updates | 7120 | -| policy_gradient_loss | -0.000256 | -| std | 0.985 | -| value_loss | 9.52e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 714 | -| time_elapsed | 18603 | -| total_timesteps | 91392 | -| train/ | | -| approx_kl | 1.8337741e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -15.9 | -| learning_rate | 0.0003 | -| loss | 0.000113 | -| n_updates | 7130 | -| policy_gradient_loss | 8.8e-05 | -| std | 0.985 | -| value_loss | 2.65e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 715 | -| time_elapsed | 18648 | -| total_timesteps | 91520 | -| train/ | | -| approx_kl | 2.8042123e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.651 | -| learning_rate | 0.0003 | -| loss | -0.000125 | -| n_updates | 7140 | -| policy_gradient_loss | -5.58e-05 | -| std | 0.984 | -| value_loss | 4.44e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 716 | -| time_elapsed | 18685 | -| total_timesteps | 91648 | -| train/ | | -| approx_kl | 8.408446e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.000678 | -| learning_rate | 0.0003 | -| loss | -0.000549 | -| n_updates | 7150 | -| policy_gradient_loss | -0.000191 | -| std | 0.983 | -| value_loss | 2.51e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 717 | -| time_elapsed | 18703 | -| total_timesteps | 91776 | -| train/ | | -| approx_kl | 3.3043325e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.000338 | -| learning_rate | 0.0003 | -| loss | 1.54e-05 | -| n_updates | 7160 | -| policy_gradient_loss | 5.2e-05 | -| std | 0.981 | -| value_loss | 1.63e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 718 | -| time_elapsed | 18738 | -| total_timesteps | 91904 | -| train/ | | -| approx_kl | 4.8181973e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.000161 | -| n_updates | 7170 | -| policy_gradient_loss | -6.5e-05 | -| std | 0.981 | -| value_loss | 1.08e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 719 | -| time_elapsed | 18776 | -| total_timesteps | 92032 | -| train/ | | -| approx_kl | 3.0347146e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | -2.12e-05 | -| n_updates | 7180 | -| policy_gradient_loss | -1.09e-05 | -| std | 0.981 | -| value_loss | 7.12e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 720 | -| time_elapsed | 18847 | -| total_timesteps | 92160 | -| train/ | | -| approx_kl | 5.3872354e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.000132 | -| n_updates | 7190 | -| policy_gradient_loss | -0.000115 | -| std | 0.983 | -| value_loss | 0.000418 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 721 | -| time_elapsed | 18886 | -| total_timesteps | 92288 | -| train/ | | -| approx_kl | 4.237052e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -310 | -| learning_rate | 0.0003 | -| loss | -8.73e-05 | -| n_updates | 7200 | -| policy_gradient_loss | -2.71e-05 | -| std | 0.982 | -| value_loss | 3.69e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 722 | -| time_elapsed | 18920 | -| total_timesteps | 92416 | -| train/ | | -| approx_kl | 8.688308e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -199 | -| learning_rate | 0.0003 | -| loss | -0.000371 | -| n_updates | 7210 | -| policy_gradient_loss | -0.000175 | -| std | 0.98 | -| value_loss | 1.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 723 | -| time_elapsed | 18950 | -| total_timesteps | 92544 | -| train/ | | -| approx_kl | 4.396774e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -61.7 | -| learning_rate | 0.0003 | -| loss | -0.000101 | -| n_updates | 7220 | -| policy_gradient_loss | -4.4e-05 | -| std | 0.979 | -| value_loss | 1.99e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 724 | -| time_elapsed | 18976 | -| total_timesteps | 92672 | -| train/ | | -| approx_kl | 7.2419643e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00022 | -| n_updates | 7230 | -| policy_gradient_loss | -0.000103 | -| std | 0.979 | -| value_loss | 7.38e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 725 | -| time_elapsed | 19022 | -| total_timesteps | 92800 | -| train/ | | -| approx_kl | 3.4105033e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.4 | -| explained_variance | -0.085 | -| learning_rate | 0.0003 | -| loss | -0.000401 | -| n_updates | 7240 | -| policy_gradient_loss | -9.79e-05 | -| std | 0.978 | -| value_loss | 3.26e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 4 | -| iterations | 726 | -| time_elapsed | 19061 | -| total_timesteps | 92928 | -| train/ | | -| approx_kl | 2.392428e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.000667 | -| n_updates | 7250 | -| policy_gradient_loss | -0.000318 | -| std | 0.974 | -| value_loss | 1.23e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 727 | -| time_elapsed | 19103 | -| total_timesteps | 93056 | -| train/ | | -| approx_kl | 1.456961e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 7260 | -| policy_gradient_loss | -0.00059 | -| std | 0.969 | -| value_loss | 5.63e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 728 | -| time_elapsed | 19155 | -| total_timesteps | 93184 | -| train/ | | -| approx_kl | 1.7473474e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.46 | -| learning_rate | 0.0003 | -| loss | -0.000928 | -| n_updates | 7270 | -| policy_gradient_loss | -0.000647 | -| std | 0.964 | -| value_loss | 0.00104 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 729 | -| time_elapsed | 19185 | -| total_timesteps | 93312 | -| train/ | | -| approx_kl | 4.895963e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -529 | -| learning_rate | 0.0003 | -| loss | 0.000175 | -| n_updates | 7280 | -| policy_gradient_loss | 0.000113 | -| std | 0.961 | -| value_loss | 3.83e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 730 | -| time_elapsed | 19219 | -| total_timesteps | 93440 | -| train/ | | -| approx_kl | 4.7106296e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -789 | -| learning_rate | 0.0003 | -| loss | -0.000298 | -| n_updates | 7290 | -| policy_gradient_loss | -0.000133 | -| std | 0.959 | -| value_loss | 1.06e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 731 | -| time_elapsed | 19254 | -| total_timesteps | 93568 | -| train/ | | -| approx_kl | 3.923662e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -783 | -| learning_rate | 0.0003 | -| loss | -9.18e-05 | -| n_updates | 7300 | -| policy_gradient_loss | -2.95e-05 | -| std | 0.957 | -| value_loss | 3.4e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 732 | -| time_elapsed | 19294 | -| total_timesteps | 93696 | -| train/ | | -| approx_kl | 2.5485642e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -9.7 | -| learning_rate | 0.0003 | -| loss | -0.000317 | -| n_updates | 7310 | -| policy_gradient_loss | -0.000107 | -| std | 0.955 | -| value_loss | 2.84e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 733 | -| time_elapsed | 19324 | -| total_timesteps | 93824 | -| train/ | | -| approx_kl | 1.1883676e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -13.7 | -| learning_rate | 0.0003 | -| loss | -8.9e-06 | -| n_updates | 7320 | -| policy_gradient_loss | 2.79e-05 | -| std | 0.954 | -| value_loss | 9.76e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 734 | -| time_elapsed | 19364 | -| total_timesteps | 93952 | -| train/ | | -| approx_kl | 2.5746878e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.815 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 7330 | -| policy_gradient_loss | -0.000678 | -| std | 0.95 | -| value_loss | 2.24e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 735 | -| time_elapsed | 19389 | -| total_timesteps | 94080 | -| train/ | | -| approx_kl | 1.1513941e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.00413 | -| learning_rate | 0.0003 | -| loss | 0.000337 | -| n_updates | 7340 | -| policy_gradient_loss | 0.000219 | -| std | 0.947 | -| value_loss | 9.71e-11 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 736 | -| time_elapsed | 19451 | -| total_timesteps | 94208 | -| train/ | | -| approx_kl | 1.0598451e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | 0.678 | -| learning_rate | 0.0003 | -| loss | 0.00224 | -| n_updates | 7350 | -| policy_gradient_loss | -2.73e-05 | -| std | 0.946 | -| value_loss | 0.00519 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 737 | -| time_elapsed | 19486 | -| total_timesteps | 94336 | -| train/ | | -| approx_kl | 4.486181e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -455 | -| learning_rate | 0.0003 | -| loss | -0.000308 | -| n_updates | 7360 | -| policy_gradient_loss | -0.000135 | -| std | 0.946 | -| value_loss | 2.14e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 738 | -| time_elapsed | 19518 | -| total_timesteps | 94464 | -| train/ | | -| approx_kl | 6.204471e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -584 | -| learning_rate | 0.0003 | -| loss | -4.19e-05 | -| n_updates | 7370 | -| policy_gradient_loss | -1.42e-05 | -| std | 0.947 | -| value_loss | 6.52e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 739 | -| time_elapsed | 19555 | -| total_timesteps | 94592 | -| train/ | | -| approx_kl | 6.4182095e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -36.6 | -| learning_rate | 0.0003 | -| loss | -0.000237 | -| n_updates | 7380 | -| policy_gradient_loss | -0.000112 | -| std | 0.948 | -| value_loss | 5.28e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 740 | -| time_elapsed | 19564 | -| total_timesteps | 94720 | -| train/ | | -| approx_kl | 8.000061e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -13.9 | -| learning_rate | 0.0003 | -| loss | 1.11e-05 | -| n_updates | 7390 | -| policy_gradient_loss | 2.89e-05 | -| std | 0.948 | -| value_loss | 2.16e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 741 | -| time_elapsed | 19568 | -| total_timesteps | 94848 | -| train/ | | -| approx_kl | 8.5588545e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.893 | -| learning_rate | 0.0003 | -| loss | -3.16e-05 | -| n_updates | 7400 | -| policy_gradient_loss | -1.64e-05 | -| std | 0.947 | -| value_loss | 4.63e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 4 | -| iterations | 742 | -| time_elapsed | 19572 | -| total_timesteps | 94976 | -| train/ | | -| approx_kl | 3.8901344e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.000297 | -| n_updates | 7410 | -| policy_gradient_loss | -0.000105 | -| std | 0.948 | -| value_loss | 3.7e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 4 | -| iterations | 743 | -| time_elapsed | 19577 | -| total_timesteps | 95104 | -| train/ | | -| approx_kl | 3.2470562e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | -4.12e-06 | -| n_updates | 7420 | -| policy_gradient_loss | 1.82e-05 | -| std | 0.947 | -| value_loss | 2.98e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 4 | -| iterations | 744 | -| time_elapsed | 19596 | -| total_timesteps | 95232 | -| train/ | | -| approx_kl | 7.743947e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | 0.921 | -| learning_rate | 0.0003 | -| loss | 0.000141 | -| n_updates | 7430 | -| policy_gradient_loss | -2.46e-05 | -| std | 0.947 | -| value_loss | 0.000511 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 4 | -| iterations | 745 | -| time_elapsed | 19619 | -| total_timesteps | 95360 | -| train/ | | -| approx_kl | 1.3625249e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -96.3 | -| learning_rate | 0.0003 | -| loss | 7.78e-06 | -| n_updates | 7440 | -| policy_gradient_loss | 5.71e-06 | -| std | 0.947 | -| value_loss | 5.83e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 4 | -| iterations | 746 | -| time_elapsed | 19661 | -| total_timesteps | 95488 | -| train/ | | -| approx_kl | 1.8691644e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -79.9 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 7450 | -| policy_gradient_loss | -0.000846 | -| std | 0.951 | -| value_loss | 1e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 4 | -| iterations | 747 | -| time_elapsed | 19695 | -| total_timesteps | 95616 | -| train/ | | -| approx_kl | 1.7394777e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.000317 | -| n_updates | 7460 | -| policy_gradient_loss | 0.000175 | -| std | 0.95 | -| value_loss | 7.86e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 4 | -| iterations | 748 | -| time_elapsed | 19732 | -| total_timesteps | 95744 | -| train/ | | -| approx_kl | 4.829839e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.708 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 7470 | -| policy_gradient_loss | -0.000596 | -| std | 0.946 | -| value_loss | 5.49e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 4 | -| iterations | 749 | -| time_elapsed | 19769 | -| total_timesteps | 95872 | -| train/ | | -| approx_kl | 1.1912081e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.0909 | -| learning_rate | 0.0003 | -| loss | 0.000146 | -| n_updates | 7480 | -| policy_gradient_loss | 0.000109 | -| std | 0.943 | -| value_loss | 3.74e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 750 | -| time_elapsed | 19814 | -| total_timesteps | 96000 | -| train/ | | -| approx_kl | 6.4773485e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 2.64e-05 | -| n_updates | 7490 | -| policy_gradient_loss | 1.66e-05 | -| std | 0.943 | -| value_loss | 2.86e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 751 | -| time_elapsed | 19852 | -| total_timesteps | 96128 | -| train/ | | -| approx_kl | 1.1575408e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | 0.000487 | -| learning_rate | 0.0003 | -| loss | -0.000467 | -| n_updates | 7500 | -| policy_gradient_loss | -0.000177 | -| std | 0.943 | -| value_loss | 1.52e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 752 | -| time_elapsed | 19941 | -| total_timesteps | 96256 | -| train/ | | -| approx_kl | 0.00013305759 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | 0.1 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 7510 | -| policy_gradient_loss | -0.000874 | -| std | 0.943 | -| value_loss | 0.00164 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 753 | -| time_elapsed | 19977 | -| total_timesteps | 96384 | -| train/ | | -| approx_kl | 2.4480745e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -723 | -| learning_rate | 0.0003 | -| loss | 0.000386 | -| n_updates | 7520 | -| policy_gradient_loss | 0.000312 | -| std | 0.942 | -| value_loss | 1.33e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 754 | -| time_elapsed | 20018 | -| total_timesteps | 96512 | -| train/ | | -| approx_kl | 1.1797063e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -789 | -| learning_rate | 0.0003 | -| loss | -0.000157 | -| n_updates | 7530 | -| policy_gradient_loss | -7.66e-05 | -| std | 0.941 | -| value_loss | 3.15e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 755 | -| time_elapsed | 20055 | -| total_timesteps | 96640 | -| train/ | | -| approx_kl | 1.125969e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -64.8 | -| learning_rate | 0.0003 | -| loss | 1.85e-05 | -| n_updates | 7540 | -| policy_gradient_loss | 1.46e-05 | -| std | 0.94 | -| value_loss | 1.08e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 756 | -| time_elapsed | 20089 | -| total_timesteps | 96768 | -| train/ | | -| approx_kl | 0.00014337385 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -8.45 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 7550 | -| policy_gradient_loss | -0.000693 | -| std | 0.94 | -| value_loss | 3.76e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 4 | -| iterations | 757 | -| time_elapsed | 20120 | -| total_timesteps | 96896 | -| train/ | | -| approx_kl | 0.0050864406 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.963 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 7560 | -| policy_gradient_loss | -0.00692 | -| std | 0.94 | -| value_loss | 1.34e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 758 | -| time_elapsed | 20167 | -| total_timesteps | 97024 | -| train/ | | -| approx_kl | 0.002276755 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.342 | -| learning_rate | 0.0003 | -| loss | 0.00341 | -| n_updates | 7570 | -| policy_gradient_loss | 0.00297 | -| std | 0.94 | -| value_loss | 6.14e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 759 | -| time_elapsed | 20256 | -| total_timesteps | 97152 | -| train/ | | -| approx_kl | 0.014120027 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 7580 | -| policy_gradient_loss | -0.00671 | -| std | 0.941 | -| value_loss | 0.000546 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 760 | -| time_elapsed | 20287 | -| total_timesteps | 97280 | -| train/ | | -| approx_kl | 0.03196679 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -56.3 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 7590 | -| policy_gradient_loss | -0.00482 | -| std | 0.941 | -| value_loss | 8.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 761 | -| time_elapsed | 20321 | -| total_timesteps | 97408 | -| train/ | | -| approx_kl | 0.04009181 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -60.6 | -| learning_rate | 0.0003 | -| loss | -0.00882 | -| n_updates | 7600 | -| policy_gradient_loss | -0.00727 | -| std | 0.941 | -| value_loss | 2.63e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 762 | -| time_elapsed | 20355 | -| total_timesteps | 97536 | -| train/ | | -| approx_kl | 0.0077680596 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -4.65 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 7610 | -| policy_gradient_loss | -0.00361 | -| std | 0.941 | -| value_loss | 4.43e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 763 | -| time_elapsed | 20388 | -| total_timesteps | 97664 | -| train/ | | -| approx_kl | 0.0023443042 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | 0.0066 | -| learning_rate | 0.0003 | -| loss | -0.0072 | -| n_updates | 7620 | -| policy_gradient_loss | -0.00502 | -| std | 0.942 | -| value_loss | 1.21e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 764 | -| time_elapsed | 20421 | -| total_timesteps | 97792 | -| train/ | | -| approx_kl | 0.009808054 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.000211 | -| learning_rate | 0.0003 | -| loss | -0.00895 | -| n_updates | 7630 | -| policy_gradient_loss | -0.00465 | -| std | 0.943 | -| value_loss | 8.44e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 4 | -| iterations | 765 | -| time_elapsed | 20451 | -| total_timesteps | 97920 | -| train/ | | -| approx_kl | 0.00055787805 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.0042 | -| learning_rate | 0.0003 | -| loss | 0.000322 | -| n_updates | 7640 | -| policy_gradient_loss | 0.000971 | -| std | 0.945 | -| value_loss | 2.61e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 766 | -| time_elapsed | 20477 | -| total_timesteps | 98048 | -| train/ | | -| approx_kl | 0.031884804 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | -0.00907 | -| n_updates | 7650 | -| policy_gradient_loss | -0.00768 | -| std | 0.948 | -| value_loss | 2.06e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 767 | -| time_elapsed | 20537 | -| total_timesteps | 98176 | -| train/ | | -| approx_kl | 0.040895913 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 7660 | -| policy_gradient_loss | -0.0101 | -| std | 0.949 | -| value_loss | 0.000432 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 768 | -| time_elapsed | 20565 | -| total_timesteps | 98304 | -| train/ | | -| approx_kl | 0.0002919049 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -28.8 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 7670 | -| policy_gradient_loss | -0.00237 | -| std | 0.949 | -| value_loss | 2.15e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 769 | -| time_elapsed | 20600 | -| total_timesteps | 98432 | -| train/ | | -| approx_kl | 0.00022959616 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -40.6 | -| learning_rate | 0.0003 | -| loss | 8.4e-05 | -| n_updates | 7680 | -| policy_gradient_loss | 0.000845 | -| std | 0.951 | -| value_loss | 6.96e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 770 | -| time_elapsed | 20634 | -| total_timesteps | 98560 | -| train/ | | -| approx_kl | 0.021297693 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -3.03 | -| learning_rate | 0.0003 | -| loss | -0.00764 | -| n_updates | 7690 | -| policy_gradient_loss | -0.00472 | -| std | 0.953 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 771 | -| time_elapsed | 20665 | -| total_timesteps | 98688 | -| train/ | | -| approx_kl | 0.005597742 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | -0.000691 | -| n_updates | 7700 | -| policy_gradient_loss | -0.000797 | -| std | 0.953 | -| value_loss | 2.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 772 | -| time_elapsed | 20698 | -| total_timesteps | 98816 | -| train/ | | -| approx_kl | 0.0065651536 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.00784 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 7710 | -| policy_gradient_loss | -0.00157 | -| std | 0.954 | -| value_loss | 2.09e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 4 | -| iterations | 773 | -| time_elapsed | 20703 | -| total_timesteps | 98944 | -| train/ | | -| approx_kl | 0.017492048 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 7720 | -| policy_gradient_loss | -0.0039 | -| std | 0.954 | -| value_loss | 7.43e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 774 | -| time_elapsed | 20708 | -| total_timesteps | 99072 | -| train/ | | -| approx_kl | 0.017210877 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.00789 | -| n_updates | 7730 | -| policy_gradient_loss | -0.00685 | -| std | 0.954 | -| value_loss | 5.67e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 775 | -| time_elapsed | 20715 | -| total_timesteps | 99200 | -| train/ | | -| approx_kl | 0.0035990877 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | -0.0088 | -| n_updates | 7740 | -| policy_gradient_loss | -0.00246 | -| std | 0.955 | -| value_loss | 0.00115 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 776 | -| time_elapsed | 20719 | -| total_timesteps | 99328 | -| train/ | | -| approx_kl | 0.014886876 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -50.2 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 7750 | -| policy_gradient_loss | -0.00311 | -| std | 0.955 | -| value_loss | 5.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 777 | -| time_elapsed | 20722 | -| total_timesteps | 99456 | -| train/ | | -| approx_kl | 0.024663161 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -70 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 7760 | -| policy_gradient_loss | -0.00272 | -| std | 0.955 | -| value_loss | 2.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 778 | -| time_elapsed | 20725 | -| total_timesteps | 99584 | -| train/ | | -| approx_kl | 0.012641545 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -8.83 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 7770 | -| policy_gradient_loss | -0.00338 | -| std | 0.955 | -| value_loss | 1.75e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 779 | -| time_elapsed | 20728 | -| total_timesteps | 99712 | -| train/ | | -| approx_kl | 1.6810372e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.387 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 7780 | -| policy_gradient_loss | 6.4e-05 | -| std | 0.957 | -| value_loss | 4.74e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 780 | -| time_elapsed | 20731 | -| total_timesteps | 99840 | -| train/ | | -| approx_kl | 0.006977315 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.00617 | -| n_updates | 7790 | -| policy_gradient_loss | -0.00245 | -| std | 0.962 | -| value_loss | 2.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 4 | -| iterations | 781 | -| time_elapsed | 20736 | -| total_timesteps | 99968 | -| train/ | | -| approx_kl | 0.025870366 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | -0.00702 | -| n_updates | 7800 | -| policy_gradient_loss | -0.00672 | -| std | 0.966 | -| value_loss | 1.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 782 | -| time_elapsed | 20740 | -| total_timesteps | 100096 | -| train/ | | -| approx_kl | 0.008633696 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -0.0066 | -| n_updates | 7810 | -| policy_gradient_loss | -0.00329 | -| std | 0.968 | -| value_loss | 6.19e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 783 | -| time_elapsed | 20748 | -| total_timesteps | 100224 | -| train/ | | -| approx_kl | 0.0061270515 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.578 | -| learning_rate | 0.0003 | -| loss | -4.97e-05 | -| n_updates | 7820 | -| policy_gradient_loss | -0.00158 | -| std | 0.968 | -| value_loss | 0.00612 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 784 | -| time_elapsed | 20752 | -| total_timesteps | 100352 | -| train/ | | -| approx_kl | 0.000515284 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -313 | -| learning_rate | 0.0003 | -| loss | 0.000588 | -| n_updates | 7830 | -| policy_gradient_loss | 0.000432 | -| std | 0.969 | -| value_loss | 2.09e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 785 | -| time_elapsed | 20755 | -| total_timesteps | 100480 | -| train/ | | -| approx_kl | 0.0013423283 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -699 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 7840 | -| policy_gradient_loss | -0.00103 | -| std | 0.97 | -| value_loss | 7.79e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 786 | -| time_elapsed | 20759 | -| total_timesteps | 100608 | -| train/ | | -| approx_kl | 0.0025701718 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -74.1 | -| learning_rate | 0.0003 | -| loss | -0.000408 | -| n_updates | 7850 | -| policy_gradient_loss | -0.000241 | -| std | 0.971 | -| value_loss | 2.27e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 787 | -| time_elapsed | 20763 | -| total_timesteps | 100736 | -| train/ | | -| approx_kl | 0.005298307 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 7860 | -| policy_gradient_loss | -0.00249 | -| std | 0.97 | -| value_loss | 1.57e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 788 | -| time_elapsed | 20767 | -| total_timesteps | 100864 | -| train/ | | -| approx_kl | 0.00072269933 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 7870 | -| policy_gradient_loss | 8.34e-05 | -| std | 0.969 | -| value_loss | 6.53e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 4 | -| iterations | 789 | -| time_elapsed | 20771 | -| total_timesteps | 100992 | -| train/ | | -| approx_kl | 0.0008929949 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 7880 | -| policy_gradient_loss | 0.001 | -| std | 0.968 | -| value_loss | 2.7e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 4 | -| iterations | 790 | -| time_elapsed | 20774 | -| total_timesteps | 101120 | -| train/ | | -| approx_kl | 0.016432479 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 7890 | -| policy_gradient_loss | -0.0096 | -| std | 0.969 | -| value_loss | 2.51e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 4 | -| iterations | 791 | -| time_elapsed | 20785 | -| total_timesteps | 101248 | -| train/ | | -| approx_kl | 0.00534099 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -4.57 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 7900 | -| policy_gradient_loss | -0.00119 | -| std | 0.97 | -| value_loss | 0.00191 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 4 | -| iterations | 792 | -| time_elapsed | 20789 | -| total_timesteps | 101376 | -| train/ | | -| approx_kl | 0.02693698 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -380 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 7910 | -| policy_gradient_loss | -0.0123 | -| std | 0.971 | -| value_loss | 1.87e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 4 | -| iterations | 793 | -| time_elapsed | 20793 | -| total_timesteps | 101504 | -| train/ | | -| approx_kl | 0.001037241 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -898 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 7920 | -| policy_gradient_loss | 0.000272 | -| std | 0.972 | -| value_loss | 4.3e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 4 | -| iterations | 794 | -| time_elapsed | 20798 | -| total_timesteps | 101632 | -| train/ | | -| approx_kl | 6.635254e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -301 | -| learning_rate | 0.0003 | -| loss | -0.000727 | -| n_updates | 7930 | -| policy_gradient_loss | 0.00109 | -| std | 0.972 | -| value_loss | 1.45e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 4 | -| iterations | 795 | -| time_elapsed | 20802 | -| total_timesteps | 101760 | -| train/ | | -| approx_kl | 0.017183457 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 7940 | -| policy_gradient_loss | -0.0037 | -| std | 0.969 | -| value_loss | 1.37e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 4 | -| iterations | 796 | -| time_elapsed | 20806 | -| total_timesteps | 101888 | -| train/ | | -| approx_kl | 0.0065917266 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | -0.00593 | -| n_updates | 7950 | -| policy_gradient_loss | -0.00271 | -| std | 0.969 | -| value_loss | 7.08e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 797 | -| time_elapsed | 20811 | -| total_timesteps | 102016 | -| train/ | | -| approx_kl | 0.005185746 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 7960 | -| policy_gradient_loss | -0.00191 | -| std | 0.969 | -| value_loss | 5.63e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 798 | -| time_elapsed | 20821 | -| total_timesteps | 102144 | -| train/ | | -| approx_kl | 0.010989141 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | 0.000625 | -| n_updates | 7970 | -| policy_gradient_loss | 0.00011 | -| std | 0.968 | -| value_loss | 0.000873 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 799 | -| time_elapsed | 20825 | -| total_timesteps | 102272 | -| train/ | | -| approx_kl | 0.008659424 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -90.2 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 7980 | -| policy_gradient_loss | -0.0038 | -| std | 0.968 | -| value_loss | 6.05e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 800 | -| time_elapsed | 20830 | -| total_timesteps | 102400 | -| train/ | | -| approx_kl | 0.0033075367 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -67.4 | -| learning_rate | 0.0003 | -| loss | 0.0027 | -| n_updates | 7990 | -| policy_gradient_loss | 0.00199 | -| std | 0.969 | -| value_loss | 1.88e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 801 | -| time_elapsed | 20834 | -| total_timesteps | 102528 | -| train/ | | -| approx_kl | 0.00981584 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -3.02 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 8000 | -| policy_gradient_loss | -0.00346 | -| std | 0.968 | -| value_loss | 1.35e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 802 | -| time_elapsed | 20839 | -| total_timesteps | 102656 | -| train/ | | -| approx_kl | 0.0038160556 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 8010 | -| policy_gradient_loss | -0.00177 | -| std | 0.968 | -| value_loss | 6.48e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 803 | -| time_elapsed | 20843 | -| total_timesteps | 102784 | -| train/ | | -| approx_kl | 0.0032495419 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | 0.00216 | -| n_updates | 8020 | -| policy_gradient_loss | 0.00158 | -| std | 0.969 | -| value_loss | 6.59e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 4 | -| iterations | 804 | -| time_elapsed | 20848 | -| total_timesteps | 102912 | -| train/ | | -| approx_kl | 0.0069075595 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 8030 | -| policy_gradient_loss | -0.0034 | -| std | 0.968 | -| value_loss | 2.68e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 805 | -| time_elapsed | 20853 | -| total_timesteps | 103040 | -| train/ | | -| approx_kl | 0.008445466 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 8040 | -| policy_gradient_loss | -0.00146 | -| std | 0.968 | -| value_loss | 2.57e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 806 | -| time_elapsed | 20860 | -| total_timesteps | 103168 | -| train/ | | -| approx_kl | 0.005609523 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.606 | -| learning_rate | 0.0003 | -| loss | -0.00593 | -| n_updates | 8050 | -| policy_gradient_loss | -0.0034 | -| std | 0.968 | -| value_loss | 0.00645 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 807 | -| time_elapsed | 20865 | -| total_timesteps | 103296 | -| train/ | | -| approx_kl | 0.00034818798 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | -1.14e+03 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 8060 | -| policy_gradient_loss | 0.000831 | -| std | 0.966 | -| value_loss | 3.55e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 808 | -| time_elapsed | 20869 | -| total_timesteps | 103424 | -| train/ | | -| approx_kl | 0.0006022956 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -935 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 8070 | -| policy_gradient_loss | 0.000496 | -| std | 0.965 | -| value_loss | 1.28e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 809 | -| time_elapsed | 20873 | -| total_timesteps | 103552 | -| train/ | | -| approx_kl | 0.003269013 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -58.6 | -| learning_rate | 0.0003 | -| loss | 0.000651 | -| n_updates | 8080 | -| policy_gradient_loss | 0.000449 | -| std | 0.966 | -| value_loss | 1.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 810 | -| time_elapsed | 20876 | -| total_timesteps | 103680 | -| train/ | | -| approx_kl | 0.014914278 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 8090 | -| policy_gradient_loss | -0.00589 | -| std | 0.965 | -| value_loss | 6.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 811 | -| time_elapsed | 20880 | -| total_timesteps | 103808 | -| train/ | | -| approx_kl | 0.016874207 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 8100 | -| policy_gradient_loss | -0.00449 | -| std | 0.964 | -| value_loss | 1.92e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 812 | -| time_elapsed | 20885 | -| total_timesteps | 103936 | -| train/ | | -| approx_kl | 6.95684e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.00265 | -| learning_rate | 0.0003 | -| loss | -0.000318 | -| n_updates | 8110 | -| policy_gradient_loss | -8.08e-05 | -| std | 0.966 | -| value_loss | 1.73e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 813 | -| time_elapsed | 20889 | -| total_timesteps | 104064 | -| train/ | | -| approx_kl | 0.00044717174 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.00438 | -| learning_rate | 0.0003 | -| loss | -0.000333 | -| n_updates | 8120 | -| policy_gradient_loss | -0.000113 | -| std | 0.967 | -| value_loss | 2.07e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 814 | -| time_elapsed | 20896 | -| total_timesteps | 104192 | -| train/ | | -| approx_kl | 0.013093455 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -1.39 | -| explained_variance | 0.843 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 8130 | -| policy_gradient_loss | -0.00658 | -| std | 0.966 | -| value_loss | 0.000474 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 815 | -| time_elapsed | 20899 | -| total_timesteps | 104320 | -| train/ | | -| approx_kl | 0.026239535 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -680 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 8140 | -| policy_gradient_loss | -0.00993 | -| std | 0.966 | -| value_loss | 7.41e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 4 | -| iterations | 816 | -| time_elapsed | 20904 | -| total_timesteps | 104448 | -| train/ | | -| approx_kl | 0.0008777431 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -774 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 8150 | -| policy_gradient_loss | 0.00247 | -| std | 0.965 | -| value_loss | 1.54e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 817 | -| time_elapsed | 20909 | -| total_timesteps | 104576 | -| train/ | | -| approx_kl | 0.010679271 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 8160 | -| policy_gradient_loss | -0.00441 | -| std | 0.964 | -| value_loss | 8.24e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 818 | -| time_elapsed | 20911 | -| total_timesteps | 104704 | -| train/ | | -| approx_kl | 0.017139107 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 8170 | -| policy_gradient_loss | -0.006 | -| std | 0.964 | -| value_loss | 5.62e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 819 | -| time_elapsed | 20915 | -| total_timesteps | 104832 | -| train/ | | -| approx_kl | 0.0015595872 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.565 | -| learning_rate | 0.0003 | -| loss | 6.23e-06 | -| n_updates | 8180 | -| policy_gradient_loss | 8.19e-05 | -| std | 0.965 | -| value_loss | 1.41e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 820 | -| time_elapsed | 20919 | -| total_timesteps | 104960 | -| train/ | | -| approx_kl | 0.01384942 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 8190 | -| policy_gradient_loss | -0.00584 | -| std | 0.965 | -| value_loss | 1.23e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 821 | -| time_elapsed | 20924 | -| total_timesteps | 105088 | -| train/ | | -| approx_kl | 0.01553691 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 8200 | -| policy_gradient_loss | -0.00921 | -| std | 0.963 | -| value_loss | 6.75e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 822 | -| time_elapsed | 20934 | -| total_timesteps | 105216 | -| train/ | | -| approx_kl | 0.010856993 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.446 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 8210 | -| policy_gradient_loss | -0.00857 | -| std | 0.961 | -| value_loss | 0.000941 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 823 | -| time_elapsed | 20939 | -| total_timesteps | 105344 | -| train/ | | -| approx_kl | 0.002316581 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -41.9 | -| learning_rate | 0.0003 | -| loss | -0.00774 | -| n_updates | 8220 | -| policy_gradient_loss | -0.00171 | -| std | 0.96 | -| value_loss | 4.35e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 824 | -| time_elapsed | 20943 | -| total_timesteps | 105472 | -| train/ | | -| approx_kl | 0.0011246153 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -115 | -| learning_rate | 0.0003 | -| loss | 0.00204 | -| n_updates | 8230 | -| policy_gradient_loss | 0.00181 | -| std | 0.959 | -| value_loss | 2.01e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 825 | -| time_elapsed | 20948 | -| total_timesteps | 105600 | -| train/ | | -| approx_kl | 0.0038291048 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -3.3 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 8240 | -| policy_gradient_loss | -0.00103 | -| std | 0.958 | -| value_loss | 1.31e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 826 | -| time_elapsed | 20953 | -| total_timesteps | 105728 | -| train/ | | -| approx_kl | 0.005665146 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 8250 | -| policy_gradient_loss | -0.00424 | -| std | 0.958 | -| value_loss | 5.53e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 827 | -| time_elapsed | 20956 | -| total_timesteps | 105856 | -| train/ | | -| approx_kl | 0.020446744 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -1.38 | -| explained_variance | 0.00136 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 8260 | -| policy_gradient_loss | -0.00674 | -| std | 0.958 | -| value_loss | 6.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 5 | -| iterations | 828 | -| time_elapsed | 20961 | -| total_timesteps | 105984 | -| train/ | | -| approx_kl | 0.009041324 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.00695 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 8270 | -| policy_gradient_loss | -0.0029 | -| std | 0.955 | -| value_loss | 2.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 829 | -| time_elapsed | 20965 | -| total_timesteps | 106112 | -| train/ | | -| approx_kl | 0.004618683 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 8280 | -| policy_gradient_loss | -0.00233 | -| std | 0.95 | -| value_loss | 1.52e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 830 | -| time_elapsed | 20975 | -| total_timesteps | 106240 | -| train/ | | -| approx_kl | 0.00053168274 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.37 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 8290 | -| policy_gradient_loss | -0.000752 | -| std | 0.946 | -| value_loss | 0.00131 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 831 | -| time_elapsed | 20980 | -| total_timesteps | 106368 | -| train/ | | -| approx_kl | 0.0012100209 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -424 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 8300 | -| policy_gradient_loss | -0.000672 | -| std | 0.944 | -| value_loss | 1.29e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 832 | -| time_elapsed | 20984 | -| total_timesteps | 106496 | -| train/ | | -| approx_kl | 0.00043605827 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -232 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 8310 | -| policy_gradient_loss | -0.000367 | -| std | 0.941 | -| value_loss | 3.63e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 833 | -| time_elapsed | 20989 | -| total_timesteps | 106624 | -| train/ | | -| approx_kl | 0.0016501942 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -36.7 | -| learning_rate | 0.0003 | -| loss | -0.00537 | -| n_updates | 8320 | -| policy_gradient_loss | -0.00126 | -| std | 0.939 | -| value_loss | 4.91e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 834 | -| time_elapsed | 20992 | -| total_timesteps | 106752 | -| train/ | | -| approx_kl | 0.00014020177 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.36 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 8330 | -| policy_gradient_loss | 0.00108 | -| std | 0.937 | -| value_loss | 1.58e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 5 | -| iterations | 835 | -| time_elapsed | 20997 | -| total_timesteps | 106880 | -| train/ | | -| approx_kl | 0.01922475 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 8340 | -| policy_gradient_loss | -0.00789 | -| std | 0.936 | -| value_loss | 4.8e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 836 | -| time_elapsed | 21002 | -| total_timesteps | 107008 | -| train/ | | -| approx_kl | 0.0029347795 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -0.00056 | -| n_updates | 8350 | -| policy_gradient_loss | -0.000271 | -| std | 0.933 | -| value_loss | 8.4e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 837 | -| time_elapsed | 21011 | -| total_timesteps | 107136 | -| train/ | | -| approx_kl | 0.0010660817 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | 0.55 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 8360 | -| policy_gradient_loss | -0.00157 | -| std | 0.93 | -| value_loss | 0.00711 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 838 | -| time_elapsed | 21014 | -| total_timesteps | 107264 | -| train/ | | -| approx_kl | 0.0026273518 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -1.09e+03 | -| learning_rate | 0.0003 | -| loss | -0.000832 | -| n_updates | 8370 | -| policy_gradient_loss | -0.000391 | -| std | 0.929 | -| value_loss | 3.25e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 839 | -| time_elapsed | 21017 | -| total_timesteps | 107392 | -| train/ | | -| approx_kl | 0.011132494 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.00995 | -| n_updates | 8380 | -| policy_gradient_loss | -0.00474 | -| std | 0.93 | -| value_loss | 9.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 840 | -| time_elapsed | 21020 | -| total_timesteps | 107520 | -| train/ | | -| approx_kl | 0.011296708 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -36 | -| learning_rate | 0.0003 | -| loss | -0.00709 | -| n_updates | 8390 | -| policy_gradient_loss | -0.00389 | -| std | 0.931 | -| value_loss | 6.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 841 | -| time_elapsed | 21024 | -| total_timesteps | 107648 | -| train/ | | -| approx_kl | 0.007119281 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -8.78 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 8400 | -| policy_gradient_loss | -0.00109 | -| std | 0.931 | -| value_loss | 3.18e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 842 | -| time_elapsed | 21028 | -| total_timesteps | 107776 | -| train/ | | -| approx_kl | 0.00030701142 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -0.516 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 8410 | -| policy_gradient_loss | -0.00014 | -| std | 0.93 | -| value_loss | 1.1e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 5 | -| iterations | 843 | -| time_elapsed | 21032 | -| total_timesteps | 107904 | -| train/ | | -| approx_kl | 0.0012024152 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.35 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 8420 | -| policy_gradient_loss | -0.000122 | -| std | 0.929 | -| value_loss | 1.11e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 844 | -| time_elapsed | 21036 | -| total_timesteps | 108032 | -| train/ | | -| approx_kl | 0.00036945427 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -0.00592 | -| learning_rate | 0.0003 | -| loss | -0.000502 | -| n_updates | 8430 | -| policy_gradient_loss | -0.000251 | -| std | 0.926 | -| value_loss | 1.14e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 845 | -| time_elapsed | 21046 | -| total_timesteps | 108160 | -| train/ | | -| approx_kl | 0.00013868604 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | -0.000146 | -| n_updates | 8440 | -| policy_gradient_loss | -0.000142 | -| std | 0.925 | -| value_loss | 0.000556 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 846 | -| time_elapsed | 21049 | -| total_timesteps | 108288 | -| train/ | | -| approx_kl | 0.0038666422 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -180 | -| learning_rate | 0.0003 | -| loss | -0.00616 | -| n_updates | 8450 | -| policy_gradient_loss | -0.00257 | -| std | 0.924 | -| value_loss | 1.96e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 847 | -| time_elapsed | 21053 | -| total_timesteps | 108416 | -| train/ | | -| approx_kl | 0.0001820135 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -147 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 8460 | -| policy_gradient_loss | 0.00118 | -| std | 0.923 | -| value_loss | 7.81e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 848 | -| time_elapsed | 21057 | -| total_timesteps | 108544 | -| train/ | | -| approx_kl | 0.000326416 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -60.6 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 8470 | -| policy_gradient_loss | 0.000729 | -| std | 0.924 | -| value_loss | 1.81e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 849 | -| time_elapsed | 21062 | -| total_timesteps | 108672 | -| train/ | | -| approx_kl | 7.541431e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -2.66 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 8480 | -| policy_gradient_loss | 0.000639 | -| std | 0.925 | -| value_loss | 1.07e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 850 | -| time_elapsed | 21067 | -| total_timesteps | 108800 | -| train/ | | -| approx_kl | 1.6906299e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -0.271 | -| learning_rate | 0.0003 | -| loss | 0.000166 | -| n_updates | 8490 | -| policy_gradient_loss | 0.000678 | -| std | 0.924 | -| value_loss | 3.72e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 5 | -| iterations | 851 | -| time_elapsed | 21072 | -| total_timesteps | 108928 | -| train/ | | -| approx_kl | 0.00023900485 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | 0.000846 | -| learning_rate | 0.0003 | -| loss | 9.48e-05 | -| n_updates | 8500 | -| policy_gradient_loss | 0.000101 | -| std | 0.921 | -| value_loss | 2.62e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 852 | -| time_elapsed | 21077 | -| total_timesteps | 109056 | -| train/ | | -| approx_kl | 0.00029525068 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | 0.01 | -| learning_rate | 0.0003 | -| loss | -0.000559 | -| n_updates | 8510 | -| policy_gradient_loss | -0.000223 | -| std | 0.92 | -| value_loss | 3.4e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 853 | -| time_elapsed | 21085 | -| total_timesteps | 109184 | -| train/ | | -| approx_kl | 0.007903554 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 8520 | -| policy_gradient_loss | -0.00704 | -| std | 0.92 | -| value_loss | 0.00493 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 854 | -| time_elapsed | 21089 | -| total_timesteps | 109312 | -| train/ | | -| approx_kl | 0.015977032 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -2.82e+03 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 8530 | -| policy_gradient_loss | -0.00971 | -| std | 0.92 | -| value_loss | 2.71e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 855 | -| time_elapsed | 21093 | -| total_timesteps | 109440 | -| train/ | | -| approx_kl | 0.007143513 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -726 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 8540 | -| policy_gradient_loss | -0.00118 | -| std | 0.92 | -| value_loss | 5.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 856 | -| time_elapsed | 21097 | -| total_timesteps | 109568 | -| train/ | | -| approx_kl | 0.009811538 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -29 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 8550 | -| policy_gradient_loss | -0.00704 | -| std | 0.92 | -| value_loss | 5.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 857 | -| time_elapsed | 21100 | -| total_timesteps | 109696 | -| train/ | | -| approx_kl | 0.017221276 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -123 | -| learning_rate | 0.0003 | -| loss | -0.00767 | -| n_updates | 8560 | -| policy_gradient_loss | -0.00419 | -| std | 0.92 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 858 | -| time_elapsed | 21104 | -| total_timesteps | 109824 | -| train/ | | -| approx_kl | 0.01738115 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -1.49 | -| learning_rate | 0.0003 | -| loss | -0.0059 | -| n_updates | 8570 | -| policy_gradient_loss | -0.00442 | -| std | 0.921 | -| value_loss | 5.18e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 5 | -| iterations | 859 | -| time_elapsed | 21107 | -| total_timesteps | 109952 | -| train/ | | -| approx_kl | 0.0026557217 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.00756 | -| n_updates | 8580 | -| policy_gradient_loss | -0.0022 | -| std | 0.922 | -| value_loss | 3.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 860 | -| time_elapsed | 21112 | -| total_timesteps | 110080 | -| train/ | | -| approx_kl | 0.012137054 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 8590 | -| policy_gradient_loss | -0.00495 | -| std | 0.921 | -| value_loss | 1.25e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 861 | -| time_elapsed | 21119 | -| total_timesteps | 110208 | -| train/ | | -| approx_kl | 0.00017178478 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 8600 | -| policy_gradient_loss | 0.000653 | -| std | 0.92 | -| value_loss | 0.000249 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 862 | -| time_elapsed | 21124 | -| total_timesteps | 110336 | -| train/ | | -| approx_kl | 0.0004184055 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.34 | -| explained_variance | -69.6 | -| learning_rate | 0.0003 | -| loss | 0.00078 | -| n_updates | 8610 | -| policy_gradient_loss | 0.000694 | -| std | 0.919 | -| value_loss | 1.53e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 863 | -| time_elapsed | 21129 | -| total_timesteps | 110464 | -| train/ | | -| approx_kl | 0.0038991529 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -32.5 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 8620 | -| policy_gradient_loss | -0.00229 | -| std | 0.917 | -| value_loss | 2.88e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 864 | -| time_elapsed | 21133 | -| total_timesteps | 110592 | -| train/ | | -| approx_kl | 0.0035949484 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | -0.000516 | -| n_updates | 8630 | -| policy_gradient_loss | -0.000266 | -| std | 0.917 | -| value_loss | 1.38e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 865 | -| time_elapsed | 21135 | -| total_timesteps | 110720 | -| train/ | | -| approx_kl | 0.0009528082 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.629 | -| learning_rate | 0.0003 | -| loss | -0.000684 | -| n_updates | 8640 | -| policy_gradient_loss | -0.00035 | -| std | 0.917 | -| value_loss | 4.42e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 866 | -| time_elapsed | 21138 | -| total_timesteps | 110848 | -| train/ | | -| approx_kl | 0.0057581537 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.00868 | -| n_updates | 8650 | -| policy_gradient_loss | -0.00409 | -| std | 0.918 | -| value_loss | 5.43e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 867 | -| time_elapsed | 21142 | -| total_timesteps | 110976 | -| train/ | | -| approx_kl | 1.1250377e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | -0.000177 | -| n_updates | 8660 | -| policy_gradient_loss | 0.00168 | -| std | 0.917 | -| value_loss | 8.27e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 868 | -| time_elapsed | 21147 | -| total_timesteps | 111104 | -| train/ | | -| approx_kl | 1.206249e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.00516 | -| learning_rate | 0.0003 | -| loss | 0.000274 | -| n_updates | 8670 | -| policy_gradient_loss | 0.000637 | -| std | 0.917 | -| value_loss | 7.94e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 869 | -| time_elapsed | 21155 | -| total_timesteps | 111232 | -| train/ | | -| approx_kl | 0.008365753 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 8680 | -| policy_gradient_loss | -0.00694 | -| std | 0.917 | -| value_loss | 0.00199 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 870 | -| time_elapsed | 21158 | -| total_timesteps | 111360 | -| train/ | | -| approx_kl | 0.002980243 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -2.49e+03 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 8690 | -| policy_gradient_loss | 0.000659 | -| std | 0.916 | -| value_loss | 2.54e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 871 | -| time_elapsed | 21161 | -| total_timesteps | 111488 | -| train/ | | -| approx_kl | 0.00011986727 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.000616 | -| n_updates | 8700 | -| policy_gradient_loss | -0.000193 | -| std | 0.914 | -| value_loss | 4.18e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 872 | -| time_elapsed | 21166 | -| total_timesteps | 111616 | -| train/ | | -| approx_kl | 8.3525665e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -3.3 | -| learning_rate | 0.0003 | -| loss | 8.25e-05 | -| n_updates | 8710 | -| policy_gradient_loss | 0.000131 | -| std | 0.913 | -| value_loss | 7.2e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 873 | -| time_elapsed | 21169 | -| total_timesteps | 111744 | -| train/ | | -| approx_kl | 0.0027702888 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | -0.00843 | -| n_updates | 8720 | -| policy_gradient_loss | -0.00304 | -| std | 0.914 | -| value_loss | 6.13e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 874 | -| time_elapsed | 21173 | -| total_timesteps | 111872 | -| train/ | | -| approx_kl | 0.01100155 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 8730 | -| policy_gradient_loss | -0.00922 | -| std | 0.914 | -| value_loss | 2.21e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 875 | -| time_elapsed | 21177 | -| total_timesteps | 112000 | -| train/ | | -| approx_kl | 0.0043658167 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.00427 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 8740 | -| policy_gradient_loss | -0.00115 | -| std | 0.913 | -| value_loss | 1.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 876 | -| time_elapsed | 21182 | -| total_timesteps | 112128 | -| train/ | | -| approx_kl | 0.008836826 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.000789 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 8750 | -| policy_gradient_loss | -0.0069 | -| std | 0.913 | -| value_loss | 6.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 877 | -| time_elapsed | 21189 | -| total_timesteps | 112256 | -| train/ | | -| approx_kl | 0.011519147 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.61 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 8760 | -| policy_gradient_loss | -0.00202 | -| std | 0.915 | -| value_loss | 0.000654 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 878 | -| time_elapsed | 21191 | -| total_timesteps | 112384 | -| train/ | | -| approx_kl | 0.0019109687 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.13e+03 | -| learning_rate | 0.0003 | -| loss | 0.000162 | -| n_updates | 8770 | -| policy_gradient_loss | 7.77e-05 | -| std | 0.915 | -| value_loss | 1.31e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 879 | -| time_elapsed | 21196 | -| total_timesteps | 112512 | -| train/ | | -| approx_kl | 0.011612223 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -690 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 8780 | -| policy_gradient_loss | -0.00341 | -| std | 0.914 | -| value_loss | 2.92e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 880 | -| time_elapsed | 21200 | -| total_timesteps | 112640 | -| train/ | | -| approx_kl | 0.0006062826 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 8790 | -| policy_gradient_loss | 0.000519 | -| std | 0.911 | -| value_loss | 1.8e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 881 | -| time_elapsed | 21204 | -| total_timesteps | 112768 | -| train/ | | -| approx_kl | 0.020487234 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -4.88 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 8800 | -| policy_gradient_loss | -0.0139 | -| std | 0.909 | -| value_loss | 1.79e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 882 | -| time_elapsed | 21207 | -| total_timesteps | 112896 | -| train/ | | -| approx_kl | 0.0025463128 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.44 | -| learning_rate | 0.0003 | -| loss | -0.000274 | -| n_updates | 8810 | -| policy_gradient_loss | -6.35e-05 | -| std | 0.91 | -| value_loss | 5.02e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 883 | -| time_elapsed | 21210 | -| total_timesteps | 113024 | -| train/ | | -| approx_kl | 0.006479245 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 8820 | -| policy_gradient_loss | -0.00373 | -| std | 0.911 | -| value_loss | 3.71e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 884 | -| time_elapsed | 21218 | -| total_timesteps | 113152 | -| train/ | | -| approx_kl | 8.713128e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.943 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 8830 | -| policy_gradient_loss | 0.000397 | -| std | 0.912 | -| value_loss | 0.000123 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 885 | -| time_elapsed | 21223 | -| total_timesteps | 113280 | -| train/ | | -| approx_kl | 5.4318924e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -663 | -| learning_rate | 0.0003 | -| loss | 0.000409 | -| n_updates | 8840 | -| policy_gradient_loss | 0.000659 | -| std | 0.911 | -| value_loss | 1.19e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 886 | -| time_elapsed | 21226 | -| total_timesteps | 113408 | -| train/ | | -| approx_kl | 0.006654149 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -678 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 8850 | -| policy_gradient_loss | -0.00544 | -| std | 0.91 | -| value_loss | 3.02e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 887 | -| time_elapsed | 21231 | -| total_timesteps | 113536 | -| train/ | | -| approx_kl | 6.283121e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -18.7 | -| learning_rate | 0.0003 | -| loss | 0.00094 | -| n_updates | 8860 | -| policy_gradient_loss | 0.00202 | -| std | 0.909 | -| value_loss | 1.33e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 888 | -| time_elapsed | 21235 | -| total_timesteps | 113664 | -| train/ | | -| approx_kl | 0.0005063405 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 8870 | -| policy_gradient_loss | -0.000171 | -| std | 0.908 | -| value_loss | 5.64e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 889 | -| time_elapsed | 21239 | -| total_timesteps | 113792 | -| train/ | | -| approx_kl | 0.0012277104 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.397 | -| learning_rate | 0.0003 | -| loss | 0.000212 | -| n_updates | 8880 | -| policy_gradient_loss | 0.000265 | -| std | 0.91 | -| value_loss | 2.54e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 890 | -| time_elapsed | 21244 | -| total_timesteps | 113920 | -| train/ | | -| approx_kl | 0.00036311056 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.00241 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 8890 | -| policy_gradient_loss | -0.000463 | -| std | 0.914 | -| value_loss | 2.39e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 891 | -| time_elapsed | 21248 | -| total_timesteps | 114048 | -| train/ | | -| approx_kl | 0.006266731 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.00492 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 8900 | -| policy_gradient_loss | -0.00574 | -| std | 0.914 | -| value_loss | 2.03e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 892 | -| time_elapsed | 21255 | -| total_timesteps | 114176 | -| train/ | | -| approx_kl | 0.00014485372 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.812 | -| learning_rate | 0.0003 | -| loss | 0.000198 | -| n_updates | 8910 | -| policy_gradient_loss | 0.000646 | -| std | 0.914 | -| value_loss | 0.0014 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 893 | -| time_elapsed | 21259 | -| total_timesteps | 114304 | -| train/ | | -| approx_kl | 0.0023149154 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -3.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 8920 | -| policy_gradient_loss | -0.00108 | -| std | 0.914 | -| value_loss | 1.3e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 894 | -| time_elapsed | 21265 | -| total_timesteps | 114432 | -| train/ | | -| approx_kl | 2.4757348e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -2.5e+03 | -| learning_rate | 0.0003 | -| loss | -0.000439 | -| n_updates | 8930 | -| policy_gradient_loss | 0.000257 | -| std | 0.916 | -| value_loss | 2.94e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 895 | -| time_elapsed | 21270 | -| total_timesteps | 114560 | -| train/ | | -| approx_kl | 0.0056577893 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 8940 | -| policy_gradient_loss | -0.00481 | -| std | 0.918 | -| value_loss | 2.08e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 896 | -| time_elapsed | 21275 | -| total_timesteps | 114688 | -| train/ | | -| approx_kl | 0.00454662 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -32 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 8950 | -| policy_gradient_loss | -0.00218 | -| std | 0.918 | -| value_loss | 2.53e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 897 | -| time_elapsed | 21279 | -| total_timesteps | 114816 | -| train/ | | -| approx_kl | 0.00804354 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 8960 | -| policy_gradient_loss | -0.00386 | -| std | 0.918 | -| value_loss | 8.17e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 898 | -| time_elapsed | 21283 | -| total_timesteps | 114944 | -| train/ | | -| approx_kl | 0.0021729977 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.384 | -| learning_rate | 0.0003 | -| loss | 0.000253 | -| n_updates | 8970 | -| policy_gradient_loss | 0.000159 | -| std | 0.918 | -| value_loss | 3.3e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 899 | -| time_elapsed | 21287 | -| total_timesteps | 115072 | -| train/ | | -| approx_kl | 0.002625531 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -0.00656 | -| n_updates | 8980 | -| policy_gradient_loss | -0.00235 | -| std | 0.918 | -| value_loss | 1.15e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 900 | -| time_elapsed | 21294 | -| total_timesteps | 115200 | -| train/ | | -| approx_kl | 0.0027814605 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.000393 | -| n_updates | 8990 | -| policy_gradient_loss | -0.000206 | -| std | 0.918 | -| value_loss | 0.000167 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 901 | -| time_elapsed | 21299 | -| total_timesteps | 115328 | -| train/ | | -| approx_kl | 0.006241563 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -12.8 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 9000 | -| policy_gradient_loss | -0.00587 | -| std | 0.917 | -| value_loss | 1.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 902 | -| time_elapsed | 21303 | -| total_timesteps | 115456 | -| train/ | | -| approx_kl | 2.877973e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -18.3 | -| learning_rate | 0.0003 | -| loss | 0.000781 | -| n_updates | 9010 | -| policy_gradient_loss | 0.00196 | -| std | 0.916 | -| value_loss | 2.53e-08 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 903 | -| time_elapsed | 21306 | -| total_timesteps | 115584 | -| train/ | | -| approx_kl | 0.000109410845 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -2.54 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 9020 | -| policy_gradient_loss | 0.000147 | -| std | 0.915 | -| value_loss | 7.46e-09 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 904 | -| time_elapsed | 21312 | -| total_timesteps | 115712 | -| train/ | | -| approx_kl | 7.205317e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.532 | -| learning_rate | 0.0003 | -| loss | 0.000373 | -| n_updates | 9030 | -| policy_gradient_loss | 0.000479 | -| std | 0.913 | -| value_loss | 5.91e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 905 | -| time_elapsed | 21316 | -| total_timesteps | 115840 | -| train/ | | -| approx_kl | 0.004812702 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 9040 | -| policy_gradient_loss | -0.00579 | -| std | 0.911 | -| value_loss | 1.3e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 5 | -| iterations | 906 | -| time_elapsed | 21319 | -| total_timesteps | 115968 | -| train/ | | -| approx_kl | 0.009988895 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00789 | -| n_updates | 9050 | -| policy_gradient_loss | -0.00588 | -| std | 0.908 | -| value_loss | 1.1e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 907 | -| time_elapsed | 21324 | -| total_timesteps | 116096 | -| train/ | | -| approx_kl | 1.4059246e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.00421 | -| learning_rate | 0.0003 | -| loss | 0.000135 | -| n_updates | 9060 | -| policy_gradient_loss | 0.000322 | -| std | 0.906 | -| value_loss | 1.83e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 908 | -| time_elapsed | 21333 | -| total_timesteps | 116224 | -| train/ | | -| approx_kl | 2.161134e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | 0.00071 | -| n_updates | 9070 | -| policy_gradient_loss | 1.55e-05 | -| std | 0.905 | -| value_loss | 0.00216 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 909 | -| time_elapsed | 21339 | -| total_timesteps | 116352 | -| train/ | | -| approx_kl | 0.0005250075 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -7.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 9080 | -| policy_gradient_loss | -0.000506 | -| std | 0.905 | -| value_loss | 4.36e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 910 | -| time_elapsed | 21343 | -| total_timesteps | 116480 | -| train/ | | -| approx_kl | 0.0026665772 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -1.47e+04 | -| learning_rate | 0.0003 | -| loss | -0.00266 | -| n_updates | 9090 | -| policy_gradient_loss | -0.00129 | -| std | 0.906 | -| value_loss | 4.74e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 911 | -| time_elapsed | 21348 | -| total_timesteps | 116608 | -| train/ | | -| approx_kl | 0.0031261258 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -844 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 9100 | -| policy_gradient_loss | -0.00136 | -| std | 0.905 | -| value_loss | 1.03e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 912 | -| time_elapsed | 21352 | -| total_timesteps | 116736 | -| train/ | | -| approx_kl | 0.00058089383 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -80.6 | -| learning_rate | 0.0003 | -| loss | 0.000371 | -| n_updates | 9110 | -| policy_gradient_loss | 0.000254 | -| std | 0.903 | -| value_loss | 4.14e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 913 | -| time_elapsed | 21357 | -| total_timesteps | 116864 | -| train/ | | -| approx_kl | 6.8927184e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -30.7 | -| learning_rate | 0.0003 | -| loss | 1.8e-06 | -| n_updates | 9120 | -| policy_gradient_loss | 1.61e-05 | -| std | 0.903 | -| value_loss | 2.53e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 5 | -| iterations | 914 | -| time_elapsed | 21362 | -| total_timesteps | 116992 | -| train/ | | -| approx_kl | 0.0022392026 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 9130 | -| policy_gradient_loss | -0.00174 | -| std | 0.906 | -| value_loss | 2.15e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 915 | -| time_elapsed | 21365 | -| total_timesteps | 117120 | -| train/ | | -| approx_kl | 3.1749718e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -4.98 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 9140 | -| policy_gradient_loss | 0.000353 | -| std | 0.911 | -| value_loss | 2.03e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 916 | -| time_elapsed | 21374 | -| total_timesteps | 117248 | -| train/ | | -| approx_kl | 0.0021358654 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.886 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 9150 | -| policy_gradient_loss | -0.000924 | -| std | 0.913 | -| value_loss | 0.000523 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 917 | -| time_elapsed | 21378 | -| total_timesteps | 117376 | -| train/ | | -| approx_kl | 0.0001061433 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.79e+03 | -| learning_rate | 0.0003 | -| loss | 0.000371 | -| n_updates | 9160 | -| policy_gradient_loss | 0.000336 | -| std | 0.912 | -| value_loss | 2.53e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 918 | -| time_elapsed | 21382 | -| total_timesteps | 117504 | -| train/ | | -| approx_kl | 0.0015001944 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.75e+03 | -| learning_rate | 0.0003 | -| loss | -0.00763 | -| n_updates | 9170 | -| policy_gradient_loss | -0.00266 | -| std | 0.912 | -| value_loss | 1.99e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 919 | -| time_elapsed | 21387 | -| total_timesteps | 117632 | -| train/ | | -| approx_kl | 0.01042346 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -110 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 9180 | -| policy_gradient_loss | -0.00864 | -| std | 0.912 | -| value_loss | 3.24e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 920 | -| time_elapsed | 21389 | -| total_timesteps | 117760 | -| train/ | | -| approx_kl | 1.7010607e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -8.32 | -| learning_rate | 0.0003 | -| loss | 0.000661 | -| n_updates | 9190 | -| policy_gradient_loss | 0.00318 | -| std | 0.91 | -| value_loss | 7.97e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 921 | -| time_elapsed | 21393 | -| total_timesteps | 117888 | -| train/ | | -| approx_kl | 0.001178924 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.563 | -| learning_rate | 0.0003 | -| loss | 8.14e-05 | -| n_updates | 9200 | -| policy_gradient_loss | 4.58e-05 | -| std | 0.908 | -| value_loss | 3.29e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 922 | -| time_elapsed | 21397 | -| total_timesteps | 118016 | -| train/ | | -| approx_kl | 0.00010578707 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | -3.51e-05 | -| n_updates | 9210 | -| policy_gradient_loss | -1.79e-05 | -| std | 0.908 | -| value_loss | 8.12e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 923 | -| time_elapsed | 21405 | -| total_timesteps | 118144 | -| train/ | | -| approx_kl | 0.00034014974 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.000901 | -| n_updates | 9220 | -| policy_gradient_loss | -0.000539 | -| std | 0.907 | -| value_loss | 0.00165 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 924 | -| time_elapsed | 21409 | -| total_timesteps | 118272 | -| train/ | | -| approx_kl | 9.473227e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -2.36e+03 | -| learning_rate | 0.0003 | -| loss | 0.000269 | -| n_updates | 9230 | -| policy_gradient_loss | 0.000201 | -| std | 0.907 | -| value_loss | 4.92e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 925 | -| time_elapsed | 21412 | -| total_timesteps | 118400 | -| train/ | | -| approx_kl | 0.0008253935 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -322 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 9240 | -| policy_gradient_loss | -0.000919 | -| std | 0.908 | -| value_loss | 3.41e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 926 | -| time_elapsed | 21416 | -| total_timesteps | 118528 | -| train/ | | -| approx_kl | 0.0005350448 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -93.5 | -| learning_rate | 0.0003 | -| loss | 0.000519 | -| n_updates | 9250 | -| policy_gradient_loss | 0.000379 | -| std | 0.907 | -| value_loss | 1.82e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 927 | -| time_elapsed | 21419 | -| total_timesteps | 118656 | -| train/ | | -| approx_kl | 0.00080529135 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.687 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 9260 | -| policy_gradient_loss | -0.000629 | -| std | 0.906 | -| value_loss | 2.78e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 928 | -| time_elapsed | 21422 | -| total_timesteps | 118784 | -| train/ | | -| approx_kl | 0.0033714399 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -4.11 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 9270 | -| policy_gradient_loss | -0.00159 | -| std | 0.906 | -| value_loss | 1.12e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 5 | -| iterations | 929 | -| time_elapsed | 21426 | -| total_timesteps | 118912 | -| train/ | | -| approx_kl | 0.00020354427 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 9280 | -| policy_gradient_loss | 5.41e-05 | -| std | 0.908 | -| value_loss | 7.81e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 930 | -| time_elapsed | 21430 | -| total_timesteps | 119040 | -| train/ | | -| approx_kl | 0.0074494197 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.00971 | -| n_updates | 9290 | -| policy_gradient_loss | -0.00608 | -| std | 0.91 | -| value_loss | 2.83e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 931 | -| time_elapsed | 21439 | -| total_timesteps | 119168 | -| train/ | | -| approx_kl | 0.00046928832 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 9300 | -| policy_gradient_loss | 0.000284 | -| std | 0.912 | -| value_loss | 0.00319 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 932 | -| time_elapsed | 21444 | -| total_timesteps | 119296 | -| train/ | | -| approx_kl | 0.0023943218 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -3.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.00986 | -| n_updates | 9310 | -| policy_gradient_loss | -0.00393 | -| std | 0.913 | -| value_loss | 0.000125 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 933 | -| time_elapsed | 21448 | -| total_timesteps | 119424 | -| train/ | | -| approx_kl | 0.0025220928 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -2.25e+03 | -| learning_rate | 0.0003 | -| loss | 0.000324 | -| n_updates | 9320 | -| policy_gradient_loss | 0.00017 | -| std | 0.912 | -| value_loss | 1.7e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 934 | -| time_elapsed | 21453 | -| total_timesteps | 119552 | -| train/ | | -| approx_kl | 0.003993588 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -8.09 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 9330 | -| policy_gradient_loss | -0.00583 | -| std | 0.912 | -| value_loss | 2.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 935 | -| time_elapsed | 21455 | -| total_timesteps | 119680 | -| train/ | | -| approx_kl | 0.009753177 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -20.5 | -| learning_rate | 0.0003 | -| loss | -0.00807 | -| n_updates | 9340 | -| policy_gradient_loss | -0.00444 | -| std | 0.912 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 936 | -| time_elapsed | 21458 | -| total_timesteps | 119808 | -| train/ | | -| approx_kl | 0.009112366 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 9350 | -| policy_gradient_loss | -0.00184 | -| std | 0.911 | -| value_loss | 5.77e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 937 | -| time_elapsed | 21462 | -| total_timesteps | 119936 | -| train/ | | -| approx_kl | 0.0051904046 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 9360 | -| policy_gradient_loss | -0.00278 | -| std | 0.91 | -| value_loss | 5.22e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 938 | -| time_elapsed | 21466 | -| total_timesteps | 120064 | -| train/ | | -| approx_kl | 0.015925704 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 9370 | -| policy_gradient_loss | -0.00482 | -| std | 0.91 | -| value_loss | 1.75e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 939 | -| time_elapsed | 21474 | -| total_timesteps | 120192 | -| train/ | | -| approx_kl | 0.0072963103 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 9380 | -| policy_gradient_loss | -0.00465 | -| std | 0.911 | -| value_loss | 0.00155 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 940 | -| time_elapsed | 21479 | -| total_timesteps | 120320 | -| train/ | | -| approx_kl | 1.7468352e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -2.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.00047 | -| n_updates | 9390 | -| policy_gradient_loss | 0.00182 | -| std | 0.911 | -| value_loss | 2.23e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 941 | -| time_elapsed | 21482 | -| total_timesteps | 120448 | -| train/ | | -| approx_kl | 0.0006294772 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.37e+03 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 9400 | -| policy_gradient_loss | 6.14e-05 | -| std | 0.911 | -| value_loss | 5.07e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 942 | -| time_elapsed | 21486 | -| total_timesteps | 120576 | -| train/ | | -| approx_kl | 0.004110593 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.33 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | -4.41e-05 | -| n_updates | 9410 | -| policy_gradient_loss | -3.56e-05 | -| std | 0.91 | -| value_loss | 5.53e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 943 | -| time_elapsed | 21489 | -| total_timesteps | 120704 | -| train/ | | -| approx_kl | 5.6754332e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.000394 | -| n_updates | 9420 | -| policy_gradient_loss | 1.98e-06 | -| std | 0.91 | -| value_loss | 5e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 944 | -| time_elapsed | 21493 | -| total_timesteps | 120832 | -| train/ | | -| approx_kl | 0.010359211 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | -0.0291 | -| n_updates | 9430 | -| policy_gradient_loss | -0.0139 | -| std | 0.909 | -| value_loss | 3.95e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 5 | -| iterations | 945 | -| time_elapsed | 21495 | -| total_timesteps | 120960 | -| train/ | | -| approx_kl | 0.004173488 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -0.497 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 9440 | -| policy_gradient_loss | 0.00119 | -| std | 0.908 | -| value_loss | 5.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 946 | -| time_elapsed | 21499 | -| total_timesteps | 121088 | -| train/ | | -| approx_kl | 0.008593349 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | 0.00516 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 9450 | -| policy_gradient_loss | -0.00792 | -| std | 0.907 | -| value_loss | 3.36e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 947 | -| time_elapsed | 21506 | -| total_timesteps | 121216 | -| train/ | | -| approx_kl | 0.00027927756 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | 7.67e-05 | -| n_updates | 9460 | -| policy_gradient_loss | 0.00141 | -| std | 0.906 | -| value_loss | 0.000223 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 948 | -| time_elapsed | 21511 | -| total_timesteps | 121344 | -| train/ | | -| approx_kl | 0.0025274376 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -2.49e+04 | -| learning_rate | 0.0003 | -| loss | -0.00602 | -| n_updates | 9470 | -| policy_gradient_loss | -0.00125 | -| std | 0.906 | -| value_loss | 4.78e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 949 | -| time_elapsed | 21516 | -| total_timesteps | 121472 | -| train/ | | -| approx_kl | 0.0015186854 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -5.3e+04 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 9480 | -| policy_gradient_loss | 0.00133 | -| std | 0.906 | -| value_loss | 7.16e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 950 | -| time_elapsed | 21519 | -| total_timesteps | 121600 | -| train/ | | -| approx_kl | 0.014215305 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -845 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 9490 | -| policy_gradient_loss | -0.00486 | -| std | 0.906 | -| value_loss | 8.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 951 | -| time_elapsed | 21523 | -| total_timesteps | 121728 | -| train/ | | -| approx_kl | 0.007768784 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -176 | -| learning_rate | 0.0003 | -| loss | 0.000156 | -| n_updates | 9500 | -| policy_gradient_loss | -1.08e-05 | -| std | 0.904 | -| value_loss | 6.43e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 952 | -| time_elapsed | 21527 | -| total_timesteps | 121856 | -| train/ | | -| approx_kl | 0.010052118 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -1.32 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 9510 | -| policy_gradient_loss | -0.00968 | -| std | 0.902 | -| value_loss | 1.09e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 953 | -| time_elapsed | 21529 | -| total_timesteps | 121984 | -| train/ | | -| approx_kl | 0.010026146 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -3.91 | -| learning_rate | 0.0003 | -| loss | -0.0059 | -| n_updates | 9520 | -| policy_gradient_loss | -0.00359 | -| std | 0.9 | -| value_loss | 3.73e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 5 | -| iterations | 954 | -| time_elapsed | 21533 | -| total_timesteps | 122112 | -| train/ | | -| approx_kl | 0.0023739296 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | -0.000137 | -| n_updates | 9530 | -| policy_gradient_loss | -8.49e-06 | -| std | 0.9 | -| value_loss | 5.02e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 5 | -| iterations | 955 | -| time_elapsed | 21543 | -| total_timesteps | 122240 | -| train/ | | -| approx_kl | 0.0014650673 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -18.4 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 9540 | -| policy_gradient_loss | -0.0055 | -| std | 0.898 | -| value_loss | 0.00464 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 5 | -| iterations | 956 | -| time_elapsed | 21548 | -| total_timesteps | 122368 | -| train/ | | -| approx_kl | 8.7395776e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -421 | -| learning_rate | 0.0003 | -| loss | 0.000429 | -| n_updates | 9550 | -| policy_gradient_loss | 0.000697 | -| std | 0.896 | -| value_loss | 2.08e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 5 | -| iterations | 957 | -| time_elapsed | 21551 | -| total_timesteps | 122496 | -| train/ | | -| approx_kl | 0.0018055583 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -146 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 9560 | -| policy_gradient_loss | -0.0014 | -| std | 0.894 | -| value_loss | 3.47e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 5 | -| iterations | 958 | -| time_elapsed | 21555 | -| total_timesteps | 122624 | -| train/ | | -| approx_kl | 5.0976407e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -2.82 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 9570 | -| policy_gradient_loss | 0.00181 | -| std | 0.893 | -| value_loss | 6.78e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 5 | -| iterations | 959 | -| time_elapsed | 21559 | -| total_timesteps | 122752 | -| train/ | | -| approx_kl | 0.00036564423 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -2.51 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 9580 | -| policy_gradient_loss | 0.000247 | -| std | 0.892 | -| value_loss | 2.55e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 5 | -| iterations | 960 | -| time_elapsed | 21563 | -| total_timesteps | 122880 | -| train/ | | -| approx_kl | 0.012994185 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | -0.00978 | -| n_updates | 9590 | -| policy_gradient_loss | -0.00565 | -| std | 0.894 | -| value_loss | 9.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 961 | -| time_elapsed | 21567 | -| total_timesteps | 123008 | -| train/ | | -| approx_kl | 0.015216118 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 9600 | -| policy_gradient_loss | -0.0102 | -| std | 0.895 | -| value_loss | 3.52e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 962 | -| time_elapsed | 21577 | -| total_timesteps | 123136 | -| train/ | | -| approx_kl | 0.00045205327 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | 0.0312 | -| learning_rate | 0.0003 | -| loss | 0.000974 | -| n_updates | 9610 | -| policy_gradient_loss | 0.000681 | -| std | 0.895 | -| value_loss | 0.00122 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 963 | -| time_elapsed | 21581 | -| total_timesteps | 123264 | -| train/ | | -| approx_kl | 0.0074266857 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -2.84e+04 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 9620 | -| policy_gradient_loss | -0.00709 | -| std | 0.896 | -| value_loss | 1.04e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 964 | -| time_elapsed | 21586 | -| total_timesteps | 123392 | -| train/ | | -| approx_kl | 0.010289872 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -6.85e+03 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 9630 | -| policy_gradient_loss | -0.00286 | -| std | 0.896 | -| value_loss | 2.54e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 965 | -| time_elapsed | 21590 | -| total_timesteps | 123520 | -| train/ | | -| approx_kl | 0.00095408875 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -104 | -| learning_rate | 0.0003 | -| loss | 0.000978 | -| n_updates | 9640 | -| policy_gradient_loss | 0.000671 | -| std | 0.895 | -| value_loss | 3.8e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 966 | -| time_elapsed | 21594 | -| total_timesteps | 123648 | -| train/ | | -| approx_kl | 0.0010068654 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -24.4 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 9650 | -| policy_gradient_loss | -0.000717 | -| std | 0.895 | -| value_loss | 1.26e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 967 | -| time_elapsed | 21598 | -| total_timesteps | 123776 | -| train/ | | -| approx_kl | 6.653555e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -5.36 | -| learning_rate | 0.0003 | -| loss | -0.000624 | -| n_updates | 9660 | -| policy_gradient_loss | 0.000228 | -| std | 0.895 | -| value_loss | 5.58e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 5 | -| iterations | 968 | -| time_elapsed | 21602 | -| total_timesteps | 123904 | -| train/ | | -| approx_kl | 0.00081023667 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.00809 | -| n_updates | 9670 | -| policy_gradient_loss | -0.00151 | -| std | 0.896 | -| value_loss | 4.19e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 969 | -| time_elapsed | 21606 | -| total_timesteps | 124032 | -| train/ | | -| approx_kl | 0.0028724489 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | -0.000417 | -| n_updates | 9680 | -| policy_gradient_loss | -0.000236 | -| std | 0.896 | -| value_loss | 1.52e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 970 | -| time_elapsed | 21614 | -| total_timesteps | 124160 | -| train/ | | -| approx_kl | 0.0012201155 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | 0.828 | -| learning_rate | 0.0003 | -| loss | -0.00063 | -| n_updates | 9690 | -| policy_gradient_loss | -0.000465 | -| std | 0.896 | -| value_loss | 0.000703 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 971 | -| time_elapsed | 21618 | -| total_timesteps | 124288 | -| train/ | | -| approx_kl | 0.008672782 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -137 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 9700 | -| policy_gradient_loss | -0.00563 | -| std | 0.896 | -| value_loss | 6.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 972 | -| time_elapsed | 21622 | -| total_timesteps | 124416 | -| train/ | | -| approx_kl | 0.017000517 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -134 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 9710 | -| policy_gradient_loss | -0.00399 | -| std | 0.897 | -| value_loss | 1.74e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 973 | -| time_elapsed | 21626 | -| total_timesteps | 124544 | -| train/ | | -| approx_kl | 2.2226945e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -1.61 | -| learning_rate | 0.0003 | -| loss | -0.000495 | -| n_updates | 9720 | -| policy_gradient_loss | 0.000898 | -| std | 0.899 | -| value_loss | 9.54e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 974 | -| time_elapsed | 21631 | -| total_timesteps | 124672 | -| train/ | | -| approx_kl | 0.0012749694 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.599 | -| learning_rate | 0.0003 | -| loss | 0.000541 | -| n_updates | 9730 | -| policy_gradient_loss | 0.000419 | -| std | 0.898 | -| value_loss | 1.21e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 975 | -| time_elapsed | 21635 | -| total_timesteps | 124800 | -| train/ | | -| approx_kl | 0.00037935236 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | -0.000645 | -| n_updates | 9740 | -| policy_gradient_loss | -0.000182 | -| std | 0.898 | -| value_loss | 7.27e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 5 | -| iterations | 976 | -| time_elapsed | 21639 | -| total_timesteps | 124928 | -| train/ | | -| approx_kl | 0.0013430305 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.089 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 9750 | -| policy_gradient_loss | -0.00056 | -| std | 0.898 | -| value_loss | 3.11e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 977 | -| time_elapsed | 21643 | -| total_timesteps | 125056 | -| train/ | | -| approx_kl | 0.0030719526 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.0777 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 9760 | -| policy_gradient_loss | -0.00171 | -| std | 0.897 | -| value_loss | 1.07e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 978 | -| time_elapsed | 21651 | -| total_timesteps | 125184 | -| train/ | | -| approx_kl | 0.00022843666 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | 0.815 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 9770 | -| policy_gradient_loss | -0.000812 | -| std | 0.896 | -| value_loss | 0.00159 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 979 | -| time_elapsed | 21655 | -| total_timesteps | 125312 | -| train/ | | -| approx_kl | 0.00019067898 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -2.12e+03 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 9780 | -| policy_gradient_loss | 0.000237 | -| std | 0.895 | -| value_loss | 2.44e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 980 | -| time_elapsed | 21658 | -| total_timesteps | 125440 | -| train/ | | -| approx_kl | 0.00018879818 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -1.13e+04 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 9790 | -| policy_gradient_loss | 0.000258 | -| std | 0.895 | -| value_loss | 4.67e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 981 | -| time_elapsed | 21662 | -| total_timesteps | 125568 | -| train/ | | -| approx_kl | 0.00013712514 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -324 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 9800 | -| policy_gradient_loss | 0.000668 | -| std | 0.897 | -| value_loss | 1.85e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 982 | -| time_elapsed | 21665 | -| total_timesteps | 125696 | -| train/ | | -| approx_kl | 0.0018752064 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -1.96e+03 | -| learning_rate | 0.0003 | -| loss | -0.000507 | -| n_updates | 9810 | -| policy_gradient_loss | -0.000288 | -| std | 0.897 | -| value_loss | 6.47e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 983 | -| time_elapsed | 21669 | -| total_timesteps | 125824 | -| train/ | | -| approx_kl | 0.0070435135 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -19.6 | -| learning_rate | 0.0003 | -| loss | -0.00974 | -| n_updates | 9820 | -| policy_gradient_loss | -0.00429 | -| std | 0.898 | -| value_loss | 5e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 5 | -| iterations | 984 | -| time_elapsed | 21674 | -| total_timesteps | 125952 | -| train/ | | -| approx_kl | 0.009959246 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -75.6 | -| learning_rate | 0.0003 | -| loss | -0.00703 | -| n_updates | 9830 | -| policy_gradient_loss | -0.00363 | -| std | 0.899 | -| value_loss | 5.48e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 985 | -| time_elapsed | 21679 | -| total_timesteps | 126080 | -| train/ | | -| approx_kl | 0.014110908 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.541 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 9840 | -| policy_gradient_loss | -0.00999 | -| std | 0.899 | -| value_loss | 4.38e-11 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 986 | -| time_elapsed | 21688 | -| total_timesteps | 126208 | -| train/ | | -| approx_kl | 0.00086359447 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | 0.832 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 9850 | -| policy_gradient_loss | 0.00059 | -| std | 0.898 | -| value_loss | 0.00234 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 987 | -| time_elapsed | 21693 | -| total_timesteps | 126336 | -| train/ | | -| approx_kl | 0.0076053175 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -1.17e+04 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 9860 | -| policy_gradient_loss | -0.00477 | -| std | 0.895 | -| value_loss | 7.82e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 988 | -| time_elapsed | 21697 | -| total_timesteps | 126464 | -| train/ | | -| approx_kl | 0.013537832 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -7.36e+03 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 9870 | -| policy_gradient_loss | -0.008 | -| std | 0.893 | -| value_loss | 8.53e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 989 | -| time_elapsed | 21701 | -| total_timesteps | 126592 | -| train/ | | -| approx_kl | 0.012102801 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -302 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 9880 | -| policy_gradient_loss | -0.00998 | -| std | 0.893 | -| value_loss | 3.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 990 | -| time_elapsed | 21705 | -| total_timesteps | 126720 | -| train/ | | -| approx_kl | 0.009388525 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -4.91 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 9890 | -| policy_gradient_loss | -0.00402 | -| std | 0.893 | -| value_loss | 6.18e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 991 | -| time_elapsed | 21710 | -| total_timesteps | 126848 | -| train/ | | -| approx_kl | 0.0058371583 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.359 | -| learning_rate | 0.0003 | -| loss | -0.00199 | -| n_updates | 9900 | -| policy_gradient_loss | -0.00144 | -| std | 0.893 | -| value_loss | 8.53e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 992 | -| time_elapsed | 21715 | -| total_timesteps | 126976 | -| train/ | | -| approx_kl | 9.007612e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -9.86 | -| learning_rate | 0.0003 | -| loss | -0.000618 | -| n_updates | 9910 | -| policy_gradient_loss | 1.79e-05 | -| std | 0.892 | -| value_loss | 0.000116 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 993 | -| time_elapsed | 21720 | -| total_timesteps | 127104 | -| train/ | | -| approx_kl | 0.0008783811 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.925 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 9920 | -| policy_gradient_loss | -0.000739 | -| std | 0.891 | -| value_loss | 7.26e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 994 | -| time_elapsed | 21729 | -| total_timesteps | 127232 | -| train/ | | -| approx_kl | 0.005174112 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -2.52 | -| learning_rate | 0.0003 | -| loss | -0.00487 | -| n_updates | 9930 | -| policy_gradient_loss | -0.00295 | -| std | 0.891 | -| value_loss | 0.0043 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 995 | -| time_elapsed | 21734 | -| total_timesteps | 127360 | -| train/ | | -| approx_kl | 3.532553e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -6.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.000607 | -| n_updates | 9940 | -| policy_gradient_loss | 0.000986 | -| std | 0.892 | -| value_loss | 0.000114 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 996 | -| time_elapsed | 21737 | -| total_timesteps | 127488 | -| train/ | | -| approx_kl | 0.00024206098 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -1.25e+03 | -| learning_rate | 0.0003 | -| loss | -0.00314 | -| n_updates | 9950 | -| policy_gradient_loss | 0.000225 | -| std | 0.893 | -| value_loss | 1.6e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 997 | -| time_elapsed | 21742 | -| total_timesteps | 127616 | -| train/ | | -| approx_kl | 0.00014679087 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -12.7 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 9960 | -| policy_gradient_loss | 0.000391 | -| std | 0.895 | -| value_loss | 1.69e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 998 | -| time_elapsed | 21745 | -| total_timesteps | 127744 | -| train/ | | -| approx_kl | 0.006973547 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.253 | -| learning_rate | 0.0003 | -| loss | -0.00958 | -| n_updates | 9970 | -| policy_gradient_loss | -0.00491 | -| std | 0.896 | -| value_loss | 8.48e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 999 | -| time_elapsed | 21749 | -| total_timesteps | 127872 | -| train/ | | -| approx_kl | 0.0021727495 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.31 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.000248 | -| n_updates | 9980 | -| policy_gradient_loss | 0.000164 | -| std | 0.893 | -| value_loss | 4.79e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1000 | -| time_elapsed | 21753 | -| total_timesteps | 128000 | -| train/ | | -| approx_kl | 4.790118e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.00883 | -| learning_rate | 0.0003 | -| loss | -0.000561 | -| n_updates | 9990 | -| policy_gradient_loss | -0.000201 | -| std | 0.89 | -| value_loss | 3.43e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1001 | -| time_elapsed | 21757 | -| total_timesteps | 128128 | -| train/ | | -| approx_kl | 0.003774067 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 9.49e-05 | -| learning_rate | 0.0003 | -| loss | -0.00752 | -| n_updates | 10000 | -| policy_gradient_loss | -0.00329 | -| std | 0.888 | -| value_loss | 1.83e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1002 | -| time_elapsed | 21767 | -| total_timesteps | 128256 | -| train/ | | -| approx_kl | 4.3349806e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.59 | -| learning_rate | 0.0003 | -| loss | 0.00203 | -| n_updates | 10010 | -| policy_gradient_loss | 0.000519 | -| std | 0.888 | -| value_loss | 0.00701 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1003 | -| time_elapsed | 21772 | -| total_timesteps | 128384 | -| train/ | | -| approx_kl | 0.005731546 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -2.09e+03 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 10020 | -| policy_gradient_loss | -0.00565 | -| std | 0.887 | -| value_loss | 9.74e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1004 | -| time_elapsed | 21777 | -| total_timesteps | 128512 | -| train/ | | -| approx_kl | 0.0003569047 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -1.45e+03 | -| learning_rate | 0.0003 | -| loss | 0.0017 | -| n_updates | 10030 | -| policy_gradient_loss | 0.00153 | -| std | 0.887 | -| value_loss | 2.73e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1005 | -| time_elapsed | 21781 | -| total_timesteps | 128640 | -| train/ | | -| approx_kl | 0.0002999357 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -17.6 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 10040 | -| policy_gradient_loss | -0.000428 | -| std | 0.885 | -| value_loss | 3.7e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1006 | -| time_elapsed | 21785 | -| total_timesteps | 128768 | -| train/ | | -| approx_kl | 9.756815e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -194 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 10050 | -| policy_gradient_loss | 7.67e-05 | -| std | 0.882 | -| value_loss | 1.91e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 5 | -| iterations | 1007 | -| time_elapsed | 21788 | -| total_timesteps | 128896 | -| train/ | | -| approx_kl | 4.9445312e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | 1.99e-05 | -| n_updates | 10060 | -| policy_gradient_loss | 0.000298 | -| std | 0.88 | -| value_loss | 1.2e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1008 | -| time_elapsed | 21792 | -| total_timesteps | 129024 | -| train/ | | -| approx_kl | 0.00011099875 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -4.67 | -| learning_rate | 0.0003 | -| loss | -0.000503 | -| n_updates | 10070 | -| policy_gradient_loss | -1.58e-05 | -| std | 0.879 | -| value_loss | 5.69e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1009 | -| time_elapsed | 21800 | -| total_timesteps | 129152 | -| train/ | | -| approx_kl | 0.004553576 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.02 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 10080 | -| policy_gradient_loss | -0.00545 | -| std | 0.878 | -| value_loss | 0.00316 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1010 | -| time_elapsed | 21803 | -| total_timesteps | 129280 | -| train/ | | -| approx_kl | 0.00021130918 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -6.07e+03 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 10090 | -| policy_gradient_loss | 0.00134 | -| std | 0.878 | -| value_loss | 2.79e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1011 | -| time_elapsed | 21807 | -| total_timesteps | 129408 | -| train/ | | -| approx_kl | 0.0006242315 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.000194 | -| n_updates | 10100 | -| policy_gradient_loss | -0.000101 | -| std | 0.877 | -| value_loss | 5.32e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1012 | -| time_elapsed | 21810 | -| total_timesteps | 129536 | -| train/ | | -| approx_kl | 0.0029731425 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.37 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 10110 | -| policy_gradient_loss | -0.00356 | -| std | 0.877 | -| value_loss | 9.76e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1013 | -| time_elapsed | 21815 | -| total_timesteps | 129664 | -| train/ | | -| approx_kl | 8.65059e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -11 | -| learning_rate | 0.0003 | -| loss | 0.000498 | -| n_updates | 10120 | -| policy_gradient_loss | 0.00177 | -| std | 0.877 | -| value_loss | 7.5e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1014 | -| time_elapsed | 21818 | -| total_timesteps | 129792 | -| train/ | | -| approx_kl | 0.00363713 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 10130 | -| policy_gradient_loss | -0.00223 | -| std | 0.877 | -| value_loss | 8.61e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 5 | -| iterations | 1015 | -| time_elapsed | 21821 | -| total_timesteps | 129920 | -| train/ | | -| approx_kl | 0.0026182714 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | -0.000541 | -| n_updates | 10140 | -| policy_gradient_loss | -0.000301 | -| std | 0.876 | -| value_loss | 4.11e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1016 | -| time_elapsed | 21824 | -| total_timesteps | 130048 | -| train/ | | -| approx_kl | 0.00054782955 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.00178 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 10150 | -| policy_gradient_loss | -0.000768 | -| std | 0.875 | -| value_loss | 3.26e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1017 | -| time_elapsed | 21830 | -| total_timesteps | 130176 | -| train/ | | -| approx_kl | 2.6950147e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 10160 | -| policy_gradient_loss | 0.000389 | -| std | 0.875 | -| value_loss | 0.00167 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1018 | -| time_elapsed | 21834 | -| total_timesteps | 130304 | -| train/ | | -| approx_kl | 0.00024255877 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.85e+03 | -| learning_rate | 0.0003 | -| loss | 0.000442 | -| n_updates | 10170 | -| policy_gradient_loss | 0.000385 | -| std | 0.876 | -| value_loss | 4.15e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1019 | -| time_elapsed | 21838 | -| total_timesteps | 130432 | -| train/ | | -| approx_kl | 0.00054233754 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -5.96e+03 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 10180 | -| policy_gradient_loss | -0.000482 | -| std | 0.879 | -| value_loss | 1.03e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1020 | -| time_elapsed | 21842 | -| total_timesteps | 130560 | -| train/ | | -| approx_kl | 0.004572851 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -41.8 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 10190 | -| policy_gradient_loss | -0.00656 | -| std | 0.878 | -| value_loss | 2.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1021 | -| time_elapsed | 21846 | -| total_timesteps | 130688 | -| train/ | | -| approx_kl | 0.0033374843 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -483 | -| learning_rate | 0.0003 | -| loss | 0.000246 | -| n_updates | 10200 | -| policy_gradient_loss | -4.08e-05 | -| std | 0.877 | -| value_loss | 6.88e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1022 | -| time_elapsed | 21850 | -| total_timesteps | 130816 | -| train/ | | -| approx_kl | 0.0001473194 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -8.94 | -| learning_rate | 0.0003 | -| loss | -0.000164 | -| n_updates | 10210 | -| policy_gradient_loss | -8.53e-05 | -| std | 0.876 | -| value_loss | 6.97e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 5 | -| iterations | 1023 | -| time_elapsed | 21854 | -| total_timesteps | 130944 | -| train/ | | -| approx_kl | 0.004110524 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.621 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 10220 | -| policy_gradient_loss | -0.00652 | -| std | 0.876 | -| value_loss | 3.18e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 5 | -| iterations | 1024 | -| time_elapsed | 21858 | -| total_timesteps | 131072 | -| train/ | | -| approx_kl | 0.014247708 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | -0.00793 | -| n_updates | 10230 | -| policy_gradient_loss | -0.00589 | -| std | 0.877 | -| value_loss | 2.19e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1025 | -| time_elapsed | 21865 | -| total_timesteps | 131200 | -| train/ | | -| approx_kl | 0.00029339176 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 10240 | -| policy_gradient_loss | -0.000335 | -| std | 0.878 | -| value_loss | 0.00202 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1026 | -| time_elapsed | 21869 | -| total_timesteps | 131328 | -| train/ | | -| approx_kl | 0.0066112024 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.45e+04 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 10250 | -| policy_gradient_loss | -0.00249 | -| std | 0.879 | -| value_loss | 1.88e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1027 | -| time_elapsed | 21873 | -| total_timesteps | 131456 | -| train/ | | -| approx_kl | 0.00010272162 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.29e+03 | -| learning_rate | 0.0003 | -| loss | 0.000609 | -| n_updates | 10260 | -| policy_gradient_loss | 0.000854 | -| std | 0.881 | -| value_loss | 2.94e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1028 | -| time_elapsed | 21878 | -| total_timesteps | 131584 | -| train/ | | -| approx_kl | 5.7546422e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -92.9 | -| learning_rate | 0.0003 | -| loss | -0.000354 | -| n_updates | 10270 | -| policy_gradient_loss | 9.82e-05 | -| std | 0.881 | -| value_loss | 2.35e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1029 | -| time_elapsed | 21883 | -| total_timesteps | 131712 | -| train/ | | -| approx_kl | 0.00514976 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -37.2 | -| learning_rate | 0.0003 | -| loss | -0.00648 | -| n_updates | 10280 | -| policy_gradient_loss | -0.003 | -| std | 0.88 | -| value_loss | 4.13e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1030 | -| time_elapsed | 21886 | -| total_timesteps | 131840 | -| train/ | | -| approx_kl | 1.5166588e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.85 | -| learning_rate | 0.0003 | -| loss | 8.94e-05 | -| n_updates | 10290 | -| policy_gradient_loss | 0.00303 | -| std | 0.879 | -| value_loss | 9.51e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1031 | -| time_elapsed | 21890 | -| total_timesteps | 131968 | -| train/ | | -| approx_kl | 0.0026779906 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.22 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 10300 | -| policy_gradient_loss | -0.000787 | -| std | 0.879 | -| value_loss | 2.51e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1032 | -| time_elapsed | 21894 | -| total_timesteps | 132096 | -| train/ | | -| approx_kl | 0.00060879486 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.00399 | -| learning_rate | 0.0003 | -| loss | 4.13e-05 | -| n_updates | 10310 | -| policy_gradient_loss | 6.24e-05 | -| std | 0.881 | -| value_loss | 1.23e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1033 | -| time_elapsed | 21902 | -| total_timesteps | 132224 | -| train/ | | -| approx_kl | 0.001920823 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 10320 | -| policy_gradient_loss | -0.00154 | -| std | 0.883 | -| value_loss | 2.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1034 | -| time_elapsed | 21906 | -| total_timesteps | 132352 | -| train/ | | -| approx_kl | 0.001419785 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -692 | -| learning_rate | 0.0003 | -| loss | 0.000189 | -| n_updates | 10330 | -| policy_gradient_loss | 0.000109 | -| std | 0.882 | -| value_loss | 7.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1035 | -| time_elapsed | 21910 | -| total_timesteps | 132480 | -| train/ | | -| approx_kl | 0.000917946 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -49 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 10340 | -| policy_gradient_loss | -0.000614 | -| std | 0.882 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1036 | -| time_elapsed | 21913 | -| total_timesteps | 132608 | -| train/ | | -| approx_kl | 0.0042461106 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 10350 | -| policy_gradient_loss | -0.00179 | -| std | 0.883 | -| value_loss | 8.47e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1037 | -| time_elapsed | 21916 | -| total_timesteps | 132736 | -| train/ | | -| approx_kl | 0.0051152706 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 10360 | -| policy_gradient_loss | -0.00364 | -| std | 0.885 | -| value_loss | 3.66e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1038 | -| time_elapsed | 21920 | -| total_timesteps | 132864 | -| train/ | | -| approx_kl | 4.233606e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | 0.000779 | -| n_updates | 10370 | -| policy_gradient_loss | 0.00139 | -| std | 0.885 | -| value_loss | 2.29e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 6 | -| iterations | 1039 | -| time_elapsed | 21925 | -| total_timesteps | 132992 | -| train/ | | -| approx_kl | 0.004860458 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.00533 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 10380 | -| policy_gradient_loss | -0.00573 | -| std | 0.884 | -| value_loss | 1.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1040 | -| time_elapsed | 21929 | -| total_timesteps | 133120 | -| train/ | | -| approx_kl | 0.009668553 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 10390 | -| policy_gradient_loss | -0.00843 | -| std | 0.884 | -| value_loss | 1.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1041 | -| time_elapsed | 21938 | -| total_timesteps | 133248 | -| train/ | | -| approx_kl | 0.010695675 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.77 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 10400 | -| policy_gradient_loss | -0.00453 | -| std | 0.883 | -| value_loss | 0.00262 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1042 | -| time_elapsed | 21944 | -| total_timesteps | 133376 | -| train/ | | -| approx_kl | 0.002420938 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -488 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 10410 | -| policy_gradient_loss | 0.000824 | -| std | 0.883 | -| value_loss | 2.8e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1043 | -| time_elapsed | 21949 | -| total_timesteps | 133504 | -| train/ | | -| approx_kl | 0.002698293 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -58.5 | -| learning_rate | 0.0003 | -| loss | -0.00379 | -| n_updates | 10420 | -| policy_gradient_loss | -0.00171 | -| std | 0.882 | -| value_loss | 3.95e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1044 | -| time_elapsed | 21953 | -| total_timesteps | 133632 | -| train/ | | -| approx_kl | 0.0002993499 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -17.5 | -| learning_rate | 0.0003 | -| loss | 0.000238 | -| n_updates | 10430 | -| policy_gradient_loss | 0.000371 | -| std | 0.879 | -| value_loss | 3.24e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1045 | -| time_elapsed | 21958 | -| total_timesteps | 133760 | -| train/ | | -| approx_kl | 0.0008711503 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.64 | -| learning_rate | 0.0003 | -| loss | -0.000824 | -| n_updates | 10440 | -| policy_gradient_loss | -0.000388 | -| std | 0.876 | -| value_loss | 5.79e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 6 | -| iterations | 1046 | -| time_elapsed | 21962 | -| total_timesteps | 133888 | -| train/ | | -| approx_kl | 0.00051494315 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.385 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 10450 | -| policy_gradient_loss | -0.000493 | -| std | 0.875 | -| value_loss | 3.98e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1047 | -| time_elapsed | 21966 | -| total_timesteps | 134016 | -| train/ | | -| approx_kl | 0.00036618905 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 10460 | -| policy_gradient_loss | -0.000142 | -| std | 0.872 | -| value_loss | 2.97e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1048 | -| time_elapsed | 21974 | -| total_timesteps | 134144 | -| train/ | | -| approx_kl | 0.0041080983 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -14.7 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 10470 | -| policy_gradient_loss | -0.00152 | -| std | 0.872 | -| value_loss | 0.00509 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1049 | -| time_elapsed | 21977 | -| total_timesteps | 134272 | -| train/ | | -| approx_kl | 5.2252784e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.98e+03 | -| learning_rate | 0.0003 | -| loss | 0.000366 | -| n_updates | 10480 | -| policy_gradient_loss | 0.000538 | -| std | 0.871 | -| value_loss | 9.64e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1050 | -| time_elapsed | 21981 | -| total_timesteps | 134400 | -| train/ | | -| approx_kl | 0.0045174733 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.49e+03 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 10490 | -| policy_gradient_loss | -0.00447 | -| std | 0.87 | -| value_loss | 1.54e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1051 | -| time_elapsed | 21984 | -| total_timesteps | 134528 | -| train/ | | -| approx_kl | 0.0013171528 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 10500 | -| policy_gradient_loss | 0.00103 | -| std | 0.868 | -| value_loss | 2.61e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1052 | -| time_elapsed | 21989 | -| total_timesteps | 134656 | -| train/ | | -| approx_kl | 0.0014715651 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 10510 | -| policy_gradient_loss | -0.0013 | -| std | 0.864 | -| value_loss | 4.94e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1053 | -| time_elapsed | 21993 | -| total_timesteps | 134784 | -| train/ | | -| approx_kl | 6.9772825e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 10520 | -| policy_gradient_loss | -4.74e-06 | -| std | 0.86 | -| value_loss | 2.52e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1054 | -| time_elapsed | 21996 | -| total_timesteps | 134912 | -| train/ | | -| approx_kl | 0.0021351408 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00734 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 10530 | -| policy_gradient_loss | -0.000757 | -| std | 0.859 | -| value_loss | 1.15e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1055 | -| time_elapsed | 22001 | -| total_timesteps | 135040 | -| train/ | | -| approx_kl | 0.00030223653 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0014 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 10540 | -| policy_gradient_loss | -0.000308 | -| std | 0.861 | -| value_loss | 8.89e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1056 | -| time_elapsed | 22011 | -| total_timesteps | 135168 | -| train/ | | -| approx_kl | 0.0058778836 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 10550 | -| policy_gradient_loss | -0.00345 | -| std | 0.863 | -| value_loss | 0.00101 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1057 | -| time_elapsed | 22015 | -| total_timesteps | 135296 | -| train/ | | -| approx_kl | 0.00049375976 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -3.07e+03 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 10560 | -| policy_gradient_loss | 0.00125 | -| std | 0.863 | -| value_loss | 3.7e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1058 | -| time_elapsed | 22019 | -| total_timesteps | 135424 | -| train/ | | -| approx_kl | 0.0046084044 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -2.03e+03 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 10570 | -| policy_gradient_loss | -0.00599 | -| std | 0.863 | -| value_loss | 1.11e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1059 | -| time_elapsed | 22023 | -| total_timesteps | 135552 | -| train/ | | -| approx_kl | 0.0024536536 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -58.6 | -| learning_rate | 0.0003 | -| loss | 0.000572 | -| n_updates | 10580 | -| policy_gradient_loss | 0.000378 | -| std | 0.863 | -| value_loss | 3.24e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1060 | -| time_elapsed | 22027 | -| total_timesteps | 135680 | -| train/ | | -| approx_kl | 0.0012165545 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.459 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 10590 | -| policy_gradient_loss | -0.000958 | -| std | 0.865 | -| value_loss | 3.3e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1061 | -| time_elapsed | 22031 | -| total_timesteps | 135808 | -| train/ | | -| approx_kl | 4.549511e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 3.4e-05 | -| n_updates | 10600 | -| policy_gradient_loss | 0.000513 | -| std | 0.867 | -| value_loss | 2.77e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 6 | -| iterations | 1062 | -| time_elapsed | 22035 | -| total_timesteps | 135936 | -| train/ | | -| approx_kl | 0.0025653378 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 10610 | -| policy_gradient_loss | -0.00183 | -| std | 0.869 | -| value_loss | 2.3e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1063 | -| time_elapsed | 22039 | -| total_timesteps | 136064 | -| train/ | | -| approx_kl | 0.007760143 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0026 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 10620 | -| policy_gradient_loss | -0.00623 | -| std | 0.868 | -| value_loss | 2.02e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1064 | -| time_elapsed | 22046 | -| total_timesteps | 136192 | -| train/ | | -| approx_kl | 5.5490993e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.614 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 10630 | -| policy_gradient_loss | 0.00106 | -| std | 0.868 | -| value_loss | 0.00411 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1065 | -| time_elapsed | 22050 | -| total_timesteps | 136320 | -| train/ | | -| approx_kl | 0.00222321 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.42e+03 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 10640 | -| policy_gradient_loss | -0.00065 | -| std | 0.87 | -| value_loss | 1.67e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1066 | -| time_elapsed | 22054 | -| total_timesteps | 136448 | -| train/ | | -| approx_kl | 0.00082666613 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -750 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 10650 | -| policy_gradient_loss | -0.00113 | -| std | 0.871 | -| value_loss | 4.71e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1067 | -| time_elapsed | 22058 | -| total_timesteps | 136576 | -| train/ | | -| approx_kl | 0.004002879 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -40.8 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 10660 | -| policy_gradient_loss | -0.000874 | -| std | 0.872 | -| value_loss | 1.46e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1068 | -| time_elapsed | 22062 | -| total_timesteps | 136704 | -| train/ | | -| approx_kl | 9.596627e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -57.6 | -| learning_rate | 0.0003 | -| loss | 0.000387 | -| n_updates | 10670 | -| policy_gradient_loss | 0.000402 | -| std | 0.872 | -| value_loss | 3.59e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1069 | -| time_elapsed | 22067 | -| total_timesteps | 136832 | -| train/ | | -| approx_kl | 0.0013833363 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.14e+03 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 10680 | -| policy_gradient_loss | -0.000618 | -| std | 0.87 | -| value_loss | 5.45e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 6 | -| iterations | 1070 | -| time_elapsed | 22071 | -| total_timesteps | 136960 | -| train/ | | -| approx_kl | 0.0026374692 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.87 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 10690 | -| policy_gradient_loss | -0.00138 | -| std | 0.868 | -| value_loss | 3.37e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1071 | -| time_elapsed | 22075 | -| total_timesteps | 137088 | -| train/ | | -| approx_kl | 0.0007371404 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.438 | -| learning_rate | 0.0003 | -| loss | -5.52e-05 | -| n_updates | 10700 | -| policy_gradient_loss | 3.66e-05 | -| std | 0.865 | -| value_loss | 1.18e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1072 | -| time_elapsed | 22083 | -| total_timesteps | 137216 | -| train/ | | -| approx_kl | 0.0033399323 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.43 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 10710 | -| policy_gradient_loss | -0.00615 | -| std | 0.861 | -| value_loss | 0.00219 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1073 | -| time_elapsed | 22087 | -| total_timesteps | 137344 | -| train/ | | -| approx_kl | 0.006018175 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -260 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 10720 | -| policy_gradient_loss | -0.00108 | -| std | 0.86 | -| value_loss | 8.31e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1074 | -| time_elapsed | 22091 | -| total_timesteps | 137472 | -| train/ | | -| approx_kl | 0.00187949 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -303 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 10730 | -| policy_gradient_loss | -0.00113 | -| std | 0.859 | -| value_loss | 2.42e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1075 | -| time_elapsed | 22095 | -| total_timesteps | 137600 | -| train/ | | -| approx_kl | 0.0001054029 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 10740 | -| policy_gradient_loss | 0.00112 | -| std | 0.857 | -| value_loss | 6.52e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1076 | -| time_elapsed | 22099 | -| total_timesteps | 137728 | -| train/ | | -| approx_kl | 0.012395233 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0976 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 10750 | -| policy_gradient_loss | -0.00369 | -| std | 0.857 | -| value_loss | 5.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1077 | -| time_elapsed | 22102 | -| total_timesteps | 137856 | -| train/ | | -| approx_kl | 0.013812207 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00114 | -| learning_rate | 0.0003 | -| loss | -0.00803 | -| n_updates | 10760 | -| policy_gradient_loss | -0.00533 | -| std | 0.858 | -| value_loss | 4.8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 6 | -| iterations | 1078 | -| time_elapsed | 22106 | -| total_timesteps | 137984 | -| train/ | | -| approx_kl | 0.017167974 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00258 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 10770 | -| policy_gradient_loss | -0.0161 | -| std | 0.858 | -| value_loss | 3.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 6 | -| iterations | 1079 | -| time_elapsed | 22108 | -| total_timesteps | 138112 | -| train/ | | -| approx_kl | 0.013716801 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 10780 | -| policy_gradient_loss | -0.0104 | -| std | 0.858 | -| value_loss | 1.16e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 6 | -| iterations | 1080 | -| time_elapsed | 22117 | -| total_timesteps | 138240 | -| train/ | | -| approx_kl | 0.0027209506 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | 0.000971 | -| n_updates | 10790 | -| policy_gradient_loss | 0.000431 | -| std | 0.859 | -| value_loss | 0.00104 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 6 | -| iterations | 1081 | -| time_elapsed | 22120 | -| total_timesteps | 138368 | -| train/ | | -| approx_kl | 0.0062550926 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.29e+03 | -| learning_rate | 0.0003 | -| loss | -0.00789 | -| n_updates | 10800 | -| policy_gradient_loss | -0.00331 | -| std | 0.86 | -| value_loss | 9.82e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 6 | -| iterations | 1082 | -| time_elapsed | 22124 | -| total_timesteps | 138496 | -| train/ | | -| approx_kl | 0.014499454 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.35e+03 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 10810 | -| policy_gradient_loss | -0.00856 | -| std | 0.861 | -| value_loss | 2.61e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 6 | -| iterations | 1083 | -| time_elapsed | 22128 | -| total_timesteps | 138624 | -| train/ | | -| approx_kl | 0.0046764617 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -448 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 10820 | -| policy_gradient_loss | -0.0124 | -| std | 0.863 | -| value_loss | 1.87e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 6 | -| iterations | 1084 | -| time_elapsed | 22131 | -| total_timesteps | 138752 | -| train/ | | -| approx_kl | 0.0011921981 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -165 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 10830 | -| policy_gradient_loss | -0.00151 | -| std | 0.864 | -| value_loss | 9.16e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 6 | -| iterations | 1085 | -| time_elapsed | 22136 | -| total_timesteps | 138880 | -| train/ | | -| approx_kl | 0.008264072 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 10840 | -| policy_gradient_loss | -0.00283 | -| std | 0.866 | -| value_loss | 1.34e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1086 | -| time_elapsed | 22140 | -| total_timesteps | 139008 | -| train/ | | -| approx_kl | 0.00073761493 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.91 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 10850 | -| policy_gradient_loss | 0.000861 | -| std | 0.866 | -| value_loss | 9.38e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1087 | -| time_elapsed | 22152 | -| total_timesteps | 139136 | -| train/ | | -| approx_kl | 0.001235025 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.676 | -| learning_rate | 0.0003 | -| loss | -0.000688 | -| n_updates | 10860 | -| policy_gradient_loss | -0.00101 | -| std | 0.865 | -| value_loss | 0.0037 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1088 | -| time_elapsed | 22155 | -| total_timesteps | 139264 | -| train/ | | -| approx_kl | 0.0008152458 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -3.15e+03 | -| learning_rate | 0.0003 | -| loss | -0.00794 | -| n_updates | 10870 | -| policy_gradient_loss | -0.00167 | -| std | 0.862 | -| value_loss | 3.32e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1089 | -| time_elapsed | 22160 | -| total_timesteps | 139392 | -| train/ | | -| approx_kl | 0.0052489783 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -545 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 10880 | -| policy_gradient_loss | -0.000917 | -| std | 0.86 | -| value_loss | 1.16e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1090 | -| time_elapsed | 22163 | -| total_timesteps | 139520 | -| train/ | | -| approx_kl | 0.0014927769 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -13.2 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 10890 | -| policy_gradient_loss | -0.00162 | -| std | 0.861 | -| value_loss | 3.66e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1091 | -| time_elapsed | 22167 | -| total_timesteps | 139648 | -| train/ | | -| approx_kl | 2.4757814e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | -0.000664 | -| n_updates | 10900 | -| policy_gradient_loss | 0.000955 | -| std | 0.861 | -| value_loss | 1.43e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1092 | -| time_elapsed | 22172 | -| total_timesteps | 139776 | -| train/ | | -| approx_kl | 0.00050764857 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 10910 | -| policy_gradient_loss | -0.000128 | -| std | 0.86 | -| value_loss | 1.27e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 6 | -| iterations | 1093 | -| time_elapsed | 22176 | -| total_timesteps | 139904 | -| train/ | | -| approx_kl | 0.01020968 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00694 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 10920 | -| policy_gradient_loss | -0.00655 | -| std | 0.86 | -| value_loss | 4.87e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1094 | -| time_elapsed | 22179 | -| total_timesteps | 140032 | -| train/ | | -| approx_kl | 3.839843e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00363 | -| learning_rate | 0.0003 | -| loss | -0.00014 | -| n_updates | 10930 | -| policy_gradient_loss | 0.00163 | -| std | 0.858 | -| value_loss | 3.92e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1095 | -| time_elapsed | 22189 | -| total_timesteps | 140160 | -| train/ | | -| approx_kl | 0.00027813064 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.73 | -| learning_rate | 0.0003 | -| loss | -0.000888 | -| n_updates | 10940 | -| policy_gradient_loss | -0.000233 | -| std | 0.858 | -| value_loss | 0.00355 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1096 | -| time_elapsed | 22194 | -| total_timesteps | 140288 | -| train/ | | -| approx_kl | 3.506057e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -550 | -| learning_rate | 0.0003 | -| loss | 0.000356 | -| n_updates | 10950 | -| policy_gradient_loss | 0.000651 | -| std | 0.859 | -| value_loss | 4.32e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1097 | -| time_elapsed | 22198 | -| total_timesteps | 140416 | -| train/ | | -| approx_kl | 0.00011135731 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.03e+03 | -| learning_rate | 0.0003 | -| loss | 0.000153 | -| n_updates | 10960 | -| policy_gradient_loss | 0.000131 | -| std | 0.86 | -| value_loss | 1e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1098 | -| time_elapsed | 22202 | -| total_timesteps | 140544 | -| train/ | | -| approx_kl | 0.00015320163 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -129 | -| learning_rate | 0.0003 | -| loss | -0.000324 | -| n_updates | 10970 | -| policy_gradient_loss | -0.000124 | -| std | 0.86 | -| value_loss | 6.12e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1099 | -| time_elapsed | 22207 | -| total_timesteps | 140672 | -| train/ | | -| approx_kl | 0.00069575384 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -67.5 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 10980 | -| policy_gradient_loss | -0.00068 | -| std | 0.858 | -| value_loss | 6.96e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1100 | -| time_elapsed | 22211 | -| total_timesteps | 140800 | -| train/ | | -| approx_kl | 0.00038320757 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -4.22 | -| learning_rate | 0.0003 | -| loss | -0.000515 | -| n_updates | 10990 | -| policy_gradient_loss | -6.74e-05 | -| std | 0.853 | -| value_loss | 1.53e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 6 | -| iterations | 1101 | -| time_elapsed | 22215 | -| total_timesteps | 140928 | -| train/ | | -| approx_kl | 0.0042448645 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.935 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 11000 | -| policy_gradient_loss | -0.00294 | -| std | 0.85 | -| value_loss | 7.01e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1102 | -| time_elapsed | 22220 | -| total_timesteps | 141056 | -| train/ | | -| approx_kl | 7.2922558e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | -0.000291 | -| n_updates | 11010 | -| policy_gradient_loss | 0.00111 | -| std | 0.847 | -| value_loss | 4.39e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1103 | -| time_elapsed | 22227 | -| total_timesteps | 141184 | -| train/ | | -| approx_kl | 6.826129e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.638 | -| learning_rate | 0.0003 | -| loss | 0.000786 | -| n_updates | 11020 | -| policy_gradient_loss | -0.000835 | -| std | 0.85 | -| value_loss | 0.0114 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1104 | -| time_elapsed | 22232 | -| total_timesteps | 141312 | -| train/ | | -| approx_kl | 0.0037999726 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -627 | -| learning_rate | 0.0003 | -| loss | -0.004 | -| n_updates | 11030 | -| policy_gradient_loss | -0.00207 | -| std | 0.854 | -| value_loss | 0.000783 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1105 | -| time_elapsed | 22235 | -| total_timesteps | 141440 | -| train/ | | -| approx_kl | 0.00014294079 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -537 | -| learning_rate | 0.0003 | -| loss | 0.000683 | -| n_updates | 11040 | -| policy_gradient_loss | 0.000748 | -| std | 0.856 | -| value_loss | 0.000102 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1106 | -| time_elapsed | 22239 | -| total_timesteps | 141568 | -| train/ | | -| approx_kl | 0.0005427138 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -434 | -| learning_rate | 0.0003 | -| loss | -0.000276 | -| n_updates | 11050 | -| policy_gradient_loss | -0.00013 | -| std | 0.855 | -| value_loss | 2.62e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1107 | -| time_elapsed | 22243 | -| total_timesteps | 141696 | -| train/ | | -| approx_kl | 0.0017065522 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -127 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 11060 | -| policy_gradient_loss | -0.00264 | -| std | 0.852 | -| value_loss | 1.65e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1108 | -| time_elapsed | 22247 | -| total_timesteps | 141824 | -| train/ | | -| approx_kl | 0.0023718565 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -248 | -| learning_rate | 0.0003 | -| loss | 0.000418 | -| n_updates | 11070 | -| policy_gradient_loss | 0.00032 | -| std | 0.853 | -| value_loss | 4.15e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 6 | -| iterations | 1109 | -| time_elapsed | 22251 | -| total_timesteps | 141952 | -| train/ | | -| approx_kl | 0.0017833957 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -73.2 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 11080 | -| policy_gradient_loss | -0.00198 | -| std | 0.853 | -| value_loss | 1.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1110 | -| time_elapsed | 22255 | -| total_timesteps | 142080 | -| train/ | | -| approx_kl | 0.009050503 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -6.63 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 11090 | -| policy_gradient_loss | -0.00948 | -| std | 0.854 | -| value_loss | 7.58e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1111 | -| time_elapsed | 22263 | -| total_timesteps | 142208 | -| train/ | | -| approx_kl | 0.009678839 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -1.42 | -| learning_rate | 0.0003 | -| loss | -0.00699 | -| n_updates | 11100 | -| policy_gradient_loss | -0.00506 | -| std | 0.853 | -| value_loss | 0.00782 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1112 | -| time_elapsed | 22268 | -| total_timesteps | 142336 | -| train/ | | -| approx_kl | 0.009501858 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -832 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 11110 | -| policy_gradient_loss | -0.00534 | -| std | 0.852 | -| value_loss | 0.000289 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1113 | -| time_elapsed | 22272 | -| total_timesteps | 142464 | -| train/ | | -| approx_kl | 0.00022587832 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -428 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 11120 | -| policy_gradient_loss | 0.00312 | -| std | 0.852 | -| value_loss | 2.96e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1114 | -| time_elapsed | 22277 | -| total_timesteps | 142592 | -| train/ | | -| approx_kl | 0.006442783 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.0158 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 11130 | -| policy_gradient_loss | -0.00307 | -| std | 0.852 | -| value_loss | 8.98e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1115 | -| time_elapsed | 22280 | -| total_timesteps | 142720 | -| train/ | | -| approx_kl | 0.005074238 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.478 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 11140 | -| policy_gradient_loss | -0.00236 | -| std | 0.849 | -| value_loss | 5.59e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1116 | -| time_elapsed | 22284 | -| total_timesteps | 142848 | -| train/ | | -| approx_kl | 0.0003300677 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 11150 | -| policy_gradient_loss | -6.95e-05 | -| std | 0.848 | -| value_loss | 2.53e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1117 | -| time_elapsed | 22288 | -| total_timesteps | 142976 | -| train/ | | -| approx_kl | 0.0006070612 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.000746 | -| n_updates | 11160 | -| policy_gradient_loss | 0.000538 | -| std | 0.847 | -| value_loss | 1.67e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1118 | -| time_elapsed | 22293 | -| total_timesteps | 143104 | -| train/ | | -| approx_kl | 0.0019943495 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.000469 | -| learning_rate | 0.0003 | -| loss | -0.00721 | -| n_updates | 11170 | -| policy_gradient_loss | -0.00264 | -| std | 0.847 | -| value_loss | 1.31e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1119 | -| time_elapsed | 22304 | -| total_timesteps | 143232 | -| train/ | | -| approx_kl | 0.009730006 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 11180 | -| policy_gradient_loss | -0.0102 | -| std | 0.849 | -| value_loss | 0.00323 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1120 | -| time_elapsed | 22307 | -| total_timesteps | 143360 | -| train/ | | -| approx_kl | 1.06636435e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -6.94e+03 | -| learning_rate | 0.0003 | -| loss | -0.00037 | -| n_updates | 11190 | -| policy_gradient_loss | 0.000784 | -| std | 0.85 | -| value_loss | 3.73e-06 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1121 | -| time_elapsed | 22311 | -| total_timesteps | 143488 | -| train/ | | -| approx_kl | 5.4212287e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -8.53e+03 | -| learning_rate | 0.0003 | -| loss | -0.000257 | -| n_updates | 11200 | -| policy_gradient_loss | 0.000368 | -| std | 0.852 | -| value_loss | 1.06e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1122 | -| time_elapsed | 22315 | -| total_timesteps | 143616 | -| train/ | | -| approx_kl | 1.3644807e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -71.2 | -| learning_rate | 0.0003 | -| loss | -0.000607 | -| n_updates | 11210 | -| policy_gradient_loss | -5.28e-05 | -| std | 0.855 | -| value_loss | 6.48e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1123 | -| time_elapsed | 22320 | -| total_timesteps | 143744 | -| train/ | | -| approx_kl | 0.0015819343 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -52.9 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 11220 | -| policy_gradient_loss | -0.0041 | -| std | 0.859 | -| value_loss | 4.73e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1124 | -| time_elapsed | 22324 | -| total_timesteps | 143872 | -| train/ | | -| approx_kl | 0.013825081 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -5.79 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 11230 | -| policy_gradient_loss | -0.0108 | -| std | 0.861 | -| value_loss | 6.98e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1125 | -| time_elapsed | 22328 | -| total_timesteps | 144000 | -| train/ | | -| approx_kl | 0.0058885766 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.531 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 11240 | -| policy_gradient_loss | -0.0012 | -| std | 0.862 | -| value_loss | 2.04e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1126 | -| time_elapsed | 22333 | -| total_timesteps | 144128 | -| train/ | | -| approx_kl | 0.00018173968 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00138 | -| learning_rate | 0.0003 | -| loss | -0.000772 | -| n_updates | 11250 | -| policy_gradient_loss | 3.23e-05 | -| std | 0.861 | -| value_loss | 1.04e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1127 | -| time_elapsed | 22342 | -| total_timesteps | 144256 | -| train/ | | -| approx_kl | 0.0020371787 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | -0.00709 | -| n_updates | 11260 | -| policy_gradient_loss | -0.00215 | -| std | 0.86 | -| value_loss | 0.000655 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1128 | -| time_elapsed | 22347 | -| total_timesteps | 144384 | -| train/ | | -| approx_kl | 0.0013515805 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -149 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 11270 | -| policy_gradient_loss | 0.000894 | -| std | 0.86 | -| value_loss | 6.3e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1129 | -| time_elapsed | 22351 | -| total_timesteps | 144512 | -| train/ | | -| approx_kl | 0.0076518366 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -69.4 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 11280 | -| policy_gradient_loss | -0.00873 | -| std | 0.86 | -| value_loss | 1.68e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1130 | -| time_elapsed | 22356 | -| total_timesteps | 144640 | -| train/ | | -| approx_kl | 2.0029023e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.000465 | -| n_updates | 11290 | -| policy_gradient_loss | 0.000361 | -| std | 0.862 | -| value_loss | 2.1e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1131 | -| time_elapsed | 22359 | -| total_timesteps | 144768 | -| train/ | | -| approx_kl | 0.0013566185 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.000731 | -| n_updates | 11300 | -| policy_gradient_loss | -0.000312 | -| std | 0.865 | -| value_loss | 1.02e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 6 | -| iterations | 1132 | -| time_elapsed | 22362 | -| total_timesteps | 144896 | -| train/ | | -| approx_kl | 0.0025138222 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.00282 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 11310 | -| policy_gradient_loss | -0.00167 | -| std | 0.869 | -| value_loss | 6.31e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1133 | -| time_elapsed | 22366 | -| total_timesteps | 145024 | -| train/ | | -| approx_kl | 0.011613462 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0025 | -| learning_rate | 0.0003 | -| loss | -0.00932 | -| n_updates | 11320 | -| policy_gradient_loss | -0.00614 | -| std | 0.871 | -| value_loss | 4.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1134 | -| time_elapsed | 22376 | -| total_timesteps | 145152 | -| train/ | | -| approx_kl | 0.012977507 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.811 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 11330 | -| policy_gradient_loss | -0.00738 | -| std | 0.872 | -| value_loss | 0.00335 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1135 | -| time_elapsed | 22380 | -| total_timesteps | 145280 | -| train/ | | -| approx_kl | 0.017101325 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -2.21e+03 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 11340 | -| policy_gradient_loss | -0.00862 | -| std | 0.872 | -| value_loss | 1.81e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1136 | -| time_elapsed | 22385 | -| total_timesteps | 145408 | -| train/ | | -| approx_kl | 0.00024242979 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -3.31e+03 | -| learning_rate | 0.0003 | -| loss | 0.00132 | -| n_updates | 11350 | -| policy_gradient_loss | 0.00183 | -| std | 0.872 | -| value_loss | 5.48e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1137 | -| time_elapsed | 22390 | -| total_timesteps | 145536 | -| train/ | | -| approx_kl | 0.009662941 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -5.13 | -| learning_rate | 0.0003 | -| loss | -0.00838 | -| n_updates | 11360 | -| policy_gradient_loss | -0.00522 | -| std | 0.873 | -| value_loss | 2.4e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1138 | -| time_elapsed | 22393 | -| total_timesteps | 145664 | -| train/ | | -| approx_kl | 5.526468e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -90.5 | -| learning_rate | 0.0003 | -| loss | -0.000149 | -| n_updates | 11370 | -| policy_gradient_loss | 0.000556 | -| std | 0.874 | -| value_loss | 3.68e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1139 | -| time_elapsed | 22398 | -| total_timesteps | 145792 | -| train/ | | -| approx_kl | 0.002194509 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.565 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 11380 | -| policy_gradient_loss | -0.00107 | -| std | 0.873 | -| value_loss | 2.82e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 6 | -| iterations | 1140 | -| time_elapsed | 22403 | -| total_timesteps | 145920 | -| train/ | | -| approx_kl | 0.0018400452 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.000466 | -| n_updates | 11390 | -| policy_gradient_loss | -0.000206 | -| std | 0.874 | -| value_loss | 4.56e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1141 | -| time_elapsed | 22408 | -| total_timesteps | 146048 | -| train/ | | -| approx_kl | 0.00017176522 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0889 | -| learning_rate | 0.0003 | -| loss | -0.000815 | -| n_updates | 11400 | -| policy_gradient_loss | -0.000123 | -| std | 0.873 | -| value_loss | 4.91e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1142 | -| time_elapsed | 22415 | -| total_timesteps | 146176 | -| train/ | | -| approx_kl | 0.00015142886 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | 0.000664 | -| n_updates | 11410 | -| policy_gradient_loss | -0.000152 | -| std | 0.87 | -| value_loss | 0.00363 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1143 | -| time_elapsed | 22420 | -| total_timesteps | 146304 | -| train/ | | -| approx_kl | 0.00044444343 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -532 | -| learning_rate | 0.0003 | -| loss | 0.000306 | -| n_updates | 11420 | -| policy_gradient_loss | 0.000201 | -| std | 0.87 | -| value_loss | 2.68e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1144 | -| time_elapsed | 22424 | -| total_timesteps | 146432 | -| train/ | | -| approx_kl | 0.00067142583 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -338 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 11430 | -| policy_gradient_loss | -0.000618 | -| std | 0.871 | -| value_loss | 4.44e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1145 | -| time_elapsed | 22427 | -| total_timesteps | 146560 | -| train/ | | -| approx_kl | 0.0075359913 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -55.4 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 11440 | -| policy_gradient_loss | -0.00298 | -| std | 0.873 | -| value_loss | 2.97e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1146 | -| time_elapsed | 22431 | -| total_timesteps | 146688 | -| train/ | | -| approx_kl | 0.01443697 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -22.2 | -| learning_rate | 0.0003 | -| loss | -0.0257 | -| n_updates | 11450 | -| policy_gradient_loss | -0.0136 | -| std | 0.874 | -| value_loss | 7.53e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1147 | -| time_elapsed | 22434 | -| total_timesteps | 146816 | -| train/ | | -| approx_kl | 0.0009872657 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | 0.0016 | -| n_updates | 11460 | -| policy_gradient_loss | 0.00143 | -| std | 0.874 | -| value_loss | 2.39e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 6 | -| iterations | 1148 | -| time_elapsed | 22439 | -| total_timesteps | 146944 | -| train/ | | -| approx_kl | 0.004626362 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.438 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 11470 | -| policy_gradient_loss | -0.00226 | -| std | 0.875 | -| value_loss | 3.96e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1149 | -| time_elapsed | 22444 | -| total_timesteps | 147072 | -| train/ | | -| approx_kl | 0.00013866602 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.00115 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 11480 | -| policy_gradient_loss | 0.00103 | -| std | 0.873 | -| value_loss | 7.18e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1150 | -| time_elapsed | 22449 | -| total_timesteps | 147200 | -| train/ | | -| approx_kl | 4.4633634e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.831 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 11490 | -| policy_gradient_loss | 0.000652 | -| std | 0.872 | -| value_loss | 0.00324 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1151 | -| time_elapsed | 22453 | -| total_timesteps | 147328 | -| train/ | | -| approx_kl | 0.014160838 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 11500 | -| policy_gradient_loss | -0.00356 | -| std | 0.871 | -| value_loss | 1.51e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1152 | -| time_elapsed | 22456 | -| total_timesteps | 147456 | -| train/ | | -| approx_kl | 0.00035754126 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 11510 | -| policy_gradient_loss | 0.000755 | -| std | 0.87 | -| value_loss | 5.93e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1153 | -| time_elapsed | 22460 | -| total_timesteps | 147584 | -| train/ | | -| approx_kl | 0.00046094134 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 11520 | -| policy_gradient_loss | 0.000364 | -| std | 0.871 | -| value_loss | 1.39e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1154 | -| time_elapsed | 22465 | -| total_timesteps | 147712 | -| train/ | | -| approx_kl | 0.0031707962 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | 0.000423 | -| n_updates | 11530 | -| policy_gradient_loss | 0.000244 | -| std | 0.871 | -| value_loss | 2.35e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1155 | -| time_elapsed | 22469 | -| total_timesteps | 147840 | -| train/ | | -| approx_kl | 0.005022387 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 11540 | -| policy_gradient_loss | -0.00412 | -| std | 0.87 | -| value_loss | 1.58e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 6 | -| iterations | 1156 | -| time_elapsed | 22473 | -| total_timesteps | 147968 | -| train/ | | -| approx_kl | 0.00078563346 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0072 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 11550 | -| policy_gradient_loss | 0.00121 | -| std | 0.869 | -| value_loss | 6.46e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1157 | -| time_elapsed | 22478 | -| total_timesteps | 148096 | -| train/ | | -| approx_kl | 0.0040604365 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 11560 | -| policy_gradient_loss | -0.00517 | -| std | 0.868 | -| value_loss | 3.88e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1158 | -| time_elapsed | 22488 | -| total_timesteps | 148224 | -| train/ | | -| approx_kl | 0.014413608 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.321 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 11570 | -| policy_gradient_loss | -0.012 | -| std | 0.867 | -| value_loss | 0.00331 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1159 | -| time_elapsed | 22492 | -| total_timesteps | 148352 | -| train/ | | -| approx_kl | 0.0016784966 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -2.75e+03 | -| learning_rate | 0.0003 | -| loss | 0.000863 | -| n_updates | 11580 | -| policy_gradient_loss | 0.000548 | -| std | 0.866 | -| value_loss | 2.63e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1160 | -| time_elapsed | 22497 | -| total_timesteps | 148480 | -| train/ | | -| approx_kl | 0.0036485791 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -3.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 11590 | -| policy_gradient_loss | -0.00212 | -| std | 0.866 | -| value_loss | 4.9e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1161 | -| time_elapsed | 22501 | -| total_timesteps | 148608 | -| train/ | | -| approx_kl | 0.000403387 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -38.3 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 11600 | -| policy_gradient_loss | 0.00117 | -| std | 0.867 | -| value_loss | 1.68e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1162 | -| time_elapsed | 22505 | -| total_timesteps | 148736 | -| train/ | | -| approx_kl | 0.0024585081 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -33 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 11610 | -| policy_gradient_loss | -0.00109 | -| std | 0.868 | -| value_loss | 5.07e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1163 | -| time_elapsed | 22508 | -| total_timesteps | 148864 | -| train/ | | -| approx_kl | 0.00042137317 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0661 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 11620 | -| policy_gradient_loss | -8.55e-05 | -| std | 0.867 | -| value_loss | 1.73e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1164 | -| time_elapsed | 22511 | -| total_timesteps | 148992 | -| train/ | | -| approx_kl | 0.0005097613 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.359 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 11630 | -| policy_gradient_loss | 7.8e-05 | -| std | 0.867 | -| value_loss | 2.21e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1165 | -| time_elapsed | 22516 | -| total_timesteps | 149120 | -| train/ | | -| approx_kl | 0.00017039757 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 11640 | -| policy_gradient_loss | 0.000405 | -| std | 0.869 | -| value_loss | 5.11e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1166 | -| time_elapsed | 22527 | -| total_timesteps | 149248 | -| train/ | | -| approx_kl | 8.649239e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.858 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 11650 | -| policy_gradient_loss | -0.000226 | -| std | 0.871 | -| value_loss | 0.00221 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1167 | -| time_elapsed | 22531 | -| total_timesteps | 149376 | -| train/ | | -| approx_kl | 0.002493259 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -494 | -| learning_rate | 0.0003 | -| loss | -0.000939 | -| n_updates | 11660 | -| policy_gradient_loss | -0.000458 | -| std | 0.874 | -| value_loss | 3.61e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1168 | -| time_elapsed | 22534 | -| total_timesteps | 149504 | -| train/ | | -| approx_kl | 0.00085266214 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -108 | -| learning_rate | 0.0003 | -| loss | -0.00047 | -| n_updates | 11670 | -| policy_gradient_loss | -0.000231 | -| std | 0.877 | -| value_loss | 5.18e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1169 | -| time_elapsed | 22536 | -| total_timesteps | 149632 | -| train/ | | -| approx_kl | 0.0012998492 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 11680 | -| policy_gradient_loss | -0.000663 | -| std | 0.878 | -| value_loss | 7.43e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1170 | -| time_elapsed | 22538 | -| total_timesteps | 149760 | -| train/ | | -| approx_kl | 0.009456202 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -4.51 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 11690 | -| policy_gradient_loss | -0.00925 | -| std | 0.879 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1171 | -| time_elapsed | 22541 | -| total_timesteps | 149888 | -| train/ | | -| approx_kl | 0.013908384 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | -0.0091 | -| n_updates | 11700 | -| policy_gradient_loss | -0.00703 | -| std | 0.879 | -| value_loss | 8.48e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1172 | -| time_elapsed | 22546 | -| total_timesteps | 150016 | -| train/ | | -| approx_kl | 0.0023185192 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 11710 | -| policy_gradient_loss | -0.000636 | -| std | 0.882 | -| value_loss | 1.65e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1173 | -| time_elapsed | 22556 | -| total_timesteps | 150144 | -| train/ | | -| approx_kl | 0.0010080812 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.197 | -| learning_rate | 0.0003 | -| loss | -0.00532 | -| n_updates | 11720 | -| policy_gradient_loss | -0.00185 | -| std | 0.882 | -| value_loss | 0.00252 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1174 | -| time_elapsed | 22560 | -| total_timesteps | 150272 | -| train/ | | -| approx_kl | 0.00019738125 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -5.14e+03 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 11730 | -| policy_gradient_loss | 0.000416 | -| std | 0.881 | -| value_loss | 3.61e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1175 | -| time_elapsed | 22564 | -| total_timesteps | 150400 | -| train/ | | -| approx_kl | 0.0026347805 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -6.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.000342 | -| n_updates | 11740 | -| policy_gradient_loss | -0.000214 | -| std | 0.88 | -| value_loss | 6.3e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1176 | -| time_elapsed | 22567 | -| total_timesteps | 150528 | -| train/ | | -| approx_kl | 0.00018434646 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.000905 | -| n_updates | 11750 | -| policy_gradient_loss | -0.000212 | -| std | 0.878 | -| value_loss | 6.82e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1177 | -| time_elapsed | 22572 | -| total_timesteps | 150656 | -| train/ | | -| approx_kl | 0.0008303807 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.15e+03 | -| learning_rate | 0.0003 | -| loss | -7.25e-06 | -| n_updates | 11760 | -| policy_gradient_loss | 1.66e-05 | -| std | 0.877 | -| value_loss | 5.24e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1178 | -| time_elapsed | 22576 | -| total_timesteps | 150784 | -| train/ | | -| approx_kl | 0.0037319474 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.00506 | -| n_updates | 11770 | -| policy_gradient_loss | -0.00218 | -| std | 0.878 | -| value_loss | 7.04e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 6 | -| iterations | 1179 | -| time_elapsed | 22580 | -| total_timesteps | 150912 | -| train/ | | -| approx_kl | 0.0004453943 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.87 | -| learning_rate | 0.0003 | -| loss | 0.00107 | -| n_updates | 11780 | -| policy_gradient_loss | 0.0009 | -| std | 0.877 | -| value_loss | 2.79e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1180 | -| time_elapsed | 22584 | -| total_timesteps | 151040 | -| train/ | | -| approx_kl | 0.006157913 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 11790 | -| policy_gradient_loss | -0.00528 | -| std | 0.876 | -| value_loss | 1.7e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1181 | -| time_elapsed | 22593 | -| total_timesteps | 151168 | -| train/ | | -| approx_kl | 0.0009835414 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -8.1 | -| learning_rate | 0.0003 | -| loss | 0.00304 | -| n_updates | 11800 | -| policy_gradient_loss | 0.00135 | -| std | 0.877 | -| value_loss | 0.00342 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1182 | -| time_elapsed | 22595 | -| total_timesteps | 151296 | -| train/ | | -| approx_kl | 0.0036735102 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -7.57e+03 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 11810 | -| policy_gradient_loss | -0.00298 | -| std | 0.878 | -| value_loss | 3.72e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1183 | -| time_elapsed | 22598 | -| total_timesteps | 151424 | -| train/ | | -| approx_kl | 0.000180698 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -6.37e+03 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 11820 | -| policy_gradient_loss | 0.00139 | -| std | 0.877 | -| value_loss | 7.94e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1184 | -| time_elapsed | 22602 | -| total_timesteps | 151552 | -| train/ | | -| approx_kl | 0.00063568447 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -79.9 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 11830 | -| policy_gradient_loss | -0.000562 | -| std | 0.876 | -| value_loss | 1.43e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1185 | -| time_elapsed | 22606 | -| total_timesteps | 151680 | -| train/ | | -| approx_kl | 0.0078495275 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 11840 | -| policy_gradient_loss | -0.00549 | -| std | 0.875 | -| value_loss | 2.73e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1186 | -| time_elapsed | 22611 | -| total_timesteps | 151808 | -| train/ | | -| approx_kl | 0.0018579704 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.36 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 11850 | -| policy_gradient_loss | 0.000877 | -| std | 0.875 | -| value_loss | 3.4e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1187 | -| time_elapsed | 22615 | -| total_timesteps | 151936 | -| train/ | | -| approx_kl | 0.003024639 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00611 | -| n_updates | 11860 | -| policy_gradient_loss | -0.00259 | -| std | 0.874 | -| value_loss | 1.86e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1188 | -| time_elapsed | 22619 | -| total_timesteps | 152064 | -| train/ | | -| approx_kl | 0.005066312 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 11870 | -| policy_gradient_loss | -0.0011 | -| std | 0.874 | -| value_loss | 8.64e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1189 | -| time_elapsed | 22626 | -| total_timesteps | 152192 | -| train/ | | -| approx_kl | 4.029181e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.706 | -| learning_rate | 0.0003 | -| loss | 0.00176 | -| n_updates | 11880 | -| policy_gradient_loss | 0.000148 | -| std | 0.873 | -| value_loss | 0.00375 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1190 | -| time_elapsed | 22629 | -| total_timesteps | 152320 | -| train/ | | -| approx_kl | 0.0022929953 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.42e+03 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 11890 | -| policy_gradient_loss | -0.00271 | -| std | 0.872 | -| value_loss | 1.99e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1191 | -| time_elapsed | 22633 | -| total_timesteps | 152448 | -| train/ | | -| approx_kl | 7.749535e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.21e+04 | -| learning_rate | 0.0003 | -| loss | -0.00069 | -| n_updates | 11900 | -| policy_gradient_loss | 0.00145 | -| std | 0.87 | -| value_loss | 7.15e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1192 | -| time_elapsed | 22637 | -| total_timesteps | 152576 | -| train/ | | -| approx_kl | 0.007546182 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.19e+04 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 11910 | -| policy_gradient_loss | -0.00603 | -| std | 0.869 | -| value_loss | 2.53e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1193 | -| time_elapsed | 22640 | -| total_timesteps | 152704 | -| train/ | | -| approx_kl | 0.00216256 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -7.49 | -| learning_rate | 0.0003 | -| loss | 0.00118 | -| n_updates | 11920 | -| policy_gradient_loss | 0.000769 | -| std | 0.869 | -| value_loss | 1.18e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1194 | -| time_elapsed | 22645 | -| total_timesteps | 152832 | -| train/ | | -| approx_kl | 2.905773e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -9.78 | -| learning_rate | 0.0003 | -| loss | -0.000103 | -| n_updates | 11930 | -| policy_gradient_loss | 2.84e-06 | -| std | 0.868 | -| value_loss | 2.64e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 6 | -| iterations | 1195 | -| time_elapsed | 22649 | -| total_timesteps | 152960 | -| train/ | | -| approx_kl | 0.00051466515 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 11940 | -| policy_gradient_loss | -0.000641 | -| std | 0.866 | -| value_loss | 5.4e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1196 | -| time_elapsed | 22653 | -| total_timesteps | 153088 | -| train/ | | -| approx_kl | 0.0023615058 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 11950 | -| policy_gradient_loss | -0.00106 | -| std | 0.867 | -| value_loss | 1.89e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1197 | -| time_elapsed | 22660 | -| total_timesteps | 153216 | -| train/ | | -| approx_kl | 0.0008641109 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 11960 | -| policy_gradient_loss | -6.82e-05 | -| std | 0.869 | -| value_loss | 0.000235 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1198 | -| time_elapsed | 22664 | -| total_timesteps | 153344 | -| train/ | | -| approx_kl | 0.000705556 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -4.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.000981 | -| n_updates | 11970 | -| policy_gradient_loss | -0.000443 | -| std | 0.87 | -| value_loss | 2.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1199 | -| time_elapsed | 22667 | -| total_timesteps | 153472 | -| train/ | | -| approx_kl | 0.004060399 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -3.87e+03 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 11980 | -| policy_gradient_loss | -0.00617 | -| std | 0.871 | -| value_loss | 5.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1200 | -| time_elapsed | 22671 | -| total_timesteps | 153600 | -| train/ | | -| approx_kl | 0.008102403 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -104 | -| learning_rate | 0.0003 | -| loss | -0.00795 | -| n_updates | 11990 | -| policy_gradient_loss | -0.00399 | -| std | 0.872 | -| value_loss | 8.2e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1201 | -| time_elapsed | 22677 | -| total_timesteps | 153728 | -| train/ | | -| approx_kl | 5.39436e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 12000 | -| policy_gradient_loss | 0.00213 | -| std | 0.871 | -| value_loss | 4.33e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1202 | -| time_elapsed | 22681 | -| total_timesteps | 153856 | -| train/ | | -| approx_kl | 1.9494444e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | 0.000248 | -| n_updates | 12010 | -| policy_gradient_loss | 0.000428 | -| std | 0.871 | -| value_loss | 4.48e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 6 | -| iterations | 1203 | -| time_elapsed | 22686 | -| total_timesteps | 153984 | -| train/ | | -| approx_kl | 0.00061906455 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 12020 | -| policy_gradient_loss | -0.000559 | -| std | 0.871 | -| value_loss | 2.11e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1204 | -| time_elapsed | 22690 | -| total_timesteps | 154112 | -| train/ | | -| approx_kl | 5.9744343e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.00815 | -| learning_rate | 0.0003 | -| loss | 5.98e-05 | -| n_updates | 12030 | -| policy_gradient_loss | 0.000499 | -| std | 0.87 | -| value_loss | 1.81e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1205 | -| time_elapsed | 22701 | -| total_timesteps | 154240 | -| train/ | | -| approx_kl | 0.0017640288 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.844 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 12040 | -| policy_gradient_loss | -0.00126 | -| std | 0.87 | -| value_loss | 0.000367 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1206 | -| time_elapsed | 22705 | -| total_timesteps | 154368 | -| train/ | | -| approx_kl | 0.00025374768 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -7.74e+03 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 12050 | -| policy_gradient_loss | -5.83e-05 | -| std | 0.871 | -| value_loss | 4.63e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1207 | -| time_elapsed | 22709 | -| total_timesteps | 154496 | -| train/ | | -| approx_kl | 0.004141363 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -668 | -| learning_rate | 0.0003 | -| loss | -0.00364 | -| n_updates | 12060 | -| policy_gradient_loss | -0.00187 | -| std | 0.87 | -| value_loss | 1.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1208 | -| time_elapsed | 22713 | -| total_timesteps | 154624 | -| train/ | | -| approx_kl | 9.330455e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -17.7 | -| learning_rate | 0.0003 | -| loss | -2.97e-05 | -| n_updates | 12070 | -| policy_gradient_loss | 0.000506 | -| std | 0.868 | -| value_loss | 3.26e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1209 | -| time_elapsed | 22716 | -| total_timesteps | 154752 | -| train/ | | -| approx_kl | 0.0048833694 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 12080 | -| policy_gradient_loss | -0.00349 | -| std | 0.868 | -| value_loss | 9.34e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 6 | -| iterations | 1210 | -| time_elapsed | 22720 | -| total_timesteps | 154880 | -| train/ | | -| approx_kl | 7.5892545e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.291 | -| learning_rate | 0.0003 | -| loss | 0.000659 | -| n_updates | 12090 | -| policy_gradient_loss | 0.000717 | -| std | 0.869 | -| value_loss | 6.47e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1211 | -| time_elapsed | 22724 | -| total_timesteps | 155008 | -| train/ | | -| approx_kl | 0.0033305706 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.00745 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 12100 | -| policy_gradient_loss | -0.00307 | -| std | 0.869 | -| value_loss | 4.67e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1212 | -| time_elapsed | 22736 | -| total_timesteps | 155136 | -| train/ | | -| approx_kl | 0.0001657498 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 12110 | -| policy_gradient_loss | 0.00114 | -| std | 0.87 | -| value_loss | 1.95e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1213 | -| time_elapsed | 22742 | -| total_timesteps | 155264 | -| train/ | | -| approx_kl | 1.6198494e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -17.1 | -| learning_rate | 0.0003 | -| loss | -0.000311 | -| n_updates | 12120 | -| policy_gradient_loss | 7.93e-05 | -| std | 0.871 | -| value_loss | 6.17e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1214 | -| time_elapsed | 22747 | -| total_timesteps | 155392 | -| train/ | | -| approx_kl | 0.0005883989 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -6.82 | -| learning_rate | 0.0003 | -| loss | -0.00624 | -| n_updates | 12130 | -| policy_gradient_loss | -0.00166 | -| std | 0.871 | -| value_loss | 2.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1215 | -| time_elapsed | 22752 | -| total_timesteps | 155520 | -| train/ | | -| approx_kl | 0.003278114 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | -0.00575 | -| n_updates | 12140 | -| policy_gradient_loss | -0.00256 | -| std | 0.875 | -| value_loss | 5.8e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1216 | -| time_elapsed | 22756 | -| total_timesteps | 155648 | -| train/ | | -| approx_kl | 8.360017e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.000405 | -| n_updates | 12150 | -| policy_gradient_loss | 0.00159 | -| std | 0.878 | -| value_loss | 5.47e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1217 | -| time_elapsed | 22760 | -| total_timesteps | 155776 | -| train/ | | -| approx_kl | 0.0011364664 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | -0.000624 | -| n_updates | 12160 | -| policy_gradient_loss | -0.000325 | -| std | 0.879 | -| value_loss | 5.96e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 6 | -| iterations | 1218 | -| time_elapsed | 22764 | -| total_timesteps | 155904 | -| train/ | | -| approx_kl | 0.00011061318 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.0005 | -| learning_rate | 0.0003 | -| loss | -0.000762 | -| n_updates | 12170 | -| policy_gradient_loss | -8.05e-05 | -| std | 0.879 | -| value_loss | 2.99e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1219 | -| time_elapsed | 22769 | -| total_timesteps | 156032 | -| train/ | | -| approx_kl | 0.00045065535 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.00472 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 12180 | -| policy_gradient_loss | -0.00128 | -| std | 0.877 | -| value_loss | 3.28e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1220 | -| time_elapsed | 22777 | -| total_timesteps | 156160 | -| train/ | | -| approx_kl | 0.0039538676 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 12190 | -| policy_gradient_loss | -0.00326 | -| std | 0.876 | -| value_loss | 0.000961 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1221 | -| time_elapsed | 22781 | -| total_timesteps | 156288 | -| train/ | | -| approx_kl | 7.28704e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -9.65e+03 | -| learning_rate | 0.0003 | -| loss | 0.000763 | -| n_updates | 12200 | -| policy_gradient_loss | 0.00103 | -| std | 0.875 | -| value_loss | 8.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1222 | -| time_elapsed | 22786 | -| total_timesteps | 156416 | -| train/ | | -| approx_kl | 0.003946145 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.92e+03 | -| learning_rate | 0.0003 | -| loss | -0.00764 | -| n_updates | 12210 | -| policy_gradient_loss | -0.00348 | -| std | 0.873 | -| value_loss | 2.19e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1223 | -| time_elapsed | 22790 | -| total_timesteps | 156544 | -| train/ | | -| approx_kl | 6.671669e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -1.82e+03 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 12220 | -| policy_gradient_loss | 0.00184 | -| std | 0.873 | -| value_loss | 1.99e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1224 | -| time_elapsed | 22795 | -| total_timesteps | 156672 | -| train/ | | -| approx_kl | 0.0017572884 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -3.91 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 12230 | -| policy_gradient_loss | -0.000869 | -| std | 0.873 | -| value_loss | 1.06e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1225 | -| time_elapsed | 22799 | -| total_timesteps | 156800 | -| train/ | | -| approx_kl | 0.0036140215 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | -0.00467 | -| n_updates | 12240 | -| policy_gradient_loss | -0.00224 | -| std | 0.876 | -| value_loss | 3.69e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1226 | -| time_elapsed | 22802 | -| total_timesteps | 156928 | -| train/ | | -| approx_kl | 0.00025083404 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.362 | -| learning_rate | 0.0003 | -| loss | 0.000903 | -| n_updates | 12250 | -| policy_gradient_loss | 0.000686 | -| std | 0.878 | -| value_loss | 1.33e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1227 | -| time_elapsed | 22806 | -| total_timesteps | 157056 | -| train/ | | -| approx_kl | 0.0008181846 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.00256 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 12260 | -| policy_gradient_loss | -0.000803 | -| std | 0.88 | -| value_loss | 5.05e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1228 | -| time_elapsed | 22811 | -| total_timesteps | 157184 | -| train/ | | -| approx_kl | 2.682861e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | 0.00025 | -| n_updates | 12270 | -| policy_gradient_loss | 0.000323 | -| std | 0.882 | -| value_loss | 3.94e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1229 | -| time_elapsed | 22814 | -| total_timesteps | 157312 | -| train/ | | -| approx_kl | 0.0015337868 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 12280 | -| policy_gradient_loss | -0.00126 | -| std | 0.883 | -| value_loss | 9.89e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1230 | -| time_elapsed | 22819 | -| total_timesteps | 157440 | -| train/ | | -| approx_kl | 0.0016878336 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -6.76 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 12290 | -| policy_gradient_loss | -0.000593 | -| std | 0.884 | -| value_loss | 3.41e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1231 | -| time_elapsed | 22824 | -| total_timesteps | 157568 | -| train/ | | -| approx_kl | 0.0021093325 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -2.44 | -| learning_rate | 0.0003 | -| loss | -0.00404 | -| n_updates | 12300 | -| policy_gradient_loss | -0.00187 | -| std | 0.884 | -| value_loss | 8.02e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1232 | -| time_elapsed | 22828 | -| total_timesteps | 157696 | -| train/ | | -| approx_kl | 2.551172e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.293 | -| learning_rate | 0.0003 | -| loss | -0.000946 | -| n_updates | 12310 | -| policy_gradient_loss | 0.000962 | -| std | 0.884 | -| value_loss | 5.17e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1233 | -| time_elapsed | 22832 | -| total_timesteps | 157824 | -| train/ | | -| approx_kl | 0.0013974993 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 12320 | -| policy_gradient_loss | -0.000628 | -| std | 0.882 | -| value_loss | 1.95e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 6 | -| iterations | 1234 | -| time_elapsed | 22837 | -| total_timesteps | 157952 | -| train/ | | -| approx_kl | 0.0032834508 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 12330 | -| policy_gradient_loss | -0.00353 | -| std | 0.883 | -| value_loss | 1.34e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1235 | -| time_elapsed | 22840 | -| total_timesteps | 158080 | -| train/ | | -| approx_kl | 0.008743364 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 12340 | -| policy_gradient_loss | -0.00706 | -| std | 0.885 | -| value_loss | 1.22e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1236 | -| time_elapsed | 22848 | -| total_timesteps | 158208 | -| train/ | | -| approx_kl | 0.00083148666 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.626 | -| learning_rate | 0.0003 | -| loss | -0.000796 | -| n_updates | 12350 | -| policy_gradient_loss | -0.000445 | -| std | 0.886 | -| value_loss | 0.00424 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1237 | -| time_elapsed | 22852 | -| total_timesteps | 158336 | -| train/ | | -| approx_kl | 0.0021638786 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -636 | -| learning_rate | 0.0003 | -| loss | -0.00631 | -| n_updates | 12360 | -| policy_gradient_loss | -0.00236 | -| std | 0.887 | -| value_loss | 4.58e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1238 | -| time_elapsed | 22856 | -| total_timesteps | 158464 | -| train/ | | -| approx_kl | 1.4528632e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -717 | -| learning_rate | 0.0003 | -| loss | -0.000218 | -| n_updates | 12370 | -| policy_gradient_loss | 0.00101 | -| std | 0.886 | -| value_loss | 1.57e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1239 | -| time_elapsed | 22860 | -| total_timesteps | 158592 | -| train/ | | -| approx_kl | 4.6190806e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -1.06e+03 | -| learning_rate | 0.0003 | -| loss | 0.000414 | -| n_updates | 12380 | -| policy_gradient_loss | 0.000497 | -| std | 0.885 | -| value_loss | 6.4e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1240 | -| time_elapsed | 22864 | -| total_timesteps | 158720 | -| train/ | | -| approx_kl | 0.0009688218 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -48.1 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 12390 | -| policy_gradient_loss | -0.00111 | -| std | 0.886 | -| value_loss | 1.21e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1241 | -| time_elapsed | 22867 | -| total_timesteps | 158848 | -| train/ | | -| approx_kl | 0.0022793482 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -224 | -| learning_rate | 0.0003 | -| loss | -0.000947 | -| n_updates | 12400 | -| policy_gradient_loss | -0.000531 | -| std | 0.884 | -| value_loss | 2.09e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 6 | -| iterations | 1242 | -| time_elapsed | 22870 | -| total_timesteps | 158976 | -| train/ | | -| approx_kl | 0.0014254316 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.884 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 12410 | -| policy_gradient_loss | -0.000701 | -| std | 0.884 | -| value_loss | 6.91e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 6 | -| iterations | 1243 | -| time_elapsed | 22874 | -| total_timesteps | 159104 | -| train/ | | -| approx_kl | 0.0006495081 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.429 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 12420 | -| policy_gradient_loss | -0.00146 | -| std | 0.885 | -| value_loss | 5.57e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 6 | -| iterations | 1244 | -| time_elapsed | 22883 | -| total_timesteps | 159232 | -| train/ | | -| approx_kl | 0.00019997498 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | -0.00738 | -| n_updates | 12430 | -| policy_gradient_loss | -0.0023 | -| std | 0.884 | -| value_loss | 8.21e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 6 | -| iterations | 1245 | -| time_elapsed | 22887 | -| total_timesteps | 159360 | -| train/ | | -| approx_kl | 0.001016594 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -3.16e+03 | -| learning_rate | 0.0003 | -| loss | -0.00039 | -| n_updates | 12440 | -| policy_gradient_loss | -0.000146 | -| std | 0.885 | -| value_loss | 7.78e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 6 | -| iterations | 1246 | -| time_elapsed | 22891 | -| total_timesteps | 159488 | -| train/ | | -| approx_kl | 0.0014529238 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -997 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 12450 | -| policy_gradient_loss | -0.00125 | -| std | 0.886 | -| value_loss | 1.7e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 6 | -| iterations | 1247 | -| time_elapsed | 22895 | -| total_timesteps | 159616 | -| train/ | | -| approx_kl | 0.0012683948 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.000208 | -| n_updates | 12460 | -| policy_gradient_loss | 1.16e-05 | -| std | 0.889 | -| value_loss | 1.92e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 6 | -| iterations | 1248 | -| time_elapsed | 22900 | -| total_timesteps | 159744 | -| train/ | | -| approx_kl | 0.00076326355 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -6.25 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 12470 | -| policy_gradient_loss | -0.000842 | -| std | 0.891 | -| value_loss | 2.9e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 6 | -| iterations | 1249 | -| time_elapsed | 22902 | -| total_timesteps | 159872 | -| train/ | | -| approx_kl | 0.005500047 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 12480 | -| policy_gradient_loss | -0.00198 | -| std | 0.891 | -| value_loss | 2.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 6 | -| iterations | 1250 | -| time_elapsed | 22906 | -| total_timesteps | 160000 | -| train/ | | -| approx_kl | 0.011851164 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.00885 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 12490 | -| policy_gradient_loss | -0.00211 | -| std | 0.891 | -| value_loss | 2.23e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 6 | -| iterations | 1251 | -| time_elapsed | 22911 | -| total_timesteps | 160128 | -| train/ | | -| approx_kl | 0.0048115067 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.000307 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 12500 | -| policy_gradient_loss | -0.00181 | -| std | 0.89 | -| value_loss | 3.23e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 6 | -| iterations | 1252 | -| time_elapsed | 22919 | -| total_timesteps | 160256 | -| train/ | | -| approx_kl | 0.0006535086 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.843 | -| learning_rate | 0.0003 | -| loss | 0.000124 | -| n_updates | 12510 | -| policy_gradient_loss | -0.000282 | -| std | 0.888 | -| value_loss | 0.00202 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 6 | -| iterations | 1253 | -| time_elapsed | 22924 | -| total_timesteps | 160384 | -| train/ | | -| approx_kl | 0.0015923213 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -2.18e+03 | -| learning_rate | 0.0003 | -| loss | -0.00782 | -| n_updates | 12520 | -| policy_gradient_loss | -0.00271 | -| std | 0.886 | -| value_loss | 5.27e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1254 | -| time_elapsed | 22927 | -| total_timesteps | 160512 | -| train/ | | -| approx_kl | 9.801239e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -9.26e+03 | -| learning_rate | 0.0003 | -| loss | -0.000997 | -| n_updates | 12530 | -| policy_gradient_loss | 0.00184 | -| std | 0.884 | -| value_loss | 1.45e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1255 | -| time_elapsed | 22930 | -| total_timesteps | 160640 | -| train/ | | -| approx_kl | 0.00035964698 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -95.9 | -| learning_rate | 0.0003 | -| loss | 0.000706 | -| n_updates | 12540 | -| policy_gradient_loss | 0.000528 | -| std | 0.883 | -| value_loss | 7.38e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1256 | -| time_elapsed | 22934 | -| total_timesteps | 160768 | -| train/ | | -| approx_kl | 5.9715007e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -37.8 | -| learning_rate | 0.0003 | -| loss | -0.000118 | -| n_updates | 12550 | -| policy_gradient_loss | -4.66e-05 | -| std | 0.883 | -| value_loss | 3.74e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1257 | -| time_elapsed | 22937 | -| total_timesteps | 160896 | -| train/ | | -| approx_kl | 0.0024659783 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.00658 | -| n_updates | 12560 | -| policy_gradient_loss | -0.00259 | -| std | 0.884 | -| value_loss | 4.25e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1258 | -| time_elapsed | 22941 | -| total_timesteps | 161024 | -| train/ | | -| approx_kl | 0.004451482 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.773 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 12570 | -| policy_gradient_loss | -0.00107 | -| std | 0.887 | -| value_loss | 7.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1259 | -| time_elapsed | 22950 | -| total_timesteps | 161152 | -| train/ | | -| approx_kl | 0.027027454 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 12580 | -| policy_gradient_loss | -0.0121 | -| std | 0.889 | -| value_loss | 0.00555 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1260 | -| time_elapsed | 22955 | -| total_timesteps | 161280 | -| train/ | | -| approx_kl | 0.01155613 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -2.2e+03 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 12590 | -| policy_gradient_loss | -0.0026 | -| std | 0.89 | -| value_loss | 0.000106 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1261 | -| time_elapsed | 22960 | -| total_timesteps | 161408 | -| train/ | | -| approx_kl | 0.0019385582 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -961 | -| learning_rate | 0.0003 | -| loss | 1.01e-05 | -| n_updates | 12600 | -| policy_gradient_loss | 9.51e-06 | -| std | 0.888 | -| value_loss | 1.62e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1262 | -| time_elapsed | 22965 | -| total_timesteps | 161536 | -| train/ | | -| approx_kl | 0.000658236 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -5.17 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 12610 | -| policy_gradient_loss | -0.000608 | -| std | 0.885 | -| value_loss | 2.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1263 | -| time_elapsed | 22969 | -| total_timesteps | 161664 | -| train/ | | -| approx_kl | 0.002473421 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.398 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 12620 | -| policy_gradient_loss | -0.00239 | -| std | 0.88 | -| value_loss | 8.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1264 | -| time_elapsed | 22974 | -| total_timesteps | 161792 | -| train/ | | -| approx_kl | 0.008808354 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | -0.00527 | -| n_updates | 12630 | -| policy_gradient_loss | -0.00389 | -| std | 0.877 | -| value_loss | 5.64e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 7 | -| iterations | 1265 | -| time_elapsed | 22979 | -| total_timesteps | 161920 | -| train/ | | -| approx_kl | 0.008550532 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.00229 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 12640 | -| policy_gradient_loss | -0.00322 | -| std | 0.876 | -| value_loss | 3.7e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1266 | -| time_elapsed | 22983 | -| total_timesteps | 162048 | -| train/ | | -| approx_kl | 0.0007483326 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.00198 | -| learning_rate | 0.0003 | -| loss | 0.000326 | -| n_updates | 12650 | -| policy_gradient_loss | 0.00021 | -| std | 0.877 | -| value_loss | 2.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1267 | -| time_elapsed | 22991 | -| total_timesteps | 162176 | -| train/ | | -| approx_kl | 0.006457116 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.761 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 12660 | -| policy_gradient_loss | -0.0174 | -| std | 0.877 | -| value_loss | 0.00228 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1268 | -| time_elapsed | 22995 | -| total_timesteps | 162304 | -| train/ | | -| approx_kl | 0.0023889667 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.89e+03 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 12670 | -| policy_gradient_loss | -0.00166 | -| std | 0.877 | -| value_loss | 1.33e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1269 | -| time_elapsed | 23000 | -| total_timesteps | 162432 | -| train/ | | -| approx_kl | 0.0008145729 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.99e+03 | -| learning_rate | 0.0003 | -| loss | 0.000933 | -| n_updates | 12680 | -| policy_gradient_loss | 0.00073 | -| std | 0.879 | -| value_loss | 3.85e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1270 | -| time_elapsed | 23004 | -| total_timesteps | 162560 | -| train/ | | -| approx_kl | 0.00044530956 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -16.8 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 12690 | -| policy_gradient_loss | -0.000463 | -| std | 0.881 | -| value_loss | 1.01e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1271 | -| time_elapsed | 23009 | -| total_timesteps | 162688 | -| train/ | | -| approx_kl | 0.0011025779 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | -0.00591 | -| n_updates | 12700 | -| policy_gradient_loss | -0.00148 | -| std | 0.883 | -| value_loss | 5.81e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1272 | -| time_elapsed | 23012 | -| total_timesteps | 162816 | -| train/ | | -| approx_kl | 0.012149632 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.894 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 12710 | -| policy_gradient_loss | -0.00551 | -| std | 0.884 | -| value_loss | 3.19e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1273 | -| time_elapsed | 23016 | -| total_timesteps | 162944 | -| train/ | | -| approx_kl | 0.0013261023 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | -0.00729 | -| n_updates | 12720 | -| policy_gradient_loss | -0.00172 | -| std | 0.882 | -| value_loss | 9.97e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1274 | -| time_elapsed | 23019 | -| total_timesteps | 163072 | -| train/ | | -| approx_kl | 0.011550938 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 12730 | -| policy_gradient_loss | -0.00831 | -| std | 0.88 | -| value_loss | 4.21e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1275 | -| time_elapsed | 23025 | -| total_timesteps | 163200 | -| train/ | | -| approx_kl | 0.0038697342 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 12740 | -| policy_gradient_loss | -0.00941 | -| std | 0.877 | -| value_loss | 0.000284 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1276 | -| time_elapsed | 23030 | -| total_timesteps | 163328 | -| train/ | | -| approx_kl | 0.0027001644 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -220 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 12750 | -| policy_gradient_loss | -0.00148 | -| std | 0.877 | -| value_loss | 4.01e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1277 | -| time_elapsed | 23034 | -| total_timesteps | 163456 | -| train/ | | -| approx_kl | 0.018154522 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -157 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 12760 | -| policy_gradient_loss | -0.00545 | -| std | 0.877 | -| value_loss | 1.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1278 | -| time_elapsed | 23037 | -| total_timesteps | 163584 | -| train/ | | -| approx_kl | 0.02076505 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.22 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 12770 | -| policy_gradient_loss | -0.00427 | -| std | 0.876 | -| value_loss | 1.43e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1279 | -| time_elapsed | 23040 | -| total_timesteps | 163712 | -| train/ | | -| approx_kl | 0.0083938185 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | -0.00777 | -| n_updates | 12780 | -| policy_gradient_loss | -0.0033 | -| std | 0.875 | -| value_loss | 1.26e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1280 | -| time_elapsed | 23044 | -| total_timesteps | 163840 | -| train/ | | -| approx_kl | 3.4406316e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.395 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 12790 | -| policy_gradient_loss | 0.00275 | -| std | 0.875 | -| value_loss | 1.35e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 7 | -| iterations | 1281 | -| time_elapsed | 23048 | -| total_timesteps | 163968 | -| train/ | | -| approx_kl | 0.017359536 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 12800 | -| policy_gradient_loss | -0.00998 | -| std | 0.875 | -| value_loss | 4.6e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1282 | -| time_elapsed | 23052 | -| total_timesteps | 164096 | -| train/ | | -| approx_kl | 0.02247686 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 12810 | -| policy_gradient_loss | -0.00831 | -| std | 0.876 | -| value_loss | 7.91e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1283 | -| time_elapsed | 23061 | -| total_timesteps | 164224 | -| train/ | | -| approx_kl | 0.0017104074 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.549 | -| learning_rate | 0.0003 | -| loss | 0.00028 | -| n_updates | 12820 | -| policy_gradient_loss | 4.88e-05 | -| std | 0.878 | -| value_loss | 0.000765 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1284 | -| time_elapsed | 23064 | -| total_timesteps | 164352 | -| train/ | | -| approx_kl | 0.012232726 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -3.17e+03 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 12830 | -| policy_gradient_loss | -0.00665 | -| std | 0.879 | -| value_loss | 8.77e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1285 | -| time_elapsed | 23068 | -| total_timesteps | 164480 | -| train/ | | -| approx_kl | 0.00022705598 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -3.63e+04 | -| learning_rate | 0.0003 | -| loss | 0.00082 | -| n_updates | 12840 | -| policy_gradient_loss | 0.00137 | -| std | 0.879 | -| value_loss | 2.39e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1286 | -| time_elapsed | 23073 | -| total_timesteps | 164608 | -| train/ | | -| approx_kl | 0.0039286106 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -4.88e+03 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 12850 | -| policy_gradient_loss | -0.00131 | -| std | 0.878 | -| value_loss | 6.31e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1287 | -| time_elapsed | 23078 | -| total_timesteps | 164736 | -| train/ | | -| approx_kl | 0.043816887 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.27e+03 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 12860 | -| policy_gradient_loss | -0.0104 | -| std | 0.877 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1288 | -| time_elapsed | 23081 | -| total_timesteps | 164864 | -| train/ | | -| approx_kl | 0.025169253 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -20.7 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 12870 | -| policy_gradient_loss | -0.00311 | -| std | 0.877 | -| value_loss | 4.42e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 7 | -| iterations | 1289 | -| time_elapsed | 23085 | -| total_timesteps | 164992 | -| train/ | | -| approx_kl | 0.0060306005 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 12880 | -| policy_gradient_loss | -0.00127 | -| std | 0.875 | -| value_loss | 8.29e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 7 | -| iterations | 1290 | -| time_elapsed | 23089 | -| total_timesteps | 165120 | -| train/ | | -| approx_kl | 0.012607065 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0621 | -| learning_rate | 0.0003 | -| loss | -0.00985 | -| n_updates | 12890 | -| policy_gradient_loss | -0.00511 | -| std | 0.874 | -| value_loss | 6.43e-11 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 7 | -| iterations | 1291 | -| time_elapsed | 23099 | -| total_timesteps | 165248 | -| train/ | | -| approx_kl | 0.00089913094 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.58 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 12900 | -| policy_gradient_loss | -0.00292 | -| std | 0.874 | -| value_loss | 0.00845 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 7 | -| iterations | 1292 | -| time_elapsed | 23103 | -| total_timesteps | 165376 | -| train/ | | -| approx_kl | 0.04228582 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -2.69e+03 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 12910 | -| policy_gradient_loss | -0.00568 | -| std | 0.874 | -| value_loss | 0.000105 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 7 | -| iterations | 1293 | -| time_elapsed | 23107 | -| total_timesteps | 165504 | -| train/ | | -| approx_kl | 0.0028034928 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -778 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 12920 | -| policy_gradient_loss | 0.000516 | -| std | 0.875 | -| value_loss | 2.39e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 7 | -| iterations | 1294 | -| time_elapsed | 23109 | -| total_timesteps | 165632 | -| train/ | | -| approx_kl | 0.001647152 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -7.57 | -| learning_rate | 0.0003 | -| loss | -0.00666 | -| n_updates | 12930 | -| policy_gradient_loss | 0.000164 | -| std | 0.875 | -| value_loss | 1.59e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 7 | -| iterations | 1295 | -| time_elapsed | 23113 | -| total_timesteps | 165760 | -| train/ | | -| approx_kl | 0.0025829067 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -12.2 | -| learning_rate | 0.0003 | -| loss | 0.00183 | -| n_updates | 12940 | -| policy_gradient_loss | 0.00135 | -| std | 0.875 | -| value_loss | 4.34e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 7 | -| iterations | 1296 | -| time_elapsed | 23116 | -| total_timesteps | 165888 | -| train/ | | -| approx_kl | 0.0019201147 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 12950 | -| policy_gradient_loss | -0.000669 | -| std | 0.877 | -| value_loss | 2.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1297 | -| time_elapsed | 23119 | -| total_timesteps | 166016 | -| train/ | | -| approx_kl | 0.033836953 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 12960 | -| policy_gradient_loss | -0.0143 | -| std | 0.879 | -| value_loss | 1.19e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1298 | -| time_elapsed | 23128 | -| total_timesteps | 166144 | -| train/ | | -| approx_kl | 0.00027361512 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.893 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 12970 | -| policy_gradient_loss | -0.00135 | -| std | 0.882 | -| value_loss | 0.000641 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1299 | -| time_elapsed | 23132 | -| total_timesteps | 166272 | -| train/ | | -| approx_kl | 0.005720603 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -230 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 12980 | -| policy_gradient_loss | -0.00122 | -| std | 0.882 | -| value_loss | 1.16e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1300 | -| time_elapsed | 23136 | -| total_timesteps | 166400 | -| train/ | | -| approx_kl | 0.009115989 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -226 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 12990 | -| policy_gradient_loss | -0.00351 | -| std | 0.882 | -| value_loss | 1.63e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1301 | -| time_elapsed | 23140 | -| total_timesteps | 166528 | -| train/ | | -| approx_kl | 2.4489593e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.000926 | -| n_updates | 13000 | -| policy_gradient_loss | 0.00334 | -| std | 0.88 | -| value_loss | 7.58e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1302 | -| time_elapsed | 23144 | -| total_timesteps | 166656 | -| train/ | | -| approx_kl | 0.001998058 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 13010 | -| policy_gradient_loss | -0.000915 | -| std | 0.878 | -| value_loss | 5.89e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1303 | -| time_elapsed | 23149 | -| total_timesteps | 166784 | -| train/ | | -| approx_kl | 0.0064876713 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.000353 | -| n_updates | 13020 | -| policy_gradient_loss | -0.000289 | -| std | 0.876 | -| value_loss | 3.77e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 7 | -| iterations | 1304 | -| time_elapsed | 23153 | -| total_timesteps | 166912 | -| train/ | | -| approx_kl | 0.00059399195 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | -0.000314 | -| n_updates | 13030 | -| policy_gradient_loss | -0.000133 | -| std | 0.877 | -| value_loss | 1.74e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1305 | -| time_elapsed | 23157 | -| total_timesteps | 167040 | -| train/ | | -| approx_kl | 0.0061271815 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 13040 | -| policy_gradient_loss | -0.00332 | -| std | 0.878 | -| value_loss | 6.57e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1306 | -| time_elapsed | 23164 | -| total_timesteps | 167168 | -| train/ | | -| approx_kl | 0.00829909 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 13050 | -| policy_gradient_loss | -0.00348 | -| std | 0.878 | -| value_loss | 0.00154 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1307 | -| time_elapsed | 23169 | -| total_timesteps | 167296 | -| train/ | | -| approx_kl | 0.0010761968 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -9.5 | -| learning_rate | 0.0003 | -| loss | -0.00431 | -| n_updates | 13060 | -| policy_gradient_loss | -0.00034 | -| std | 0.88 | -| value_loss | 1.98e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1308 | -| time_elapsed | 23173 | -| total_timesteps | 167424 | -| train/ | | -| approx_kl | 0.00031191343 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -12.1 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 13070 | -| policy_gradient_loss | 0.00108 | -| std | 0.88 | -| value_loss | 8.11e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1309 | -| time_elapsed | 23176 | -| total_timesteps | 167552 | -| train/ | | -| approx_kl | 0.008301677 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 13080 | -| policy_gradient_loss | -0.00124 | -| std | 0.881 | -| value_loss | 3.18e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1310 | -| time_elapsed | 23180 | -| total_timesteps | 167680 | -| train/ | | -| approx_kl | 0.0032069245 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.537 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 13090 | -| policy_gradient_loss | -0.00092 | -| std | 0.88 | -| value_loss | 7.11e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1311 | -| time_elapsed | 23184 | -| total_timesteps | 167808 | -| train/ | | -| approx_kl | 0.003825659 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | -0.00696 | -| n_updates | 13100 | -| policy_gradient_loss | -0.00205 | -| std | 0.878 | -| value_loss | 2.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 7 | -| iterations | 1312 | -| time_elapsed | 23189 | -| total_timesteps | 167936 | -| train/ | | -| approx_kl | 0.004024903 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.000579 | -| n_updates | 13110 | -| policy_gradient_loss | 0.000328 | -| std | 0.876 | -| value_loss | 2.04e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1313 | -| time_elapsed | 23193 | -| total_timesteps | 168064 | -| train/ | | -| approx_kl | 0.0063917562 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00541 | -| n_updates | 13120 | -| policy_gradient_loss | -0.00265 | -| std | 0.872 | -| value_loss | 4.23e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1314 | -| time_elapsed | 23200 | -| total_timesteps | 168192 | -| train/ | | -| approx_kl | 0.00059071183 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.632 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 13130 | -| policy_gradient_loss | -0.00315 | -| std | 0.872 | -| value_loss | 0.00977 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1315 | -| time_elapsed | 23203 | -| total_timesteps | 168320 | -| train/ | | -| approx_kl | 0.0013819672 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -462 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 13140 | -| policy_gradient_loss | -0.000925 | -| std | 0.873 | -| value_loss | 0.000328 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1316 | -| time_elapsed | 23207 | -| total_timesteps | 168448 | -| train/ | | -| approx_kl | 0.0010728859 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -441 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 13150 | -| policy_gradient_loss | 6.62e-05 | -| std | 0.875 | -| value_loss | 4.17e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1317 | -| time_elapsed | 23210 | -| total_timesteps | 168576 | -| train/ | | -| approx_kl | 0.008223861 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.11e+03 | -| learning_rate | 0.0003 | -| loss | -0.000927 | -| n_updates | 13160 | -| policy_gradient_loss | -0.000687 | -| std | 0.875 | -| value_loss | 4.99e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1318 | -| time_elapsed | 23213 | -| total_timesteps | 168704 | -| train/ | | -| approx_kl | 0.00033131195 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -27.3 | -| learning_rate | 0.0003 | -| loss | -0.000745 | -| n_updates | 13170 | -| policy_gradient_loss | -7.75e-05 | -| std | 0.874 | -| value_loss | 1.16e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1319 | -| time_elapsed | 23217 | -| total_timesteps | 168832 | -| train/ | | -| approx_kl | 0.0016625058 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -50.5 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 13180 | -| policy_gradient_loss | -0.000452 | -| std | 0.874 | -| value_loss | 3.97e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 7 | -| iterations | 1320 | -| time_elapsed | 23222 | -| total_timesteps | 168960 | -| train/ | | -| approx_kl | 0.0038938122 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.25 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 13190 | -| policy_gradient_loss | -0.00456 | -| std | 0.876 | -| value_loss | 9.2e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1321 | -| time_elapsed | 23226 | -| total_timesteps | 169088 | -| train/ | | -| approx_kl | 0.013907355 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -2.79 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 13200 | -| policy_gradient_loss | -0.00925 | -| std | 0.877 | -| value_loss | 4.34e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1322 | -| time_elapsed | 23234 | -| total_timesteps | 169216 | -| train/ | | -| approx_kl | 0.0020392379 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.915 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 13210 | -| policy_gradient_loss | -0.00623 | -| std | 0.878 | -| value_loss | 0.00193 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1323 | -| time_elapsed | 23238 | -| total_timesteps | 169344 | -| train/ | | -| approx_kl | 0.0033019208 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -1.39e+03 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 13220 | -| policy_gradient_loss | -0.00168 | -| std | 0.879 | -| value_loss | 2.65e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1324 | -| time_elapsed | 23243 | -| total_timesteps | 169472 | -| train/ | | -| approx_kl | 0.023724617 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -674 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 13230 | -| policy_gradient_loss | -0.00793 | -| std | 0.879 | -| value_loss | 9.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1325 | -| time_elapsed | 23247 | -| total_timesteps | 169600 | -| train/ | | -| approx_kl | 0.010585545 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -336 | -| learning_rate | 0.0003 | -| loss | 0.00088 | -| n_updates | 13240 | -| policy_gradient_loss | 0.000212 | -| std | 0.878 | -| value_loss | 2.14e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1326 | -| time_elapsed | 23252 | -| total_timesteps | 169728 | -| train/ | | -| approx_kl | 0.0011480586 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -33.7 | -| learning_rate | 0.0003 | -| loss | -0.000456 | -| n_updates | 13250 | -| policy_gradient_loss | -0.000198 | -| std | 0.877 | -| value_loss | 1.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1327 | -| time_elapsed | 23256 | -| total_timesteps | 169856 | -| train/ | | -| approx_kl | 0.005119481 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -634 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 13260 | -| policy_gradient_loss | -0.00396 | -| std | 0.877 | -| value_loss | 5.86e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 7 | -| iterations | 1328 | -| time_elapsed | 23261 | -| total_timesteps | 169984 | -| train/ | | -| approx_kl | 0.00011612009 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -14.2 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 13270 | -| policy_gradient_loss | 0.00141 | -| std | 0.877 | -| value_loss | 5.74e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 7 | -| iterations | 1329 | -| time_elapsed | 23265 | -| total_timesteps | 170112 | -| train/ | | -| approx_kl | 0.019319663 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.00924 | -| n_updates | 13280 | -| policy_gradient_loss | -0.00787 | -| std | 0.877 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 7 | -| iterations | 1330 | -| time_elapsed | 23275 | -| total_timesteps | 170240 | -| train/ | | -| approx_kl | 0.002076439 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.61 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 13290 | -| policy_gradient_loss | -0.0078 | -| std | 0.876 | -| value_loss | 0.0031 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 7 | -| iterations | 1331 | -| time_elapsed | 23279 | -| total_timesteps | 170368 | -| train/ | | -| approx_kl | 0.0072744587 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -876 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 13300 | -| policy_gradient_loss | -0.00428 | -| std | 0.876 | -| value_loss | 0.000125 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 7 | -| iterations | 1332 | -| time_elapsed | 23284 | -| total_timesteps | 170496 | -| train/ | | -| approx_kl | 0.00026849844 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -155 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 13310 | -| policy_gradient_loss | 0.00157 | -| std | 0.875 | -| value_loss | 1.55e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 7 | -| iterations | 1333 | -| time_elapsed | 23287 | -| total_timesteps | 170624 | -| train/ | | -| approx_kl | 0.0011192341 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -5.8 | -| learning_rate | 0.0003 | -| loss | 0.000249 | -| n_updates | 13320 | -| policy_gradient_loss | 0.000161 | -| std | 0.874 | -| value_loss | 5.3e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 7 | -| iterations | 1334 | -| time_elapsed | 23291 | -| total_timesteps | 170752 | -| train/ | | -| approx_kl | 0.0073743276 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -8.42 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 13330 | -| policy_gradient_loss | -0.00261 | -| std | 0.874 | -| value_loss | 1.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 7 | -| iterations | 1335 | -| time_elapsed | 23295 | -| total_timesteps | 170880 | -| train/ | | -| approx_kl | 0.019035237 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.00696 | -| n_updates | 13340 | -| policy_gradient_loss | -0.00646 | -| std | 0.874 | -| value_loss | 1.54e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1336 | -| time_elapsed | 23299 | -| total_timesteps | 171008 | -| train/ | | -| approx_kl | 1.6672537e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0966 | -| learning_rate | 0.0003 | -| loss | -0.000582 | -| n_updates | 13350 | -| policy_gradient_loss | -0.000178 | -| std | 0.877 | -| value_loss | 1.36e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1337 | -| time_elapsed | 23309 | -| total_timesteps | 171136 | -| train/ | | -| approx_kl | 0.0009363787 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -3.1 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 13360 | -| policy_gradient_loss | -0.0011 | -| std | 0.881 | -| value_loss | 0.00358 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1338 | -| time_elapsed | 23314 | -| total_timesteps | 171264 | -| train/ | | -| approx_kl | 0.003940843 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -33.1 | -| learning_rate | 0.0003 | -| loss | -0.00626 | -| n_updates | 13370 | -| policy_gradient_loss | -0.00441 | -| std | 0.884 | -| value_loss | 6.73e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1339 | -| time_elapsed | 23319 | -| total_timesteps | 171392 | -| train/ | | -| approx_kl | 0.009239922 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -1.62e+03 | -| learning_rate | 0.0003 | -| loss | -0.00903 | -| n_updates | 13380 | -| policy_gradient_loss | -0.0033 | -| std | 0.885 | -| value_loss | 1.12e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1340 | -| time_elapsed | 23324 | -| total_timesteps | 171520 | -| train/ | | -| approx_kl | 0.0152272675 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -873 | -| learning_rate | 0.0003 | -| loss | -0.000772 | -| n_updates | 13390 | -| policy_gradient_loss | -0.000895 | -| std | 0.884 | -| value_loss | 2.15e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1341 | -| time_elapsed | 23328 | -| total_timesteps | 171648 | -| train/ | | -| approx_kl | 3.961986e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -104 | -| learning_rate | 0.0003 | -| loss | -0.000295 | -| n_updates | 13400 | -| policy_gradient_loss | 5.17e-05 | -| std | 0.884 | -| value_loss | 3.99e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1342 | -| time_elapsed | 23331 | -| total_timesteps | 171776 | -| train/ | | -| approx_kl | 0.011635139 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -345 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 13410 | -| policy_gradient_loss | -0.00458 | -| std | 0.885 | -| value_loss | 9.58e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 7 | -| iterations | 1343 | -| time_elapsed | 23334 | -| total_timesteps | 171904 | -| train/ | | -| approx_kl | 0.016259097 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 13420 | -| policy_gradient_loss | -0.00365 | -| std | 0.886 | -| value_loss | 3.28e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1344 | -| time_elapsed | 23339 | -| total_timesteps | 172032 | -| train/ | | -| approx_kl | 0.012331057 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -6.11 | -| learning_rate | 0.0003 | -| loss | -0.00709 | -| n_updates | 13430 | -| policy_gradient_loss | -0.00417 | -| std | 0.885 | -| value_loss | 8.25e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1345 | -| time_elapsed | 23346 | -| total_timesteps | 172160 | -| train/ | | -| approx_kl | 0.0037010424 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 13440 | -| policy_gradient_loss | -0.000674 | -| std | 0.884 | -| value_loss | 0.000182 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1346 | -| time_elapsed | 23350 | -| total_timesteps | 172288 | -| train/ | | -| approx_kl | 0.011915064 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -88.8 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 13450 | -| policy_gradient_loss | -0.00504 | -| std | 0.883 | -| value_loss | 1.42e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1347 | -| time_elapsed | 23355 | -| total_timesteps | 172416 | -| train/ | | -| approx_kl | 0.01743337 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 13460 | -| policy_gradient_loss | -0.0092 | -| std | 0.882 | -| value_loss | 5.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1348 | -| time_elapsed | 23358 | -| total_timesteps | 172544 | -| train/ | | -| approx_kl | 0.018664492 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -13 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 13470 | -| policy_gradient_loss | -0.00607 | -| std | 0.882 | -| value_loss | 1.39e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1349 | -| time_elapsed | 23363 | -| total_timesteps | 172672 | -| train/ | | -| approx_kl | 0.00022660941 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.00122 | -| n_updates | 13480 | -| policy_gradient_loss | 0.00194 | -| std | 0.881 | -| value_loss | 3.68e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1350 | -| time_elapsed | 23367 | -| total_timesteps | 172800 | -| train/ | | -| approx_kl | 0.010261066 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.00691 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 13490 | -| policy_gradient_loss | -0.00227 | -| std | 0.879 | -| value_loss | 5.13e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 7 | -| iterations | 1351 | -| time_elapsed | 23370 | -| total_timesteps | 172928 | -| train/ | | -| approx_kl | 0.0019298065 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.00817 | -| learning_rate | 0.0003 | -| loss | -0.00807 | -| n_updates | 13500 | -| policy_gradient_loss | -0.00206 | -| std | 0.878 | -| value_loss | 4.71e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1352 | -| time_elapsed | 23374 | -| total_timesteps | 173056 | -| train/ | | -| approx_kl | 0.011672407 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.00421 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 13510 | -| policy_gradient_loss | -0.00546 | -| std | 0.88 | -| value_loss | 3.15e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1353 | -| time_elapsed | 23380 | -| total_timesteps | 173184 | -| train/ | | -| approx_kl | 0.0006835791 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.901 | -| learning_rate | 0.0003 | -| loss | -0.00099 | -| n_updates | 13520 | -| policy_gradient_loss | -0.0006 | -| std | 0.88 | -| value_loss | 0.00147 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1354 | -| time_elapsed | 23385 | -| total_timesteps | 173312 | -| train/ | | -| approx_kl | 0.0010136822 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.0238 | -| learning_rate | 0.0003 | -| loss | 0.00517 | -| n_updates | 13530 | -| policy_gradient_loss | -0.000193 | -| std | 0.878 | -| value_loss | 0.0123 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1355 | -| time_elapsed | 23389 | -| total_timesteps | 173440 | -| train/ | | -| approx_kl | 0.00042518368 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.521 | -| learning_rate | 0.0003 | -| loss | -0.000647 | -| n_updates | 13540 | -| policy_gradient_loss | -0.000247 | -| std | 0.875 | -| value_loss | 0.00025 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1356 | -| time_elapsed | 23394 | -| total_timesteps | 173568 | -| train/ | | -| approx_kl | 0.0023590978 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.00144 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 13550 | -| policy_gradient_loss | -0.00228 | -| std | 0.873 | -| value_loss | 8.24e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1357 | -| time_elapsed | 23398 | -| total_timesteps | 173696 | -| train/ | | -| approx_kl | 0.0001749848 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.00233 | -| learning_rate | 0.0003 | -| loss | 0.00097 | -| n_updates | 13560 | -| policy_gradient_loss | 0.0011 | -| std | 0.873 | -| value_loss | 7.17e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1358 | -| time_elapsed | 23402 | -| total_timesteps | 173824 | -| train/ | | -| approx_kl | 0.0049282587 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.00112 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 13570 | -| policy_gradient_loss | -0.00152 | -| std | 0.875 | -| value_loss | 6.73e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1359 | -| time_elapsed | 23406 | -| total_timesteps | 173952 | -| train/ | | -| approx_kl | 0.0012327712 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0043 | -| learning_rate | 0.0003 | -| loss | 0.00026 | -| n_updates | 13580 | -| policy_gradient_loss | 0.00014 | -| std | 0.875 | -| value_loss | 7e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1360 | -| time_elapsed | 23410 | -| total_timesteps | 174080 | -| train/ | | -| approx_kl | 2.8836075e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.00404 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 13590 | -| policy_gradient_loss | -0.000585 | -| std | 0.879 | -| value_loss | 6.38e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1361 | -| time_elapsed | 23417 | -| total_timesteps | 174208 | -| train/ | | -| approx_kl | 0.0012118276 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.218 | -| learning_rate | 0.0003 | -| loss | 0.00448 | -| n_updates | 13600 | -| policy_gradient_loss | -0.000865 | -| std | 0.884 | -| value_loss | 0.0132 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1362 | -| time_elapsed | 23420 | -| total_timesteps | 174336 | -| train/ | | -| approx_kl | 0.009456824 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 13610 | -| policy_gradient_loss | -0.00397 | -| std | 0.886 | -| value_loss | 7.05e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1363 | -| time_elapsed | 23425 | -| total_timesteps | 174464 | -| train/ | | -| approx_kl | 0.00022682967 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.0012 | -| learning_rate | 0.0003 | -| loss | -0.000624 | -| n_updates | 13620 | -| policy_gradient_loss | -2.72e-05 | -| std | 0.886 | -| value_loss | 5.68e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1364 | -| time_elapsed | 23429 | -| total_timesteps | 174592 | -| train/ | | -| approx_kl | 0.010644085 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.00527 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 13630 | -| policy_gradient_loss | -0.00489 | -| std | 0.885 | -| value_loss | 5.46e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1365 | -| time_elapsed | 23433 | -| total_timesteps | 174720 | -| train/ | | -| approx_kl | 0.0042812885 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.00255 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 13640 | -| policy_gradient_loss | -0.00118 | -| std | 0.883 | -| value_loss | 4.56e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1366 | -| time_elapsed | 23436 | -| total_timesteps | 174848 | -| train/ | | -| approx_kl | 4.615169e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.000458 | -| learning_rate | 0.0003 | -| loss | -0.000236 | -| n_updates | 13650 | -| policy_gradient_loss | 0.00026 | -| std | 0.884 | -| value_loss | 3.75e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 7 | -| iterations | 1367 | -| time_elapsed | 23440 | -| total_timesteps | 174976 | -| train/ | | -| approx_kl | 0.0022828556 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.000983 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 13660 | -| policy_gradient_loss | -0.00125 | -| std | 0.885 | -| value_loss | 3.35e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 7 | -| iterations | 1368 | -| time_elapsed | 23445 | -| total_timesteps | 175104 | -| train/ | | -| approx_kl | 0.012043963 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.00359 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 13670 | -| policy_gradient_loss | -0.00368 | -| std | 0.885 | -| value_loss | 2.83e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 7 | -| iterations | 1369 | -| time_elapsed | 23453 | -| total_timesteps | 175232 | -| train/ | | -| approx_kl | 0.0039372863 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.424 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 13680 | -| policy_gradient_loss | -0.0039 | -| std | 0.884 | -| value_loss | 0.00706 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 7 | -| iterations | 1370 | -| time_elapsed | 23457 | -| total_timesteps | 175360 | -| train/ | | -| approx_kl | 0.0020382213 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | -0.00613 | -| n_updates | 13690 | -| policy_gradient_loss | -0.00201 | -| std | 0.886 | -| value_loss | 0.0015 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 7 | -| iterations | 1371 | -| time_elapsed | 23461 | -| total_timesteps | 175488 | -| train/ | | -| approx_kl | 0.0050119604 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | 0.015 | -| learning_rate | 0.0003 | -| loss | 0.0048 | -| n_updates | 13700 | -| policy_gradient_loss | -0.000777 | -| std | 0.89 | -| value_loss | 0.0155 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 7 | -| iterations | 1372 | -| time_elapsed | 23465 | -| total_timesteps | 175616 | -| train/ | | -| approx_kl | 0.005505239 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.0903 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 13710 | -| policy_gradient_loss | -0.00241 | -| std | 0.89 | -| value_loss | 0.00151 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 7 | -| iterations | 1373 | -| time_elapsed | 23469 | -| total_timesteps | 175744 | -| train/ | | -| approx_kl | 0.0077392026 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.000331 | -| n_updates | 13720 | -| policy_gradient_loss | -0.00112 | -| std | 0.889 | -| value_loss | 0.000925 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 7 | -| iterations | 1374 | -| time_elapsed | 23472 | -| total_timesteps | 175872 | -| train/ | | -| approx_kl | 0.0030714073 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.00636 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 13730 | -| policy_gradient_loss | -0.00145 | -| std | 0.887 | -| value_loss | 0.000247 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1375 | -| time_elapsed | 23477 | -| total_timesteps | 176000 | -| train/ | | -| approx_kl | 7.4194744e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.3 | -| explained_variance | -0.00583 | -| learning_rate | 0.0003 | -| loss | -0.000188 | -| n_updates | 13740 | -| policy_gradient_loss | 0.000325 | -| std | 0.884 | -| value_loss | 0.000202 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1376 | -| time_elapsed | 23482 | -| total_timesteps | 176128 | -| train/ | | -| approx_kl | 0.010496648 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.00176 | -| learning_rate | 0.0003 | -| loss | -0.0076 | -| n_updates | 13750 | -| policy_gradient_loss | -0.00402 | -| std | 0.883 | -| value_loss | 0.000608 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1377 | -| time_elapsed | 23490 | -| total_timesteps | 176256 | -| train/ | | -| approx_kl | 0.012308001 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.175 | -| learning_rate | 0.0003 | -| loss | 0.00556 | -| n_updates | 13760 | -| policy_gradient_loss | -0.00454 | -| std | 0.883 | -| value_loss | 0.0223 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1378 | -| time_elapsed | 23494 | -| total_timesteps | 176384 | -| train/ | | -| approx_kl | 0.0029861839 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.00212 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 13770 | -| policy_gradient_loss | -0.00159 | -| std | 0.882 | -| value_loss | 0.00192 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1379 | -| time_elapsed | 23498 | -| total_timesteps | 176512 | -| train/ | | -| approx_kl | 0.00028358772 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.00215 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 13780 | -| policy_gradient_loss | 0.000566 | -| std | 0.881 | -| value_loss | 0.000338 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1380 | -| time_elapsed | 23501 | -| total_timesteps | 176640 | -| train/ | | -| approx_kl | 0.013108242 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.00985 | -| n_updates | 13790 | -| policy_gradient_loss | -0.00739 | -| std | 0.881 | -| value_loss | 0.000383 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1381 | -| time_elapsed | 23506 | -| total_timesteps | 176768 | -| train/ | | -| approx_kl | 8.213334e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | 1.1e-05 | -| n_updates | 13800 | -| policy_gradient_loss | 0.000165 | -| std | 0.881 | -| value_loss | 0.000326 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 7 | -| iterations | 1382 | -| time_elapsed | 23510 | -| total_timesteps | 176896 | -| train/ | | -| approx_kl | 0.008024506 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 13810 | -| policy_gradient_loss | -0.00366 | -| std | 0.88 | -| value_loss | 0.000253 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1383 | -| time_elapsed | 23514 | -| total_timesteps | 177024 | -| train/ | | -| approx_kl | 0.0016744253 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 13820 | -| policy_gradient_loss | 0.000781 | -| std | 0.879 | -| value_loss | 0.000133 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1384 | -| time_elapsed | 23523 | -| total_timesteps | 177152 | -| train/ | | -| approx_kl | 0.015754085 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.362 | -| learning_rate | 0.0003 | -| loss | -0.000935 | -| n_updates | 13830 | -| policy_gradient_loss | -0.00262 | -| std | 0.879 | -| value_loss | 0.00916 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1385 | -| time_elapsed | 23527 | -| total_timesteps | 177280 | -| train/ | | -| approx_kl | 0.00527145 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | 0.00829 | -| learning_rate | 0.0003 | -| loss | 0.0803 | -| n_updates | 13840 | -| policy_gradient_loss | -0.000639 | -| std | 0.878 | -| value_loss | 0.166 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1386 | -| time_elapsed | 23532 | -| total_timesteps | 177408 | -| train/ | | -| approx_kl | 0.00047721062 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0535 | -| learning_rate | 0.0003 | -| loss | -0.000907 | -| n_updates | 13850 | -| policy_gradient_loss | -0.000337 | -| std | 0.876 | -| value_loss | 0.00123 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1387 | -| time_elapsed | 23536 | -| total_timesteps | 177536 | -| train/ | | -| approx_kl | 0.0011012051 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.29 | -| explained_variance | -0.0865 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 13860 | -| policy_gradient_loss | -0.00175 | -| std | 0.874 | -| value_loss | 0.0025 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1388 | -| time_elapsed | 23539 | -| total_timesteps | 177664 | -| train/ | | -| approx_kl | 0.01975792 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.00278 | -| learning_rate | 0.0003 | -| loss | -0.00864 | -| n_updates | 13870 | -| policy_gradient_loss | -0.00722 | -| std | 0.873 | -| value_loss | 0.000471 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1389 | -| time_elapsed | 23541 | -| total_timesteps | 177792 | -| train/ | | -| approx_kl | 0.0012491266 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.000439 | -| n_updates | 13880 | -| policy_gradient_loss | 0.000161 | -| std | 0.872 | -| value_loss | 0.000412 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 7 | -| iterations | 1390 | -| time_elapsed | 23544 | -| total_timesteps | 177920 | -| train/ | | -| approx_kl | 0.005507659 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0533 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 13890 | -| policy_gradient_loss | -0.00504 | -| std | 0.872 | -| value_loss | 0.000427 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1391 | -| time_elapsed | 23548 | -| total_timesteps | 178048 | -| train/ | | -| approx_kl | 0.0016085985 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 13900 | -| policy_gradient_loss | 0.00103 | -| std | 0.87 | -| value_loss | 0.000161 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1392 | -| time_elapsed | 23556 | -| total_timesteps | 178176 | -| train/ | | -| approx_kl | 0.006669247 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.35 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 13910 | -| policy_gradient_loss | -0.00433 | -| std | 0.868 | -| value_loss | 0.0104 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1393 | -| time_elapsed | 23561 | -| total_timesteps | 178304 | -| train/ | | -| approx_kl | 4.1360036e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0477 | -| n_updates | 13920 | -| policy_gradient_loss | 0.00179 | -| std | 0.867 | -| value_loss | 0.166 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1394 | -| time_elapsed | 23565 | -| total_timesteps | 178432 | -| train/ | | -| approx_kl | 0.004292769 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | -0.00421 | -| learning_rate | 0.0003 | -| loss | 0.00143 | -| n_updates | 13930 | -| policy_gradient_loss | -0.000748 | -| std | 0.867 | -| value_loss | 0.00544 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1395 | -| time_elapsed | 23569 | -| total_timesteps | 178560 | -| train/ | | -| approx_kl | 0.0038745077 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.00314 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 13940 | -| policy_gradient_loss | -0.00617 | -| std | 0.868 | -| value_loss | 0.376 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1396 | -| time_elapsed | 23573 | -| total_timesteps | 178688 | -| train/ | | -| approx_kl | 3.7432183e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.28 | -| explained_variance | 0.00516 | -| learning_rate | 0.0003 | -| loss | 0.0789 | -| n_updates | 13950 | -| policy_gradient_loss | 0.00139 | -| std | 0.866 | -| value_loss | 0.168 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1397 | -| time_elapsed | 23577 | -| total_timesteps | 178816 | -| train/ | | -| approx_kl | 0.004194076 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00149 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 13960 | -| policy_gradient_loss | -0.00103 | -| std | 0.864 | -| value_loss | 0.0113 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 7 | -| iterations | 1398 | -| time_elapsed | 23580 | -| total_timesteps | 178944 | -| train/ | | -| approx_kl | 0.0014454303 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00373 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 13970 | -| policy_gradient_loss | -0.000629 | -| std | 0.862 | -| value_loss | 0.117 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1399 | -| time_elapsed | 23586 | -| total_timesteps | 179072 | -| train/ | | -| approx_kl | 0.018880777 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00179 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 13980 | -| policy_gradient_loss | -0.0122 | -| std | 0.86 | -| value_loss | 0.0102 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1400 | -| time_elapsed | 23593 | -| total_timesteps | 179200 | -| train/ | | -| approx_kl | 0.007288869 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.0316 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 13990 | -| policy_gradient_loss | -0.00304 | -| std | 0.859 | -| value_loss | 0.0559 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1401 | -| time_elapsed | 23598 | -| total_timesteps | 179328 | -| train/ | | -| approx_kl | 0.00052478677 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0018 | -| learning_rate | 0.0003 | -| loss | 0.00193 | -| n_updates | 14000 | -| policy_gradient_loss | 0.000507 | -| std | 0.859 | -| value_loss | 0.00293 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1402 | -| time_elapsed | 23602 | -| total_timesteps | 179456 | -| train/ | | -| approx_kl | 0.0060081226 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00686 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 14010 | -| policy_gradient_loss | -0.0065 | -| std | 0.86 | -| value_loss | 0.00262 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1403 | -| time_elapsed | 23606 | -| total_timesteps | 179584 | -| train/ | | -| approx_kl | 0.010617136 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00869 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 14020 | -| policy_gradient_loss | -0.00339 | -| std | 0.86 | -| value_loss | 0.00148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1404 | -| time_elapsed | 23609 | -| total_timesteps | 179712 | -| train/ | | -| approx_kl | 0.005859733 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0637 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 14030 | -| policy_gradient_loss | -0.00245 | -| std | 0.859 | -| value_loss | 0.000995 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1405 | -| time_elapsed | 23612 | -| total_timesteps | 179840 | -| train/ | | -| approx_kl | 0.006775146 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0926 | -| learning_rate | 0.0003 | -| loss | -0.000494 | -| n_updates | 14040 | -| policy_gradient_loss | -0.00117 | -| std | 0.858 | -| value_loss | 0.000672 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1406 | -| time_elapsed | 23614 | -| total_timesteps | 179968 | -| train/ | | -| approx_kl | 0.003416996 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 14050 | -| policy_gradient_loss | -0.00188 | -| std | 0.857 | -| value_loss | 0.000368 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1407 | -| time_elapsed | 23617 | -| total_timesteps | 180096 | -| train/ | | -| approx_kl | 0.016809318 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 14060 | -| policy_gradient_loss | -0.00806 | -| std | 0.856 | -| value_loss | 0.000445 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1408 | -| time_elapsed | 23626 | -| total_timesteps | 180224 | -| train/ | | -| approx_kl | 0.5445146 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.023 | -| learning_rate | 0.0003 | -| loss | 0.064 | -| n_updates | 14070 | -| policy_gradient_loss | -0.00726 | -| std | 0.855 | -| value_loss | 0.194 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1409 | -| time_elapsed | 23631 | -| total_timesteps | 180352 | -| train/ | | -| approx_kl | 0.002019329 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00642 | -| learning_rate | 0.0003 | -| loss | 0.464 | -| n_updates | 14080 | -| policy_gradient_loss | 0.0013 | -| std | 0.854 | -| value_loss | 1.15 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1410 | -| time_elapsed | 23636 | -| total_timesteps | 180480 | -| train/ | | -| approx_kl | 0.0020753099 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.000415 | -| learning_rate | 0.0003 | -| loss | 0.066 | -| n_updates | 14090 | -| policy_gradient_loss | -0.0013 | -| std | 0.856 | -| value_loss | 0.139 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1411 | -| time_elapsed | 23641 | -| total_timesteps | 180608 | -| train/ | | -| approx_kl | 0.0030528735 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.000603 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 14100 | -| policy_gradient_loss | -0.000378 | -| std | 0.859 | -| value_loss | 0.0847 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1412 | -| time_elapsed | 23646 | -| total_timesteps | 180736 | -| train/ | | -| approx_kl | 0.0026696152 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00235 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 14110 | -| policy_gradient_loss | -0.00139 | -| std | 0.861 | -| value_loss | 0.278 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1413 | -| time_elapsed | 23651 | -| total_timesteps | 180864 | -| train/ | | -| approx_kl | 0.004793052 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 14120 | -| policy_gradient_loss | -0.00127 | -| std | 0.861 | -| value_loss | 0.0845 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 7 | -| iterations | 1414 | -| time_elapsed | 23655 | -| total_timesteps | 180992 | -| train/ | | -| approx_kl | 0.0020539472 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00903 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 14130 | -| policy_gradient_loss | -0.000551 | -| std | 0.861 | -| value_loss | 0.0383 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1415 | -| time_elapsed | 23660 | -| total_timesteps | 181120 | -| train/ | | -| approx_kl | 0.008154264 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 14140 | -| policy_gradient_loss | -0.00686 | -| std | 0.862 | -| value_loss | 0.0279 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1416 | -| time_elapsed | 23669 | -| total_timesteps | 181248 | -| train/ | | -| approx_kl | 0.028369922 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.0093 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 14150 | -| policy_gradient_loss | -0.00468 | -| std | 0.863 | -| value_loss | 0.0937 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1417 | -| time_elapsed | 23674 | -| total_timesteps | 181376 | -| train/ | | -| approx_kl | 0.006469258 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.000786 | -| learning_rate | 0.0003 | -| loss | 0.000301 | -| n_updates | 14160 | -| policy_gradient_loss | -0.000904 | -| std | 0.861 | -| value_loss | 0.0103 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1418 | -| time_elapsed | 23678 | -| total_timesteps | 181504 | -| train/ | | -| approx_kl | 0.010537792 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 14170 | -| policy_gradient_loss | -0.00398 | -| std | 0.858 | -| value_loss | 0.00677 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1419 | -| time_elapsed | 23682 | -| total_timesteps | 181632 | -| train/ | | -| approx_kl | 0.011291783 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 14180 | -| policy_gradient_loss | -0.00295 | -| std | 0.858 | -| value_loss | 0.00472 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1420 | -| time_elapsed | 23685 | -| total_timesteps | 181760 | -| train/ | | -| approx_kl | 1.9539148e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 14190 | -| policy_gradient_loss | 0.00039 | -| std | 0.86 | -| value_loss | 0.00334 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1421 | -| time_elapsed | 23688 | -| total_timesteps | 181888 | -| train/ | | -| approx_kl | 0.0063660494 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 14200 | -| policy_gradient_loss | -0.00149 | -| std | 0.859 | -| value_loss | 0.00222 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1422 | -| time_elapsed | 23692 | -| total_timesteps | 182016 | -| train/ | | -| approx_kl | 0.009748024 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0932 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 14210 | -| policy_gradient_loss | -0.00656 | -| std | 0.857 | -| value_loss | 0.00223 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1423 | -| time_elapsed | 23703 | -| total_timesteps | 182144 | -| train/ | | -| approx_kl | 0.00073375273 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.477 | -| learning_rate | 0.0003 | -| loss | -0.00887 | -| n_updates | 14220 | -| policy_gradient_loss | -0.00546 | -| std | 0.856 | -| value_loss | 0.00865 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1424 | -| time_elapsed | 23707 | -| total_timesteps | 182272 | -| train/ | | -| approx_kl | 0.0020675175 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.1 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 14230 | -| policy_gradient_loss | -0.000919 | -| std | 0.856 | -| value_loss | 0.000614 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1425 | -| time_elapsed | 23711 | -| total_timesteps | 182400 | -| train/ | | -| approx_kl | 0.00018113013 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 14240 | -| policy_gradient_loss | 0.00106 | -| std | 0.857 | -| value_loss | 0.00061 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1426 | -| time_elapsed | 23715 | -| total_timesteps | 182528 | -| train/ | | -| approx_kl | 0.0042024236 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.000113 | -| n_updates | 14250 | -| policy_gradient_loss | -7.56e-05 | -| std | 0.856 | -| value_loss | 0.00025 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1427 | -| time_elapsed | 23719 | -| total_timesteps | 182656 | -| train/ | | -| approx_kl | 0.0013562958 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00581 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 14260 | -| policy_gradient_loss | -0.000616 | -| std | 0.855 | -| value_loss | 0.000194 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1428 | -| time_elapsed | 23723 | -| total_timesteps | 182784 | -| train/ | | -| approx_kl | 0.0031052926 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00456 | -| learning_rate | 0.0003 | -| loss | -0.000859 | -| n_updates | 14270 | -| policy_gradient_loss | -0.000628 | -| std | 0.852 | -| value_loss | 0.000172 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1429 | -| time_elapsed | 23728 | -| total_timesteps | 182912 | -| train/ | | -| approx_kl | 0.004211148 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00651 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 14280 | -| policy_gradient_loss | -0.00195 | -| std | 0.85 | -| value_loss | 0.000148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1430 | -| time_elapsed | 23731 | -| total_timesteps | 183040 | -| train/ | | -| approx_kl | 0.011597281 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | -0.00519 | -| n_updates | 14290 | -| policy_gradient_loss | -0.0041 | -| std | 0.849 | -| value_loss | 0.000125 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1431 | -| time_elapsed | 23739 | -| total_timesteps | 183168 | -| train/ | | -| approx_kl | 0.0085961595 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.618 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 14300 | -| policy_gradient_loss | -0.00385 | -| std | 0.849 | -| value_loss | 0.00384 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1432 | -| time_elapsed | 23743 | -| total_timesteps | 183296 | -| train/ | | -| approx_kl | 0.006186505 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00145 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 14310 | -| policy_gradient_loss | -0.00218 | -| std | 0.85 | -| value_loss | 6.48e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1433 | -| time_elapsed | 23747 | -| total_timesteps | 183424 | -| train/ | | -| approx_kl | 0.0048326496 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.0196 | -| learning_rate | 0.0003 | -| loss | -0.000713 | -| n_updates | 14320 | -| policy_gradient_loss | -0.000554 | -| std | 0.849 | -| value_loss | 8.17e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1434 | -| time_elapsed | 23751 | -| total_timesteps | 183552 | -| train/ | | -| approx_kl | 0.0034018955 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00045 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 14330 | -| policy_gradient_loss | -0.00416 | -| std | 0.851 | -| value_loss | 7.34e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1435 | -| time_elapsed | 23755 | -| total_timesteps | 183680 | -| train/ | | -| approx_kl | 0.014806016 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.00998 | -| n_updates | 14340 | -| policy_gradient_loss | -0.00638 | -| std | 0.851 | -| value_loss | 7.37e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1436 | -| time_elapsed | 23758 | -| total_timesteps | 183808 | -| train/ | | -| approx_kl | 0.0002649282 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 14350 | -| policy_gradient_loss | 0.000289 | -| std | 0.85 | -| value_loss | 4.98e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1437 | -| time_elapsed | 23760 | -| total_timesteps | 183936 | -| train/ | | -| approx_kl | 0.0002999166 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00953 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 14360 | -| policy_gradient_loss | 0.000348 | -| std | 0.85 | -| value_loss | 3.82e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1438 | -| time_elapsed | 23764 | -| total_timesteps | 184064 | -| train/ | | -| approx_kl | 0.010204395 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.00389 | -| n_updates | 14370 | -| policy_gradient_loss | -0.0029 | -| std | 0.848 | -| value_loss | 3.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1439 | -| time_elapsed | 23771 | -| total_timesteps | 184192 | -| train/ | | -| approx_kl | 0.007516532 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.117 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 14380 | -| policy_gradient_loss | -0.00337 | -| std | 0.844 | -| value_loss | 0.117 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1440 | -| time_elapsed | 23775 | -| total_timesteps | 184320 | -| train/ | | -| approx_kl | 0.0007641632 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 14390 | -| policy_gradient_loss | -0.00105 | -| std | 0.841 | -| value_loss | 0.0056 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1441 | -| time_elapsed | 23778 | -| total_timesteps | 184448 | -| train/ | | -| approx_kl | 0.01614029 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0031 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 14400 | -| policy_gradient_loss | -0.0106 | -| std | 0.84 | -| value_loss | 0.00152 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1442 | -| time_elapsed | 23784 | -| total_timesteps | 184576 | -| train/ | | -| approx_kl | 0.0089418255 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.007 | -| n_updates | 14410 | -| policy_gradient_loss | -0.00503 | -| std | 0.84 | -| value_loss | 0.000728 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1443 | -| time_elapsed | 23788 | -| total_timesteps | 184704 | -| train/ | | -| approx_kl | 0.0042834277 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | -0.00199 | -| n_updates | 14420 | -| policy_gradient_loss | -0.00116 | -| std | 0.841 | -| value_loss | 0.00067 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1444 | -| time_elapsed | 23791 | -| total_timesteps | 184832 | -| train/ | | -| approx_kl | 2.2440683e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | 0.000203 | -| n_updates | 14430 | -| policy_gradient_loss | 0.00037 | -| std | 0.84 | -| value_loss | 0.00028 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 7 | -| iterations | 1445 | -| time_elapsed | 23795 | -| total_timesteps | 184960 | -| train/ | | -| approx_kl | 0.007704031 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0986 | -| learning_rate | 0.0003 | -| loss | -0.00671 | -| n_updates | 14440 | -| policy_gradient_loss | -0.00351 | -| std | 0.838 | -| value_loss | 0.000231 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1446 | -| time_elapsed | 23800 | -| total_timesteps | 185088 | -| train/ | | -| approx_kl | 0.0036558802 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | 0.000524 | -| n_updates | 14450 | -| policy_gradient_loss | 0.000111 | -| std | 0.836 | -| value_loss | 0.000124 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1447 | -| time_elapsed | 23808 | -| total_timesteps | 185216 | -| train/ | | -| approx_kl | 0.0066607906 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.35 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 14460 | -| policy_gradient_loss | -0.00627 | -| std | 0.837 | -| value_loss | 0.00159 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1448 | -| time_elapsed | 23812 | -| total_timesteps | 185344 | -| train/ | | -| approx_kl | 0.00013416726 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 14470 | -| policy_gradient_loss | 0.000502 | -| std | 0.838 | -| value_loss | 4.62e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1449 | -| time_elapsed | 23815 | -| total_timesteps | 185472 | -| train/ | | -| approx_kl | 0.0074239317 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.000688 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 14480 | -| policy_gradient_loss | -0.00235 | -| std | 0.838 | -| value_loss | 3.5e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1450 | -| time_elapsed | 23818 | -| total_timesteps | 185600 | -| train/ | | -| approx_kl | 0.00034867693 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 14490 | -| policy_gradient_loss | -0.000442 | -| std | 0.841 | -| value_loss | 2.79e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1451 | -| time_elapsed | 23821 | -| total_timesteps | 185728 | -| train/ | | -| approx_kl | 0.009626411 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0604 | -| learning_rate | 0.0003 | -| loss | -0.00498 | -| n_updates | 14500 | -| policy_gradient_loss | -0.00331 | -| std | 0.843 | -| value_loss | 2.09e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1452 | -| time_elapsed | 23824 | -| total_timesteps | 185856 | -| train/ | | -| approx_kl | 0.011849258 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 14510 | -| policy_gradient_loss | -0.00747 | -| std | 0.845 | -| value_loss | 2.05e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 7 | -| iterations | 1453 | -| time_elapsed | 23827 | -| total_timesteps | 185984 | -| train/ | | -| approx_kl | 0.011066415 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 14520 | -| policy_gradient_loss | -0.00396 | -| std | 0.844 | -| value_loss | 5.84e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 7 | -| iterations | 1454 | -| time_elapsed | 23831 | -| total_timesteps | 186112 | -| train/ | | -| approx_kl | 0.00784926 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | -0.00996 | -| n_updates | 14530 | -| policy_gradient_loss | -0.0056 | -| std | 0.843 | -| value_loss | 7.07e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 7 | -| iterations | 1455 | -| time_elapsed | 23841 | -| total_timesteps | 186240 | -| train/ | | -| approx_kl | 0.0009944956 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.37 | -| learning_rate | 0.0003 | -| loss | 0.00543 | -| n_updates | 14540 | -| policy_gradient_loss | -0.00114 | -| std | 0.844 | -| value_loss | 0.0218 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 7 | -| iterations | 1456 | -| time_elapsed | 23847 | -| total_timesteps | 186368 | -| train/ | | -| approx_kl | 0.00013883831 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0287 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 14550 | -| policy_gradient_loss | -3.77e-05 | -| std | 0.844 | -| value_loss | 0.0736 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 7 | -| iterations | 1457 | -| time_elapsed | 23851 | -| total_timesteps | 186496 | -| train/ | | -| approx_kl | 0.0129511515 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 14560 | -| policy_gradient_loss | -0.0058 | -| std | 0.843 | -| value_loss | 0.00655 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 7 | -| iterations | 1458 | -| time_elapsed | 23854 | -| total_timesteps | 186624 | -| train/ | | -| approx_kl | 0.0010805349 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0078 | -| learning_rate | 0.0003 | -| loss | 0.565 | -| n_updates | 14570 | -| policy_gradient_loss | 0.00116 | -| std | 0.843 | -| value_loss | 1.28 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 7 | -| iterations | 1459 | -| time_elapsed | 23857 | -| total_timesteps | 186752 | -| train/ | | -| approx_kl | 0.0047452445 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00862 | -| learning_rate | 0.0003 | -| loss | 0.069 | -| n_updates | 14580 | -| policy_gradient_loss | -0.00198 | -| std | 0.844 | -| value_loss | 0.147 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 7 | -| iterations | 1460 | -| time_elapsed | 23861 | -| total_timesteps | 186880 | -| train/ | | -| approx_kl | 2.6762486e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.00462 | -| n_updates | 14590 | -| policy_gradient_loss | 0.00229 | -| std | 0.845 | -| value_loss | 0.0119 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1461 | -| time_elapsed | 23865 | -| total_timesteps | 187008 | -| train/ | | -| approx_kl | 0.00012551947 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00173 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 14600 | -| policy_gradient_loss | 0.000314 | -| std | 0.847 | -| value_loss | 0.237 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1462 | -| time_elapsed | 23876 | -| total_timesteps | 187136 | -| train/ | | -| approx_kl | 0.00077152625 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0177 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 14610 | -| policy_gradient_loss | -0.000461 | -| std | 0.849 | -| value_loss | 0.092 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1463 | -| time_elapsed | 23879 | -| total_timesteps | 187264 | -| train/ | | -| approx_kl | 0.004768778 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00903 | -| learning_rate | 0.0003 | -| loss | 0.0351 | -| n_updates | 14620 | -| policy_gradient_loss | -0.000734 | -| std | 0.85 | -| value_loss | 0.0722 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1464 | -| time_elapsed | 23885 | -| total_timesteps | 187392 | -| train/ | | -| approx_kl | 0.008110451 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00267 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 14630 | -| policy_gradient_loss | -0.00772 | -| std | 0.851 | -| value_loss | 0.0311 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1465 | -| time_elapsed | 23889 | -| total_timesteps | 187520 | -| train/ | | -| approx_kl | 0.004569239 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00432 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 14640 | -| policy_gradient_loss | -0.00117 | -| std | 0.851 | -| value_loss | 0.00808 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1466 | -| time_elapsed | 23892 | -| total_timesteps | 187648 | -| train/ | | -| approx_kl | 0.0012136484 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 14650 | -| policy_gradient_loss | 4.61e-05 | -| std | 0.851 | -| value_loss | 0.0196 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1467 | -| time_elapsed | 23897 | -| total_timesteps | 187776 | -| train/ | | -| approx_kl | 0.0010104105 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00819 | -| learning_rate | 0.0003 | -| loss | 0.00492 | -| n_updates | 14660 | -| policy_gradient_loss | -0.000322 | -| std | 0.851 | -| value_loss | 0.0127 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.6 | -| time/ | | -| fps | 7 | -| iterations | 1468 | -| time_elapsed | 23900 | -| total_timesteps | 187904 | -| train/ | | -| approx_kl | 0.008914628 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00378 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 14670 | -| policy_gradient_loss | -0.00467 | -| std | 0.851 | -| value_loss | 0.0104 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1469 | -| time_elapsed | 23904 | -| total_timesteps | 188032 | -| train/ | | -| approx_kl | 0.00079461886 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00428 | -| learning_rate | 0.0003 | -| loss | -0.000955 | -| n_updates | 14680 | -| policy_gradient_loss | -0.000345 | -| std | 0.852 | -| value_loss | 0.0089 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1470 | -| time_elapsed | 23913 | -| total_timesteps | 188160 | -| train/ | | -| approx_kl | 0.0039570755 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00315 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 14690 | -| policy_gradient_loss | -3.8e-05 | -| std | 0.852 | -| value_loss | 0.326 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1471 | -| time_elapsed | 23917 | -| total_timesteps | 188288 | -| train/ | | -| approx_kl | 0.006875211 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.000471 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 14700 | -| policy_gradient_loss | -0.00145 | -| std | 0.849 | -| value_loss | 0.0158 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1472 | -| time_elapsed | 23920 | -| total_timesteps | 188416 | -| train/ | | -| approx_kl | 0.0018702629 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.000838 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 14710 | -| policy_gradient_loss | -0.00145 | -| std | 0.847 | -| value_loss | 0.00694 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1473 | -| time_elapsed | 23923 | -| total_timesteps | 188544 | -| train/ | | -| approx_kl | 0.006249755 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00303 | -| learning_rate | 0.0003 | -| loss | 0.000167 | -| n_updates | 14720 | -| policy_gradient_loss | -0.000709 | -| std | 0.847 | -| value_loss | 0.00539 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1474 | -| time_elapsed | 23927 | -| total_timesteps | 188672 | -| train/ | | -| approx_kl | 0.004390832 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0066 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 14730 | -| policy_gradient_loss | -0.00377 | -| std | 0.848 | -| value_loss | 0.00405 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1475 | -| time_elapsed | 23933 | -| total_timesteps | 188800 | -| train/ | | -| approx_kl | 1.2839213e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00117 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 14740 | -| policy_gradient_loss | 0.00327 | -| std | 0.849 | -| value_loss | 0.00393 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.72 | -| time/ | | -| fps | 7 | -| iterations | 1476 | -| time_elapsed | 23937 | -| total_timesteps | 188928 | -| train/ | | -| approx_kl | 7.407274e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00916 | -| learning_rate | 0.0003 | -| loss | 0.247 | -| n_updates | 14750 | -| policy_gradient_loss | 0.000987 | -| std | 0.849 | -| value_loss | 0.555 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1477 | -| time_elapsed | 23939 | -| total_timesteps | 189056 | -| train/ | | -| approx_kl | 0.010220061 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00507 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 14760 | -| policy_gradient_loss | -0.00606 | -| std | 0.847 | -| value_loss | 0.0894 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1478 | -| time_elapsed | 23947 | -| total_timesteps | 189184 | -| train/ | | -| approx_kl | 0.006162269 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0208 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 14770 | -| policy_gradient_loss | -0.00493 | -| std | 0.847 | -| value_loss | 0.0575 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1479 | -| time_elapsed | 23951 | -| total_timesteps | 189312 | -| train/ | | -| approx_kl | 0.0020114728 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00139 | -| learning_rate | 0.0003 | -| loss | 0.00343 | -| n_updates | 14780 | -| policy_gradient_loss | -0.00189 | -| std | 0.849 | -| value_loss | 0.018 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1480 | -| time_elapsed | 23956 | -| total_timesteps | 189440 | -| train/ | | -| approx_kl | 0.0066855378 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00349 | -| learning_rate | 0.0003 | -| loss | 0.642 | -| n_updates | 14790 | -| policy_gradient_loss | -0.00488 | -| std | 0.849 | -| value_loss | 1.41 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1481 | -| time_elapsed | 23960 | -| total_timesteps | 189568 | -| train/ | | -| approx_kl | 0.0062799826 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0047 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 14800 | -| policy_gradient_loss | -0.00383 | -| std | 0.848 | -| value_loss | 0.509 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1482 | -| time_elapsed | 23965 | -| total_timesteps | 189696 | -| train/ | | -| approx_kl | 0.0016326942 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00771 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 14810 | -| policy_gradient_loss | -0.000132 | -| std | 0.848 | -| value_loss | 0.0438 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1483 | -| time_elapsed | 23967 | -| total_timesteps | 189824 | -| train/ | | -| approx_kl | 0.0017199446 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00063 | -| learning_rate | 0.0003 | -| loss | 0.00023 | -| n_updates | 14820 | -| policy_gradient_loss | -0.000451 | -| std | 0.847 | -| value_loss | 0.015 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.79 | -| time/ | | -| fps | 7 | -| iterations | 1484 | -| time_elapsed | 23971 | -| total_timesteps | 189952 | -| train/ | | -| approx_kl | 0.0025254227 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00278 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 14830 | -| policy_gradient_loss | -0.00381 | -| std | 0.845 | -| value_loss | 0.0101 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1485 | -| time_elapsed | 23975 | -| total_timesteps | 190080 | -| train/ | | -| approx_kl | 0.0025186348 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00494 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 14840 | -| policy_gradient_loss | 0.000393 | -| std | 0.845 | -| value_loss | 0.00656 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1486 | -| time_elapsed | 23983 | -| total_timesteps | 190208 | -| train/ | | -| approx_kl | 0.0046010795 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0616 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 14850 | -| policy_gradient_loss | -0.00915 | -| std | 0.846 | -| value_loss | 0.0622 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1487 | -| time_elapsed | 23986 | -| total_timesteps | 190336 | -| train/ | | -| approx_kl | 0.008396329 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00692 | -| learning_rate | 0.0003 | -| loss | 0.00418 | -| n_updates | 14860 | -| policy_gradient_loss | -0.00275 | -| std | 0.847 | -| value_loss | 0.021 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1488 | -| time_elapsed | 23989 | -| total_timesteps | 190464 | -| train/ | | -| approx_kl | 0.0001805611 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.000125 | -| learning_rate | 0.0003 | -| loss | 0.384 | -| n_updates | 14870 | -| policy_gradient_loss | 0.000233 | -| std | 0.848 | -| value_loss | 0.872 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1489 | -| time_elapsed | 23993 | -| total_timesteps | 190592 | -| train/ | | -| approx_kl | 0.0008736234 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00549 | -| learning_rate | 0.0003 | -| loss | 0.0341 | -| n_updates | 14880 | -| policy_gradient_loss | -0.000323 | -| std | 0.848 | -| value_loss | 0.0893 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1490 | -| time_elapsed | 23996 | -| total_timesteps | 190720 | -| train/ | | -| approx_kl | 0.0046480787 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00412 | -| learning_rate | 0.0003 | -| loss | 0.33 | -| n_updates | 14890 | -| policy_gradient_loss | -0.00695 | -| std | 0.848 | -| value_loss | 0.892 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1491 | -| time_elapsed | 23999 | -| total_timesteps | 190848 | -| train/ | | -| approx_kl | 0.004870458 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00427 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 14900 | -| policy_gradient_loss | -0.00123 | -| std | 0.851 | -| value_loss | 0.0478 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 7 | -| iterations | 1492 | -| time_elapsed | 24003 | -| total_timesteps | 190976 | -| train/ | | -| approx_kl | 0.000555153 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00268 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 14910 | -| policy_gradient_loss | -0.000426 | -| std | 0.853 | -| value_loss | 0.0184 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 7 | -| iterations | 1493 | -| time_elapsed | 24006 | -| total_timesteps | 191104 | -| train/ | | -| approx_kl | 8.021435e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00067 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 14920 | -| policy_gradient_loss | 0.000249 | -| std | 0.854 | -| value_loss | 0.0198 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 7 | -| iterations | 1494 | -| time_elapsed | 24015 | -| total_timesteps | 191232 | -| train/ | | -| approx_kl | 0.0077125914 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00859 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 14930 | -| policy_gradient_loss | -0.00467 | -| std | 0.853 | -| value_loss | 0.114 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 7 | -| iterations | 1495 | -| time_elapsed | 24020 | -| total_timesteps | 191360 | -| train/ | | -| approx_kl | 0.0015795911 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00397 | -| learning_rate | 0.0003 | -| loss | 0.0253 | -| n_updates | 14940 | -| policy_gradient_loss | 0.000471 | -| std | 0.852 | -| value_loss | 0.0551 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 7 | -| iterations | 1496 | -| time_elapsed | 24024 | -| total_timesteps | 191488 | -| train/ | | -| approx_kl | 0.00043472555 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.000608 | -| learning_rate | 0.0003 | -| loss | 0.0046 | -| n_updates | 14950 | -| policy_gradient_loss | -0.000182 | -| std | 0.851 | -| value_loss | 0.0128 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 7 | -| iterations | 1497 | -| time_elapsed | 24029 | -| total_timesteps | 191616 | -| train/ | | -| approx_kl | 0.00044002943 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00272 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 14960 | -| policy_gradient_loss | -0.000476 | -| std | 0.851 | -| value_loss | 0.546 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 7 | -| iterations | 1498 | -| time_elapsed | 24034 | -| total_timesteps | 191744 | -| train/ | | -| approx_kl | 0.005934284 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00238 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 14970 | -| policy_gradient_loss | -0.00217 | -| std | 0.849 | -| value_loss | 0.0323 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 7 | -| iterations | 1499 | -| time_elapsed | 24037 | -| total_timesteps | 191872 | -| train/ | | -| approx_kl | 0.001025212 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 7.49e-05 | -| learning_rate | 0.0003 | -| loss | -0.000107 | -| n_updates | 14980 | -| policy_gradient_loss | -0.000409 | -| std | 0.848 | -| value_loss | 0.0142 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 7 | -| iterations | 1500 | -| time_elapsed | 24041 | -| total_timesteps | 192000 | -| train/ | | -| approx_kl | 0.007049594 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.000166 | -| learning_rate | 0.0003 | -| loss | -0.000306 | -| n_updates | 14990 | -| policy_gradient_loss | -0.00176 | -| std | 0.848 | -| value_loss | 0.011 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 7 | -| iterations | 1501 | -| time_elapsed | 24045 | -| total_timesteps | 192128 | -| train/ | | -| approx_kl | 0.0012204787 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 7.34e-05 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 15000 | -| policy_gradient_loss | -0.000406 | -| std | 0.848 | -| value_loss | 0.0633 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 7 | -| iterations | 1502 | -| time_elapsed | 24055 | -| total_timesteps | 192256 | -| train/ | | -| approx_kl | 0.0017593754 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0427 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 15010 | -| policy_gradient_loss | -0.00269 | -| std | 0.849 | -| value_loss | 0.005 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 7 | -| iterations | 1503 | -| time_elapsed | 24060 | -| total_timesteps | 192384 | -| train/ | | -| approx_kl | 0.0016973563 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00208 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 15020 | -| policy_gradient_loss | -0.00106 | -| std | 0.85 | -| value_loss | 0.00288 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 7 | -| iterations | 1504 | -| time_elapsed | 24064 | -| total_timesteps | 192512 | -| train/ | | -| approx_kl | 0.0068211695 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00794 | -| learning_rate | 0.0003 | -| loss | 0.00955 | -| n_updates | 15030 | -| policy_gradient_loss | -0.00155 | -| std | 0.853 | -| value_loss | 0.022 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 8 | -| iterations | 1505 | -| time_elapsed | 24068 | -| total_timesteps | 192640 | -| train/ | | -| approx_kl | 0.0065235724 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00112 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 15040 | -| policy_gradient_loss | -0.0057 | -| std | 0.856 | -| value_loss | 0.00447 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 8 | -| iterations | 1506 | -| time_elapsed | 24073 | -| total_timesteps | 192768 | -| train/ | | -| approx_kl | 2.9898249e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00132 | -| learning_rate | 0.0003 | -| loss | 0.000963 | -| n_updates | 15050 | -| policy_gradient_loss | 0.00173 | -| std | 0.857 | -| value_loss | 0.00295 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.3 | -| time/ | | -| fps | 8 | -| iterations | 1507 | -| time_elapsed | 24076 | -| total_timesteps | 192896 | -| train/ | | -| approx_kl | 0.008243019 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | 0.234 | -| n_updates | 15060 | -| policy_gradient_loss | -0.00983 | -| std | 0.858 | -| value_loss | 0.589 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1508 | -| time_elapsed | 24080 | -| total_timesteps | 193024 | -| train/ | | -| approx_kl | 0.005789708 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00288 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 15070 | -| policy_gradient_loss | -0.000734 | -| std | 0.858 | -| value_loss | 0.0549 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1509 | -| time_elapsed | 24089 | -| total_timesteps | 193152 | -| train/ | | -| approx_kl | 0.00628792 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 15080 | -| policy_gradient_loss | -0.00486 | -| std | 0.858 | -| value_loss | 0.0482 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1510 | -| time_elapsed | 24094 | -| total_timesteps | 193280 | -| train/ | | -| approx_kl | 0.0089719705 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00017 | -| learning_rate | 0.0003 | -| loss | 0.00361 | -| n_updates | 15090 | -| policy_gradient_loss | -0.00118 | -| std | 0.858 | -| value_loss | 0.0116 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1511 | -| time_elapsed | 24098 | -| total_timesteps | 193408 | -| train/ | | -| approx_kl | 0.004110527 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.000647 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 15100 | -| policy_gradient_loss | -0.00147 | -| std | 0.859 | -| value_loss | 0.00828 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1512 | -| time_elapsed | 24101 | -| total_timesteps | 193536 | -| train/ | | -| approx_kl | 0.00019600522 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00197 | -| learning_rate | 0.0003 | -| loss | -0.000191 | -| n_updates | 15110 | -| policy_gradient_loss | 0.000358 | -| std | 0.858 | -| value_loss | 0.00646 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1513 | -| time_elapsed | 24105 | -| total_timesteps | 193664 | -| train/ | | -| approx_kl | 0.0016810768 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00459 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 15120 | -| policy_gradient_loss | 0.000256 | -| std | 0.856 | -| value_loss | 0.00475 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1514 | -| time_elapsed | 24109 | -| total_timesteps | 193792 | -| train/ | | -| approx_kl | 0.0038617956 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00693 | -| n_updates | 15130 | -| policy_gradient_loss | -0.00286 | -| std | 0.856 | -| value_loss | 0.0031 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1515 | -| time_elapsed | 24112 | -| total_timesteps | 193920 | -| train/ | | -| approx_kl | 0.013455881 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.00845 | -| n_updates | 15140 | -| policy_gradient_loss | -0.00613 | -| std | 0.858 | -| value_loss | 0.0019 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1516 | -| time_elapsed | 24114 | -| total_timesteps | 194048 | -| train/ | | -| approx_kl | 0.000783117 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 15150 | -| policy_gradient_loss | -0.000376 | -| std | 0.86 | -| value_loss | 0.00131 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1517 | -| time_elapsed | 24122 | -| total_timesteps | 194176 | -| train/ | | -| approx_kl | 0.0036489586 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.107 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 15160 | -| policy_gradient_loss | 0.000218 | -| std | 0.861 | -| value_loss | 0.00583 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1518 | -| time_elapsed | 24127 | -| total_timesteps | 194304 | -| train/ | | -| approx_kl | 0.00027252128 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | 0.000447 | -| n_updates | 15170 | -| policy_gradient_loss | 0.000121 | -| std | 0.861 | -| value_loss | 0.000538 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1519 | -| time_elapsed | 24130 | -| total_timesteps | 194432 | -| train/ | | -| approx_kl | 0.004570855 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 15180 | -| policy_gradient_loss | -0.00348 | -| std | 0.861 | -| value_loss | 0.000206 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1520 | -| time_elapsed | 24134 | -| total_timesteps | 194560 | -| train/ | | -| approx_kl | 1.9506551e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | 0.000234 | -| n_updates | 15190 | -| policy_gradient_loss | 0.00217 | -| std | 0.861 | -| value_loss | 0.000106 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1521 | -| time_elapsed | 24137 | -| total_timesteps | 194688 | -| train/ | | -| approx_kl | 0.00058357045 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | -0.00732 | -| n_updates | 15200 | -| policy_gradient_loss | -0.000242 | -| std | 0.862 | -| value_loss | 6.48e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1522 | -| time_elapsed | 24140 | -| total_timesteps | 194816 | -| train/ | | -| approx_kl | 0.010172074 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | -0.000733 | -| n_updates | 15210 | -| policy_gradient_loss | -0.00201 | -| std | 0.864 | -| value_loss | 3.47e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1523 | -| time_elapsed | 24145 | -| total_timesteps | 194944 | -| train/ | | -| approx_kl | 0.0046913405 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.0074 | -| n_updates | 15220 | -| policy_gradient_loss | -0.003 | -| std | 0.864 | -| value_loss | 3.73e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1524 | -| time_elapsed | 24149 | -| total_timesteps | 195072 | -| train/ | | -| approx_kl | 0.014569356 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 15230 | -| policy_gradient_loss | -0.00808 | -| std | 0.863 | -| value_loss | 3.34e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1525 | -| time_elapsed | 24157 | -| total_timesteps | 195200 | -| train/ | | -| approx_kl | 0.0076462496 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.507 | -| learning_rate | 0.0003 | -| loss | 0.000205 | -| n_updates | 15240 | -| policy_gradient_loss | -0.0012 | -| std | 0.862 | -| value_loss | 0.00598 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1526 | -| time_elapsed | 24161 | -| total_timesteps | 195328 | -| train/ | | -| approx_kl | 0.0017175698 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 15250 | -| policy_gradient_loss | -0.000533 | -| std | 0.861 | -| value_loss | 1.52e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1527 | -| time_elapsed | 24165 | -| total_timesteps | 195456 | -| train/ | | -| approx_kl | 0.0070537906 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 15260 | -| policy_gradient_loss | -0.00212 | -| std | 0.861 | -| value_loss | 9.14e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1528 | -| time_elapsed | 24170 | -| total_timesteps | 195584 | -| train/ | | -| approx_kl | 0.007872706 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0699 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 15270 | -| policy_gradient_loss | -0.00698 | -| std | 0.862 | -| value_loss | 1.03e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1529 | -| time_elapsed | 24175 | -| total_timesteps | 195712 | -| train/ | | -| approx_kl | 0.01310863 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.45 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 15280 | -| policy_gradient_loss | -0.0022 | -| std | 0.862 | -| value_loss | 2.59e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1530 | -| time_elapsed | 24178 | -| total_timesteps | 195840 | -| train/ | | -| approx_kl | 0.004081196 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 15290 | -| policy_gradient_loss | -0.0025 | -| std | 0.863 | -| value_loss | 2.28e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1531 | -| time_elapsed | 24183 | -| total_timesteps | 195968 | -| train/ | | -| approx_kl | 0.00013823994 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0958 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 15300 | -| policy_gradient_loss | 0.0015 | -| std | 0.863 | -| value_loss | 3.24e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1532 | -| time_elapsed | 24187 | -| total_timesteps | 196096 | -| train/ | | -| approx_kl | 0.0003572069 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.477 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 15310 | -| policy_gradient_loss | 0.000199 | -| std | 0.863 | -| value_loss | 1.07e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1533 | -| time_elapsed | 24195 | -| total_timesteps | 196224 | -| train/ | | -| approx_kl | 0.0035495558 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.54 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 15320 | -| policy_gradient_loss | -0.00639 | -| std | 0.864 | -| value_loss | 0.00131 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1534 | -| time_elapsed | 24200 | -| total_timesteps | 196352 | -| train/ | | -| approx_kl | 0.0019348608 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.00192 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 15330 | -| policy_gradient_loss | -0.00104 | -| std | 0.864 | -| value_loss | 0.00427 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1535 | -| time_elapsed | 24204 | -| total_timesteps | 196480 | -| train/ | | -| approx_kl | 0.015008641 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 15340 | -| policy_gradient_loss | -0.0127 | -| std | 0.864 | -| value_loss | 0.00057 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1536 | -| time_elapsed | 24208 | -| total_timesteps | 196608 | -| train/ | | -| approx_kl | 0.0005860282 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | 0.000341 | -| n_updates | 15350 | -| policy_gradient_loss | 0.000171 | -| std | 0.865 | -| value_loss | 0.000185 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1537 | -| time_elapsed | 24213 | -| total_timesteps | 196736 | -| train/ | | -| approx_kl | 0.0048332363 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.696 | -| learning_rate | 0.0003 | -| loss | -0.00702 | -| n_updates | 15360 | -| policy_gradient_loss | -0.00276 | -| std | 0.866 | -| value_loss | 3.25e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1538 | -| time_elapsed | 24217 | -| total_timesteps | 196864 | -| train/ | | -| approx_kl | 0.0030963025 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | 0.000946 | -| n_updates | 15370 | -| policy_gradient_loss | 0.000524 | -| std | 0.865 | -| value_loss | 1.56e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 8 | -| iterations | 1539 | -| time_elapsed | 24220 | -| total_timesteps | 196992 | -| train/ | | -| approx_kl | 0.0028499505 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 15380 | -| policy_gradient_loss | -0.00383 | -| std | 0.863 | -| value_loss | 1.54e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1540 | -| time_elapsed | 24224 | -| total_timesteps | 197120 | -| train/ | | -| approx_kl | 0.0037199073 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.362 | -| learning_rate | 0.0003 | -| loss | -0.000203 | -| n_updates | 15390 | -| policy_gradient_loss | -0.000139 | -| std | 0.861 | -| value_loss | 4.81e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1541 | -| time_elapsed | 24234 | -| total_timesteps | 197248 | -| train/ | | -| approx_kl | 0.06027631 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00387 | -| learning_rate | 0.0003 | -| loss | 0.705 | -| n_updates | 15400 | -| policy_gradient_loss | -0.00305 | -| std | 0.86 | -| value_loss | 1.66 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1542 | -| time_elapsed | 24237 | -| total_timesteps | 197376 | -| train/ | | -| approx_kl | 0.00082098506 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 15410 | -| policy_gradient_loss | -0.000731 | -| std | 0.858 | -| value_loss | 0.0612 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1543 | -| time_elapsed | 24241 | -| total_timesteps | 197504 | -| train/ | | -| approx_kl | 0.00037355395 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.000623 | -| learning_rate | 0.0003 | -| loss | 0.302 | -| n_updates | 15420 | -| policy_gradient_loss | 0.00113 | -| std | 0.859 | -| value_loss | 0.659 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1544 | -| time_elapsed | 24245 | -| total_timesteps | 197632 | -| train/ | | -| approx_kl | 0.0011608098 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00794 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 15430 | -| policy_gradient_loss | -0.000512 | -| std | 0.859 | -| value_loss | 0.0202 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1545 | -| time_elapsed | 24249 | -| total_timesteps | 197760 | -| train/ | | -| approx_kl | 6.756652e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | 0.000683 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 15440 | -| policy_gradient_loss | 0.000212 | -| std | 0.858 | -| value_loss | 0.0103 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 8 | -| iterations | 1546 | -| time_elapsed | 24254 | -| total_timesteps | 197888 | -| train/ | | -| approx_kl | 0.001233737 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.27 | -| explained_variance | -0.00259 | -| learning_rate | 0.0003 | -| loss | 0.0014 | -| n_updates | 15450 | -| policy_gradient_loss | -0.000145 | -| std | 0.857 | -| value_loss | 0.0078 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1547 | -| time_elapsed | 24258 | -| total_timesteps | 198016 | -| train/ | | -| approx_kl | 0.0025207936 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00147 | -| learning_rate | 0.0003 | -| loss | 0.0032 | -| n_updates | 15460 | -| policy_gradient_loss | -0.0022 | -| std | 0.855 | -| value_loss | 0.018 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1548 | -| time_elapsed | 24269 | -| total_timesteps | 198144 | -| train/ | | -| approx_kl | 0.011204197 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 15470 | -| policy_gradient_loss | -0.00724 | -| std | 0.853 | -| value_loss | 0.0553 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1549 | -| time_elapsed | 24271 | -| total_timesteps | 198272 | -| train/ | | -| approx_kl | 0.001504927 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00209 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 15480 | -| policy_gradient_loss | 0.000521 | -| std | 0.85 | -| value_loss | 0.0361 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1550 | -| time_elapsed | 24273 | -| total_timesteps | 198400 | -| train/ | | -| approx_kl | 0.0018035858 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 3.76e-06 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 15490 | -| policy_gradient_loss | -0.0011 | -| std | 0.848 | -| value_loss | 0.00959 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1551 | -| time_elapsed | 24275 | -| total_timesteps | 198528 | -| train/ | | -| approx_kl | 0.013192654 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.000357 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 15500 | -| policy_gradient_loss | -0.00955 | -| std | 0.847 | -| value_loss | 0.00687 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1552 | -| time_elapsed | 24277 | -| total_timesteps | 198656 | -| train/ | | -| approx_kl | 5.488051e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00139 | -| learning_rate | 0.0003 | -| loss | 0.000427 | -| n_updates | 15510 | -| policy_gradient_loss | 0.00143 | -| std | 0.847 | -| value_loss | 0.00599 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1553 | -| time_elapsed | 24279 | -| total_timesteps | 198784 | -| train/ | | -| approx_kl | 0.0025618137 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00199 | -| learning_rate | 0.0003 | -| loss | 0.000511 | -| n_updates | 15520 | -| policy_gradient_loss | -0.000362 | -| std | 0.848 | -| value_loss | 0.00488 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 8 | -| iterations | 1554 | -| time_elapsed | 24281 | -| total_timesteps | 198912 | -| train/ | | -| approx_kl | 0.0038696053 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00477 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 15530 | -| policy_gradient_loss | -0.00142 | -| std | 0.848 | -| value_loss | 0.00327 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1555 | -| time_elapsed | 24284 | -| total_timesteps | 199040 | -| train/ | | -| approx_kl | 0.00080419704 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 15540 | -| policy_gradient_loss | -0.000489 | -| std | 0.85 | -| value_loss | 0.00207 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1556 | -| time_elapsed | 24292 | -| total_timesteps | 199168 | -| train/ | | -| approx_kl | 0.0027968613 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.0895 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 15550 | -| policy_gradient_loss | -0.00363 | -| std | 0.851 | -| value_loss | 0.0173 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1557 | -| time_elapsed | 24296 | -| total_timesteps | 199296 | -| train/ | | -| approx_kl | 0.00021676254 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00194 | -| learning_rate | 0.0003 | -| loss | 0.918 | -| n_updates | 15560 | -| policy_gradient_loss | -0.000532 | -| std | 0.853 | -| value_loss | 2.01 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1558 | -| time_elapsed | 24300 | -| total_timesteps | 199424 | -| train/ | | -| approx_kl | 0.0041953563 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00579 | -| learning_rate | 0.0003 | -| loss | 0.0047 | -| n_updates | 15570 | -| policy_gradient_loss | -0.00139 | -| std | 0.853 | -| value_loss | 0.0116 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1559 | -| time_elapsed | 24303 | -| total_timesteps | 199552 | -| train/ | | -| approx_kl | 2.3860484e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | 0.00167 | -| learning_rate | 0.0003 | -| loss | 0.00163 | -| n_updates | 15580 | -| policy_gradient_loss | 0.000409 | -| std | 0.853 | -| value_loss | 0.0054 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1560 | -| time_elapsed | 24306 | -| total_timesteps | 199680 | -| train/ | | -| approx_kl | 0.00084536197 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.000989 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 15590 | -| policy_gradient_loss | -0.000804 | -| std | 0.852 | -| value_loss | 0.00442 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1561 | -| time_elapsed | 24310 | -| total_timesteps | 199808 | -| train/ | | -| approx_kl | 0.000489824 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00179 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 15600 | -| policy_gradient_loss | 0.000732 | -| std | 0.85 | -| value_loss | 0.00367 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 8 | -| iterations | 1562 | -| time_elapsed | 24314 | -| total_timesteps | 199936 | -| train/ | | -| approx_kl | 0.006889051 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.00351 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 15610 | -| policy_gradient_loss | -0.00568 | -| std | 0.848 | -| value_loss | 0.00297 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1563 | -| time_elapsed | 24319 | -| total_timesteps | 200064 | -| train/ | | -| approx_kl | 5.2797142e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00512 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 15620 | -| policy_gradient_loss | 0.00238 | -| std | 0.848 | -| value_loss | 0.00248 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1564 | -| time_elapsed | 24327 | -| total_timesteps | 200192 | -| train/ | | -| approx_kl | 0.011257349 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 15630 | -| policy_gradient_loss | -0.00142 | -| std | 0.848 | -| value_loss | 0.0126 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1565 | -| time_elapsed | 24331 | -| total_timesteps | 200320 | -| train/ | | -| approx_kl | 0.0026440825 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00312 | -| learning_rate | 0.0003 | -| loss | 0.259 | -| n_updates | 15640 | -| policy_gradient_loss | -0.000572 | -| std | 0.846 | -| value_loss | 0.59 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1566 | -| time_elapsed | 24334 | -| total_timesteps | 200448 | -| train/ | | -| approx_kl | 0.0023139236 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.000191 | -| learning_rate | 0.0003 | -| loss | -0.000928 | -| n_updates | 15650 | -| policy_gradient_loss | -0.00289 | -| std | 0.843 | -| value_loss | 0.0114 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1567 | -| time_elapsed | 24338 | -| total_timesteps | 200576 | -| train/ | | -| approx_kl | 2.6648864e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.000561 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 15660 | -| policy_gradient_loss | 0.000835 | -| std | 0.841 | -| value_loss | 0.00657 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1568 | -| time_elapsed | 24342 | -| total_timesteps | 200704 | -| train/ | | -| approx_kl | 0.0108576175 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.000406 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 15670 | -| policy_gradient_loss | -0.00443 | -| std | 0.84 | -| value_loss | 0.00516 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1569 | -| time_elapsed | 24345 | -| total_timesteps | 200832 | -| train/ | | -| approx_kl | 0.00048043113 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.000628 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 15680 | -| policy_gradient_loss | -0.00027 | -| std | 0.84 | -| value_loss | 0.00469 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 8 | -| iterations | 1570 | -| time_elapsed | 24349 | -| total_timesteps | 200960 | -| train/ | | -| approx_kl | 0.009371413 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.00062 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 15690 | -| policy_gradient_loss | -0.00254 | -| std | 0.839 | -| value_loss | 0.00427 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1571 | -| time_elapsed | 24353 | -| total_timesteps | 201088 | -| train/ | | -| approx_kl | 0.0016142763 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.00105 | -| learning_rate | 0.0003 | -| loss | -0.00364 | -| n_updates | 15700 | -| policy_gradient_loss | -0.0014 | -| std | 0.839 | -| value_loss | 0.00366 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1572 | -| time_elapsed | 24360 | -| total_timesteps | 201216 | -| train/ | | -| approx_kl | 0.0064845434 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 15710 | -| policy_gradient_loss | -0.00583 | -| std | 0.84 | -| value_loss | 0.0183 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1573 | -| time_elapsed | 24364 | -| total_timesteps | 201344 | -| train/ | | -| approx_kl | 0.0013501165 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00229 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 15720 | -| policy_gradient_loss | -0.00156 | -| std | 0.843 | -| value_loss | 0.00277 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1574 | -| time_elapsed | 24368 | -| total_timesteps | 201472 | -| train/ | | -| approx_kl | 0.012383411 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00361 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 15730 | -| policy_gradient_loss | -0.00379 | -| std | 0.844 | -| value_loss | 0.00231 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1575 | -| time_elapsed | 24373 | -| total_timesteps | 201600 | -| train/ | | -| approx_kl | 0.00040089106 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00715 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 15740 | -| policy_gradient_loss | -0.000147 | -| std | 0.843 | -| value_loss | 0.00158 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1576 | -| time_elapsed | 24376 | -| total_timesteps | 201728 | -| train/ | | -| approx_kl | 0.002157793 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | -0.000325 | -| n_updates | 15750 | -| policy_gradient_loss | -0.000235 | -| std | 0.842 | -| value_loss | 0.000975 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1577 | -| time_elapsed | 24381 | -| total_timesteps | 201856 | -| train/ | | -| approx_kl | 0.0067730267 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 15760 | -| policy_gradient_loss | -0.00863 | -| std | 0.841 | -| value_loss | 0.000681 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1578 | -| time_elapsed | 24384 | -| total_timesteps | 201984 | -| train/ | | -| approx_kl | 0.00480461 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | 0.00027 | -| n_updates | 15770 | -| policy_gradient_loss | -0.000139 | -| std | 0.841 | -| value_loss | 0.000432 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 8 | -| iterations | 1579 | -| time_elapsed | 24388 | -| total_timesteps | 202112 | -| train/ | | -| approx_kl | 0.003953532 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00904 | -| n_updates | 15780 | -| policy_gradient_loss | -0.00347 | -| std | 0.842 | -| value_loss | 0.00026 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 8 | -| iterations | 1580 | -| time_elapsed | 24397 | -| total_timesteps | 202240 | -| train/ | | -| approx_kl | 0.008366566 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.18 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 15790 | -| policy_gradient_loss | -0.00311 | -| std | 0.843 | -| value_loss | 0.00198 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 8 | -| iterations | 1581 | -| time_elapsed | 24400 | -| total_timesteps | 202368 | -| train/ | | -| approx_kl | 6.574718e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 15800 | -| policy_gradient_loss | -0.000354 | -| std | 0.849 | -| value_loss | 0.000125 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 8 | -| iterations | 1582 | -| time_elapsed | 24404 | -| total_timesteps | 202496 | -| train/ | | -| approx_kl | 0.0063905837 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | -0.00878 | -| n_updates | 15810 | -| policy_gradient_loss | -0.00402 | -| std | 0.853 | -| value_loss | 6.89e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 8 | -| iterations | 1583 | -| time_elapsed | 24409 | -| total_timesteps | 202624 | -| train/ | | -| approx_kl | 0.011322587 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.00996 | -| n_updates | 15820 | -| policy_gradient_loss | -0.00737 | -| std | 0.854 | -| value_loss | 4.28e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 8 | -| iterations | 1584 | -| time_elapsed | 24413 | -| total_timesteps | 202752 | -| train/ | | -| approx_kl | 0.008560495 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | -0.006 | -| n_updates | 15830 | -| policy_gradient_loss | -0.0033 | -| std | 0.853 | -| value_loss | 2.67e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 8 | -| iterations | 1585 | -| time_elapsed | 24416 | -| total_timesteps | 202880 | -| train/ | | -| approx_kl | 0.00038900087 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 15840 | -| policy_gradient_loss | 0.000158 | -| std | 0.851 | -| value_loss | 2.17e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1586 | -| time_elapsed | 24420 | -| total_timesteps | 203008 | -| train/ | | -| approx_kl | 5.919207e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.26 | -| explained_variance | -0.237 | -| learning_rate | 0.0003 | -| loss | -0.0003 | -| n_updates | 15850 | -| policy_gradient_loss | 0.000401 | -| std | 0.847 | -| value_loss | 1.01e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1587 | -| time_elapsed | 24430 | -| total_timesteps | 203136 | -| train/ | | -| approx_kl | 0.0022050883 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.639 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 15860 | -| policy_gradient_loss | -0.00234 | -| std | 0.845 | -| value_loss | 0.000587 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1588 | -| time_elapsed | 24434 | -| total_timesteps | 203264 | -| train/ | | -| approx_kl | 0.008350981 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -10 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 15870 | -| policy_gradient_loss | -0.00423 | -| std | 0.844 | -| value_loss | 6.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1589 | -| time_elapsed | 24438 | -| total_timesteps | 203392 | -| train/ | | -| approx_kl | 0.018536245 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | -0.0078 | -| n_updates | 15880 | -| policy_gradient_loss | -0.00914 | -| std | 0.844 | -| value_loss | 7.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1590 | -| time_elapsed | 24443 | -| total_timesteps | 203520 | -| train/ | | -| approx_kl | 0.0055628354 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 15890 | -| policy_gradient_loss | -0.00176 | -| std | 0.845 | -| value_loss | 4.04e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1591 | -| time_elapsed | 24447 | -| total_timesteps | 203648 | -| train/ | | -| approx_kl | 0.0016555237 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0906 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 15900 | -| policy_gradient_loss | -0.00101 | -| std | 0.847 | -| value_loss | 8.12e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1592 | -| time_elapsed | 24453 | -| total_timesteps | 203776 | -| train/ | | -| approx_kl | 0.009154547 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 15910 | -| policy_gradient_loss | -0.00228 | -| std | 0.847 | -| value_loss | 2.43e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1593 | -| time_elapsed | 24457 | -| total_timesteps | 203904 | -| train/ | | -| approx_kl | 0.0041088946 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | -0.00942 | -| n_updates | 15920 | -| policy_gradient_loss | -0.00375 | -| std | 0.846 | -| value_loss | 3.02e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1594 | -| time_elapsed | 24461 | -| total_timesteps | 204032 | -| train/ | | -| approx_kl | 1.1073425e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | -0.000137 | -| n_updates | 15930 | -| policy_gradient_loss | 0.00141 | -| std | 0.846 | -| value_loss | 1.07e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1595 | -| time_elapsed | 24472 | -| total_timesteps | 204160 | -| train/ | | -| approx_kl | 0.008201846 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.344 | -| learning_rate | 0.0003 | -| loss | -0.000102 | -| n_updates | 15940 | -| policy_gradient_loss | -0.0016 | -| std | 0.846 | -| value_loss | 0.00744 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1596 | -| time_elapsed | 24476 | -| total_timesteps | 204288 | -| train/ | | -| approx_kl | 0.010761648 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -55.8 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 15950 | -| policy_gradient_loss | -0.00652 | -| std | 0.846 | -| value_loss | 2.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1597 | -| time_elapsed | 24480 | -| total_timesteps | 204416 | -| train/ | | -| approx_kl | 4.350627e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -47.4 | -| learning_rate | 0.0003 | -| loss | 0.00177 | -| n_updates | 15960 | -| policy_gradient_loss | 0.00518 | -| std | 0.845 | -| value_loss | 1.33e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1598 | -| time_elapsed | 24483 | -| total_timesteps | 204544 | -| train/ | | -| approx_kl | 7.0949085e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -76.3 | -| learning_rate | 0.0003 | -| loss | 0.000227 | -| n_updates | 15970 | -| policy_gradient_loss | 0.000458 | -| std | 0.844 | -| value_loss | 8.59e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1599 | -| time_elapsed | 24487 | -| total_timesteps | 204672 | -| train/ | | -| approx_kl | 0.0025960328 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -18.3 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 15980 | -| policy_gradient_loss | -0.00523 | -| std | 0.842 | -| value_loss | 1.44e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1600 | -| time_elapsed | 24491 | -| total_timesteps | 204800 | -| train/ | | -| approx_kl | 0.009022632 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 15990 | -| policy_gradient_loss | -0.00204 | -| std | 0.841 | -| value_loss | 1.44e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 8 | -| iterations | 1601 | -| time_elapsed | 24496 | -| total_timesteps | 204928 | -| train/ | | -| approx_kl | 0.002908193 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.00513 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 16000 | -| policy_gradient_loss | -0.00076 | -| std | 0.84 | -| value_loss | 1.3e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1602 | -| time_elapsed | 24499 | -| total_timesteps | 205056 | -| train/ | | -| approx_kl | 0.0014731167 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.000614 | -| n_updates | 16010 | -| policy_gradient_loss | -0.000326 | -| std | 0.838 | -| value_loss | 5.91e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1603 | -| time_elapsed | 24507 | -| total_timesteps | 205184 | -| train/ | | -| approx_kl | 0.0008133589 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.509 | -| learning_rate | 0.0003 | -| loss | -0.00573 | -| n_updates | 16020 | -| policy_gradient_loss | -0.00285 | -| std | 0.837 | -| value_loss | 0.00255 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1604 | -| time_elapsed | 24510 | -| total_timesteps | 205312 | -| train/ | | -| approx_kl | 0.004557898 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -4 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 16030 | -| policy_gradient_loss | -0.00207 | -| std | 0.835 | -| value_loss | 1.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1605 | -| time_elapsed | 24515 | -| total_timesteps | 205440 | -| train/ | | -| approx_kl | 0.012495188 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.556 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 16040 | -| policy_gradient_loss | -0.00482 | -| std | 0.835 | -| value_loss | 4.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1606 | -| time_elapsed | 24519 | -| total_timesteps | 205568 | -| train/ | | -| approx_kl | 0.011723084 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0717 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 16050 | -| policy_gradient_loss | -0.00318 | -| std | 0.835 | -| value_loss | 1.26e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1607 | -| time_elapsed | 24523 | -| total_timesteps | 205696 | -| train/ | | -| approx_kl | 0.0032832613 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 16060 | -| policy_gradient_loss | -0.000634 | -| std | 0.834 | -| value_loss | 1.26e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1608 | -| time_elapsed | 24527 | -| total_timesteps | 205824 | -| train/ | | -| approx_kl | 0.007663021 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 16070 | -| policy_gradient_loss | -0.0023 | -| std | 0.835 | -| value_loss | 6.86e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1609 | -| time_elapsed | 24530 | -| total_timesteps | 205952 | -| train/ | | -| approx_kl | 0.016954582 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 16080 | -| policy_gradient_loss | -0.00935 | -| std | 0.836 | -| value_loss | 6.15e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1610 | -| time_elapsed | 24535 | -| total_timesteps | 206080 | -| train/ | | -| approx_kl | 0.00050363643 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 16090 | -| policy_gradient_loss | 0.00043 | -| std | 0.838 | -| value_loss | 2.37e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1611 | -| time_elapsed | 24542 | -| total_timesteps | 206208 | -| train/ | | -| approx_kl | 0.019452346 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.197 | -| learning_rate | 0.0003 | -| loss | 0.00461 | -| n_updates | 16100 | -| policy_gradient_loss | -0.00384 | -| std | 0.84 | -| value_loss | 0.0244 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1612 | -| time_elapsed | 24546 | -| total_timesteps | 206336 | -| train/ | | -| approx_kl | 2.1748245e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 16110 | -| policy_gradient_loss | 5.33e-05 | -| std | 0.84 | -| value_loss | 0.00535 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1613 | -| time_elapsed | 24550 | -| total_timesteps | 206464 | -| train/ | | -| approx_kl | 0.0048213317 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0024 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 16120 | -| policy_gradient_loss | -0.00286 | -| std | 0.84 | -| value_loss | 0.0042 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1614 | -| time_elapsed | 24555 | -| total_timesteps | 206592 | -| train/ | | -| approx_kl | 3.4174882e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00931 | -| learning_rate | 0.0003 | -| loss | 0.00186 | -| n_updates | 16130 | -| policy_gradient_loss | 0.00223 | -| std | 0.841 | -| value_loss | 0.00429 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1615 | -| time_elapsed | 24559 | -| total_timesteps | 206720 | -| train/ | | -| approx_kl | 0.00051549263 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 16140 | -| policy_gradient_loss | -1.03e-05 | -| std | 0.841 | -| value_loss | 0.00262 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1616 | -| time_elapsed | 24562 | -| total_timesteps | 206848 | -| train/ | | -| approx_kl | 0.010012926 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00189 | -| learning_rate | 0.0003 | -| loss | -0.00817 | -| n_updates | 16150 | -| policy_gradient_loss | -0.00728 | -| std | 0.842 | -| value_loss | 0.00194 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 8 | -| iterations | 1617 | -| time_elapsed | 24566 | -| total_timesteps | 206976 | -| train/ | | -| approx_kl | 0.00396542 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.00661 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 16160 | -| policy_gradient_loss | -0.00252 | -| std | 0.842 | -| value_loss | 0.00102 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 8 | -| iterations | 1618 | -| time_elapsed | 24570 | -| total_timesteps | 207104 | -| train/ | | -| approx_kl | 0.00012382818 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.000726 | -| n_updates | 16170 | -| policy_gradient_loss | 0.000915 | -| std | 0.842 | -| value_loss | 0.000585 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 8 | -| iterations | 1619 | -| time_elapsed | 24578 | -| total_timesteps | 207232 | -| train/ | | -| approx_kl | 0.002684609 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.0316 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 16180 | -| policy_gradient_loss | -0.00146 | -| std | 0.842 | -| value_loss | 0.0741 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 8 | -| iterations | 1620 | -| time_elapsed | 24582 | -| total_timesteps | 207360 | -| train/ | | -| approx_kl | 4.514726e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.00122 | -| n_updates | 16190 | -| policy_gradient_loss | 0.000592 | -| std | 0.841 | -| value_loss | 0.00363 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 8 | -| iterations | 1621 | -| time_elapsed | 24586 | -| total_timesteps | 207488 | -| train/ | | -| approx_kl | 0.016629465 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.00565 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 16200 | -| policy_gradient_loss | -0.0135 | -| std | 0.839 | -| value_loss | 0.00138 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 8 | -| iterations | 1622 | -| time_elapsed | 24589 | -| total_timesteps | 207616 | -| train/ | | -| approx_kl | 0.012754086 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.00929 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 16210 | -| policy_gradient_loss | -0.00734 | -| std | 0.837 | -| value_loss | 0.000986 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 8 | -| iterations | 1623 | -| time_elapsed | 24593 | -| total_timesteps | 207744 | -| train/ | | -| approx_kl | 0.0025458643 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.000743 | -| n_updates | 16220 | -| policy_gradient_loss | 0.00053 | -| std | 0.838 | -| value_loss | 0.000552 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 8 | -| iterations | 1624 | -| time_elapsed | 24597 | -| total_timesteps | 207872 | -| train/ | | -| approx_kl | 0.0047582495 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 16230 | -| policy_gradient_loss | -0.00639 | -| std | 0.84 | -| value_loss | 0.000368 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1625 | -| time_elapsed | 24601 | -| total_timesteps | 208000 | -| train/ | | -| approx_kl | 3.3590477e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.000437 | -| n_updates | 16240 | -| policy_gradient_loss | 0.00167 | -| std | 0.842 | -| value_loss | 0.000246 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1626 | -| time_elapsed | 24604 | -| total_timesteps | 208128 | -| train/ | | -| approx_kl | 0.011149326 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -1.25 | -| explained_variance | 0.00637 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 16250 | -| policy_gradient_loss | -0.00361 | -| std | 0.841 | -| value_loss | 0.00117 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1627 | -| time_elapsed | 24613 | -| total_timesteps | 208256 | -| train/ | | -| approx_kl | 0.004480107 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.359 | -| learning_rate | 0.0003 | -| loss | -0.00042 | -| n_updates | 16260 | -| policy_gradient_loss | -0.000998 | -| std | 0.839 | -| value_loss | 0.00355 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1628 | -| time_elapsed | 24617 | -| total_timesteps | 208384 | -| train/ | | -| approx_kl | 0.0015972974 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 16270 | -| policy_gradient_loss | -0.000923 | -| std | 0.838 | -| value_loss | 7.14e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1629 | -| time_elapsed | 24622 | -| total_timesteps | 208512 | -| train/ | | -| approx_kl | 0.010433238 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 16280 | -| policy_gradient_loss | -0.00305 | -| std | 0.84 | -| value_loss | 3.29e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1630 | -| time_elapsed | 24626 | -| total_timesteps | 208640 | -| train/ | | -| approx_kl | 0.0007668622 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.000363 | -| n_updates | 16290 | -| policy_gradient_loss | -0.000147 | -| std | 0.839 | -| value_loss | 1.64e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1631 | -| time_elapsed | 24630 | -| total_timesteps | 208768 | -| train/ | | -| approx_kl | 0.0014105286 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 16300 | -| policy_gradient_loss | -0.000651 | -| std | 0.837 | -| value_loss | 8.46e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1632 | -| time_elapsed | 24634 | -| total_timesteps | 208896 | -| train/ | | -| approx_kl | 0.0001298748 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.000975 | -| n_updates | 16310 | -| policy_gradient_loss | 0.000128 | -| std | 0.836 | -| value_loss | 5.36e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1633 | -| time_elapsed | 24638 | -| total_timesteps | 209024 | -| train/ | | -| approx_kl | 0.0017227684 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | -0.000374 | -| n_updates | 16320 | -| policy_gradient_loss | -0.000225 | -| std | 0.834 | -| value_loss | 2.88e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1634 | -| time_elapsed | 24647 | -| total_timesteps | 209152 | -| train/ | | -| approx_kl | 0.00022535585 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.24 | -| explained_variance | 0.338 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 16330 | -| policy_gradient_loss | -0.000937 | -| std | 0.832 | -| value_loss | 0.00835 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1635 | -| time_elapsed | 24650 | -| total_timesteps | 209280 | -| train/ | | -| approx_kl | 0.0019721766 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | 0.138 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 16340 | -| policy_gradient_loss | -0.000924 | -| std | 0.831 | -| value_loss | 5.84e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1636 | -| time_elapsed | 24652 | -| total_timesteps | 209408 | -| train/ | | -| approx_kl | 0.0005626478 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | -0.45 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 16350 | -| policy_gradient_loss | -0.000244 | -| std | 0.83 | -| value_loss | 1.59e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1637 | -| time_elapsed | 24656 | -| total_timesteps | 209536 | -| train/ | | -| approx_kl | 0.01347903 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | -0.443 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 16360 | -| policy_gradient_loss | -0.0078 | -| std | 0.83 | -| value_loss | 7.6e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1638 | -| time_elapsed | 24659 | -| total_timesteps | 209664 | -| train/ | | -| approx_kl | 9.131897e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | -0.000845 | -| n_updates | 16370 | -| policy_gradient_loss | 0.000589 | -| std | 0.83 | -| value_loss | 5.48e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1639 | -| time_elapsed | 24663 | -| total_timesteps | 209792 | -| train/ | | -| approx_kl | 0.010154853 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 16380 | -| policy_gradient_loss | -0.00713 | -| std | 0.829 | -| value_loss | 3.08e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1640 | -| time_elapsed | 24667 | -| total_timesteps | 209920 | -| train/ | | -| approx_kl | 0.0003445819 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 16390 | -| policy_gradient_loss | 0.00023 | -| std | 0.827 | -| value_loss | 1.64e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1641 | -| time_elapsed | 24671 | -| total_timesteps | 210048 | -| train/ | | -| approx_kl | 0.010858305 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | -0.204 | -| learning_rate | 0.0003 | -| loss | -0.00826 | -| n_updates | 16400 | -| policy_gradient_loss | -0.0064 | -| std | 0.826 | -| value_loss | 1.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1642 | -| time_elapsed | 24678 | -| total_timesteps | 210176 | -| train/ | | -| approx_kl | 0.002971021 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.23 | -| explained_variance | 0.685 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 16410 | -| policy_gradient_loss | -0.000972 | -| std | 0.824 | -| value_loss | 0.00074 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1643 | -| time_elapsed | 24683 | -| total_timesteps | 210304 | -| train/ | | -| approx_kl | 4.1515566e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.22 | -| explained_variance | -0.877 | -| learning_rate | 0.0003 | -| loss | -0.000479 | -| n_updates | 16420 | -| policy_gradient_loss | -0.000136 | -| std | 0.822 | -| value_loss | 1.41e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1644 | -| time_elapsed | 24686 | -| total_timesteps | 210432 | -| train/ | | -| approx_kl | 0.0018192017 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.22 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | -0.00703 | -| n_updates | 16430 | -| policy_gradient_loss | -0.00234 | -| std | 0.82 | -| value_loss | 1.44e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1645 | -| time_elapsed | 24689 | -| total_timesteps | 210560 | -| train/ | | -| approx_kl | 0.0072761616 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.22 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 16440 | -| policy_gradient_loss | -0.000965 | -| std | 0.821 | -| value_loss | 5.94e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1646 | -| time_elapsed | 24692 | -| total_timesteps | 210688 | -| train/ | | -| approx_kl | 0.0007961523 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.22 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 16450 | -| policy_gradient_loss | -0.000889 | -| std | 0.822 | -| value_loss | 6.11e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1647 | -| time_elapsed | 24696 | -| total_timesteps | 210816 | -| train/ | | -| approx_kl | 0.0041485275 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.22 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 16460 | -| policy_gradient_loss | -0.000835 | -| std | 0.82 | -| value_loss | 2.36e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1648 | -| time_elapsed | 24700 | -| total_timesteps | 210944 | -| train/ | | -| approx_kl | 0.0015492388 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.22 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 16470 | -| policy_gradient_loss | -0.000818 | -| std | 0.817 | -| value_loss | 1.91e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1649 | -| time_elapsed | 24705 | -| total_timesteps | 211072 | -| train/ | | -| approx_kl | 0.007897049 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.22 | -| explained_variance | -0.236 | -| learning_rate | 0.0003 | -| loss | -0.00783 | -| n_updates | 16480 | -| policy_gradient_loss | -0.00424 | -| std | 0.814 | -| value_loss | 6.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1650 | -| time_elapsed | 24711 | -| total_timesteps | 211200 | -| train/ | | -| approx_kl | 0.009132633 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | 0.302 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 16490 | -| policy_gradient_loss | -0.0117 | -| std | 0.811 | -| value_loss | 0.015 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1651 | -| time_elapsed | 24716 | -| total_timesteps | 211328 | -| train/ | | -| approx_kl | 0.00013815239 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.571 | -| learning_rate | 0.0003 | -| loss | -0.000331 | -| n_updates | 16500 | -| policy_gradient_loss | -0.000167 | -| std | 0.809 | -| value_loss | 2.81e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1652 | -| time_elapsed | 24719 | -| total_timesteps | 211456 | -| train/ | | -| approx_kl | 0.004218172 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.558 | -| learning_rate | 0.0003 | -| loss | -0.00785 | -| n_updates | 16510 | -| policy_gradient_loss | -0.00305 | -| std | 0.807 | -| value_loss | 2.69e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1653 | -| time_elapsed | 24723 | -| total_timesteps | 211584 | -| train/ | | -| approx_kl | 1.7909333e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.368 | -| learning_rate | 0.0003 | -| loss | 0.000255 | -| n_updates | 16520 | -| policy_gradient_loss | 0.0021 | -| std | 0.806 | -| value_loss | 1.07e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1654 | -| time_elapsed | 24727 | -| total_timesteps | 211712 | -| train/ | | -| approx_kl | 0.00038678572 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.336 | -| learning_rate | 0.0003 | -| loss | 0.000499 | -| n_updates | 16530 | -| policy_gradient_loss | 0.000468 | -| std | 0.805 | -| value_loss | 6.17e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1655 | -| time_elapsed | 24731 | -| total_timesteps | 211840 | -| train/ | | -| approx_kl | 0.0031531574 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 16540 | -| policy_gradient_loss | -0.00409 | -| std | 0.804 | -| value_loss | 5.85e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 8 | -| iterations | 1656 | -| time_elapsed | 24736 | -| total_timesteps | 211968 | -| train/ | | -| approx_kl | 2.9797666e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.000417 | -| n_updates | 16550 | -| policy_gradient_loss | 0.00197 | -| std | 0.803 | -| value_loss | 2.31e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1657 | -| time_elapsed | 24740 | -| total_timesteps | 212096 | -| train/ | | -| approx_kl | 0.0024080877 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.28 | -| learning_rate | 0.0003 | -| loss | -0.000254 | -| n_updates | 16560 | -| policy_gradient_loss | -0.000106 | -| std | 0.803 | -| value_loss | 1.39e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1658 | -| time_elapsed | 24748 | -| total_timesteps | 212224 | -| train/ | | -| approx_kl | 0.008500013 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | 0.466 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 16570 | -| policy_gradient_loss | -0.0149 | -| std | 0.805 | -| value_loss | 0.00329 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1659 | -| time_elapsed | 24752 | -| total_timesteps | 212352 | -| train/ | | -| approx_kl | 0.0015951595 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | 0.00932 | -| learning_rate | 0.0003 | -| loss | -0.000631 | -| n_updates | 16580 | -| policy_gradient_loss | -0.00101 | -| std | 0.806 | -| value_loss | 0.00554 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1660 | -| time_elapsed | 24757 | -| total_timesteps | 212480 | -| train/ | | -| approx_kl | 0.0113786515 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.414 | -| learning_rate | 0.0003 | -| loss | -0.00911 | -| n_updates | 16590 | -| policy_gradient_loss | -0.00676 | -| std | 0.807 | -| value_loss | 0.000133 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1661 | -| time_elapsed | 24761 | -| total_timesteps | 212608 | -| train/ | | -| approx_kl | 0.00123592 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 1.75e-05 | -| n_updates | 16600 | -| policy_gradient_loss | -2.75e-05 | -| std | 0.807 | -| value_loss | 0.000111 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1662 | -| time_elapsed | 24766 | -| total_timesteps | 212736 | -| train/ | | -| approx_kl | 6.170012e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | 1.5e-05 | -| n_updates | 16610 | -| policy_gradient_loss | 2.63e-05 | -| std | 0.806 | -| value_loss | 7.31e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1663 | -| time_elapsed | 24770 | -| total_timesteps | 212864 | -| train/ | | -| approx_kl | 0.0036744121 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 16620 | -| policy_gradient_loss | -0.00547 | -| std | 0.806 | -| value_loss | 3.97e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 8 | -| iterations | 1664 | -| time_elapsed | 24774 | -| total_timesteps | 212992 | -| train/ | | -| approx_kl | 4.2091124e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00029 | -| n_updates | 16630 | -| policy_gradient_loss | 0.00166 | -| std | 0.805 | -| value_loss | 2.3e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 8 | -| iterations | 1665 | -| time_elapsed | 24777 | -| total_timesteps | 213120 | -| train/ | | -| approx_kl | 0.009220261 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 16640 | -| policy_gradient_loss | -0.00391 | -| std | 0.806 | -| value_loss | 1.52e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 8 | -| iterations | 1666 | -| time_elapsed | 24788 | -| total_timesteps | 213248 | -| train/ | | -| approx_kl | 0.001403023 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | 0.372 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 16650 | -| policy_gradient_loss | -0.00767 | -| std | 0.809 | -| value_loss | 0.00669 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 8 | -| iterations | 1667 | -| time_elapsed | 24792 | -| total_timesteps | 213376 | -| train/ | | -| approx_kl | 0.004807468 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.0887 | -| learning_rate | 0.0003 | -| loss | -0.00784 | -| n_updates | 16660 | -| policy_gradient_loss | -0.00358 | -| std | 0.812 | -| value_loss | 2.47e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 8 | -| iterations | 1668 | -| time_elapsed | 24797 | -| total_timesteps | 213504 | -| train/ | | -| approx_kl | 3.879424e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.272 | -| learning_rate | 0.0003 | -| loss | 0.000129 | -| n_updates | 16670 | -| policy_gradient_loss | 0.000801 | -| std | 0.811 | -| value_loss | 1.97e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 8 | -| iterations | 1669 | -| time_elapsed | 24800 | -| total_timesteps | 213632 | -| train/ | | -| approx_kl | 0.00050111767 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.007 | -| learning_rate | 0.0003 | -| loss | 2.8e-05 | -| n_updates | 16680 | -| policy_gradient_loss | 3.41e-05 | -| std | 0.809 | -| value_loss | 0.000241 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 8 | -| iterations | 1670 | -| time_elapsed | 24804 | -| total_timesteps | 213760 | -| train/ | | -| approx_kl | 0.0039288737 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.00763 | -| n_updates | 16690 | -| policy_gradient_loss | -0.00309 | -| std | 0.807 | -| value_loss | 0.000517 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 8 | -| iterations | 1671 | -| time_elapsed | 24809 | -| total_timesteps | 213888 | -| train/ | | -| approx_kl | 2.0214356e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.0499 | -| learning_rate | 0.0003 | -| loss | 0.000476 | -| n_updates | 16700 | -| policy_gradient_loss | 0.00369 | -| std | 0.806 | -| value_loss | 0.000161 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1672 | -| time_elapsed | 24815 | -| total_timesteps | 214016 | -| train/ | | -| approx_kl | 0.00019706693 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.000903 | -| n_updates | 16710 | -| policy_gradient_loss | 0.000182 | -| std | 0.806 | -| value_loss | 5.47e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1673 | -| time_elapsed | 24826 | -| total_timesteps | 214144 | -| train/ | | -| approx_kl | 0.008947482 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | 0.283 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 16720 | -| policy_gradient_loss | -0.0136 | -| std | 0.807 | -| value_loss | 0.0109 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1674 | -| time_elapsed | 24831 | -| total_timesteps | 214272 | -| train/ | | -| approx_kl | 0.0069337282 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | 0.0173 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 16730 | -| policy_gradient_loss | -0.004 | -| std | 0.808 | -| value_loss | 0.0133 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1675 | -| time_elapsed | 24835 | -| total_timesteps | 214400 | -| train/ | | -| approx_kl | 1.473492e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.0007 | -| n_updates | 16740 | -| policy_gradient_loss | 0.00239 | -| std | 0.809 | -| value_loss | 0.000718 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1676 | -| time_elapsed | 24840 | -| total_timesteps | 214528 | -| train/ | | -| approx_kl | 0.00033290405 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -3.18e-05 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 16750 | -| policy_gradient_loss | 0.000121 | -| std | 0.809 | -| value_loss | 0.000227 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1677 | -| time_elapsed | 24844 | -| total_timesteps | 214656 | -| train/ | | -| approx_kl | 0.011540328 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.026 | -| n_updates | 16760 | -| policy_gradient_loss | -0.0143 | -| std | 0.809 | -| value_loss | 0.000136 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1678 | -| time_elapsed | 24848 | -| total_timesteps | 214784 | -| train/ | | -| approx_kl | 0.014309282 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -1.21 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 16770 | -| policy_gradient_loss | -0.00725 | -| std | 0.808 | -| value_loss | 9.14e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.8 | -| time/ | | -| fps | 8 | -| iterations | 1679 | -| time_elapsed | 24851 | -| total_timesteps | 214912 | -| train/ | | -| approx_kl | 0.0070510427 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | -0.00667 | -| n_updates | 16780 | -| policy_gradient_loss | -0.00351 | -| std | 0.807 | -| value_loss | 6.15e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1680 | -| time_elapsed | 24855 | -| total_timesteps | 215040 | -| train/ | | -| approx_kl | 0.003283 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.000152 | -| n_updates | 16790 | -| policy_gradient_loss | -0.000107 | -| std | 0.806 | -| value_loss | 4.15e-05 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1681 | -| time_elapsed | 24864 | -| total_timesteps | 215168 | -| train/ | | -| approx_kl | 0.00064827036 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | 0.316 | -| learning_rate | 0.0003 | -| loss | 0.00156 | -| n_updates | 16800 | -| policy_gradient_loss | -0.00105 | -| std | 0.804 | -| value_loss | 0.00757 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1682 | -| time_elapsed | 24869 | -| total_timesteps | 215296 | -| train/ | | -| approx_kl | 0.0037534046 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 16810 | -| policy_gradient_loss | -0.00203 | -| std | 0.802 | -| value_loss | 1.23e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1683 | -| time_elapsed | 24871 | -| total_timesteps | 215424 | -| train/ | | -| approx_kl | 5.5823475e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | -0.000652 | -| n_updates | 16820 | -| policy_gradient_loss | 0.00284 | -| std | 0.801 | -| value_loss | 4.49e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1684 | -| time_elapsed | 24875 | -| total_timesteps | 215552 | -| train/ | | -| approx_kl | 0.000405021 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | -0.00407 | -| n_updates | 16830 | -| policy_gradient_loss | 0.000117 | -| std | 0.8 | -| value_loss | 2.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1685 | -| time_elapsed | 24879 | -| total_timesteps | 215680 | -| train/ | | -| approx_kl | 0.008742505 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 16840 | -| policy_gradient_loss | -0.00144 | -| std | 0.801 | -| value_loss | 1.59e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1686 | -| time_elapsed | 24882 | -| total_timesteps | 215808 | -| train/ | | -| approx_kl | 9.828387e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | -0.000223 | -| n_updates | 16850 | -| policy_gradient_loss | -5.32e-05 | -| std | 0.8 | -| value_loss | 1.18e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1687 | -| time_elapsed | 24887 | -| total_timesteps | 215936 | -| train/ | | -| approx_kl | 0.0046276036 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 16860 | -| policy_gradient_loss | -0.00418 | -| std | 0.8 | -| value_loss | 7.86e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1688 | -| time_elapsed | 24892 | -| total_timesteps | 216064 | -| train/ | | -| approx_kl | 1.5218742e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.2 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -0.000442 | -| n_updates | 16870 | -| policy_gradient_loss | 0.00134 | -| std | 0.799 | -| value_loss | 3.89e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1689 | -| time_elapsed | 24899 | -| total_timesteps | 216192 | -| train/ | | -| approx_kl | 0.003223498 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | 0.561 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 16880 | -| policy_gradient_loss | -0.00575 | -| std | 0.798 | -| value_loss | 0.00237 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1690 | -| time_elapsed | 24903 | -| total_timesteps | 216320 | -| train/ | | -| approx_kl | 7.47242e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -5.73 | -| learning_rate | 0.0003 | -| loss | 0.00023 | -| n_updates | 16890 | -| policy_gradient_loss | 0.000228 | -| std | 0.798 | -| value_loss | 2.62e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1691 | -| time_elapsed | 24907 | -| total_timesteps | 216448 | -| train/ | | -| approx_kl | 3.9326493e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -6.18 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 16900 | -| policy_gradient_loss | -1.29e-05 | -| std | 0.798 | -| value_loss | 1.12e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1692 | -| time_elapsed | 24911 | -| total_timesteps | 216576 | -| train/ | | -| approx_kl | 0.0047067846 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -0.00983 | -| n_updates | 16910 | -| policy_gradient_loss | -0.00356 | -| std | 0.796 | -| value_loss | 5.07e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1693 | -| time_elapsed | 24915 | -| total_timesteps | 216704 | -| train/ | | -| approx_kl | 6.2603503e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -0.638 | -| learning_rate | 0.0003 | -| loss | -0.000277 | -| n_updates | 16920 | -| policy_gradient_loss | 0.00139 | -| std | 0.795 | -| value_loss | 1.89e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1694 | -| time_elapsed | 24919 | -| total_timesteps | 216832 | -| train/ | | -| approx_kl | 0.012542253 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -0.335 | -| learning_rate | 0.0003 | -| loss | -0.00736 | -| n_updates | 16930 | -| policy_gradient_loss | -0.00461 | -| std | 0.795 | -| value_loss | 1.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1695 | -| time_elapsed | 24923 | -| total_timesteps | 216960 | -| train/ | | -| approx_kl | 0.017443912 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -0.303 | -| learning_rate | 0.0003 | -| loss | -0.00882 | -| n_updates | 16940 | -| policy_gradient_loss | -0.0062 | -| std | 0.795 | -| value_loss | 5.85e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1696 | -| time_elapsed | 24927 | -| total_timesteps | 217088 | -| train/ | | -| approx_kl | 0.01674723 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 16950 | -| policy_gradient_loss | -0.00867 | -| std | 0.795 | -| value_loss | 3.4e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1697 | -| time_elapsed | 24936 | -| total_timesteps | 217216 | -| train/ | | -| approx_kl | 0.0016605803 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | 0.332 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 16960 | -| policy_gradient_loss | -0.0057 | -| std | 0.795 | -| value_loss | 0.015 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1698 | -| time_elapsed | 24940 | -| total_timesteps | 217344 | -| train/ | | -| approx_kl | 0.0049111242 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -16.3 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 16970 | -| policy_gradient_loss | -0.00141 | -| std | 0.795 | -| value_loss | 1.38e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1699 | -| time_elapsed | 24943 | -| total_timesteps | 217472 | -| train/ | | -| approx_kl | 0.0015497007 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -19.8 | -| learning_rate | 0.0003 | -| loss | -0.00717 | -| n_updates | 16980 | -| policy_gradient_loss | -0.000909 | -| std | 0.793 | -| value_loss | 1.01e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1700 | -| time_elapsed | 24946 | -| total_timesteps | 217600 | -| train/ | | -| approx_kl | 0.007386889 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -5.44 | -| learning_rate | 0.0003 | -| loss | -4.56e-05 | -| n_updates | 16990 | -| policy_gradient_loss | -0.000324 | -| std | 0.792 | -| value_loss | 1.73e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1701 | -| time_elapsed | 24948 | -| total_timesteps | 217728 | -| train/ | | -| approx_kl | 0.0058529247 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.19 | -| explained_variance | -0.733 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 17000 | -| policy_gradient_loss | -0.00285 | -| std | 0.791 | -| value_loss | 1.03e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1702 | -| time_elapsed | 24951 | -| total_timesteps | 217856 | -| train/ | | -| approx_kl | 5.3779688e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -0.817 | -| learning_rate | 0.0003 | -| loss | 0.000214 | -| n_updates | 17010 | -| policy_gradient_loss | 0.00107 | -| std | 0.789 | -| value_loss | 3.04e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1703 | -| time_elapsed | 24954 | -| total_timesteps | 217984 | -| train/ | | -| approx_kl | 0.0012596054 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 17020 | -| policy_gradient_loss | -0.000522 | -| std | 0.789 | -| value_loss | 3.04e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1704 | -| time_elapsed | 24958 | -| total_timesteps | 218112 | -| train/ | | -| approx_kl | 0.01664973 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 17030 | -| policy_gradient_loss | -0.00582 | -| std | 0.789 | -| value_loss | 9.37e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1705 | -| time_elapsed | 24969 | -| total_timesteps | 218240 | -| train/ | | -| approx_kl | 0.0015076413 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | 0.483 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 17040 | -| policy_gradient_loss | -0.0118 | -| std | 0.789 | -| value_loss | 0.00567 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1706 | -| time_elapsed | 24972 | -| total_timesteps | 218368 | -| train/ | | -| approx_kl | 0.0056477813 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -48 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 17050 | -| policy_gradient_loss | -0.00177 | -| std | 0.789 | -| value_loss | 3.36e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1707 | -| time_elapsed | 24976 | -| total_timesteps | 218496 | -| train/ | | -| approx_kl | 3.639469e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -52 | -| learning_rate | 0.0003 | -| loss | -0.000305 | -| n_updates | 17060 | -| policy_gradient_loss | 0.000531 | -| std | 0.789 | -| value_loss | 1.48e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1708 | -| time_elapsed | 24980 | -| total_timesteps | 218624 | -| train/ | | -| approx_kl | 0.009791672 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -30.4 | -| learning_rate | 0.0003 | -| loss | -0.00866 | -| n_updates | 17070 | -| policy_gradient_loss | -0.00743 | -| std | 0.788 | -| value_loss | 2.46e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1709 | -| time_elapsed | 24984 | -| total_timesteps | 218752 | -| train/ | | -| approx_kl | 0.0100849075 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -15.2 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 17080 | -| policy_gradient_loss | -0.0059 | -| std | 0.787 | -| value_loss | 4.19e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1710 | -| time_elapsed | 24989 | -| total_timesteps | 218880 | -| train/ | | -| approx_kl | 0.0012443815 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -3.45 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 17090 | -| policy_gradient_loss | 0.00144 | -| std | 0.787 | -| value_loss | 9.24e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1711 | -| time_elapsed | 24993 | -| total_timesteps | 219008 | -| train/ | | -| approx_kl | 0.018141147 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 17100 | -| policy_gradient_loss | -0.0101 | -| std | 0.787 | -| value_loss | 4.79e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1712 | -| time_elapsed | 25003 | -| total_timesteps | 219136 | -| train/ | | -| approx_kl | 0.0019328566 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | 0.402 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 17110 | -| policy_gradient_loss | -0.00731 | -| std | 0.786 | -| value_loss | 0.0124 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1713 | -| time_elapsed | 25008 | -| total_timesteps | 219264 | -| train/ | | -| approx_kl | 0.009087348 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -56.6 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 17120 | -| policy_gradient_loss | -0.00474 | -| std | 0.785 | -| value_loss | 1.74e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1714 | -| time_elapsed | 25013 | -| total_timesteps | 219392 | -| train/ | | -| approx_kl | 0.017470252 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -27.2 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 17130 | -| policy_gradient_loss | -0.00543 | -| std | 0.785 | -| value_loss | 2.68e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1715 | -| time_elapsed | 25016 | -| total_timesteps | 219520 | -| train/ | | -| approx_kl | 0.0015292931 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -33.4 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 17140 | -| policy_gradient_loss | -0.000682 | -| std | 0.784 | -| value_loss | 1.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1716 | -| time_elapsed | 25019 | -| total_timesteps | 219648 | -| train/ | | -| approx_kl | 0.012427088 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | -1.18 | -| explained_variance | -4.08 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 17150 | -| policy_gradient_loss | -0.00577 | -| std | 0.783 | -| value_loss | 3.24e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1717 | -| time_elapsed | 25022 | -| total_timesteps | 219776 | -| train/ | | -| approx_kl | 0.00020237407 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -1.76 | -| learning_rate | 0.0003 | -| loss | -0.000308 | -| n_updates | 17160 | -| policy_gradient_loss | -0.000112 | -| std | 0.781 | -| value_loss | 5.95e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1718 | -| time_elapsed | 25026 | -| total_timesteps | 219904 | -| train/ | | -| approx_kl | 0.009831164 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00823 | -| n_updates | 17170 | -| policy_gradient_loss | -0.0044 | -| std | 0.78 | -| value_loss | 5.28e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1719 | -| time_elapsed | 25029 | -| total_timesteps | 220032 | -| train/ | | -| approx_kl | 0.0009951317 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.293 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 17180 | -| policy_gradient_loss | -7.51e-05 | -| std | 0.779 | -| value_loss | 3.52e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1720 | -| time_elapsed | 25037 | -| total_timesteps | 220160 | -| train/ | | -| approx_kl | 0.026284274 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | 0.626 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 17190 | -| policy_gradient_loss | -0.0148 | -| std | 0.779 | -| value_loss | 0.00232 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1721 | -| time_elapsed | 25041 | -| total_timesteps | 220288 | -| train/ | | -| approx_kl | 0.014514927 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -10 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 17200 | -| policy_gradient_loss | -0.00317 | -| std | 0.778 | -| value_loss | 2.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1722 | -| time_elapsed | 25046 | -| total_timesteps | 220416 | -| train/ | | -| approx_kl | 0.005080797 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -2.26 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 17210 | -| policy_gradient_loss | -0.00158 | -| std | 0.776 | -| value_loss | 4.07e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1723 | -| time_elapsed | 25051 | -| total_timesteps | 220544 | -| train/ | | -| approx_kl | 0.00067886943 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.0209 | -| learning_rate | 0.0003 | -| loss | -0.00374 | -| n_updates | 17220 | -| policy_gradient_loss | 8.71e-05 | -| std | 0.775 | -| value_loss | 3.7e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1724 | -| time_elapsed | 25056 | -| total_timesteps | 220672 | -| train/ | | -| approx_kl | 0.013216269 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.335 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 17230 | -| policy_gradient_loss | -0.00553 | -| std | 0.774 | -| value_loss | 1.03e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1725 | -| time_elapsed | 25061 | -| total_timesteps | 220800 | -| train/ | | -| approx_kl | 0.0046863793 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 17240 | -| policy_gradient_loss | -0.00159 | -| std | 0.773 | -| value_loss | 7.7e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1726 | -| time_elapsed | 25066 | -| total_timesteps | 220928 | -| train/ | | -| approx_kl | 0.017181912 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 17250 | -| policy_gradient_loss | -0.0093 | -| std | 0.771 | -| value_loss | 1.3e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1727 | -| time_elapsed | 25070 | -| total_timesteps | 221056 | -| train/ | | -| approx_kl | 0.00875853 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.697 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 17260 | -| policy_gradient_loss | -0.00675 | -| std | 0.77 | -| value_loss | 3.51e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1728 | -| time_elapsed | 25077 | -| total_timesteps | 221184 | -| train/ | | -| approx_kl | 0.0015426236 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.441 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 17270 | -| policy_gradient_loss | -0.0148 | -| std | 0.77 | -| value_loss | 0.0104 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1729 | -| time_elapsed | 25082 | -| total_timesteps | 221312 | -| train/ | | -| approx_kl | 0.0063370513 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -42 | -| learning_rate | 0.0003 | -| loss | -0.00916 | -| n_updates | 17280 | -| policy_gradient_loss | -0.00404 | -| std | 0.77 | -| value_loss | 2.78e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1730 | -| time_elapsed | 25086 | -| total_timesteps | 221440 | -| train/ | | -| approx_kl | 0.0030551162 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -38.9 | -| learning_rate | 0.0003 | -| loss | 0.000859 | -| n_updates | 17290 | -| policy_gradient_loss | 0.000509 | -| std | 0.77 | -| value_loss | 8.96e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1731 | -| time_elapsed | 25091 | -| total_timesteps | 221568 | -| train/ | | -| approx_kl | 0.00709591 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -34.6 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 17300 | -| policy_gradient_loss | -0.00377 | -| std | 0.77 | -| value_loss | 1.67e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1732 | -| time_elapsed | 25094 | -| total_timesteps | 221696 | -| train/ | | -| approx_kl | 0.0140430555 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -36.6 | -| learning_rate | 0.0003 | -| loss | -0.031 | -| n_updates | 17310 | -| policy_gradient_loss | -0.0168 | -| std | 0.77 | -| value_loss | 7.25e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1733 | -| time_elapsed | 25099 | -| total_timesteps | 221824 | -| train/ | | -| approx_kl | 3.2256357e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -13 | -| learning_rate | 0.0003 | -| loss | 0.00137 | -| n_updates | 17320 | -| policy_gradient_loss | 0.00443 | -| std | 0.769 | -| value_loss | 5.1e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1734 | -| time_elapsed | 25102 | -| total_timesteps | 221952 | -| train/ | | -| approx_kl | 0.004751142 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -3.44 | -| learning_rate | 0.0003 | -| loss | -0.000882 | -| n_updates | 17330 | -| policy_gradient_loss | -0.000516 | -| std | 0.768 | -| value_loss | 1.05e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1735 | -| time_elapsed | 25107 | -| total_timesteps | 222080 | -| train/ | | -| approx_kl | 0.0030217464 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 17340 | -| policy_gradient_loss | -0.00119 | -| std | 0.766 | -| value_loss | 5.06e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1736 | -| time_elapsed | 25114 | -| total_timesteps | 222208 | -| train/ | | -| approx_kl | 0.009877836 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.774 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 17350 | -| policy_gradient_loss | -0.0071 | -| std | 0.764 | -| value_loss | 0.000802 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1737 | -| time_elapsed | 25117 | -| total_timesteps | 222336 | -| train/ | | -| approx_kl | 0.009220706 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 17360 | -| policy_gradient_loss | -0.0036 | -| std | 0.765 | -| value_loss | 2.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1738 | -| time_elapsed | 25121 | -| total_timesteps | 222464 | -| train/ | | -| approx_kl | 0.001515423 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.774 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 17370 | -| policy_gradient_loss | 0.000828 | -| std | 0.765 | -| value_loss | 2.29e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1739 | -| time_elapsed | 25126 | -| total_timesteps | 222592 | -| train/ | | -| approx_kl | 0.0066481824 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 17380 | -| policy_gradient_loss | -0.00297 | -| std | 0.765 | -| value_loss | 1.32e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1740 | -| time_elapsed | 25130 | -| total_timesteps | 222720 | -| train/ | | -| approx_kl | 0.0029355376 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | -0.000338 | -| n_updates | 17390 | -| policy_gradient_loss | -7.87e-05 | -| std | 0.768 | -| value_loss | 1.19e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1741 | -| time_elapsed | 25134 | -| total_timesteps | 222848 | -| train/ | | -| approx_kl | 0.0074759005 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 17400 | -| policy_gradient_loss | -0.00249 | -| std | 0.77 | -| value_loss | 1.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1742 | -| time_elapsed | 25139 | -| total_timesteps | 222976 | -| train/ | | -| approx_kl | 0.013932832 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0909 | -| learning_rate | 0.0003 | -| loss | -0.00896 | -| n_updates | 17410 | -| policy_gradient_loss | -0.0057 | -| std | 0.772 | -| value_loss | 9.3e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1743 | -| time_elapsed | 25144 | -| total_timesteps | 223104 | -| train/ | | -| approx_kl | 0.00069690123 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 17420 | -| policy_gradient_loss | 7.59e-05 | -| std | 0.773 | -| value_loss | 6.39e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1744 | -| time_elapsed | 25153 | -| total_timesteps | 223232 | -| train/ | | -| approx_kl | 0.012538051 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.519 | -| learning_rate | 0.0003 | -| loss | -0.0233 | -| n_updates | 17430 | -| policy_gradient_loss | -0.0155 | -| std | 0.773 | -| value_loss | 0.00756 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1745 | -| time_elapsed | 25156 | -| total_timesteps | 223360 | -| train/ | | -| approx_kl | 0.00062091835 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -36.4 | -| learning_rate | 0.0003 | -| loss | -0.00345 | -| n_updates | 17440 | -| policy_gradient_loss | -0.000111 | -| std | 0.773 | -| value_loss | 2.47e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1746 | -| time_elapsed | 25160 | -| total_timesteps | 223488 | -| train/ | | -| approx_kl | 0.02492643 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -33.3 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 17450 | -| policy_gradient_loss | -0.012 | -| std | 0.773 | -| value_loss | 7.36e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1747 | -| time_elapsed | 25162 | -| total_timesteps | 223616 | -| train/ | | -| approx_kl | 0.025246745 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -30.6 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 17460 | -| policy_gradient_loss | -0.00751 | -| std | 0.774 | -| value_loss | 8.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1748 | -| time_elapsed | 25165 | -| total_timesteps | 223744 | -| train/ | | -| approx_kl | 0.019319635 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -9.83 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 17470 | -| policy_gradient_loss | -0.00662 | -| std | 0.774 | -| value_loss | 9.11e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.81 | -| time/ | | -| fps | 8 | -| iterations | 1749 | -| time_elapsed | 25168 | -| total_timesteps | 223872 | -| train/ | | -| approx_kl | 0.014148639 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 17480 | -| policy_gradient_loss | -0.00821 | -| std | 0.774 | -| value_loss | 3.77e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1750 | -| time_elapsed | 25171 | -| total_timesteps | 224000 | -| train/ | | -| approx_kl | 0.013460407 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 17490 | -| policy_gradient_loss | -0.00703 | -| std | 0.774 | -| value_loss | 8.12e-10 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1751 | -| time_elapsed | 25175 | -| total_timesteps | 224128 | -| train/ | | -| approx_kl | 0.000103070866 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.0144 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 17500 | -| policy_gradient_loss | 0.000677 | -| std | 0.773 | -| value_loss | 3.36e-09 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1752 | -| time_elapsed | 25183 | -| total_timesteps | 224256 | -| train/ | | -| approx_kl | 0.0135946665 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.00513 | -| learning_rate | 0.0003 | -| loss | 0.0915 | -| n_updates | 17510 | -| policy_gradient_loss | -0.00298 | -| std | 0.771 | -| value_loss | 0.307 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1753 | -| time_elapsed | 25187 | -| total_timesteps | 224384 | -| train/ | | -| approx_kl | 0.001069962 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.00396 | -| n_updates | 17520 | -| policy_gradient_loss | -0.000136 | -| std | 0.77 | -| value_loss | 0.0096 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1754 | -| time_elapsed | 25190 | -| total_timesteps | 224512 | -| train/ | | -| approx_kl | 0.0052624955 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.000923 | -| learning_rate | 0.0003 | -| loss | 0.633 | -| n_updates | 17530 | -| policy_gradient_loss | -0.00465 | -| std | 0.77 | -| value_loss | 1.46 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1755 | -| time_elapsed | 25195 | -| total_timesteps | 224640 | -| train/ | | -| approx_kl | 0.010730758 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.0126 | -| learning_rate | 0.0003 | -| loss | 0.00571 | -| n_updates | 17540 | -| policy_gradient_loss | -0.00195 | -| std | 0.77 | -| value_loss | 0.0275 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1756 | -| time_elapsed | 25199 | -| total_timesteps | 224768 | -| train/ | | -| approx_kl | 0.007647923 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.000469 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 17550 | -| policy_gradient_loss | -0.00342 | -| std | 0.77 | -| value_loss | 0.448 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.82 | -| time/ | | -| fps | 8 | -| iterations | 1757 | -| time_elapsed | 25203 | -| total_timesteps | 224896 | -| train/ | | -| approx_kl | 0.0013961485 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.00105 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 17560 | -| policy_gradient_loss | -0.000838 | -| std | 0.771 | -| value_loss | 0.0476 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1758 | -| time_elapsed | 25208 | -| total_timesteps | 225024 | -| train/ | | -| approx_kl | 0.008304274 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.00246 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 17570 | -| policy_gradient_loss | -0.00082 | -| std | 0.77 | -| value_loss | 0.0294 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1759 | -| time_elapsed | 25216 | -| total_timesteps | 225152 | -| train/ | | -| approx_kl | 0.0023413259 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 17580 | -| policy_gradient_loss | -0.00241 | -| std | 0.769 | -| value_loss | 0.0958 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1760 | -| time_elapsed | 25222 | -| total_timesteps | 225280 | -| train/ | | -| approx_kl | 0.0018069018 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.000704 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 17590 | -| policy_gradient_loss | 0.000158 | -| std | 0.769 | -| value_loss | 0.25 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1761 | -| time_elapsed | 25225 | -| total_timesteps | 225408 | -| train/ | | -| approx_kl | 0.0039928597 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.00283 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 17600 | -| policy_gradient_loss | -0.00265 | -| std | 0.771 | -| value_loss | 0.0583 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1762 | -| time_elapsed | 25228 | -| total_timesteps | 225536 | -| train/ | | -| approx_kl | 0.002331268 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.00191 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 17610 | -| policy_gradient_loss | -0.000813 | -| std | 0.773 | -| value_loss | 0.267 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1763 | -| time_elapsed | 25230 | -| total_timesteps | 225664 | -| train/ | | -| approx_kl | 0.012177491 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 17620 | -| policy_gradient_loss | -0.00257 | -| std | 0.775 | -| value_loss | 0.0818 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1764 | -| time_elapsed | 25234 | -| total_timesteps | 225792 | -| train/ | | -| approx_kl | 0.0077504893 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.000718 | -| learning_rate | 0.0003 | -| loss | 0.0792 | -| n_updates | 17630 | -| policy_gradient_loss | -0.00195 | -| std | 0.774 | -| value_loss | 0.162 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.06 | -| time/ | | -| fps | 8 | -| iterations | 1765 | -| time_elapsed | 25237 | -| total_timesteps | 225920 | -| train/ | | -| approx_kl | 0.008314473 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.00362 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 17640 | -| policy_gradient_loss | -0.00707 | -| std | 0.774 | -| value_loss | 0.0489 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1766 | -| time_elapsed | 25241 | -| total_timesteps | 226048 | -| train/ | | -| approx_kl | 0.011613078 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.00983 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 17650 | -| policy_gradient_loss | -0.00548 | -| std | 0.775 | -| value_loss | 0.0185 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1767 | -| time_elapsed | 25247 | -| total_timesteps | 226176 | -| train/ | | -| approx_kl | 0.005488595 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.000813 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 17660 | -| policy_gradient_loss | -0.00204 | -| std | 0.775 | -| value_loss | 0.123 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1768 | -| time_elapsed | 25251 | -| total_timesteps | 226304 | -| train/ | | -| approx_kl | 0.00037027383 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.00534 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 17670 | -| policy_gradient_loss | 0.000189 | -| std | 0.776 | -| value_loss | 0.00708 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1769 | -| time_elapsed | 25255 | -| total_timesteps | 226432 | -| train/ | | -| approx_kl | 0.014610893 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.00793 | -| learning_rate | 0.0003 | -| loss | -0.00404 | -| n_updates | 17680 | -| policy_gradient_loss | -0.00369 | -| std | 0.776 | -| value_loss | 0.00652 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1770 | -| time_elapsed | 25259 | -| total_timesteps | 226560 | -| train/ | | -| approx_kl | 0.0075009707 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 17690 | -| policy_gradient_loss | -0.00209 | -| std | 0.777 | -| value_loss | 0.00396 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1771 | -| time_elapsed | 25262 | -| total_timesteps | 226688 | -| train/ | | -| approx_kl | 0.00216913 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00289 | -| n_updates | 17700 | -| policy_gradient_loss | -0.00112 | -| std | 0.778 | -| value_loss | 0.00264 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1772 | -| time_elapsed | 25265 | -| total_timesteps | 226816 | -| train/ | | -| approx_kl | 8.814689e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | -0.000529 | -| n_updates | 17710 | -| policy_gradient_loss | 0.00123 | -| std | 0.778 | -| value_loss | 0.00168 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 8 | -| iterations | 1773 | -| time_elapsed | 25268 | -| total_timesteps | 226944 | -| train/ | | -| approx_kl | 2.0278618e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | 0.000144 | -| n_updates | 17720 | -| policy_gradient_loss | 0.000504 | -| std | 0.779 | -| value_loss | 0.000921 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 8 | -| iterations | 1774 | -| time_elapsed | 25271 | -| total_timesteps | 227072 | -| train/ | | -| approx_kl | 8.666422e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.000226 | -| n_updates | 17730 | -| policy_gradient_loss | 0.000196 | -| std | 0.781 | -| value_loss | 0.000947 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 8 | -| iterations | 1775 | -| time_elapsed | 25278 | -| total_timesteps | 227200 | -| train/ | | -| approx_kl | 0.0026817694 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | 0.366 | -| learning_rate | 0.0003 | -| loss | 0.000237 | -| n_updates | 17740 | -| policy_gradient_loss | -0.0036 | -| std | 0.781 | -| value_loss | 0.0186 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 8 | -| iterations | 1776 | -| time_elapsed | 25281 | -| total_timesteps | 227328 | -| train/ | | -| approx_kl | 0.0039408416 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 17750 | -| policy_gradient_loss | -0.0011 | -| std | 0.781 | -| value_loss | 0.000708 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 8 | -| iterations | 1777 | -| time_elapsed | 25285 | -| total_timesteps | 227456 | -| train/ | | -| approx_kl | 0.003950195 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 17760 | -| policy_gradient_loss | -0.00137 | -| std | 0.777 | -| value_loss | 0.000419 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 8 | -| iterations | 1778 | -| time_elapsed | 25290 | -| total_timesteps | 227584 | -| train/ | | -| approx_kl | 0.0025102864 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.17 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | -0.00865 | -| n_updates | 17770 | -| policy_gradient_loss | -0.00199 | -| std | 0.775 | -| value_loss | 0.000532 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1779 | -| time_elapsed | 25296 | -| total_timesteps | 227712 | -| train/ | | -| approx_kl | 0.0065333024 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | 8.5e-06 | -| n_updates | 17780 | -| policy_gradient_loss | -0.000156 | -| std | 0.775 | -| value_loss | 0.000157 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1780 | -| time_elapsed | 25301 | -| total_timesteps | 227840 | -| train/ | | -| approx_kl | 0.0055443477 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.00434 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 17790 | -| policy_gradient_loss | -0.00159 | -| std | 0.773 | -| value_loss | 0.000107 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1781 | -| time_elapsed | 25306 | -| total_timesteps | 227968 | -| train/ | | -| approx_kl | 0.00077753654 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.00685 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 17800 | -| policy_gradient_loss | -0.000234 | -| std | 0.77 | -| value_loss | 8.46e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1782 | -| time_elapsed | 25309 | -| total_timesteps | 228096 | -| train/ | | -| approx_kl | 0.0027086772 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | 0.000322 | -| n_updates | 17810 | -| policy_gradient_loss | 0.000342 | -| std | 0.771 | -| value_loss | 7.3e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1783 | -| time_elapsed | 25319 | -| total_timesteps | 228224 | -| train/ | | -| approx_kl | 0.01604573 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.696 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 17820 | -| policy_gradient_loss | -0.0119 | -| std | 0.772 | -| value_loss | 0.00391 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1784 | -| time_elapsed | 25325 | -| total_timesteps | 228352 | -| train/ | | -| approx_kl | 0.017915592 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.212 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 17830 | -| policy_gradient_loss | -0.00501 | -| std | 0.772 | -| value_loss | 8.71e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1785 | -| time_elapsed | 25329 | -| total_timesteps | 228480 | -| train/ | | -| approx_kl | 0.0007101516 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | -0.000109 | -| n_updates | 17840 | -| policy_gradient_loss | -5.38e-05 | -| std | 0.77 | -| value_loss | 4.02e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1786 | -| time_elapsed | 25333 | -| total_timesteps | 228608 | -| train/ | | -| approx_kl | 0.005039095 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 17850 | -| policy_gradient_loss | -0.00711 | -| std | 0.769 | -| value_loss | 3.31e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1787 | -| time_elapsed | 25337 | -| total_timesteps | 228736 | -| train/ | | -| approx_kl | 0.015015591 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.362 | -| learning_rate | 0.0003 | -| loss | -0.0041 | -| n_updates | 17860 | -| policy_gradient_loss | -0.00455 | -| std | 0.769 | -| value_loss | 1.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1788 | -| time_elapsed | 25343 | -| total_timesteps | 228864 | -| train/ | | -| approx_kl | 0.004527153 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 17870 | -| policy_gradient_loss | -0.00169 | -| std | 0.769 | -| value_loss | 1.47e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1789 | -| time_elapsed | 25347 | -| total_timesteps | 228992 | -| train/ | | -| approx_kl | 0.017278578 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 17880 | -| policy_gradient_loss | -0.00447 | -| std | 0.769 | -| value_loss | 1.34e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1790 | -| time_elapsed | 25351 | -| total_timesteps | 229120 | -| train/ | | -| approx_kl | 0.003040677 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.0034 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 17890 | -| policy_gradient_loss | -0.000936 | -| std | 0.769 | -| value_loss | 1.18e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1791 | -| time_elapsed | 25361 | -| total_timesteps | 229248 | -| train/ | | -| approx_kl | 0.0077219727 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.797 | -| learning_rate | 0.0003 | -| loss | -0.00562 | -| n_updates | 17900 | -| policy_gradient_loss | -0.00503 | -| std | 0.768 | -| value_loss | 0.0025 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1792 | -| time_elapsed | 25365 | -| total_timesteps | 229376 | -| train/ | | -| approx_kl | 0.0034836172 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 17910 | -| policy_gradient_loss | -0.00397 | -| std | 0.768 | -| value_loss | 1.3e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1793 | -| time_elapsed | 25367 | -| total_timesteps | 229504 | -| train/ | | -| approx_kl | 0.02048999 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 17920 | -| policy_gradient_loss | -0.0137 | -| std | 0.768 | -| value_loss | 1.43e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1794 | -| time_elapsed | 25371 | -| total_timesteps | 229632 | -| train/ | | -| approx_kl | 1.1403579e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.446 | -| learning_rate | 0.0003 | -| loss | 0.000111 | -| n_updates | 17930 | -| policy_gradient_loss | 0.00028 | -| std | 0.768 | -| value_loss | 3.88e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1795 | -| time_elapsed | 25375 | -| total_timesteps | 229760 | -| train/ | | -| approx_kl | 0.002874955 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 17940 | -| policy_gradient_loss | -0.0017 | -| std | 0.77 | -| value_loss | 3.23e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1796 | -| time_elapsed | 25379 | -| total_timesteps | 229888 | -| train/ | | -| approx_kl | 9.119976e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.0029 | -| learning_rate | 0.0003 | -| loss | -0.000197 | -| n_updates | 17950 | -| policy_gradient_loss | 0.000797 | -| std | 0.77 | -| value_loss | 2.68e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1797 | -| time_elapsed | 25384 | -| total_timesteps | 230016 | -| train/ | | -| approx_kl | 0.006504246 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 17960 | -| policy_gradient_loss | -0.0014 | -| std | 0.767 | -| value_loss | 2.96e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1798 | -| time_elapsed | 25394 | -| total_timesteps | 230144 | -| train/ | | -| approx_kl | 0.0041968813 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | -0.00682 | -| n_updates | 17970 | -| policy_gradient_loss | -0.00356 | -| std | 0.764 | -| value_loss | 0.000728 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1799 | -| time_elapsed | 25397 | -| total_timesteps | 230272 | -| train/ | | -| approx_kl | 0.012423525 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.218 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 17980 | -| policy_gradient_loss | -0.00331 | -| std | 0.762 | -| value_loss | 1.85e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1800 | -| time_elapsed | 25401 | -| total_timesteps | 230400 | -| train/ | | -| approx_kl | 0.0010114051 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | -0.000727 | -| n_updates | 17990 | -| policy_gradient_loss | -0.000327 | -| std | 0.76 | -| value_loss | 1.3e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1801 | -| time_elapsed | 25404 | -| total_timesteps | 230528 | -| train/ | | -| approx_kl | 0.005416745 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.459 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 18000 | -| policy_gradient_loss | -0.00219 | -| std | 0.761 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1802 | -| time_elapsed | 25407 | -| total_timesteps | 230656 | -| train/ | | -| approx_kl | 0.008621292 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 18010 | -| policy_gradient_loss | -0.00375 | -| std | 0.763 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1803 | -| time_elapsed | 25411 | -| total_timesteps | 230784 | -| train/ | | -| approx_kl | 0.016291104 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.088 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 18020 | -| policy_gradient_loss | -0.0129 | -| std | 0.765 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.23 | -| time/ | | -| fps | 9 | -| iterations | 1804 | -| time_elapsed | 25415 | -| total_timesteps | 230912 | -| train/ | | -| approx_kl | 4.053302e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.023 | -| learning_rate | 0.0003 | -| loss | -0.000392 | -| n_updates | 18030 | -| policy_gradient_loss | -2.19e-05 | -| std | 0.766 | -| value_loss | 4.52e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1805 | -| time_elapsed | 25419 | -| total_timesteps | 231040 | -| train/ | | -| approx_kl | 0.0026520002 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | -0.00839 | -| n_updates | 18040 | -| policy_gradient_loss | -0.00261 | -| std | 0.768 | -| value_loss | 5.03e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1806 | -| time_elapsed | 25427 | -| total_timesteps | 231168 | -| train/ | | -| approx_kl | 0.00037371973 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.117 | -| learning_rate | 0.0003 | -| loss | 0.00794 | -| n_updates | 18050 | -| policy_gradient_loss | 0.000478 | -| std | 0.768 | -| value_loss | 0.0177 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1807 | -| time_elapsed | 25432 | -| total_timesteps | 231296 | -| train/ | | -| approx_kl | 0.0017670849 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | 0.00742 | -| learning_rate | 0.0003 | -| loss | 0.0491 | -| n_updates | 18060 | -| policy_gradient_loss | -0.000231 | -| std | 0.768 | -| value_loss | 0.104 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1808 | -| time_elapsed | 25436 | -| total_timesteps | 231424 | -| train/ | | -| approx_kl | 0.0007488318 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.16 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.000932 | -| n_updates | 18070 | -| policy_gradient_loss | -6.82e-05 | -| std | 0.767 | -| value_loss | 0.00191 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1809 | -| time_elapsed | 25440 | -| total_timesteps | 231552 | -| train/ | | -| approx_kl | 0.0059714615 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.0959 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 18080 | -| policy_gradient_loss | -0.0018 | -| std | 0.765 | -| value_loss | 0.000413 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1810 | -| time_elapsed | 25445 | -| total_timesteps | 231680 | -| train/ | | -| approx_kl | 0.00976708 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 18090 | -| policy_gradient_loss | -0.00244 | -| std | 0.763 | -| value_loss | 0.000335 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1811 | -| time_elapsed | 25449 | -| total_timesteps | 231808 | -| train/ | | -| approx_kl | 0.0050880928 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 18100 | -| policy_gradient_loss | -0.000789 | -| std | 0.761 | -| value_loss | 0.000211 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.22 | -| time/ | | -| fps | 9 | -| iterations | 1812 | -| time_elapsed | 25453 | -| total_timesteps | 231936 | -| train/ | | -| approx_kl | 0.0037916559 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.00952 | -| n_updates | 18110 | -| policy_gradient_loss | -0.00315 | -| std | 0.76 | -| value_loss | 0.000222 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1813 | -| time_elapsed | 25458 | -| total_timesteps | 232064 | -| train/ | | -| approx_kl | 0.013846189 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 18120 | -| policy_gradient_loss | -0.0111 | -| std | 0.759 | -| value_loss | 5.47e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1814 | -| time_elapsed | 25466 | -| total_timesteps | 232192 | -| train/ | | -| approx_kl | 0.0016654003 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | 0.783 | -| learning_rate | 0.0003 | -| loss | -0.0098 | -| n_updates | 18130 | -| policy_gradient_loss | -0.00307 | -| std | 0.759 | -| value_loss | 0.00164 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1815 | -| time_elapsed | 25470 | -| total_timesteps | 232320 | -| train/ | | -| approx_kl | 0.000965497 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0948 | -| learning_rate | 0.0003 | -| loss | 0.000911 | -| n_updates | 18140 | -| policy_gradient_loss | 0.000753 | -| std | 0.758 | -| value_loss | 3.46e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1816 | -| time_elapsed | 25474 | -| total_timesteps | 232448 | -| train/ | | -| approx_kl | 0.00047997804 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.000791 | -| n_updates | 18150 | -| policy_gradient_loss | -0.000175 | -| std | 0.758 | -| value_loss | 3.22e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1817 | -| time_elapsed | 25478 | -| total_timesteps | 232576 | -| train/ | | -| approx_kl | 0.0044003716 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 18160 | -| policy_gradient_loss | -0.0012 | -| std | 0.761 | -| value_loss | 2.97e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1818 | -| time_elapsed | 25482 | -| total_timesteps | 232704 | -| train/ | | -| approx_kl | 0.0047033615 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.0695 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 18170 | -| policy_gradient_loss | -0.0011 | -| std | 0.763 | -| value_loss | 2.38e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1819 | -| time_elapsed | 25486 | -| total_timesteps | 232832 | -| train/ | | -| approx_kl | 0.009516206 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 18180 | -| policy_gradient_loss | -0.00215 | -| std | 0.762 | -| value_loss | 1.84e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1820 | -| time_elapsed | 25489 | -| total_timesteps | 232960 | -| train/ | | -| approx_kl | 0.0034349975 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.0766 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 18190 | -| policy_gradient_loss | -0.000962 | -| std | 0.761 | -| value_loss | 1.23e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1821 | -| time_elapsed | 25493 | -| total_timesteps | 233088 | -| train/ | | -| approx_kl | 0.0020682104 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 18200 | -| policy_gradient_loss | -8.12e-05 | -| std | 0.759 | -| value_loss | 9.8e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1822 | -| time_elapsed | 25503 | -| total_timesteps | 233216 | -| train/ | | -| approx_kl | 0.0048121945 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | 0.525 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 18210 | -| policy_gradient_loss | -0.00467 | -| std | 0.758 | -| value_loss | 0.0177 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1823 | -| time_elapsed | 25507 | -| total_timesteps | 233344 | -| train/ | | -| approx_kl | 0.00014456874 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -2.98 | -| learning_rate | 0.0003 | -| loss | -0.000483 | -| n_updates | 18220 | -| policy_gradient_loss | 0.000123 | -| std | 0.758 | -| value_loss | 1.25e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1824 | -| time_elapsed | 25511 | -| total_timesteps | 233472 | -| train/ | | -| approx_kl | 0.006646827 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -2.89 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 18230 | -| policy_gradient_loss | -0.00138 | -| std | 0.759 | -| value_loss | 7.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1825 | -| time_elapsed | 25514 | -| total_timesteps | 233600 | -| train/ | | -| approx_kl | 0.015196322 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.361 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 18240 | -| policy_gradient_loss | -0.00622 | -| std | 0.76 | -| value_loss | 4.33e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1826 | -| time_elapsed | 25518 | -| total_timesteps | 233728 | -| train/ | | -| approx_kl | 0.00011993479 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.000365 | -| n_updates | 18250 | -| policy_gradient_loss | 6.88e-05 | -| std | 0.76 | -| value_loss | 3.22e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1827 | -| time_elapsed | 25522 | -| total_timesteps | 233856 | -| train/ | | -| approx_kl | 0.0031816415 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 18260 | -| policy_gradient_loss | -0.00193 | -| std | 0.76 | -| value_loss | 3.23e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1828 | -| time_elapsed | 25526 | -| total_timesteps | 233984 | -| train/ | | -| approx_kl | 0.006393915 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 18270 | -| policy_gradient_loss | -0.000109 | -| std | 0.762 | -| value_loss | 1.92e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1829 | -| time_elapsed | 25529 | -| total_timesteps | 234112 | -| train/ | | -| approx_kl | 0.0053533884 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.0778 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 18280 | -| policy_gradient_loss | -0.00579 | -| std | 0.763 | -| value_loss | 1.94e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1830 | -| time_elapsed | 25539 | -| total_timesteps | 234240 | -| train/ | | -| approx_kl | 0.0177817 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 18290 | -| policy_gradient_loss | -0.0142 | -| std | 0.763 | -| value_loss | 0.00314 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1831 | -| time_elapsed | 25544 | -| total_timesteps | 234368 | -| train/ | | -| approx_kl | 0.009407807 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 18300 | -| policy_gradient_loss | -0.00497 | -| std | 0.764 | -| value_loss | 2.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1832 | -| time_elapsed | 25548 | -| total_timesteps | 234496 | -| train/ | | -| approx_kl | 0.015849082 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 18310 | -| policy_gradient_loss | -0.0109 | -| std | 0.765 | -| value_loss | 6.61e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1833 | -| time_elapsed | 25551 | -| total_timesteps | 234624 | -| train/ | | -| approx_kl | 0.0031698332 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 18320 | -| policy_gradient_loss | -0.000955 | -| std | 0.764 | -| value_loss | 5.79e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1834 | -| time_elapsed | 25556 | -| total_timesteps | 234752 | -| train/ | | -| approx_kl | 0.0017950409 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.0305 | -| learning_rate | 0.0003 | -| loss | -0.000313 | -| n_updates | 18330 | -| policy_gradient_loss | -0.000182 | -| std | 0.761 | -| value_loss | 4.79e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.24 | -| time/ | | -| fps | 9 | -| iterations | 1835 | -| time_elapsed | 25559 | -| total_timesteps | 234880 | -| train/ | | -| approx_kl | 0.010786412 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 18340 | -| policy_gradient_loss | -0.00899 | -| std | 0.761 | -| value_loss | 3.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1836 | -| time_elapsed | 25564 | -| total_timesteps | 235008 | -| train/ | | -| approx_kl | 0.010306795 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 18350 | -| policy_gradient_loss | -0.00158 | -| std | 0.759 | -| value_loss | 3.45e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1837 | -| time_elapsed | 25574 | -| total_timesteps | 235136 | -| train/ | | -| approx_kl | 0.00046774698 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 18360 | -| policy_gradient_loss | -0.00809 | -| std | 0.759 | -| value_loss | 0.00176 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1838 | -| time_elapsed | 25579 | -| total_timesteps | 235264 | -| train/ | | -| approx_kl | 0.0018689078 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.663 | -| learning_rate | 0.0003 | -| loss | -0.000896 | -| n_updates | 18370 | -| policy_gradient_loss | -0.000752 | -| std | 0.762 | -| value_loss | 1.11e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1839 | -| time_elapsed | 25584 | -| total_timesteps | 235392 | -| train/ | | -| approx_kl | 0.0005026348 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -35.7 | -| learning_rate | 0.0003 | -| loss | -0.000204 | -| n_updates | 18380 | -| policy_gradient_loss | -6.86e-05 | -| std | 0.763 | -| value_loss | 5.35e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1840 | -| time_elapsed | 25590 | -| total_timesteps | 235520 | -| train/ | | -| approx_kl | 0.0012388723 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | -8.86 | -| learning_rate | 0.0003 | -| loss | -0.000821 | -| n_updates | 18390 | -| policy_gradient_loss | -0.000406 | -| std | 0.761 | -| value_loss | 4.35e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1841 | -| time_elapsed | 25594 | -| total_timesteps | 235648 | -| train/ | | -| approx_kl | 0.011238968 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 18400 | -| policy_gradient_loss | -0.00959 | -| std | 0.759 | -| value_loss | 1.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1842 | -| time_elapsed | 25599 | -| total_timesteps | 235776 | -| train/ | | -| approx_kl | 0.01850614 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 18410 | -| policy_gradient_loss | -0.013 | -| std | 0.758 | -| value_loss | 2.12e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1843 | -| time_elapsed | 25602 | -| total_timesteps | 235904 | -| train/ | | -| approx_kl | 0.002201072 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 18420 | -| policy_gradient_loss | -0.00151 | -| std | 0.759 | -| value_loss | 5.82e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1844 | -| time_elapsed | 25606 | -| total_timesteps | 236032 | -| train/ | | -| approx_kl | 0.012954646 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | -0.00519 | -| n_updates | 18430 | -| policy_gradient_loss | -0.00514 | -| std | 0.76 | -| value_loss | 5e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1845 | -| time_elapsed | 25614 | -| total_timesteps | 236160 | -| train/ | | -| approx_kl | 0.0027919463 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | 0.74 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 18440 | -| policy_gradient_loss | -0.00697 | -| std | 0.759 | -| value_loss | 0.00197 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1846 | -| time_elapsed | 25619 | -| total_timesteps | 236288 | -| train/ | | -| approx_kl | 7.777009e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -5.88 | -| learning_rate | 0.0003 | -| loss | -0.000558 | -| n_updates | 18450 | -| policy_gradient_loss | 0.000535 | -| std | 0.759 | -| value_loss | 3.75e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1847 | -| time_elapsed | 25624 | -| total_timesteps | 236416 | -| train/ | | -| approx_kl | 0.0013464708 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.791 | -| learning_rate | 0.0003 | -| loss | 0.0002 | -| n_updates | 18460 | -| policy_gradient_loss | 0.000211 | -| std | 0.761 | -| value_loss | 1.29e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1848 | -| time_elapsed | 25628 | -| total_timesteps | 236544 | -| train/ | | -| approx_kl | 0.007632371 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.0252 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 18470 | -| policy_gradient_loss | -0.00467 | -| std | 0.762 | -| value_loss | 7.12e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1849 | -| time_elapsed | 25632 | -| total_timesteps | 236672 | -| train/ | | -| approx_kl | 4.6718866e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.15 | -| explained_variance | 0.0177 | -| learning_rate | 0.0003 | -| loss | -7.46e-05 | -| n_updates | 18480 | -| policy_gradient_loss | 0.000992 | -| std | 0.76 | -| value_loss | 2.59e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1850 | -| time_elapsed | 25637 | -| total_timesteps | 236800 | -| train/ | | -| approx_kl | 0.00080355303 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 18490 | -| policy_gradient_loss | -0.000299 | -| std | 0.758 | -| value_loss | 2.73e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1851 | -| time_elapsed | 25640 | -| total_timesteps | 236928 | -| train/ | | -| approx_kl | 0.0056446907 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.000159 | -| n_updates | 18500 | -| policy_gradient_loss | -0.000313 | -| std | 0.758 | -| value_loss | 1.51e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1852 | -| time_elapsed | 25644 | -| total_timesteps | 237056 | -| train/ | | -| approx_kl | 0.00019736588 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -0.00822 | -| learning_rate | 0.0003 | -| loss | -7.19e-05 | -| n_updates | 18510 | -| policy_gradient_loss | -3.68e-05 | -| std | 0.758 | -| value_loss | 1.15e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1853 | -| time_elapsed | 25653 | -| total_timesteps | 237184 | -| train/ | | -| approx_kl | 0.004134619 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.00985 | -| n_updates | 18520 | -| policy_gradient_loss | -0.00397 | -| std | 0.758 | -| value_loss | 0.000585 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1854 | -| time_elapsed | 25657 | -| total_timesteps | 237312 | -| train/ | | -| approx_kl | 0.012727419 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -17.7 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 18530 | -| policy_gradient_loss | -0.003 | -| std | 0.756 | -| value_loss | 4.69e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1855 | -| time_elapsed | 25661 | -| total_timesteps | 237440 | -| train/ | | -| approx_kl | 0.00018546497 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -17 | -| learning_rate | 0.0003 | -| loss | 0.000318 | -| n_updates | 18540 | -| policy_gradient_loss | 0.000411 | -| std | 0.754 | -| value_loss | 2.04e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1856 | -| time_elapsed | 25665 | -| total_timesteps | 237568 | -| train/ | | -| approx_kl | 0.006189815 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -1.36 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 18550 | -| policy_gradient_loss | -0.0033 | -| std | 0.755 | -| value_loss | 3.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1857 | -| time_elapsed | 25670 | -| total_timesteps | 237696 | -| train/ | | -| approx_kl | 0.004769113 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | 0.021 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 18560 | -| policy_gradient_loss | -0.00134 | -| std | 0.755 | -| value_loss | 2.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1858 | -| time_elapsed | 25675 | -| total_timesteps | 237824 | -| train/ | | -| approx_kl | 0.005829352 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | 0.00687 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 18570 | -| policy_gradient_loss | -0.00106 | -| std | 0.753 | -| value_loss | 2.37e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1859 | -| time_elapsed | 25679 | -| total_timesteps | 237952 | -| train/ | | -| approx_kl | 0.0020907796 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.00488 | -| learning_rate | 0.0003 | -| loss | -0.00582 | -| n_updates | 18580 | -| policy_gradient_loss | -0.00148 | -| std | 0.752 | -| value_loss | 2.28e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1860 | -| time_elapsed | 25683 | -| total_timesteps | 238080 | -| train/ | | -| approx_kl | 0.011279745 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 18590 | -| policy_gradient_loss | -0.0028 | -| std | 0.752 | -| value_loss | 1.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1861 | -| time_elapsed | 25691 | -| total_timesteps | 238208 | -| train/ | | -| approx_kl | 0.010149427 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 18600 | -| policy_gradient_loss | -0.00616 | -| std | 0.753 | -| value_loss | 0.00192 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1862 | -| time_elapsed | 25696 | -| total_timesteps | 238336 | -| train/ | | -| approx_kl | 0.00072949985 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -61.6 | -| learning_rate | 0.0003 | -| loss | 0.000914 | -| n_updates | 18610 | -| policy_gradient_loss | 0.000772 | -| std | 0.753 | -| value_loss | 2.19e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1863 | -| time_elapsed | 25700 | -| total_timesteps | 238464 | -| train/ | | -| approx_kl | 0.0042019933 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.14 | -| explained_variance | -63.2 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 18620 | -| policy_gradient_loss | -0.00331 | -| std | 0.753 | -| value_loss | 9.75e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1864 | -| time_elapsed | 25703 | -| total_timesteps | 238592 | -| train/ | | -| approx_kl | 0.00742287 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -64.5 | -| learning_rate | 0.0003 | -| loss | -0.000121 | -| n_updates | 18630 | -| policy_gradient_loss | -0.000302 | -| std | 0.751 | -| value_loss | 6.65e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1865 | -| time_elapsed | 25705 | -| total_timesteps | 238720 | -| train/ | | -| approx_kl | 0.00061525684 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -45.4 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 18640 | -| policy_gradient_loss | -0.000433 | -| std | 0.749 | -| value_loss | 1.03e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1866 | -| time_elapsed | 25708 | -| total_timesteps | 238848 | -| train/ | | -| approx_kl | 0.0024385164 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -5.24 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 18650 | -| policy_gradient_loss | -0.00159 | -| std | 0.748 | -| value_loss | 3.56e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1867 | -| time_elapsed | 25710 | -| total_timesteps | 238976 | -| train/ | | -| approx_kl | 0.012308353 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 18660 | -| policy_gradient_loss | -0.00167 | -| std | 0.747 | -| value_loss | 3.22e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1868 | -| time_elapsed | 25715 | -| total_timesteps | 239104 | -| train/ | | -| approx_kl | 0.008888798 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | 0.00834 | -| learning_rate | 0.0003 | -| loss | -0.00908 | -| n_updates | 18670 | -| policy_gradient_loss | -0.0045 | -| std | 0.745 | -| value_loss | 3.29e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1869 | -| time_elapsed | 25723 | -| total_timesteps | 239232 | -| train/ | | -| approx_kl | 0.00012313854 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.225 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 18680 | -| policy_gradient_loss | 0.000365 | -| std | 0.743 | -| value_loss | 0.045 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1870 | -| time_elapsed | 25727 | -| total_timesteps | 239360 | -| train/ | | -| approx_kl | 0.0045514833 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00127 | -| learning_rate | 0.0003 | -| loss | 0.000699 | -| n_updates | 18690 | -| policy_gradient_loss | -0.000206 | -| std | 0.743 | -| value_loss | 0.00257 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1871 | -| time_elapsed | 25731 | -| total_timesteps | 239488 | -| train/ | | -| approx_kl | 0.009720497 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 18700 | -| policy_gradient_loss | -0.00565 | -| std | 0.745 | -| value_loss | 0.000711 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1872 | -| time_elapsed | 25735 | -| total_timesteps | 239616 | -| train/ | | -| approx_kl | 0.0028107455 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 18710 | -| policy_gradient_loss | -0.00254 | -| std | 0.747 | -| value_loss | 0.000422 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1873 | -| time_elapsed | 25738 | -| total_timesteps | 239744 | -| train/ | | -| approx_kl | 3.58643e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.0005 | -| n_updates | 18720 | -| policy_gradient_loss | 0.000692 | -| std | 0.749 | -| value_loss | 0.000261 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.25 | -| time/ | | -| fps | 9 | -| iterations | 1874 | -| time_elapsed | 25741 | -| total_timesteps | 239872 | -| train/ | | -| approx_kl | 0.00037441542 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.0942 | -| learning_rate | 0.0003 | -| loss | 0.000688 | -| n_updates | 18730 | -| policy_gradient_loss | 0.000584 | -| std | 0.749 | -| value_loss | 0.000219 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1875 | -| time_elapsed | 25744 | -| total_timesteps | 240000 | -| train/ | | -| approx_kl | 0.009482957 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 18740 | -| policy_gradient_loss | -0.00768 | -| std | 0.748 | -| value_loss | 0.00025 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1876 | -| time_elapsed | 25748 | -| total_timesteps | 240128 | -| train/ | | -| approx_kl | 0.00013750419 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 18750 | -| policy_gradient_loss | 0.00118 | -| std | 0.748 | -| value_loss | 0.000447 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1877 | -| time_elapsed | 25756 | -| total_timesteps | 240256 | -| train/ | | -| approx_kl | 0.0058824657 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | 0.0151 | -| learning_rate | 0.0003 | -| loss | 0.0323 | -| n_updates | 18760 | -| policy_gradient_loss | -0.000496 | -| std | 0.746 | -| value_loss | 0.099 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1878 | -| time_elapsed | 25760 | -| total_timesteps | 240384 | -| train/ | | -| approx_kl | 0.002109895 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | 0.00257 | -| n_updates | 18770 | -| policy_gradient_loss | 0.000173 | -| std | 0.745 | -| value_loss | 0.00514 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1879 | -| time_elapsed | 25764 | -| total_timesteps | 240512 | -| train/ | | -| approx_kl | 0.004958998 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00661 | -| learning_rate | 0.0003 | -| loss | -0.00962 | -| n_updates | 18780 | -| policy_gradient_loss | -0.00425 | -| std | 0.745 | -| value_loss | 0.00256 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1880 | -| time_elapsed | 25767 | -| total_timesteps | 240640 | -| train/ | | -| approx_kl | 4.0400773e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00038 | -| n_updates | 18790 | -| policy_gradient_loss | 0.00111 | -| std | 0.746 | -| value_loss | 0.00163 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1881 | -| time_elapsed | 25771 | -| total_timesteps | 240768 | -| train/ | | -| approx_kl | 0.00071819173 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 18800 | -| policy_gradient_loss | 0.000474 | -| std | 0.747 | -| value_loss | 0.00104 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.27 | -| time/ | | -| fps | 9 | -| iterations | 1882 | -| time_elapsed | 25776 | -| total_timesteps | 240896 | -| train/ | | -| approx_kl | 0.004403249 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.0818 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 18810 | -| policy_gradient_loss | -0.00286 | -| std | 0.745 | -| value_loss | 0.000669 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1883 | -| time_elapsed | 25781 | -| total_timesteps | 241024 | -| train/ | | -| approx_kl | 0.013773745 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 18820 | -| policy_gradient_loss | -0.00792 | -| std | 0.744 | -| value_loss | 0.00038 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1884 | -| time_elapsed | 25790 | -| total_timesteps | 241152 | -| train/ | | -| approx_kl | 0.004061426 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.466 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 18830 | -| policy_gradient_loss | -0.00132 | -| std | 0.743 | -| value_loss | 0.00264 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1885 | -| time_elapsed | 25795 | -| total_timesteps | 241280 | -| train/ | | -| approx_kl | 0.00348632 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.143 | -| learning_rate | 0.0003 | -| loss | -0.000976 | -| n_updates | 18840 | -| policy_gradient_loss | -0.000487 | -| std | 0.743 | -| value_loss | 0.000196 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1886 | -| time_elapsed | 25798 | -| total_timesteps | 241408 | -| train/ | | -| approx_kl | 0.0065660127 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.0224 | -| learning_rate | 0.0003 | -| loss | 0.00295 | -| n_updates | 18850 | -| policy_gradient_loss | -0.0016 | -| std | 0.744 | -| value_loss | 0.0109 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1887 | -| time_elapsed | 25802 | -| total_timesteps | 241536 | -| train/ | | -| approx_kl | 2.3851171e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -8.08e-05 | -| n_updates | 18860 | -| policy_gradient_loss | -7.87e-05 | -| std | 0.742 | -| value_loss | 0.00135 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1888 | -| time_elapsed | 25806 | -| total_timesteps | 241664 | -| train/ | | -| approx_kl | 0.0039048414 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | -0.000635 | -| n_updates | 18870 | -| policy_gradient_loss | -0.00116 | -| std | 0.741 | -| value_loss | 0.00122 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1889 | -| time_elapsed | 25810 | -| total_timesteps | 241792 | -| train/ | | -| approx_kl | 1.5059952e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00955 | -| learning_rate | 0.0003 | -| loss | 0.00186 | -| n_updates | 18880 | -| policy_gradient_loss | 1.82e-05 | -| std | 0.741 | -| value_loss | 0.00401 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.3 | -| time/ | | -| fps | 9 | -| iterations | 1890 | -| time_elapsed | 25814 | -| total_timesteps | 241920 | -| train/ | | -| approx_kl | 0.000105815474 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.041 | -| n_updates | 18890 | -| policy_gradient_loss | -6.75e-05 | -| std | 0.742 | -| value_loss | 0.0894 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1891 | -| time_elapsed | 25817 | -| total_timesteps | 242048 | -| train/ | | -| approx_kl | 0.010929221 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00827 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 18900 | -| policy_gradient_loss | -0.0101 | -| std | 0.742 | -| value_loss | 0.0824 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1892 | -| time_elapsed | 25825 | -| total_timesteps | 242176 | -| train/ | | -| approx_kl | 0.008306885 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00665 | -| learning_rate | 0.0003 | -| loss | 0.564 | -| n_updates | 18910 | -| policy_gradient_loss | -0.00358 | -| std | 0.741 | -| value_loss | 1.25 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1893 | -| time_elapsed | 25828 | -| total_timesteps | 242304 | -| train/ | | -| approx_kl | 0.0037472928 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00237 | -| learning_rate | 0.0003 | -| loss | 0.19 | -| n_updates | 18920 | -| policy_gradient_loss | -0.000817 | -| std | 0.74 | -| value_loss | 0.442 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1894 | -| time_elapsed | 25833 | -| total_timesteps | 242432 | -| train/ | | -| approx_kl | 0.010697538 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.000332 | -| learning_rate | 0.0003 | -| loss | 0.0896 | -| n_updates | 18930 | -| policy_gradient_loss | -0.00287 | -| std | 0.74 | -| value_loss | 0.179 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1895 | -| time_elapsed | 25837 | -| total_timesteps | 242560 | -| train/ | | -| approx_kl | 0.0021428443 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00265 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 18940 | -| policy_gradient_loss | -0.00117 | -| std | 0.741 | -| value_loss | 0.0145 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1896 | -| time_elapsed | 25841 | -| total_timesteps | 242688 | -| train/ | | -| approx_kl | 0.00080344407 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.000189 | -| learning_rate | 0.0003 | -| loss | 0.541 | -| n_updates | 18950 | -| policy_gradient_loss | 0.00327 | -| std | 0.741 | -| value_loss | 1.27 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1897 | -| time_elapsed | 25846 | -| total_timesteps | 242816 | -| train/ | | -| approx_kl | 0.008292744 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00013 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 18960 | -| policy_gradient_loss | -0.0047 | -| std | 0.741 | -| value_loss | 0.304 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 9 | -| iterations | 1898 | -| time_elapsed | 25849 | -| total_timesteps | 242944 | -| train/ | | -| approx_kl | 0.0042312793 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00341 | -| learning_rate | 0.0003 | -| loss | 0.00376 | -| n_updates | 18970 | -| policy_gradient_loss | -0.000522 | -| std | 0.741 | -| value_loss | 0.024 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1899 | -| time_elapsed | 25854 | -| total_timesteps | 243072 | -| train/ | | -| approx_kl | 0.013858282 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00303 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 18980 | -| policy_gradient_loss | -0.0134 | -| std | 0.742 | -| value_loss | 0.0261 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1900 | -| time_elapsed | 25864 | -| total_timesteps | 243200 | -| train/ | | -| approx_kl | 0.011404114 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00315 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 18990 | -| policy_gradient_loss | -0.0122 | -| std | 0.743 | -| value_loss | 0.145 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1901 | -| time_elapsed | 25868 | -| total_timesteps | 243328 | -| train/ | | -| approx_kl | 0.011135666 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.000741 | -| learning_rate | 0.0003 | -| loss | 0.000861 | -| n_updates | 19000 | -| policy_gradient_loss | -0.00183 | -| std | 0.743 | -| value_loss | 0.0133 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1902 | -| time_elapsed | 25873 | -| total_timesteps | 243456 | -| train/ | | -| approx_kl | 0.0067869932 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0033 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 19010 | -| policy_gradient_loss | -0.00529 | -| std | 0.743 | -| value_loss | 0.0115 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1903 | -| time_elapsed | 25877 | -| total_timesteps | 243584 | -| train/ | | -| approx_kl | 0.016226346 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00555 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 19020 | -| policy_gradient_loss | -0.00388 | -| std | 0.742 | -| value_loss | 0.00788 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1904 | -| time_elapsed | 25881 | -| total_timesteps | 243712 | -| train/ | | -| approx_kl | 0.0077766967 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 19030 | -| policy_gradient_loss | -0.00369 | -| std | 0.743 | -| value_loss | 0.00449 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1905 | -| time_elapsed | 25886 | -| total_timesteps | 243840 | -| train/ | | -| approx_kl | 0.0037587662 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0926 | -| learning_rate | 0.0003 | -| loss | -1.42e-05 | -| n_updates | 19040 | -| policy_gradient_loss | -0.000782 | -| std | 0.744 | -| value_loss | 0.0034 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1906 | -| time_elapsed | 25889 | -| total_timesteps | 243968 | -| train/ | | -| approx_kl | 0.009458556 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 19050 | -| policy_gradient_loss | -0.00402 | -| std | 0.745 | -| value_loss | 0.00324 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1907 | -| time_elapsed | 25894 | -| total_timesteps | 244096 | -| train/ | | -| approx_kl | 0.0018156948 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.00679 | -| n_updates | 19060 | -| policy_gradient_loss | -0.00178 | -| std | 0.746 | -| value_loss | 0.00143 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1908 | -| time_elapsed | 25904 | -| total_timesteps | 244224 | -| train/ | | -| approx_kl | 0.0067744856 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.13 | -| explained_variance | 0.448 | -| learning_rate | 0.0003 | -| loss | 0.00109 | -| n_updates | 19070 | -| policy_gradient_loss | -0.00165 | -| std | 0.745 | -| value_loss | 0.00829 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1909 | -| time_elapsed | 25909 | -| total_timesteps | 244352 | -| train/ | | -| approx_kl | 0.0073572346 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0773 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 19080 | -| policy_gradient_loss | -0.00674 | -| std | 0.744 | -| value_loss | 0.00151 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1910 | -| time_elapsed | 25912 | -| total_timesteps | 244480 | -| train/ | | -| approx_kl | 7.022172e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.24 | -| learning_rate | 0.0003 | -| loss | -0.000129 | -| n_updates | 19090 | -| policy_gradient_loss | 0.00174 | -| std | 0.745 | -| value_loss | 0.0004 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1911 | -| time_elapsed | 25915 | -| total_timesteps | 244608 | -| train/ | | -| approx_kl | 0.00070310803 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 19100 | -| policy_gradient_loss | 1.89e-07 | -| std | 0.745 | -| value_loss | 0.000288 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1912 | -| time_elapsed | 25919 | -| total_timesteps | 244736 | -| train/ | | -| approx_kl | 0.0144100785 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 19110 | -| policy_gradient_loss | -0.00438 | -| std | 0.743 | -| value_loss | 0.000256 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1913 | -| time_elapsed | 25921 | -| total_timesteps | 244864 | -| train/ | | -| approx_kl | 0.003315379 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 19120 | -| policy_gradient_loss | -0.00166 | -| std | 0.743 | -| value_loss | 0.000209 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1914 | -| time_elapsed | 25924 | -| total_timesteps | 244992 | -| train/ | | -| approx_kl | 0.0017219922 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 19130 | -| policy_gradient_loss | 0.000705 | -| std | 0.742 | -| value_loss | 0.000163 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1915 | -| time_elapsed | 25927 | -| total_timesteps | 245120 | -| train/ | | -| approx_kl | 0.0047822683 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00539 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 19140 | -| policy_gradient_loss | -0.00214 | -| std | 0.742 | -| value_loss | 0.00013 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1916 | -| time_elapsed | 25937 | -| total_timesteps | 245248 | -| train/ | | -| approx_kl | 0.0015735002 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | 0.000226 | -| n_updates | 19150 | -| policy_gradient_loss | 0.000177 | -| std | 0.741 | -| value_loss | 0.000956 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1917 | -| time_elapsed | 25941 | -| total_timesteps | 245376 | -| train/ | | -| approx_kl | 0.0004034685 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.0202 | -| learning_rate | 0.0003 | -| loss | -0.000461 | -| n_updates | 19160 | -| policy_gradient_loss | -0.000151 | -| std | 0.741 | -| value_loss | 9.19e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1918 | -| time_elapsed | 25946 | -| total_timesteps | 245504 | -| train/ | | -| approx_kl | 0.0046972553 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.0213 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 19170 | -| policy_gradient_loss | -0.00113 | -| std | 0.743 | -| value_loss | 8.51e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1919 | -| time_elapsed | 25949 | -| total_timesteps | 245632 | -| train/ | | -| approx_kl | 0.006486716 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.00166 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 19180 | -| policy_gradient_loss | -0.00585 | -| std | 0.744 | -| value_loss | 7.55e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1920 | -| time_elapsed | 25955 | -| total_timesteps | 245760 | -| train/ | | -| approx_kl | 0.011085844 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 19190 | -| policy_gradient_loss | -0.00212 | -| std | 0.743 | -| value_loss | 6.3e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 1921 | -| time_elapsed | 25959 | -| total_timesteps | 245888 | -| train/ | | -| approx_kl | 0.00045192335 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00347 | -| learning_rate | 0.0003 | -| loss | -0.000251 | -| n_updates | 19200 | -| policy_gradient_loss | -9.41e-05 | -| std | 0.743 | -| value_loss | 4.85e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1922 | -| time_elapsed | 25963 | -| total_timesteps | 246016 | -| train/ | | -| approx_kl | 0.003998179 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 19210 | -| policy_gradient_loss | -0.00316 | -| std | 0.744 | -| value_loss | 4.33e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1923 | -| time_elapsed | 25973 | -| total_timesteps | 246144 | -| train/ | | -| approx_kl | 0.026323982 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.893 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 19220 | -| policy_gradient_loss | -0.0076 | -| std | 0.744 | -| value_loss | 0.000539 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1924 | -| time_elapsed | 25977 | -| total_timesteps | 246272 | -| train/ | | -| approx_kl | 0.0062122587 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 19230 | -| policy_gradient_loss | -0.00277 | -| std | 0.743 | -| value_loss | 2.08e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1925 | -| time_elapsed | 25980 | -| total_timesteps | 246400 | -| train/ | | -| approx_kl | 0.013446613 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 19240 | -| policy_gradient_loss | -0.00957 | -| std | 0.743 | -| value_loss | 2.12e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1926 | -| time_elapsed | 25984 | -| total_timesteps | 246528 | -| train/ | | -| approx_kl | 0.00014428934 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | 0.000496 | -| n_updates | 19250 | -| policy_gradient_loss | 0.000599 | -| std | 0.743 | -| value_loss | 1.54e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1927 | -| time_elapsed | 25988 | -| total_timesteps | 246656 | -| train/ | | -| approx_kl | 0.011424568 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.00855 | -| n_updates | 19260 | -| policy_gradient_loss | -0.00522 | -| std | 0.743 | -| value_loss | 1.2e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1928 | -| time_elapsed | 25992 | -| total_timesteps | 246784 | -| train/ | | -| approx_kl | 0.0009751371 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 19270 | -| policy_gradient_loss | -0.000476 | -| std | 0.743 | -| value_loss | 1.3e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 1929 | -| time_elapsed | 25995 | -| total_timesteps | 246912 | -| train/ | | -| approx_kl | 0.0001478903 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0808 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 19280 | -| policy_gradient_loss | 0.000494 | -| std | 0.742 | -| value_loss | 9.58e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1930 | -| time_elapsed | 25998 | -| total_timesteps | 247040 | -| train/ | | -| approx_kl | 2.4301466e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.000116 | -| n_updates | 19290 | -| policy_gradient_loss | 0.000504 | -| std | 0.74 | -| value_loss | 7.53e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1931 | -| time_elapsed | 26005 | -| total_timesteps | 247168 | -| train/ | | -| approx_kl | 0.0016755373 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | 0.826 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 19300 | -| policy_gradient_loss | -0.0025 | -| std | 0.738 | -| value_loss | 0.0013 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1932 | -| time_elapsed | 26009 | -| total_timesteps | 247296 | -| train/ | | -| approx_kl | 0.01279561 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 19310 | -| policy_gradient_loss | -0.0027 | -| std | 0.736 | -| value_loss | 5.03e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1933 | -| time_elapsed | 26012 | -| total_timesteps | 247424 | -| train/ | | -| approx_kl | 0.0054803477 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 19320 | -| policy_gradient_loss | -0.00602 | -| std | 0.736 | -| value_loss | 4.57e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1934 | -| time_elapsed | 26014 | -| total_timesteps | 247552 | -| train/ | | -| approx_kl | 0.012349928 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.237 | -| learning_rate | 0.0003 | -| loss | -0.00541 | -| n_updates | 19330 | -| policy_gradient_loss | -0.00529 | -| std | 0.736 | -| value_loss | 2.99e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1935 | -| time_elapsed | 26016 | -| total_timesteps | 247680 | -| train/ | | -| approx_kl | 0.0027505103 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 19340 | -| policy_gradient_loss | -0.000497 | -| std | 0.736 | -| value_loss | 2.47e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1936 | -| time_elapsed | 26020 | -| total_timesteps | 247808 | -| train/ | | -| approx_kl | 0.0019650464 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | -0.00563 | -| n_updates | 19350 | -| policy_gradient_loss | -0.00138 | -| std | 0.736 | -| value_loss | 2.17e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1937 | -| time_elapsed | 26024 | -| total_timesteps | 247936 | -| train/ | | -| approx_kl | 0.015207598 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 19360 | -| policy_gradient_loss | -0.0113 | -| std | 0.736 | -| value_loss | 2.13e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1938 | -| time_elapsed | 26029 | -| total_timesteps | 248064 | -| train/ | | -| approx_kl | 0.0036733625 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 19370 | -| policy_gradient_loss | -0.00107 | -| std | 0.735 | -| value_loss | 1.33e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1939 | -| time_elapsed | 26035 | -| total_timesteps | 248192 | -| train/ | | -| approx_kl | 0.00077168085 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | 0.645 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 19380 | -| policy_gradient_loss | -0.0042 | -| std | 0.736 | -| value_loss | 0.00692 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1940 | -| time_elapsed | 26038 | -| total_timesteps | 248320 | -| train/ | | -| approx_kl | 0.0065949718 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -6.6 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 19390 | -| policy_gradient_loss | -0.00148 | -| std | 0.739 | -| value_loss | 3.07e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1941 | -| time_elapsed | 26040 | -| total_timesteps | 248448 | -| train/ | | -| approx_kl | 0.0023904657 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -7.47 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 19400 | -| policy_gradient_loss | -0.000554 | -| std | 0.741 | -| value_loss | 1.88e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1942 | -| time_elapsed | 26043 | -| total_timesteps | 248576 | -| train/ | | -| approx_kl | 0.010809321 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 19410 | -| policy_gradient_loss | -0.0108 | -| std | 0.743 | -| value_loss | 1.35e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1943 | -| time_elapsed | 26046 | -| total_timesteps | 248704 | -| train/ | | -| approx_kl | 0.0014272262 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.00368 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 19420 | -| policy_gradient_loss | 0.000945 | -| std | 0.742 | -| value_loss | 3.69e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1944 | -| time_elapsed | 26049 | -| total_timesteps | 248832 | -| train/ | | -| approx_kl | 0.002249871 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.12 | -| explained_variance | -0.0559 | -| learning_rate | 0.0003 | -| loss | -0.00226 | -| n_updates | 19430 | -| policy_gradient_loss | -0.0011 | -| std | 0.739 | -| value_loss | 3.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1945 | -| time_elapsed | 26052 | -| total_timesteps | 248960 | -| train/ | | -| approx_kl | 0.010968337 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 19440 | -| policy_gradient_loss | -0.00421 | -| std | 0.737 | -| value_loss | 3.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1946 | -| time_elapsed | 26055 | -| total_timesteps | 249088 | -| train/ | | -| approx_kl | 0.0022117314 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.0564 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 19450 | -| policy_gradient_loss | -0.000352 | -| std | 0.736 | -| value_loss | 2.33e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1947 | -| time_elapsed | 26061 | -| total_timesteps | 249216 | -| train/ | | -| approx_kl | 0.013274309 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | 0.761 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 19460 | -| policy_gradient_loss | -0.0122 | -| std | 0.736 | -| value_loss | 0.000791 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1948 | -| time_elapsed | 26065 | -| total_timesteps | 249344 | -| train/ | | -| approx_kl | 0.0009904294 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -39.2 | -| learning_rate | 0.0003 | -| loss | 0.000462 | -| n_updates | 19470 | -| policy_gradient_loss | 0.000392 | -| std | 0.734 | -| value_loss | 7.58e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1949 | -| time_elapsed | 26068 | -| total_timesteps | 249472 | -| train/ | | -| approx_kl | 0.009050834 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -46 | -| learning_rate | 0.0003 | -| loss | -0.00991 | -| n_updates | 19480 | -| policy_gradient_loss | -0.00468 | -| std | 0.732 | -| value_loss | 2.98e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1950 | -| time_elapsed | 26072 | -| total_timesteps | 249600 | -| train/ | | -| approx_kl | 3.641937e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -13.7 | -| learning_rate | 0.0003 | -| loss | -8.91e-05 | -| n_updates | 19490 | -| policy_gradient_loss | 0.00188 | -| std | 0.73 | -| value_loss | 2.77e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1951 | -| time_elapsed | 26076 | -| total_timesteps | 249728 | -| train/ | | -| approx_kl | 0.0006507044 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -0.761 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 19500 | -| policy_gradient_loss | -4.72e-05 | -| std | 0.729 | -| value_loss | 5.18e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1952 | -| time_elapsed | 26079 | -| total_timesteps | 249856 | -| train/ | | -| approx_kl | 0.00022730185 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | 0.0177 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 19510 | -| policy_gradient_loss | 0.000494 | -| std | 0.729 | -| value_loss | 3.92e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 1953 | -| time_elapsed | 26083 | -| total_timesteps | 249984 | -| train/ | | -| approx_kl | 0.013709877 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | 0.00381 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 19520 | -| policy_gradient_loss | -0.00394 | -| std | 0.728 | -| value_loss | 3.42e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1954 | -| time_elapsed | 26088 | -| total_timesteps | 250112 | -| train/ | | -| approx_kl | 0.008089265 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 19530 | -| policy_gradient_loss | -0.00273 | -| std | 0.728 | -| value_loss | 3.61e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1955 | -| time_elapsed | 26098 | -| total_timesteps | 250240 | -| train/ | | -| approx_kl | 0.0072251856 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | 0.642 | -| learning_rate | 0.0003 | -| loss | -0.0264 | -| n_updates | 19540 | -| policy_gradient_loss | -0.0158 | -| std | 0.728 | -| value_loss | 0.0085 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1956 | -| time_elapsed | 26102 | -| total_timesteps | 250368 | -| train/ | | -| approx_kl | 0.0075234943 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -3.26 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 19550 | -| policy_gradient_loss | -0.000609 | -| std | 0.73 | -| value_loss | 5.97e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1957 | -| time_elapsed | 26107 | -| total_timesteps | 250496 | -| train/ | | -| approx_kl | 2.6898924e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -30.5 | -| learning_rate | 0.0003 | -| loss | -0.000148 | -| n_updates | 19560 | -| policy_gradient_loss | 3.16e-05 | -| std | 0.732 | -| value_loss | 2.61e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1958 | -| time_elapsed | 26110 | -| total_timesteps | 250624 | -| train/ | | -| approx_kl | 0.004120838 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -12.5 | -| learning_rate | 0.0003 | -| loss | -0.00637 | -| n_updates | 19570 | -| policy_gradient_loss | -0.00227 | -| std | 0.733 | -| value_loss | 4.15e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1959 | -| time_elapsed | 26114 | -| total_timesteps | 250752 | -| train/ | | -| approx_kl | 1.1078082e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.459 | -| learning_rate | 0.0003 | -| loss | -0.000536 | -| n_updates | 19580 | -| policy_gradient_loss | 0.002 | -| std | 0.733 | -| value_loss | 2.36e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1960 | -| time_elapsed | 26118 | -| total_timesteps | 250880 | -| train/ | | -| approx_kl | 0.00048491033 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | 0.00634 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 19590 | -| policy_gradient_loss | 7.64e-05 | -| std | 0.733 | -| value_loss | 3.59e-08 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1961 | -| time_elapsed | 26123 | -| total_timesteps | 251008 | -| train/ | | -| approx_kl | 0.000105396844 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.11 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 19600 | -| policy_gradient_loss | 0.000298 | -| std | 0.731 | -| value_loss | 3.57e-08 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1962 | -| time_elapsed | 26133 | -| total_timesteps | 251136 | -| train/ | | -| approx_kl | 0.015753835 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 19610 | -| policy_gradient_loss | -0.00652 | -| std | 0.728 | -| value_loss | 0.000855 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1963 | -| time_elapsed | 26138 | -| total_timesteps | 251264 | -| train/ | | -| approx_kl | 0.012227751 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -48.6 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 19620 | -| policy_gradient_loss | -0.00116 | -| std | 0.728 | -| value_loss | 2.44e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1964 | -| time_elapsed | 26142 | -| total_timesteps | 251392 | -| train/ | | -| approx_kl | 0.00096021174 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -0.856 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 19630 | -| policy_gradient_loss | -0.000262 | -| std | 0.728 | -| value_loss | 2.42e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1965 | -| time_elapsed | 26147 | -| total_timesteps | 251520 | -| train/ | | -| approx_kl | 0.0124076735 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 19640 | -| policy_gradient_loss | -0.00226 | -| std | 0.727 | -| value_loss | 1e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1966 | -| time_elapsed | 26151 | -| total_timesteps | 251648 | -| train/ | | -| approx_kl | 0.008155441 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -0.764 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 19650 | -| policy_gradient_loss | -0.00308 | -| std | 0.725 | -| value_loss | 3.14e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1967 | -| time_elapsed | 26155 | -| total_timesteps | 251776 | -| train/ | | -| approx_kl | 0.0011114432 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | 0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 19660 | -| policy_gradient_loss | -0.000417 | -| std | 0.723 | -| value_loss | 1.73e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1968 | -| time_elapsed | 26160 | -| total_timesteps | 251904 | -| train/ | | -| approx_kl | 0.009643506 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | -0.00348 | -| n_updates | 19670 | -| policy_gradient_loss | -0.00315 | -| std | 0.722 | -| value_loss | 8.91e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1969 | -| time_elapsed | 26163 | -| total_timesteps | 252032 | -| train/ | | -| approx_kl | 0.007830234 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 19680 | -| policy_gradient_loss | -0.00524 | -| std | 0.722 | -| value_loss | 7.08e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1970 | -| time_elapsed | 26169 | -| total_timesteps | 252160 | -| train/ | | -| approx_kl | 5.0041825e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | 0.757 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 19690 | -| policy_gradient_loss | 0.00121 | -| std | 0.722 | -| value_loss | 0.00243 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1971 | -| time_elapsed | 26172 | -| total_timesteps | 252288 | -| train/ | | -| approx_kl | 0.012515025 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 19700 | -| policy_gradient_loss | -0.00458 | -| std | 0.722 | -| value_loss | 8.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1972 | -| time_elapsed | 26177 | -| total_timesteps | 252416 | -| train/ | | -| approx_kl | 0.006388204 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -37.8 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 19710 | -| policy_gradient_loss | -0.00134 | -| std | 0.723 | -| value_loss | 3.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1973 | -| time_elapsed | 26181 | -| total_timesteps | 252544 | -| train/ | | -| approx_kl | 0.017563647 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -24.5 | -| learning_rate | 0.0003 | -| loss | -0.00961 | -| n_updates | 19720 | -| policy_gradient_loss | -0.00564 | -| std | 0.724 | -| value_loss | 1.7e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1974 | -| time_elapsed | 26186 | -| total_timesteps | 252672 | -| train/ | | -| approx_kl | 0.0167258 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | -0.00675 | -| n_updates | 19730 | -| policy_gradient_loss | -0.00615 | -| std | 0.724 | -| value_loss | 4.04e-09 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1975 | -| time_elapsed | 26190 | -| total_timesteps | 252800 | -| train/ | | -| approx_kl | 0.0052061905 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.1 | -| explained_variance | -0.00479 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 19740 | -| policy_gradient_loss | -0.00272 | -| std | 0.723 | -| value_loss | 2.72e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1976 | -| time_elapsed | 26194 | -| total_timesteps | 252928 | -| train/ | | -| approx_kl | 2.1716114e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | -0.000955 | -| n_updates | 19750 | -| policy_gradient_loss | 0.00289 | -| std | 0.721 | -| value_loss | 2.65e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1977 | -| time_elapsed | 26199 | -| total_timesteps | 253056 | -| train/ | | -| approx_kl | 0.009449765 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | 0.025 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 19760 | -| policy_gradient_loss | -0.00229 | -| std | 0.721 | -| value_loss | 7.23e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1978 | -| time_elapsed | 26206 | -| total_timesteps | 253184 | -| train/ | | -| approx_kl | 0.0031697447 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | 0.552 | -| learning_rate | 0.0003 | -| loss | 0.00153 | -| n_updates | 19770 | -| policy_gradient_loss | -0.00246 | -| std | 0.72 | -| value_loss | 0.0183 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1979 | -| time_elapsed | 26211 | -| total_timesteps | 253312 | -| train/ | | -| approx_kl | 0.020304412 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -43.5 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 19780 | -| policy_gradient_loss | -0.00749 | -| std | 0.721 | -| value_loss | 1.23e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1980 | -| time_elapsed | 26214 | -| total_timesteps | 253440 | -| train/ | | -| approx_kl | 0.0131617 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -36.8 | -| learning_rate | 0.0003 | -| loss | 0.000724 | -| n_updates | 19790 | -| policy_gradient_loss | -0.00163 | -| std | 0.721 | -| value_loss | 4.21e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1981 | -| time_elapsed | 26217 | -| total_timesteps | 253568 | -| train/ | | -| approx_kl | 0.0052882954 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -16 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 19800 | -| policy_gradient_loss | -0.00438 | -| std | 0.72 | -| value_loss | 1.47e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1982 | -| time_elapsed | 26221 | -| total_timesteps | 253696 | -| train/ | | -| approx_kl | 0.0038809492 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | 0.000864 | -| n_updates | 19810 | -| policy_gradient_loss | 0.000492 | -| std | 0.72 | -| value_loss | 2.02e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1983 | -| time_elapsed | 26225 | -| total_timesteps | 253824 | -| train/ | | -| approx_kl | 0.005839361 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -0.35 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 19820 | -| policy_gradient_loss | -0.00533 | -| std | 0.719 | -| value_loss | 1.35e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.63 | -| time/ | | -| fps | 9 | -| iterations | 1984 | -| time_elapsed | 26228 | -| total_timesteps | 253952 | -| train/ | | -| approx_kl | 2.6570633e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.000161 | -| n_updates | 19830 | -| policy_gradient_loss | 0.00185 | -| std | 0.718 | -| value_loss | 1.11e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1985 | -| time_elapsed | 26232 | -| total_timesteps | 254080 | -| train/ | | -| approx_kl | 0.003928271 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.09 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.000749 | -| n_updates | 19840 | -| policy_gradient_loss | -0.000602 | -| std | 0.716 | -| value_loss | 1.17e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1986 | -| time_elapsed | 26238 | -| total_timesteps | 254208 | -| train/ | | -| approx_kl | 0.0027518496 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 19850 | -| policy_gradient_loss | -0.00613 | -| std | 0.714 | -| value_loss | 0.00114 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1987 | -| time_elapsed | 26242 | -| total_timesteps | 254336 | -| train/ | | -| approx_kl | 4.474772e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -7.92 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 19860 | -| policy_gradient_loss | 0.000938 | -| std | 0.711 | -| value_loss | 3.08e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1988 | -| time_elapsed | 26247 | -| total_timesteps | 254464 | -| train/ | | -| approx_kl | 0.0044882316 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -3.18 | -| learning_rate | 0.0003 | -| loss | -0.000616 | -| n_updates | 19870 | -| policy_gradient_loss | -0.000418 | -| std | 0.711 | -| value_loss | 7.72e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1989 | -| time_elapsed | 26250 | -| total_timesteps | 254592 | -| train/ | | -| approx_kl | 0.007218177 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.000754 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 19880 | -| policy_gradient_loss | -0.002 | -| std | 0.71 | -| value_loss | 4.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1990 | -| time_elapsed | 26253 | -| total_timesteps | 254720 | -| train/ | | -| approx_kl | 0.011492432 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | -0.00876 | -| n_updates | 19890 | -| policy_gradient_loss | -0.00713 | -| std | 0.709 | -| value_loss | 2.75e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1991 | -| time_elapsed | 26257 | -| total_timesteps | 254848 | -| train/ | | -| approx_kl | 0.0079195015 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | -0.00748 | -| n_updates | 19900 | -| policy_gradient_loss | -0.00349 | -| std | 0.708 | -| value_loss | 2.24e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1992 | -| time_elapsed | 26262 | -| total_timesteps | 254976 | -| train/ | | -| approx_kl | 0.0003688326 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 19910 | -| policy_gradient_loss | 0.000451 | -| std | 0.708 | -| value_loss | 2.63e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1993 | -| time_elapsed | 26267 | -| total_timesteps | 255104 | -| train/ | | -| approx_kl | 0.0003120848 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.00188 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 19920 | -| policy_gradient_loss | 0.000728 | -| std | 0.708 | -| value_loss | 1.46e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1994 | -| time_elapsed | 26278 | -| total_timesteps | 255232 | -| train/ | | -| approx_kl | 0.00022514211 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.713 | -| learning_rate | 0.0003 | -| loss | 0.000916 | -| n_updates | 19930 | -| policy_gradient_loss | -0.000403 | -| std | 0.706 | -| value_loss | 0.00809 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1995 | -| time_elapsed | 26283 | -| total_timesteps | 255360 | -| train/ | | -| approx_kl | 0.021093886 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -31.7 | -| learning_rate | 0.0003 | -| loss | -0.0319 | -| n_updates | 19940 | -| policy_gradient_loss | -0.0168 | -| std | 0.705 | -| value_loss | 1.6e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1996 | -| time_elapsed | 26287 | -| total_timesteps | 255488 | -| train/ | | -| approx_kl | 0.00541745 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -29.1 | -| learning_rate | 0.0003 | -| loss | 0.00153 | -| n_updates | 19950 | -| policy_gradient_loss | 0.000818 | -| std | 0.704 | -| value_loss | 7.01e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1997 | -| time_elapsed | 26292 | -| total_timesteps | 255616 | -| train/ | | -| approx_kl | 5.5785757e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -28.7 | -| learning_rate | 0.0003 | -| loss | -4.59e-05 | -| n_updates | 19960 | -| policy_gradient_loss | 5.26e-05 | -| std | 0.705 | -| value_loss | 2.08e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1998 | -| time_elapsed | 26296 | -| total_timesteps | 255744 | -| train/ | | -| approx_kl | 0.0063073784 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -3.67 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 19970 | -| policy_gradient_loss | -0.00291 | -| std | 0.706 | -| value_loss | 1.24e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 9 | -| iterations | 1999 | -| time_elapsed | 26300 | -| total_timesteps | 255872 | -| train/ | | -| approx_kl | 0.000249058 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | 0.00096 | -| n_updates | 19980 | -| policy_gradient_loss | 0.00116 | -| std | 0.706 | -| value_loss | 5.3e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2000 | -| time_elapsed | 26305 | -| total_timesteps | 256000 | -| train/ | | -| approx_kl | 0.001483216 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 19990 | -| policy_gradient_loss | -0.0027 | -| std | 0.706 | -| value_loss | 5.69e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2001 | -| time_elapsed | 26309 | -| total_timesteps | 256128 | -| train/ | | -| approx_kl | 0.016246991 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.0289 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 20000 | -| policy_gradient_loss | -0.0139 | -| std | 0.706 | -| value_loss | 9.55e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2002 | -| time_elapsed | 26319 | -| total_timesteps | 256256 | -| train/ | | -| approx_kl | 0.010647802 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | -0.00803 | -| n_updates | 20010 | -| policy_gradient_loss | -0.00659 | -| std | 0.706 | -| value_loss | 0.00526 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2003 | -| time_elapsed | 26323 | -| total_timesteps | 256384 | -| train/ | | -| approx_kl | 0.002990455 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -19.3 | -| learning_rate | 0.0003 | -| loss | -0.000172 | -| n_updates | 20020 | -| policy_gradient_loss | -0.000101 | -| std | 0.705 | -| value_loss | 6.37e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2004 | -| time_elapsed | 26327 | -| total_timesteps | 256512 | -| train/ | | -| approx_kl | 0.0109983925 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -15.9 | -| learning_rate | 0.0003 | -| loss | -0.00791 | -| n_updates | 20030 | -| policy_gradient_loss | -0.00404 | -| std | 0.707 | -| value_loss | 1.35e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2005 | -| time_elapsed | 26331 | -| total_timesteps | 256640 | -| train/ | | -| approx_kl | 0.0014039758 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.0166 | -| learning_rate | 0.0003 | -| loss | 0.00099 | -| n_updates | 20040 | -| policy_gradient_loss | 0.000704 | -| std | 0.708 | -| value_loss | 9.87e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2006 | -| time_elapsed | 26336 | -| total_timesteps | 256768 | -| train/ | | -| approx_kl | 0.0047944984 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.482 | -| learning_rate | 0.0003 | -| loss | -0.00935 | -| n_updates | 20050 | -| policy_gradient_loss | -0.00369 | -| std | 0.709 | -| value_loss | 7.3e-08 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2007 | -| time_elapsed | 26341 | -| total_timesteps | 256896 | -| train/ | | -| approx_kl | 1.51935965e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.536 | -| learning_rate | 0.0003 | -| loss | 0.00023 | -| n_updates | 20060 | -| policy_gradient_loss | 0.00101 | -| std | 0.709 | -| value_loss | 8.81e-08 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2008 | -| time_elapsed | 26344 | -| total_timesteps | 257024 | -| train/ | | -| approx_kl | 0.00034787785 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.042 | -| learning_rate | 0.0003 | -| loss | 0.000248 | -| n_updates | 20070 | -| policy_gradient_loss | 0.000359 | -| std | 0.708 | -| value_loss | 4.66e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2009 | -| time_elapsed | 26353 | -| total_timesteps | 257152 | -| train/ | | -| approx_kl | 0.004336472 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | -0.00892 | -| n_updates | 20080 | -| policy_gradient_loss | -0.00506 | -| std | 0.706 | -| value_loss | 0.00271 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2010 | -| time_elapsed | 26358 | -| total_timesteps | 257280 | -| train/ | | -| approx_kl | 0.014665729 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 20090 | -| policy_gradient_loss | -0.0149 | -| std | 0.706 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2011 | -| time_elapsed | 26363 | -| total_timesteps | 257408 | -| train/ | | -| approx_kl | 0.0060596857 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -25.3 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 20100 | -| policy_gradient_loss | -0.00112 | -| std | 0.707 | -| value_loss | 8.03e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2012 | -| time_elapsed | 26366 | -| total_timesteps | 257536 | -| train/ | | -| approx_kl | 0.0024884795 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.531 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 20110 | -| policy_gradient_loss | -0.00674 | -| std | 0.707 | -| value_loss | 3.61e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2013 | -| time_elapsed | 26370 | -| total_timesteps | 257664 | -| train/ | | -| approx_kl | 0.0034338296 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.825 | -| learning_rate | 0.0003 | -| loss | -5.5e-06 | -| n_updates | 20120 | -| policy_gradient_loss | 5.74e-05 | -| std | 0.709 | -| value_loss | 2.67e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2014 | -| time_elapsed | 26373 | -| total_timesteps | 257792 | -| train/ | | -| approx_kl | 0.00014402298 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.0252 | -| learning_rate | 0.0003 | -| loss | -0.00041 | -| n_updates | 20130 | -| policy_gradient_loss | -0.000149 | -| std | 0.711 | -| value_loss | 1.47e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2015 | -| time_elapsed | 26377 | -| total_timesteps | 257920 | -| train/ | | -| approx_kl | 0.004281505 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.0885 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 20140 | -| policy_gradient_loss | -0.00768 | -| std | 0.713 | -| value_loss | 1.49e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2016 | -| time_elapsed | 26382 | -| total_timesteps | 258048 | -| train/ | | -| approx_kl | 3.5301782e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -6.76e-06 | -| n_updates | 20150 | -| policy_gradient_loss | 0.00202 | -| std | 0.714 | -| value_loss | 7.33e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2017 | -| time_elapsed | 26390 | -| total_timesteps | 258176 | -| train/ | | -| approx_kl | 0.0027154153 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | 0.00969 | -| n_updates | 20160 | -| policy_gradient_loss | 0.0037 | -| std | 0.713 | -| value_loss | 0.00381 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2018 | -| time_elapsed | 26394 | -| total_timesteps | 258304 | -| train/ | | -| approx_kl | 0.0020366372 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -23 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 20170 | -| policy_gradient_loss | -0.000707 | -| std | 0.713 | -| value_loss | 1.62e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2019 | -| time_elapsed | 26398 | -| total_timesteps | 258432 | -| train/ | | -| approx_kl | 0.0063974215 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -17.4 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 20180 | -| policy_gradient_loss | -0.00154 | -| std | 0.714 | -| value_loss | 2.84e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2020 | -| time_elapsed | 26402 | -| total_timesteps | 258560 | -| train/ | | -| approx_kl | 0.004774019 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | -0.000839 | -| n_updates | 20190 | -| policy_gradient_loss | -0.000607 | -| std | 0.716 | -| value_loss | 1.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2021 | -| time_elapsed | 26407 | -| total_timesteps | 258688 | -| train/ | | -| approx_kl | 0.008317835 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 20200 | -| policy_gradient_loss | -0.00339 | -| std | 0.716 | -| value_loss | 1.61e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2022 | -| time_elapsed | 26410 | -| total_timesteps | 258816 | -| train/ | | -| approx_kl | 0.00054633664 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.000143 | -| n_updates | 20210 | -| policy_gradient_loss | 9.54e-05 | -| std | 0.716 | -| value_loss | 9.72e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2023 | -| time_elapsed | 26413 | -| total_timesteps | 258944 | -| train/ | | -| approx_kl | 0.002507118 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.0387 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 20220 | -| policy_gradient_loss | -0.00094 | -| std | 0.715 | -| value_loss | 8.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2024 | -| time_elapsed | 26417 | -| total_timesteps | 259072 | -| train/ | | -| approx_kl | 0.015431188 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.0319 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 20230 | -| policy_gradient_loss | -0.00993 | -| std | 0.714 | -| value_loss | 7.75e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2025 | -| time_elapsed | 26424 | -| total_timesteps | 259200 | -| train/ | | -| approx_kl | 0.0030609788 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.687 | -| learning_rate | 0.0003 | -| loss | 0.00432 | -| n_updates | 20240 | -| policy_gradient_loss | -0.000616 | -| std | 0.715 | -| value_loss | 0.0123 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2026 | -| time_elapsed | 26428 | -| total_timesteps | 259328 | -| train/ | | -| approx_kl | 0.0029140054 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -16.8 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 20250 | -| policy_gradient_loss | -0.00148 | -| std | 0.715 | -| value_loss | 5.8e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2027 | -| time_elapsed | 26433 | -| total_timesteps | 259456 | -| train/ | | -| approx_kl | 4.9836002e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -13 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 20260 | -| policy_gradient_loss | 0.00225 | -| std | 0.716 | -| value_loss | 1.03e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2028 | -| time_elapsed | 26436 | -| total_timesteps | 259584 | -| train/ | | -| approx_kl | 0.013981335 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -8.8 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 20270 | -| policy_gradient_loss | -0.00721 | -| std | 0.715 | -| value_loss | 4.64e-07 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2029 | -| time_elapsed | 26440 | -| total_timesteps | 259712 | -| train/ | | -| approx_kl | 0.000102274586 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -2.05 | -| learning_rate | 0.0003 | -| loss | -0.000945 | -| n_updates | 20280 | -| policy_gradient_loss | 0.000313 | -| std | 0.713 | -| value_loss | 2.03e-07 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2030 | -| time_elapsed | 26445 | -| total_timesteps | 259840 | -| train/ | | -| approx_kl | 0.004799303 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.0513 | -| learning_rate | 0.0003 | -| loss | -0.000789 | -| n_updates | 20290 | -| policy_gradient_loss | -0.000743 | -| std | 0.711 | -| value_loss | 2.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2031 | -| time_elapsed | 26449 | -| total_timesteps | 259968 | -| train/ | | -| approx_kl | 0.0010704175 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | -0.000744 | -| n_updates | 20300 | -| policy_gradient_loss | -0.000327 | -| std | 0.71 | -| value_loss | 4.48e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2032 | -| time_elapsed | 26454 | -| total_timesteps | 260096 | -| train/ | | -| approx_kl | 0.001571314 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 20310 | -| policy_gradient_loss | -0.00104 | -| std | 0.709 | -| value_loss | 9.08e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2033 | -| time_elapsed | 26462 | -| total_timesteps | 260224 | -| train/ | | -| approx_kl | 0.00078648655 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.762 | -| learning_rate | 0.0003 | -| loss | -0.00078 | -| n_updates | 20320 | -| policy_gradient_loss | -0.00223 | -| std | 0.707 | -| value_loss | 0.00891 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2034 | -| time_elapsed | 26467 | -| total_timesteps | 260352 | -| train/ | | -| approx_kl | 0.007544404 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -8.75 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 20330 | -| policy_gradient_loss | -0.00646 | -| std | 0.705 | -| value_loss | 4.09e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2035 | -| time_elapsed | 26471 | -| total_timesteps | 260480 | -| train/ | | -| approx_kl | 3.6236364e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -4.36 | -| learning_rate | 0.0003 | -| loss | 0.000621 | -| n_updates | 20340 | -| policy_gradient_loss | 0.00168 | -| std | 0.705 | -| value_loss | 2.73e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2036 | -| time_elapsed | 26475 | -| total_timesteps | 260608 | -| train/ | | -| approx_kl | 0.0027058413 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -2.42 | -| learning_rate | 0.0003 | -| loss | 5.71e-05 | -| n_updates | 20350 | -| policy_gradient_loss | 4.54e-05 | -| std | 0.706 | -| value_loss | 1.6e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2037 | -| time_elapsed | 26480 | -| total_timesteps | 260736 | -| train/ | | -| approx_kl | 0.008353077 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 20360 | -| policy_gradient_loss | -0.00721 | -| std | 0.705 | -| value_loss | 7.45e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2038 | -| time_elapsed | 26485 | -| total_timesteps | 260864 | -| train/ | | -| approx_kl | 0.0009372318 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | 0.000459 | -| n_updates | 20370 | -| policy_gradient_loss | 0.000303 | -| std | 0.703 | -| value_loss | 6.29e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2039 | -| time_elapsed | 26490 | -| total_timesteps | 260992 | -| train/ | | -| approx_kl | 0.004391244 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.00721 | -| n_updates | 20380 | -| policy_gradient_loss | -0.00282 | -| std | 0.703 | -| value_loss | 7.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2040 | -| time_elapsed | 26495 | -| total_timesteps | 261120 | -| train/ | | -| approx_kl | 0.016385552 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 20390 | -| policy_gradient_loss | -0.00855 | -| std | 0.704 | -| value_loss | 2.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2041 | -| time_elapsed | 26506 | -| total_timesteps | 261248 | -| train/ | | -| approx_kl | 0.009009117 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 20400 | -| policy_gradient_loss | -0.0139 | -| std | 0.704 | -| value_loss | 0.00574 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2042 | -| time_elapsed | 26510 | -| total_timesteps | 261376 | -| train/ | | -| approx_kl | 0.007425005 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -5.5 | -| learning_rate | 0.0003 | -| loss | -0.000581 | -| n_updates | 20410 | -| policy_gradient_loss | -0.000432 | -| std | 0.705 | -| value_loss | 5.53e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2043 | -| time_elapsed | 26515 | -| total_timesteps | 261504 | -| train/ | | -| approx_kl | 0.0023666006 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.853 | -| learning_rate | 0.0003 | -| loss | -0.00579 | -| n_updates | 20420 | -| policy_gradient_loss | -0.00166 | -| std | 0.705 | -| value_loss | 9.24e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2044 | -| time_elapsed | 26519 | -| total_timesteps | 261632 | -| train/ | | -| approx_kl | 0.0095937895 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -3.29 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 20430 | -| policy_gradient_loss | -0.00287 | -| std | 0.706 | -| value_loss | 2.81e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2045 | -| time_elapsed | 26523 | -| total_timesteps | 261760 | -| train/ | | -| approx_kl | 0.003880086 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.028 | -| learning_rate | 0.0003 | -| loss | -0.00346 | -| n_updates | 20440 | -| policy_gradient_loss | -0.00144 | -| std | 0.707 | -| value_loss | 3.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2046 | -| time_elapsed | 26527 | -| total_timesteps | 261888 | -| train/ | | -| approx_kl | 0.017991785 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 20450 | -| policy_gradient_loss | -0.011 | -| std | 0.708 | -| value_loss | 3.4e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2047 | -| time_elapsed | 26531 | -| total_timesteps | 262016 | -| train/ | | -| approx_kl | 0.00014200993 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 20460 | -| policy_gradient_loss | 0.000995 | -| std | 0.71 | -| value_loss | 2.83e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2048 | -| time_elapsed | 26542 | -| total_timesteps | 262144 | -| train/ | | -| approx_kl | 0.008523384 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 20470 | -| policy_gradient_loss | -0.00538 | -| std | 0.711 | -| value_loss | 0.00227 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2049 | -| time_elapsed | 26546 | -| total_timesteps | 262272 | -| train/ | | -| approx_kl | 0.0037927642 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -12.3 | -| learning_rate | 0.0003 | -| loss | -6.7e-05 | -| n_updates | 20480 | -| policy_gradient_loss | -0.000242 | -| std | 0.71 | -| value_loss | 5.46e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2050 | -| time_elapsed | 26550 | -| total_timesteps | 262400 | -| train/ | | -| approx_kl | 0.0014050086 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.08 | -| explained_variance | -11.6 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 20490 | -| policy_gradient_loss | -0.000643 | -| std | 0.709 | -| value_loss | 1.37e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2051 | -| time_elapsed | 26554 | -| total_timesteps | 262528 | -| train/ | | -| approx_kl | 0.00031983387 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -8.45 | -| learning_rate | 0.0003 | -| loss | -0.000501 | -| n_updates | 20500 | -| policy_gradient_loss | -0.00015 | -| std | 0.706 | -| value_loss | 2.62e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2052 | -| time_elapsed | 26558 | -| total_timesteps | 262656 | -| train/ | | -| approx_kl | 0.012853895 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -12.7 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 20510 | -| policy_gradient_loss | -0.00276 | -| std | 0.705 | -| value_loss | 2.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2053 | -| time_elapsed | 26562 | -| total_timesteps | 262784 | -| train/ | | -| approx_kl | 0.0045847287 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.721 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 20520 | -| policy_gradient_loss | -0.00763 | -| std | 0.705 | -| value_loss | 1.67e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2054 | -| time_elapsed | 26565 | -| total_timesteps | 262912 | -| train/ | | -| approx_kl | 0.014293859 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.771 | -| learning_rate | 0.0003 | -| loss | -0.0299 | -| n_updates | 20530 | -| policy_gradient_loss | -0.0162 | -| std | 0.705 | -| value_loss | 1.77e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2055 | -| time_elapsed | 26570 | -| total_timesteps | 263040 | -| train/ | | -| approx_kl | 0.00039242068 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.0633 | -| learning_rate | 0.0003 | -| loss | 0.00421 | -| n_updates | 20540 | -| policy_gradient_loss | 0.00481 | -| std | 0.705 | -| value_loss | 1.07e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2056 | -| time_elapsed | 26578 | -| total_timesteps | 263168 | -| train/ | | -| approx_kl | 0.02161154 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.713 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 20550 | -| policy_gradient_loss | -0.0105 | -| std | 0.706 | -| value_loss | 0.00225 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2057 | -| time_elapsed | 26582 | -| total_timesteps | 263296 | -| train/ | | -| approx_kl | 8.162996e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -19 | -| learning_rate | 0.0003 | -| loss | -4.99e-05 | -| n_updates | 20560 | -| policy_gradient_loss | 1.67e-06 | -| std | 0.705 | -| value_loss | 4.87e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2058 | -| time_elapsed | 26587 | -| total_timesteps | 263424 | -| train/ | | -| approx_kl | 0.005851737 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -25.4 | -| learning_rate | 0.0003 | -| loss | -0.00964 | -| n_updates | 20570 | -| policy_gradient_loss | -0.00408 | -| std | 0.703 | -| value_loss | 9.33e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2059 | -| time_elapsed | 26591 | -| total_timesteps | 263552 | -| train/ | | -| approx_kl | 0.015721785 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -2.79 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 20580 | -| policy_gradient_loss | -0.00394 | -| std | 0.702 | -| value_loss | 1.65e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2060 | -| time_elapsed | 26595 | -| total_timesteps | 263680 | -| train/ | | -| approx_kl | 0.0017750957 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.705 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 20590 | -| policy_gradient_loss | -0.00212 | -| std | 0.702 | -| value_loss | 4.4e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2061 | -| time_elapsed | 26597 | -| total_timesteps | 263808 | -| train/ | | -| approx_kl | 0.010792185 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 20600 | -| policy_gradient_loss | -0.00308 | -| std | 0.703 | -| value_loss | 8.36e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2062 | -| time_elapsed | 26602 | -| total_timesteps | 263936 | -| train/ | | -| approx_kl | 0.0006230059 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.00147 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 20610 | -| policy_gradient_loss | -0.000384 | -| std | 0.704 | -| value_loss | 7.25e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2063 | -| time_elapsed | 26606 | -| total_timesteps | 264064 | -| train/ | | -| approx_kl | 0.0017995341 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.00886 | -| learning_rate | 0.0003 | -| loss | -0.000479 | -| n_updates | 20620 | -| policy_gradient_loss | -0.000224 | -| std | 0.706 | -| value_loss | 8.97e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2064 | -| time_elapsed | 26611 | -| total_timesteps | 264192 | -| train/ | | -| approx_kl | 0.002091474 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 20630 | -| policy_gradient_loss | -0.0115 | -| std | 0.706 | -| value_loss | 0.0036 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2065 | -| time_elapsed | 26615 | -| total_timesteps | 264320 | -| train/ | | -| approx_kl | 0.12784652 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | 0.00268 | -| n_updates | 20640 | -| policy_gradient_loss | 0.014 | -| std | 0.706 | -| value_loss | 3.53e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2066 | -| time_elapsed | 26618 | -| total_timesteps | 264448 | -| train/ | | -| approx_kl | 0.00045081787 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -8.52 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 20650 | -| policy_gradient_loss | -0.000126 | -| std | 0.707 | -| value_loss | 6.94e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2067 | -| time_elapsed | 26621 | -| total_timesteps | 264576 | -| train/ | | -| approx_kl | 0.01339703 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 20660 | -| policy_gradient_loss | -0.0079 | -| std | 0.707 | -| value_loss | 2.37e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2068 | -| time_elapsed | 26624 | -| total_timesteps | 264704 | -| train/ | | -| approx_kl | 0.00021099718 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.34 | -| learning_rate | 0.0003 | -| loss | -0.00412 | -| n_updates | 20670 | -| policy_gradient_loss | 0.000759 | -| std | 0.707 | -| value_loss | 2.46e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2069 | -| time_elapsed | 26627 | -| total_timesteps | 264832 | -| train/ | | -| approx_kl | 0.0115741035 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.00922 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 20680 | -| policy_gradient_loss | -0.00565 | -| std | 0.704 | -| value_loss | 1.51e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2070 | -| time_elapsed | 26631 | -| total_timesteps | 264960 | -| train/ | | -| approx_kl | 0.00010643015 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | -0.000306 | -| n_updates | 20690 | -| policy_gradient_loss | -9.37e-06 | -| std | 0.703 | -| value_loss | 1.01e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2071 | -| time_elapsed | 26635 | -| total_timesteps | 265088 | -| train/ | | -| approx_kl | 0.0018580081 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 20700 | -| policy_gradient_loss | -0.00149 | -| std | 0.703 | -| value_loss | 1.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2072 | -| time_elapsed | 26644 | -| total_timesteps | 265216 | -| train/ | | -| approx_kl | 0.018720888 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 20710 | -| policy_gradient_loss | -0.0099 | -| std | 0.703 | -| value_loss | 0.00148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2073 | -| time_elapsed | 26648 | -| total_timesteps | 265344 | -| train/ | | -| approx_kl | 0.010709232 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -22.2 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 20720 | -| policy_gradient_loss | -0.00226 | -| std | 0.702 | -| value_loss | 1.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2074 | -| time_elapsed | 26653 | -| total_timesteps | 265472 | -| train/ | | -| approx_kl | 0.011772965 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -1.07 | -| explained_variance | -30.8 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 20730 | -| policy_gradient_loss | -0.0037 | -| std | 0.702 | -| value_loss | 6.58e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2075 | -| time_elapsed | 26658 | -| total_timesteps | 265600 | -| train/ | | -| approx_kl | 0.00088518625 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -2.72 | -| learning_rate | 0.0003 | -| loss | -0.000191 | -| n_updates | 20740 | -| policy_gradient_loss | 1.93e-05 | -| std | 0.7 | -| value_loss | 7.34e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2076 | -| time_elapsed | 26662 | -| total_timesteps | 265728 | -| train/ | | -| approx_kl | 0.0024780398 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 20750 | -| policy_gradient_loss | -0.0013 | -| std | 0.697 | -| value_loss | 5.31e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2077 | -| time_elapsed | 26665 | -| total_timesteps | 265856 | -| train/ | | -| approx_kl | 3.8407743e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | 0.000147 | -| n_updates | 20760 | -| policy_gradient_loss | 0.000639 | -| std | 0.697 | -| value_loss | 3.8e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.67 | -| time/ | | -| fps | 9 | -| iterations | 2078 | -| time_elapsed | 26669 | -| total_timesteps | 265984 | -| train/ | | -| approx_kl | 0.00040239375 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | 0.000226 | -| n_updates | 20770 | -| policy_gradient_loss | 0.000186 | -| std | 0.698 | -| value_loss | 2.62e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2079 | -| time_elapsed | 26672 | -| total_timesteps | 266112 | -| train/ | | -| approx_kl | 0.005678189 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 20780 | -| policy_gradient_loss | -0.00334 | -| std | 0.698 | -| value_loss | 2.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2080 | -| time_elapsed | 26683 | -| total_timesteps | 266240 | -| train/ | | -| approx_kl | 0.008744473 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | 0.12 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 20790 | -| policy_gradient_loss | -0.00784 | -| std | 0.697 | -| value_loss | 0.00246 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2081 | -| time_elapsed | 26686 | -| total_timesteps | 266368 | -| train/ | | -| approx_kl | 0.0005117436 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -39.7 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 20800 | -| policy_gradient_loss | -0.000189 | -| std | 0.697 | -| value_loss | 3.16e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2082 | -| time_elapsed | 26691 | -| total_timesteps | 266496 | -| train/ | | -| approx_kl | 0.010643797 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -45 | -| learning_rate | 0.0003 | -| loss | -0.00702 | -| n_updates | 20810 | -| policy_gradient_loss | -0.00567 | -| std | 0.697 | -| value_loss | 8.39e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2083 | -| time_elapsed | 26695 | -| total_timesteps | 266624 | -| train/ | | -| approx_kl | 0.0033821505 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -18 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 20820 | -| policy_gradient_loss | -0.00284 | -| std | 0.696 | -| value_loss | 1.95e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2084 | -| time_elapsed | 26699 | -| total_timesteps | 266752 | -| train/ | | -| approx_kl | 2.3883767e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -6.32 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 20830 | -| policy_gradient_loss | 0.00298 | -| std | 0.696 | -| value_loss | 1.07e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.66 | -| time/ | | -| fps | 9 | -| iterations | 2085 | -| time_elapsed | 26702 | -| total_timesteps | 266880 | -| train/ | | -| approx_kl | 0.0006132652 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.06 | -| explained_variance | -0.381 | -| learning_rate | 0.0003 | -| loss | 0.000402 | -| n_updates | 20840 | -| policy_gradient_loss | 0.000373 | -| std | 0.694 | -| value_loss | 2.26e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2086 | -| time_elapsed | 26707 | -| total_timesteps | 267008 | -| train/ | | -| approx_kl | 0.0031742696 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -0.0778 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 20850 | -| policy_gradient_loss | -0.00112 | -| std | 0.694 | -| value_loss | 1.6e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 9 | -| iterations | 2087 | -| time_elapsed | 26718 | -| total_timesteps | 267136 | -| train/ | | -| approx_kl | 0.021820629 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.788 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 20860 | -| policy_gradient_loss | -0.00704 | -| std | 0.694 | -| value_loss | 0.00512 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2088 | -| time_elapsed | 26721 | -| total_timesteps | 267264 | -| train/ | | -| approx_kl | 0.002187177 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -53.3 | -| learning_rate | 0.0003 | -| loss | -0.000235 | -| n_updates | 20870 | -| policy_gradient_loss | -0.000177 | -| std | 0.692 | -| value_loss | 0.000115 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2089 | -| time_elapsed | 26724 | -| total_timesteps | 267392 | -| train/ | | -| approx_kl | 0.003947564 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -39.1 | -| learning_rate | 0.0003 | -| loss | -0.00834 | -| n_updates | 20880 | -| policy_gradient_loss | -0.00299 | -| std | 0.69 | -| value_loss | 3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2090 | -| time_elapsed | 26728 | -| total_timesteps | 267520 | -| train/ | | -| approx_kl | 0.008882847 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -31.3 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 20890 | -| policy_gradient_loss | -0.00356 | -| std | 0.689 | -| value_loss | 2.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2091 | -| time_elapsed | 26731 | -| total_timesteps | 267648 | -| train/ | | -| approx_kl | 0.005852666 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -24.1 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 20900 | -| policy_gradient_loss | -0.00543 | -| std | 0.689 | -| value_loss | 1.74e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2092 | -| time_elapsed | 26734 | -| total_timesteps | 267776 | -| train/ | | -| approx_kl | 0.013575302 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 20910 | -| policy_gradient_loss | -0.00756 | -| std | 0.689 | -| value_loss | 1.68e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2093 | -| time_elapsed | 26737 | -| total_timesteps | 267904 | -| train/ | | -| approx_kl | 0.00082450174 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -1.29 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 20920 | -| policy_gradient_loss | 0.00135 | -| std | 0.69 | -| value_loss | 8.38e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2094 | -| time_elapsed | 26740 | -| total_timesteps | 268032 | -| train/ | | -| approx_kl | 0.0027699582 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.0299 | -| learning_rate | 0.0003 | -| loss | -0.00809 | -| n_updates | 20930 | -| policy_gradient_loss | -0.00228 | -| std | 0.691 | -| value_loss | 5.63e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2095 | -| time_elapsed | 26749 | -| total_timesteps | 268160 | -| train/ | | -| approx_kl | 0.012817103 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 20940 | -| policy_gradient_loss | -0.00356 | -| std | 0.69 | -| value_loss | 0.00472 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2096 | -| time_elapsed | 26753 | -| total_timesteps | 268288 | -| train/ | | -| approx_kl | 0.001693387 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -11.9 | -| learning_rate | 0.0003 | -| loss | -0.00809 | -| n_updates | 20950 | -| policy_gradient_loss | -0.000847 | -| std | 0.69 | -| value_loss | 1.12e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2097 | -| time_elapsed | 26757 | -| total_timesteps | 268416 | -| train/ | | -| approx_kl | 0.00025033252 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -15.2 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 20960 | -| policy_gradient_loss | 0.000867 | -| std | 0.69 | -| value_loss | 2.64e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2098 | -| time_elapsed | 26761 | -| total_timesteps | 268544 | -| train/ | | -| approx_kl | 5.7639554e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | -0.000626 | -| n_updates | 20970 | -| policy_gradient_loss | 0.000392 | -| std | 0.688 | -| value_loss | 6.23e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2099 | -| time_elapsed | 26765 | -| total_timesteps | 268672 | -| train/ | | -| approx_kl | 0.0019140812 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.348 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 20980 | -| policy_gradient_loss | -0.000403 | -| std | 0.687 | -| value_loss | 8.89e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2100 | -| time_elapsed | 26769 | -| total_timesteps | 268800 | -| train/ | | -| approx_kl | 0.00033555832 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 20990 | -| policy_gradient_loss | 0.000712 | -| std | 0.688 | -| value_loss | 7.39e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2101 | -| time_elapsed | 26773 | -| total_timesteps | 268928 | -| train/ | | -| approx_kl | 0.0020743348 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.000506 | -| n_updates | 21000 | -| policy_gradient_loss | 0.0004 | -| std | 0.69 | -| value_loss | 1.16e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2102 | -| time_elapsed | 26777 | -| total_timesteps | 269056 | -| train/ | | -| approx_kl | 0.0061004814 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.0312 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 21010 | -| policy_gradient_loss | -0.00616 | -| std | 0.691 | -| value_loss | 8.37e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2103 | -| time_elapsed | 26785 | -| total_timesteps | 269184 | -| train/ | | -| approx_kl | 0.0020002876 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | -0.00914 | -| n_updates | 21020 | -| policy_gradient_loss | -0.0035 | -| std | 0.69 | -| value_loss | 0.00207 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2104 | -| time_elapsed | 26789 | -| total_timesteps | 269312 | -| train/ | | -| approx_kl | 0.00040823594 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -37.5 | -| learning_rate | 0.0003 | -| loss | -0.000332 | -| n_updates | 21030 | -| policy_gradient_loss | -0.000169 | -| std | 0.688 | -| value_loss | 1.32e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2105 | -| time_elapsed | 26794 | -| total_timesteps | 269440 | -| train/ | | -| approx_kl | 0.004299897 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -36.3 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 21040 | -| policy_gradient_loss | -0.00464 | -| std | 0.687 | -| value_loss | 3.92e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2106 | -| time_elapsed | 26799 | -| total_timesteps | 269568 | -| train/ | | -| approx_kl | 0.012500128 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.00427 | -| n_updates | 21050 | -| policy_gradient_loss | -0.00373 | -| std | 0.689 | -| value_loss | 1.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2107 | -| time_elapsed | 26804 | -| total_timesteps | 269696 | -| train/ | | -| approx_kl | 0.007868575 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 21060 | -| policy_gradient_loss | -0.00271 | -| std | 0.689 | -| value_loss | 9.46e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2108 | -| time_elapsed | 26807 | -| total_timesteps | 269824 | -| train/ | | -| approx_kl | 0.00078970054 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.00592 | -| learning_rate | 0.0003 | -| loss | 0.000592 | -| n_updates | 21070 | -| policy_gradient_loss | 0.00043 | -| std | 0.689 | -| value_loss | 8.05e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2109 | -| time_elapsed | 26811 | -| total_timesteps | 269952 | -| train/ | | -| approx_kl | 0.0075434963 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.0191 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 21080 | -| policy_gradient_loss | -0.00601 | -| std | 0.689 | -| value_loss | 7.39e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2110 | -| time_elapsed | 26815 | -| total_timesteps | 270080 | -| train/ | | -| approx_kl | 0.01345285 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.0085 | -| n_updates | 21090 | -| policy_gradient_loss | -0.00684 | -| std | 0.689 | -| value_loss | 1.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2111 | -| time_elapsed | 26823 | -| total_timesteps | 270208 | -| train/ | | -| approx_kl | 0.012017272 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.251 | -| learning_rate | 0.0003 | -| loss | -0.0236 | -| n_updates | 21100 | -| policy_gradient_loss | -0.0148 | -| std | 0.689 | -| value_loss | 0.00312 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2112 | -| time_elapsed | 26829 | -| total_timesteps | 270336 | -| train/ | | -| approx_kl | 0.012444729 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.00934 | -| n_updates | 21110 | -| policy_gradient_loss | -0.00498 | -| std | 0.687 | -| value_loss | 4.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2113 | -| time_elapsed | 26833 | -| total_timesteps | 270464 | -| train/ | | -| approx_kl | 0.017116563 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -29.5 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 21120 | -| policy_gradient_loss | -0.0077 | -| std | 0.686 | -| value_loss | 1.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2114 | -| time_elapsed | 26838 | -| total_timesteps | 270592 | -| train/ | | -| approx_kl | 0.009591423 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 21130 | -| policy_gradient_loss | -0.00209 | -| std | 0.684 | -| value_loss | 1.56e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2115 | -| time_elapsed | 26841 | -| total_timesteps | 270720 | -| train/ | | -| approx_kl | 0.0023491113 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.333 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 21140 | -| policy_gradient_loss | -0.00218 | -| std | 0.68 | -| value_loss | 9.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2116 | -| time_elapsed | 26846 | -| total_timesteps | 270848 | -| train/ | | -| approx_kl | 0.010544015 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 21150 | -| policy_gradient_loss | -0.00881 | -| std | 0.678 | -| value_loss | 5.87e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2117 | -| time_elapsed | 26850 | -| total_timesteps | 270976 | -| train/ | | -| approx_kl | 2.6683789e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.000549 | -| n_updates | 21160 | -| policy_gradient_loss | 0.00262 | -| std | 0.676 | -| value_loss | 9.69e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2118 | -| time_elapsed | 26855 | -| total_timesteps | 271104 | -| train/ | | -| approx_kl | 0.0068053477 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 21170 | -| policy_gradient_loss | -0.00174 | -| std | 0.677 | -| value_loss | 6.86e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2119 | -| time_elapsed | 26864 | -| total_timesteps | 271232 | -| train/ | | -| approx_kl | 0.0030698064 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 21180 | -| policy_gradient_loss | -0.0059 | -| std | 0.678 | -| value_loss | 0.00301 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2120 | -| time_elapsed | 26869 | -| total_timesteps | 271360 | -| train/ | | -| approx_kl | 0.010241005 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 21190 | -| policy_gradient_loss | -0.00273 | -| std | 0.679 | -| value_loss | 3.29e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2121 | -| time_elapsed | 26873 | -| total_timesteps | 271488 | -| train/ | | -| approx_kl | 0.0054252497 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 21200 | -| policy_gradient_loss | -0.0017 | -| std | 0.68 | -| value_loss | 3.23e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2122 | -| time_elapsed | 26878 | -| total_timesteps | 271616 | -| train/ | | -| approx_kl | 0.0002505649 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 21210 | -| policy_gradient_loss | 0.000316 | -| std | 0.681 | -| value_loss | 2.25e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2123 | -| time_elapsed | 26883 | -| total_timesteps | 271744 | -| train/ | | -| approx_kl | 0.0002927375 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.00054 | -| n_updates | 21220 | -| policy_gradient_loss | 0.000529 | -| std | 0.68 | -| value_loss | 1.46e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2124 | -| time_elapsed | 26887 | -| total_timesteps | 271872 | -| train/ | | -| approx_kl | 0.0017810473 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.0189 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 21230 | -| policy_gradient_loss | -0.000931 | -| std | 0.678 | -| value_loss | 1.31e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2125 | -| time_elapsed | 26891 | -| total_timesteps | 272000 | -| train/ | | -| approx_kl | 2.4451874e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.0197 | -| learning_rate | 0.0003 | -| loss | -4.44e-05 | -| n_updates | 21240 | -| policy_gradient_loss | 0.000539 | -| std | 0.678 | -| value_loss | 1.19e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2126 | -| time_elapsed | 26895 | -| total_timesteps | 272128 | -| train/ | | -| approx_kl | 0.0008805711 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.00483 | -| learning_rate | 0.0003 | -| loss | -0.00933 | -| n_updates | 21250 | -| policy_gradient_loss | -0.00154 | -| std | 0.678 | -| value_loss | 6.88e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2127 | -| time_elapsed | 26906 | -| total_timesteps | 272256 | -| train/ | | -| approx_kl | 0.00045802444 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.751 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 21260 | -| policy_gradient_loss | -0.00205 | -| std | 0.68 | -| value_loss | 0.00252 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2128 | -| time_elapsed | 26910 | -| total_timesteps | 272384 | -| train/ | | -| approx_kl | 0.0024447502 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -7.85 | -| learning_rate | 0.0003 | -| loss | -0.000837 | -| n_updates | 21270 | -| policy_gradient_loss | -0.000466 | -| std | 0.68 | -| value_loss | 2.18e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2129 | -| time_elapsed | 26914 | -| total_timesteps | 272512 | -| train/ | | -| approx_kl | 0.0021717884 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -8.84 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 21280 | -| policy_gradient_loss | -0.0015 | -| std | 0.679 | -| value_loss | 1.04e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2130 | -| time_elapsed | 26919 | -| total_timesteps | 272640 | -| train/ | | -| approx_kl | 0.0016485816 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | 0.000967 | -| n_updates | 21290 | -| policy_gradient_loss | 0.000655 | -| std | 0.679 | -| value_loss | 5.37e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2131 | -| time_elapsed | 26923 | -| total_timesteps | 272768 | -| train/ | | -| approx_kl | 0.0043865675 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.0074 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 21300 | -| policy_gradient_loss | -0.00442 | -| std | 0.679 | -| value_loss | 2.08e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2132 | -| time_elapsed | 26926 | -| total_timesteps | 272896 | -| train/ | | -| approx_kl | 2.8125476e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.000334 | -| n_updates | 21310 | -| policy_gradient_loss | 0.00146 | -| std | 0.68 | -| value_loss | 1.84e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2133 | -| time_elapsed | 26930 | -| total_timesteps | 273024 | -| train/ | | -| approx_kl | 0.0005631279 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 21320 | -| policy_gradient_loss | -0.000415 | -| std | 0.682 | -| value_loss | 1.19e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2134 | -| time_elapsed | 26939 | -| total_timesteps | 273152 | -| train/ | | -| approx_kl | 0.0041887397 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 21330 | -| policy_gradient_loss | -0.00758 | -| std | 0.684 | -| value_loss | 0.00208 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2135 | -| time_elapsed | 26944 | -| total_timesteps | 273280 | -| train/ | | -| approx_kl | 0.0065850625 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -39.2 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 21340 | -| policy_gradient_loss | -0.00168 | -| std | 0.685 | -| value_loss | 2.7e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2136 | -| time_elapsed | 26948 | -| total_timesteps | 273408 | -| train/ | | -| approx_kl | 0.00020688213 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -27.4 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 21350 | -| policy_gradient_loss | 0.000364 | -| std | 0.686 | -| value_loss | 5.61e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2137 | -| time_elapsed | 26952 | -| total_timesteps | 273536 | -| train/ | | -| approx_kl | 0.012756619 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 21360 | -| policy_gradient_loss | -0.00537 | -| std | 0.687 | -| value_loss | 5.37e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2138 | -| time_elapsed | 26956 | -| total_timesteps | 273664 | -| train/ | | -| approx_kl | 0.005842305 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 21370 | -| policy_gradient_loss | -0.00557 | -| std | 0.688 | -| value_loss | 3.08e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2139 | -| time_elapsed | 26961 | -| total_timesteps | 273792 | -| train/ | | -| approx_kl | 0.010860475 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 21380 | -| policy_gradient_loss | -0.00188 | -| std | 0.688 | -| value_loss | 5.12e-08 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2140 | -| time_elapsed | 26965 | -| total_timesteps | 273920 | -| train/ | | -| approx_kl | 1.11833215e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.0144 | -| learning_rate | 0.0003 | -| loss | -0.00023 | -| n_updates | 21390 | -| policy_gradient_loss | -3.72e-05 | -| std | 0.69 | -| value_loss | 2.35e-08 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2141 | -| time_elapsed | 26968 | -| total_timesteps | 274048 | -| train/ | | -| approx_kl | 0.007739023 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 21400 | -| policy_gradient_loss | -0.00767 | -| std | 0.691 | -| value_loss | 1.89e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2142 | -| time_elapsed | 26973 | -| total_timesteps | 274176 | -| train/ | | -| approx_kl | 0.0076183844 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.879 | -| learning_rate | 0.0003 | -| loss | -0.00842 | -| n_updates | 21410 | -| policy_gradient_loss | -0.00491 | -| std | 0.692 | -| value_loss | 0.00056 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2143 | -| time_elapsed | 26977 | -| total_timesteps | 274304 | -| train/ | | -| approx_kl | 0.00081322854 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -75 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 21420 | -| policy_gradient_loss | -0.00063 | -| std | 0.692 | -| value_loss | 3.13e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2144 | -| time_elapsed | 26983 | -| total_timesteps | 274432 | -| train/ | | -| approx_kl | 0.014135225 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -82.5 | -| learning_rate | 0.0003 | -| loss | -0.00797 | -| n_updates | 21430 | -| policy_gradient_loss | -0.00447 | -| std | 0.691 | -| value_loss | 7.46e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2145 | -| time_elapsed | 26987 | -| total_timesteps | 274560 | -| train/ | | -| approx_kl | 6.9779344e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -30.1 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 21440 | -| policy_gradient_loss | 0.00173 | -| std | 0.69 | -| value_loss | 6.88e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2146 | -| time_elapsed | 26990 | -| total_timesteps | 274688 | -| train/ | | -| approx_kl | 0.0003586486 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -38.8 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 21450 | -| policy_gradient_loss | 0.000109 | -| std | 0.69 | -| value_loss | 3.61e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2147 | -| time_elapsed | 26994 | -| total_timesteps | 274816 | -| train/ | | -| approx_kl | 0.013388837 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -11.5 | -| learning_rate | 0.0003 | -| loss | -0.00764 | -| n_updates | 21460 | -| policy_gradient_loss | -0.00626 | -| std | 0.689 | -| value_loss | 3.81e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.65 | -| time/ | | -| fps | 10 | -| iterations | 2148 | -| time_elapsed | 26998 | -| total_timesteps | 274944 | -| train/ | | -| approx_kl | 0.0011149091 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -0.67 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 21470 | -| policy_gradient_loss | -0.000791 | -| std | 0.687 | -| value_loss | 8.2e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2149 | -| time_elapsed | 27002 | -| total_timesteps | 275072 | -| train/ | | -| approx_kl | 0.007281483 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.0234 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 21480 | -| policy_gradient_loss | -0.00111 | -| std | 0.685 | -| value_loss | 4.67e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2150 | -| time_elapsed | 27010 | -| total_timesteps | 275200 | -| train/ | | -| approx_kl | 0.004890196 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 21490 | -| policy_gradient_loss | -0.00636 | -| std | 0.684 | -| value_loss | 0.00161 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2151 | -| time_elapsed | 27015 | -| total_timesteps | 275328 | -| train/ | | -| approx_kl | 0.00023804605 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -84.3 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 21500 | -| policy_gradient_loss | 0.000603 | -| std | 0.683 | -| value_loss | 8.25e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2152 | -| time_elapsed | 27018 | -| total_timesteps | 275456 | -| train/ | | -| approx_kl | 0.00017598085 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -69.8 | -| learning_rate | 0.0003 | -| loss | -0.001 | -| n_updates | 21510 | -| policy_gradient_loss | 0.000331 | -| std | 0.684 | -| value_loss | 2.32e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2153 | -| time_elapsed | 27022 | -| total_timesteps | 275584 | -| train/ | | -| approx_kl | 0.009730028 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -2.83 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 21520 | -| policy_gradient_loss | -0.0097 | -| std | 0.684 | -| value_loss | 5.3e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2154 | -| time_elapsed | 27025 | -| total_timesteps | 275712 | -| train/ | | -| approx_kl | 0.0070831515 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -3.18 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 21530 | -| policy_gradient_loss | -0.00654 | -| std | 0.683 | -| value_loss | 5.24e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2155 | -| time_elapsed | 27030 | -| total_timesteps | 275840 | -| train/ | | -| approx_kl | 0.00036336388 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.831 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 21540 | -| policy_gradient_loss | 0.000734 | -| std | 0.683 | -| value_loss | 1.84e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.64 | -| time/ | | -| fps | 10 | -| iterations | 2156 | -| time_elapsed | 27035 | -| total_timesteps | 275968 | -| train/ | | -| approx_kl | 0.011200653 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.000529 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 21550 | -| policy_gradient_loss | -0.00374 | -| std | 0.684 | -| value_loss | 1.65e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2157 | -| time_elapsed | 27039 | -| total_timesteps | 276096 | -| train/ | | -| approx_kl | 0.0062128287 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 21560 | -| policy_gradient_loss | -0.00158 | -| std | 0.687 | -| value_loss | 1.15e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2158 | -| time_elapsed | 27048 | -| total_timesteps | 276224 | -| train/ | | -| approx_kl | 0.011830019 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | 0.67 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 21570 | -| policy_gradient_loss | -0.00787 | -| std | 0.69 | -| value_loss | 0.00105 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2159 | -| time_elapsed | 27053 | -| total_timesteps | 276352 | -| train/ | | -| approx_kl | 0.0033255778 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -88.7 | -| learning_rate | 0.0003 | -| loss | 6.89e-05 | -| n_updates | 21580 | -| policy_gradient_loss | 3.92e-05 | -| std | 0.69 | -| value_loss | 1.27e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2160 | -| time_elapsed | 27057 | -| total_timesteps | 276480 | -| train/ | | -| approx_kl | 9.604404e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -98.3 | -| learning_rate | 0.0003 | -| loss | -0.000429 | -| n_updates | 21590 | -| policy_gradient_loss | -0.000123 | -| std | 0.689 | -| value_loss | 2.37e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2161 | -| time_elapsed | 27061 | -| total_timesteps | 276608 | -| train/ | | -| approx_kl | 0.00079331873 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -3.59 | -| learning_rate | 0.0003 | -| loss | -0.000491 | -| n_updates | 21600 | -| policy_gradient_loss | -0.00026 | -| std | 0.687 | -| value_loss | 9.42e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2162 | -| time_elapsed | 27065 | -| total_timesteps | 276736 | -| train/ | | -| approx_kl | 0.00558906 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -95.1 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 21610 | -| policy_gradient_loss | -0.00316 | -| std | 0.686 | -| value_loss | 1.08e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2163 | -| time_elapsed | 27069 | -| total_timesteps | 276864 | -| train/ | | -| approx_kl | 4.89573e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -19.6 | -| learning_rate | 0.0003 | -| loss | 0.000681 | -| n_updates | 21620 | -| policy_gradient_loss | 0.00155 | -| std | 0.686 | -| value_loss | 4.34e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.62 | -| time/ | | -| fps | 10 | -| iterations | 2164 | -| time_elapsed | 27073 | -| total_timesteps | 276992 | -| train/ | | -| approx_kl | 0.010265997 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 21630 | -| policy_gradient_loss | -0.00538 | -| std | 0.686 | -| value_loss | 1.13e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.6 | -| time/ | | -| fps | 10 | -| iterations | 2165 | -| time_elapsed | 27077 | -| total_timesteps | 277120 | -| train/ | | -| approx_kl | 0.00019761035 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.0881 | -| learning_rate | 0.0003 | -| loss | 0.000205 | -| n_updates | 21640 | -| policy_gradient_loss | 0.000561 | -| std | 0.687 | -| value_loss | 3.35e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.6 | -| time/ | | -| fps | 10 | -| iterations | 2166 | -| time_elapsed | 27087 | -| total_timesteps | 277248 | -| train/ | | -| approx_kl | 0.007997168 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -1.64 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 21650 | -| policy_gradient_loss | -0.0112 | -| std | 0.689 | -| value_loss | 0.00232 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.6 | -| time/ | | -| fps | 10 | -| iterations | 2167 | -| time_elapsed | 27092 | -| total_timesteps | 277376 | -| train/ | | -| approx_kl | 8.465536e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -34.6 | -| learning_rate | 0.0003 | -| loss | -0.000864 | -| n_updates | 21660 | -| policy_gradient_loss | 0.000585 | -| std | 0.689 | -| value_loss | 6.15e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.6 | -| time/ | | -| fps | 10 | -| iterations | 2168 | -| time_elapsed | 27096 | -| total_timesteps | 277504 | -| train/ | | -| approx_kl | 0.0069780424 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -1.05 | -| explained_variance | -87.9 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 21670 | -| policy_gradient_loss | -0.00128 | -| std | 0.688 | -| value_loss | 2.5e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.6 | -| time/ | | -| fps | 10 | -| iterations | 2169 | -| time_elapsed | 27100 | -| total_timesteps | 277632 | -| train/ | | -| approx_kl | 0.00068803737 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 21680 | -| policy_gradient_loss | -0.000773 | -| std | 0.687 | -| value_loss | 1.44e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.6 | -| time/ | | -| fps | 10 | -| iterations | 2170 | -| time_elapsed | 27105 | -| total_timesteps | 277760 | -| train/ | | -| approx_kl | 0.0065248613 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | -0.000961 | -| n_updates | 21690 | -| policy_gradient_loss | -0.00159 | -| std | 0.685 | -| value_loss | 1.05e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.6 | -| time/ | | -| fps | 10 | -| iterations | 2171 | -| time_elapsed | 27109 | -| total_timesteps | 277888 | -| train/ | | -| approx_kl | 0.0047403653 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 21700 | -| policy_gradient_loss | -0.00523 | -| std | 0.683 | -| value_loss | 5.91e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2172 | -| time_elapsed | 27114 | -| total_timesteps | 278016 | -| train/ | | -| approx_kl | 0.010074843 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.00971 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 21710 | -| policy_gradient_loss | -0.00184 | -| std | 0.682 | -| value_loss | 3.83e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2173 | -| time_elapsed | 27121 | -| total_timesteps | 278144 | -| train/ | | -| approx_kl | 0.0018636445 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.295 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 21720 | -| policy_gradient_loss | -0.00458 | -| std | 0.681 | -| value_loss | 0.00118 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2174 | -| time_elapsed | 27124 | -| total_timesteps | 278272 | -| train/ | | -| approx_kl | 0.00028957846 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -27.8 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 21730 | -| policy_gradient_loss | 0.000473 | -| std | 0.682 | -| value_loss | 2.11e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2175 | -| time_elapsed | 27128 | -| total_timesteps | 278400 | -| train/ | | -| approx_kl | 0.00032294914 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -27.6 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 21740 | -| policy_gradient_loss | 0.000252 | -| std | 0.682 | -| value_loss | 8.61e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2176 | -| time_elapsed | 27131 | -| total_timesteps | 278528 | -| train/ | | -| approx_kl | 0.00034041656 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 21750 | -| policy_gradient_loss | 0.000268 | -| std | 0.681 | -| value_loss | 1.41e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2177 | -| time_elapsed | 27134 | -| total_timesteps | 278656 | -| train/ | | -| approx_kl | 0.011683296 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.000562 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 21760 | -| policy_gradient_loss | -0.00291 | -| std | 0.679 | -| value_loss | 1.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2178 | -| time_elapsed | 27137 | -| total_timesteps | 278784 | -| train/ | | -| approx_kl | 0.011423545 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.00905 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 21770 | -| policy_gradient_loss | -0.00646 | -| std | 0.677 | -| value_loss | 8.35e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.57 | -| time/ | | -| fps | 10 | -| iterations | 2179 | -| time_elapsed | 27141 | -| total_timesteps | 278912 | -| train/ | | -| approx_kl | 0.0003151754 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 21780 | -| policy_gradient_loss | 0.000667 | -| std | 0.676 | -| value_loss | 8.07e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2180 | -| time_elapsed | 27145 | -| total_timesteps | 279040 | -| train/ | | -| approx_kl | 0.0004892871 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.235 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 21790 | -| policy_gradient_loss | 0.000666 | -| std | 0.675 | -| value_loss | 3.47e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2181 | -| time_elapsed | 27153 | -| total_timesteps | 279168 | -| train/ | | -| approx_kl | 0.02617403 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.664 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 21800 | -| policy_gradient_loss | -0.0141 | -| std | 0.674 | -| value_loss | 0.00431 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2182 | -| time_elapsed | 27157 | -| total_timesteps | 279296 | -| train/ | | -| approx_kl | 0.016143091 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -80.7 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 21810 | -| policy_gradient_loss | -0.00496 | -| std | 0.674 | -| value_loss | 3.79e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2183 | -| time_elapsed | 27161 | -| total_timesteps | 279424 | -| train/ | | -| approx_kl | 0.015386586 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -59.8 | -| learning_rate | 0.0003 | -| loss | -0.00971 | -| n_updates | 21820 | -| policy_gradient_loss | -0.00689 | -| std | 0.674 | -| value_loss | 1.38e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2184 | -| time_elapsed | 27165 | -| total_timesteps | 279552 | -| train/ | | -| approx_kl | 0.0027839788 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -12.2 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 21830 | -| policy_gradient_loss | -0.0015 | -| std | 0.673 | -| value_loss | 3.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2185 | -| time_elapsed | 27169 | -| total_timesteps | 279680 | -| train/ | | -| approx_kl | 0.0015466996 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 21840 | -| policy_gradient_loss | 0.000837 | -| std | 0.673 | -| value_loss | 1.57e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2186 | -| time_elapsed | 27171 | -| total_timesteps | 279808 | -| train/ | | -| approx_kl | 0.0044879075 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.842 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 21850 | -| policy_gradient_loss | -0.00112 | -| std | 0.672 | -| value_loss | 1.34e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2187 | -| time_elapsed | 27174 | -| total_timesteps | 279936 | -| train/ | | -| approx_kl | 8.875318e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | 0.00817 | -| learning_rate | 0.0003 | -| loss | -0.000403 | -| n_updates | 21860 | -| policy_gradient_loss | 0.000179 | -| std | 0.672 | -| value_loss | 1.12e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2188 | -| time_elapsed | 27177 | -| total_timesteps | 280064 | -| train/ | | -| approx_kl | 0.0026102224 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | -0.0083 | -| n_updates | 21870 | -| policy_gradient_loss | -0.00198 | -| std | 0.672 | -| value_loss | 1.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2189 | -| time_elapsed | 27183 | -| total_timesteps | 280192 | -| train/ | | -| approx_kl | 0.003374754 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | 0.728 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 21880 | -| policy_gradient_loss | -0.0121 | -| std | 0.671 | -| value_loss | 0.00602 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2190 | -| time_elapsed | 27187 | -| total_timesteps | 280320 | -| train/ | | -| approx_kl | 0.006417856 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -69.6 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 21890 | -| policy_gradient_loss | -0.00498 | -| std | 0.671 | -| value_loss | 5.81e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2191 | -| time_elapsed | 27190 | -| total_timesteps | 280448 | -| train/ | | -| approx_kl | 0.00015471177 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -47 | -| learning_rate | 0.0003 | -| loss | 0.00043 | -| n_updates | 21900 | -| policy_gradient_loss | 0.00111 | -| std | 0.672 | -| value_loss | 1.72e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2192 | -| time_elapsed | 27193 | -| total_timesteps | 280576 | -| train/ | | -| approx_kl | 0.004341077 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.758 | -| learning_rate | 0.0003 | -| loss | -0.000897 | -| n_updates | 21910 | -| policy_gradient_loss | -0.000665 | -| std | 0.675 | -| value_loss | 3.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2193 | -| time_elapsed | 27197 | -| total_timesteps | 280704 | -| train/ | | -| approx_kl | 0.007725869 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -12.1 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 21920 | -| policy_gradient_loss | -0.00172 | -| std | 0.675 | -| value_loss | 6.3e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2194 | -| time_elapsed | 27200 | -| total_timesteps | 280832 | -| train/ | | -| approx_kl | 0.0005158223 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.713 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 21930 | -| policy_gradient_loss | 0.000265 | -| std | 0.675 | -| value_loss | 2.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.42 | -| time/ | | -| fps | 10 | -| iterations | 2195 | -| time_elapsed | 27203 | -| total_timesteps | 280960 | -| train/ | | -| approx_kl | 0.017699625 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.646 | -| learning_rate | 0.0003 | -| loss | -0.00879 | -| n_updates | 21940 | -| policy_gradient_loss | -0.00836 | -| std | 0.675 | -| value_loss | 6.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2196 | -| time_elapsed | 27206 | -| total_timesteps | 281088 | -| train/ | | -| approx_kl | 0.0068722884 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 21950 | -| policy_gradient_loss | -0.00157 | -| std | 0.674 | -| value_loss | 6.38e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2197 | -| time_elapsed | 27213 | -| total_timesteps | 281216 | -| train/ | | -| approx_kl | 0.0024029026 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | 0.491 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 21960 | -| policy_gradient_loss | -0.00723 | -| std | 0.674 | -| value_loss | 0.00185 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2198 | -| time_elapsed | 27218 | -| total_timesteps | 281344 | -| train/ | | -| approx_kl | 0.0014916197 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -54.8 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 21970 | -| policy_gradient_loss | -0.00054 | -| std | 0.674 | -| value_loss | 1.3e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2199 | -| time_elapsed | 27221 | -| total_timesteps | 281472 | -| train/ | | -| approx_kl | 0.0014131707 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -41.7 | -| learning_rate | 0.0003 | -| loss | 0.000673 | -| n_updates | 21980 | -| policy_gradient_loss | 0.000465 | -| std | 0.673 | -| value_loss | 1.73e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2200 | -| time_elapsed | 27225 | -| total_timesteps | 281600 | -| train/ | | -| approx_kl | 0.007971248 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 21990 | -| policy_gradient_loss | -0.00251 | -| std | 0.673 | -| value_loss | 1.55e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2201 | -| time_elapsed | 27229 | -| total_timesteps | 281728 | -| train/ | | -| approx_kl | 0.0006963182 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.626 | -| learning_rate | 0.0003 | -| loss | 0.00047 | -| n_updates | 22000 | -| policy_gradient_loss | 0.000356 | -| std | 0.674 | -| value_loss | 1.3e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2202 | -| time_elapsed | 27232 | -| total_timesteps | 281856 | -| train/ | | -| approx_kl | 0.012609659 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.0606 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 22010 | -| policy_gradient_loss | -0.0073 | -| std | 0.674 | -| value_loss | 1.63e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.15 | -| time/ | | -| fps | 10 | -| iterations | 2203 | -| time_elapsed | 27236 | -| total_timesteps | 281984 | -| train/ | | -| approx_kl | 0.00033254828 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | 0.000809 | -| n_updates | 22020 | -| policy_gradient_loss | 0.00104 | -| std | 0.674 | -| value_loss | 5.51e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.14 | -| time/ | | -| fps | 10 | -| iterations | 2204 | -| time_elapsed | 27240 | -| total_timesteps | 282112 | -| train/ | | -| approx_kl | 0.00091488287 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | -0.000174 | -| n_updates | 22030 | -| policy_gradient_loss | -4.53e-06 | -| std | 0.676 | -| value_loss | 7.94e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.14 | -| time/ | | -| fps | 10 | -| iterations | 2205 | -| time_elapsed | 27251 | -| total_timesteps | 282240 | -| train/ | | -| approx_kl | 0.0029476415 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.69 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 22040 | -| policy_gradient_loss | -0.00984 | -| std | 0.678 | -| value_loss | 0.00793 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.14 | -| time/ | | -| fps | 10 | -| iterations | 2206 | -| time_elapsed | 27255 | -| total_timesteps | 282368 | -| train/ | | -| approx_kl | 0.0063311458 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -46.5 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 22050 | -| policy_gradient_loss | -0.00761 | -| std | 0.677 | -| value_loss | 7.89e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.14 | -| time/ | | -| fps | 10 | -| iterations | 2207 | -| time_elapsed | 27259 | -| total_timesteps | 282496 | -| train/ | | -| approx_kl | 0.011703506 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -29.4 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 22060 | -| policy_gradient_loss | -0.000915 | -| std | 0.678 | -| value_loss | 2.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.14 | -| time/ | | -| fps | 10 | -| iterations | 2208 | -| time_elapsed | 27263 | -| total_timesteps | 282624 | -| train/ | | -| approx_kl | 0.010692332 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.716 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 22070 | -| policy_gradient_loss | -0.00177 | -| std | 0.678 | -| value_loss | 4.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.14 | -| time/ | | -| fps | 10 | -| iterations | 2209 | -| time_elapsed | 27267 | -| total_timesteps | 282752 | -| train/ | | -| approx_kl | 0.011700908 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -4.76 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 22080 | -| policy_gradient_loss | -0.00627 | -| std | 0.678 | -| value_loss | 2.17e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.14 | -| time/ | | -| fps | 10 | -| iterations | 2210 | -| time_elapsed | 27271 | -| total_timesteps | 282880 | -| train/ | | -| approx_kl | 0.01835812 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.0331 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 22090 | -| policy_gradient_loss | -0.00834 | -| std | 0.678 | -| value_loss | 9.72e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2211 | -| time_elapsed | 27275 | -| total_timesteps | 283008 | -| train/ | | -| approx_kl | 0.0031817947 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.0213 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 22100 | -| policy_gradient_loss | -0.00105 | -| std | 0.678 | -| value_loss | 1.96e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2212 | -| time_elapsed | 27286 | -| total_timesteps | 283136 | -| train/ | | -| approx_kl | 0.013178915 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 22110 | -| policy_gradient_loss | -0.0102 | -| std | 0.678 | -| value_loss | 0.00127 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2213 | -| time_elapsed | 27290 | -| total_timesteps | 283264 | -| train/ | | -| approx_kl | 0.0061659515 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -69.7 | -| learning_rate | 0.0003 | -| loss | -0.0051 | -| n_updates | 22120 | -| policy_gradient_loss | -0.00187 | -| std | 0.679 | -| value_loss | 4.56e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2214 | -| time_elapsed | 27294 | -| total_timesteps | 283392 | -| train/ | | -| approx_kl | 0.026517412 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -41.5 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 22130 | -| policy_gradient_loss | -0.00881 | -| std | 0.68 | -| value_loss | 8.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2215 | -| time_elapsed | 27298 | -| total_timesteps | 283520 | -| train/ | | -| approx_kl | 0.013051847 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -24.7 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 22140 | -| policy_gradient_loss | -0.00965 | -| std | 0.679 | -| value_loss | 8.53e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2216 | -| time_elapsed | 27303 | -| total_timesteps | 283648 | -| train/ | | -| approx_kl | 0.00011224812 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | 0.00102 | -| n_updates | 22150 | -| policy_gradient_loss | 0.00211 | -| std | 0.679 | -| value_loss | 2.27e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2217 | -| time_elapsed | 27308 | -| total_timesteps | 283776 | -| train/ | | -| approx_kl | 0.00074519264 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 22160 | -| policy_gradient_loss | -0.000162 | -| std | 0.681 | -| value_loss | 1.56e-07 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2218 | -| time_elapsed | 27312 | -| total_timesteps | 283904 | -| train/ | | -| approx_kl | 1.14445575e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.534 | -| learning_rate | 0.0003 | -| loss | -0.00037 | -| n_updates | 22170 | -| policy_gradient_loss | 0.000401 | -| std | 0.683 | -| value_loss | 1.15e-07 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2219 | -| time_elapsed | 27316 | -| total_timesteps | 284032 | -| train/ | | -| approx_kl | 0.007307679 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 22180 | -| policy_gradient_loss | -0.00117 | -| std | 0.686 | -| value_loss | 3.96e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2220 | -| time_elapsed | 27325 | -| total_timesteps | 284160 | -| train/ | | -| approx_kl | 0.00277784 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | -0.00772 | -| n_updates | 22190 | -| policy_gradient_loss | -0.00659 | -| std | 0.685 | -| value_loss | 0.00473 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2221 | -| time_elapsed | 27329 | -| total_timesteps | 284288 | -| train/ | | -| approx_kl | 0.006632399 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -39.7 | -| learning_rate | 0.0003 | -| loss | -0.00655 | -| n_updates | 22200 | -| policy_gradient_loss | -0.00256 | -| std | 0.684 | -| value_loss | 1.87e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2222 | -| time_elapsed | 27333 | -| total_timesteps | 284416 | -| train/ | | -| approx_kl | 8.1025064e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -31.5 | -| learning_rate | 0.0003 | -| loss | -7.41e-05 | -| n_updates | 22210 | -| policy_gradient_loss | 0.00154 | -| std | 0.684 | -| value_loss | 1.45e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2223 | -| time_elapsed | 27337 | -| total_timesteps | 284544 | -| train/ | | -| approx_kl | 0.00081416266 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -21.6 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 22220 | -| policy_gradient_loss | 6.79e-06 | -| std | 0.683 | -| value_loss | 3.58e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2224 | -| time_elapsed | 27341 | -| total_timesteps | 284672 | -| train/ | | -| approx_kl | 0.0005587614 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.04 | -| explained_variance | -7.66 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 22230 | -| policy_gradient_loss | 0.000307 | -| std | 0.682 | -| value_loss | 6.76e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2225 | -| time_elapsed | 27346 | -| total_timesteps | 284800 | -| train/ | | -| approx_kl | 0.00018354924 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | -0.000894 | -| n_updates | 22240 | -| policy_gradient_loss | 0.000291 | -| std | 0.68 | -| value_loss | 2.07e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 10 | -| iterations | 2226 | -| time_elapsed | 27350 | -| total_timesteps | 284928 | -| train/ | | -| approx_kl | 0.01093182 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 22250 | -| policy_gradient_loss | -0.00221 | -| std | 0.679 | -| value_loss | 7.31e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2227 | -| time_elapsed | 27354 | -| total_timesteps | 285056 | -| train/ | | -| approx_kl | 0.007640279 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.637 | -| learning_rate | 0.0003 | -| loss | -0.0083 | -| n_updates | 22260 | -| policy_gradient_loss | -0.00352 | -| std | 0.679 | -| value_loss | 9.12e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2228 | -| time_elapsed | 27363 | -| total_timesteps | 285184 | -| train/ | | -| approx_kl | 0.029161597 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -0.577 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 22270 | -| policy_gradient_loss | -0.0173 | -| std | 0.679 | -| value_loss | 0.00411 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2229 | -| time_elapsed | 27367 | -| total_timesteps | 285312 | -| train/ | | -| approx_kl | 0.00052576326 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -41.4 | -| learning_rate | 0.0003 | -| loss | -2.92e-05 | -| n_updates | 22280 | -| policy_gradient_loss | -1.89e-05 | -| std | 0.678 | -| value_loss | 2.96e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2230 | -| time_elapsed | 27370 | -| total_timesteps | 285440 | -| train/ | | -| approx_kl | 0.0005049794 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -48.3 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 22290 | -| policy_gradient_loss | -0.000238 | -| std | 0.676 | -| value_loss | 3.29e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2231 | -| time_elapsed | 27374 | -| total_timesteps | 285568 | -| train/ | | -| approx_kl | 0.004159592 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -1.03 | -| explained_variance | -62 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 22300 | -| policy_gradient_loss | -0.00181 | -| std | 0.675 | -| value_loss | 5.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2232 | -| time_elapsed | 27378 | -| total_timesteps | 285696 | -| train/ | | -| approx_kl | 0.004674538 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -61.8 | -| learning_rate | 0.0003 | -| loss | 0.000972 | -| n_updates | 22310 | -| policy_gradient_loss | 0.000613 | -| std | 0.674 | -| value_loss | 5.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2233 | -| time_elapsed | 27382 | -| total_timesteps | 285824 | -| train/ | | -| approx_kl | 0.0022968813 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -31.7 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 22320 | -| policy_gradient_loss | -0.000826 | -| std | 0.672 | -| value_loss | 4.28e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2234 | -| time_elapsed | 27387 | -| total_timesteps | 285952 | -| train/ | | -| approx_kl | 0.0059013157 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -23.5 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 22330 | -| policy_gradient_loss | -0.000671 | -| std | 0.67 | -| value_loss | 3.74e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2235 | -| time_elapsed | 27391 | -| total_timesteps | 286080 | -| train/ | | -| approx_kl | 0.00617031 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -7.99 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 22340 | -| policy_gradient_loss | -0.000896 | -| std | 0.67 | -| value_loss | 1.58e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2236 | -| time_elapsed | 27400 | -| total_timesteps | 286208 | -| train/ | | -| approx_kl | 0.02352585 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 22350 | -| policy_gradient_loss | -0.0132 | -| std | 0.67 | -| value_loss | 0.000926 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2237 | -| time_elapsed | 27404 | -| total_timesteps | 286336 | -| train/ | | -| approx_kl | 0.0071216244 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -41.9 | -| learning_rate | 0.0003 | -| loss | -0.000217 | -| n_updates | 22360 | -| policy_gradient_loss | -0.000197 | -| std | 0.67 | -| value_loss | 3.65e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2238 | -| time_elapsed | 27409 | -| total_timesteps | 286464 | -| train/ | | -| approx_kl | 0.007537981 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -46.2 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 22370 | -| policy_gradient_loss | -0.00127 | -| std | 0.67 | -| value_loss | 8.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2239 | -| time_elapsed | 27413 | -| total_timesteps | 286592 | -| train/ | | -| approx_kl | 0.013117526 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 22380 | -| policy_gradient_loss | -0.00318 | -| std | 0.67 | -| value_loss | 1.07e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2240 | -| time_elapsed | 27417 | -| total_timesteps | 286720 | -| train/ | | -| approx_kl | 0.00070565054 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -14.5 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 22390 | -| policy_gradient_loss | 0.000363 | -| std | 0.671 | -| value_loss | 1.91e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2241 | -| time_elapsed | 27420 | -| total_timesteps | 286848 | -| train/ | | -| approx_kl | 0.000582288 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 22400 | -| policy_gradient_loss | 0.000731 | -| std | 0.671 | -| value_loss | 3.02e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 10 | -| iterations | 2242 | -| time_elapsed | 27424 | -| total_timesteps | 286976 | -| train/ | | -| approx_kl | 0.009313364 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.712 | -| learning_rate | 0.0003 | -| loss | -0.000752 | -| n_updates | 22410 | -| policy_gradient_loss | -0.00116 | -| std | 0.67 | -| value_loss | 2.42e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.88 | -| time/ | | -| fps | 10 | -| iterations | 2243 | -| time_elapsed | 27428 | -| total_timesteps | 287104 | -| train/ | | -| approx_kl | 0.014164735 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -0.0981 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 22420 | -| policy_gradient_loss | -0.00797 | -| std | 0.67 | -| value_loss | 2.86e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.88 | -| time/ | | -| fps | 10 | -| iterations | 2244 | -| time_elapsed | 27438 | -| total_timesteps | 287232 | -| train/ | | -| approx_kl | 0.0073241466 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | 0.743 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 22430 | -| policy_gradient_loss | -0.00474 | -| std | 0.67 | -| value_loss | 0.0036 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.88 | -| time/ | | -| fps | 10 | -| iterations | 2245 | -| time_elapsed | 27442 | -| total_timesteps | 287360 | -| train/ | | -| approx_kl | 0.004750955 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -35.2 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 22440 | -| policy_gradient_loss | -0.00154 | -| std | 0.668 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.88 | -| time/ | | -| fps | 10 | -| iterations | 2246 | -| time_elapsed | 27447 | -| total_timesteps | 287488 | -| train/ | | -| approx_kl | 0.0018404676 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.02 | -| explained_variance | -35.3 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 22450 | -| policy_gradient_loss | 0.00101 | -| std | 0.667 | -| value_loss | 2.39e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.88 | -| time/ | | -| fps | 10 | -| iterations | 2247 | -| time_elapsed | 27452 | -| total_timesteps | 287616 | -| train/ | | -| approx_kl | 0.011365954 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.524 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 22460 | -| policy_gradient_loss | -0.00555 | -| std | 0.667 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.88 | -| time/ | | -| fps | 10 | -| iterations | 2248 | -| time_elapsed | 27455 | -| total_timesteps | 287744 | -| train/ | | -| approx_kl | 0.0031131497 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | -0.00989 | -| n_updates | 22470 | -| policy_gradient_loss | -0.00225 | -| std | 0.667 | -| value_loss | 1.52e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.88 | -| time/ | | -| fps | 10 | -| iterations | 2249 | -| time_elapsed | 27459 | -| total_timesteps | 287872 | -| train/ | | -| approx_kl | 0.016667161 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.00896 | -| learning_rate | 0.0003 | -| loss | -0.000671 | -| n_updates | 22480 | -| policy_gradient_loss | -0.00231 | -| std | 0.666 | -| value_loss | 2.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2250 | -| time_elapsed | 27464 | -| total_timesteps | 288000 | -| train/ | | -| approx_kl | 0.008535385 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | 0.0135 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 22490 | -| policy_gradient_loss | -0.00717 | -| std | 0.665 | -| value_loss | 1.2e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2251 | -| time_elapsed | 27468 | -| total_timesteps | 288128 | -| train/ | | -| approx_kl | 1.0547228e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | 0.00812 | -| learning_rate | 0.0003 | -| loss | 0.000153 | -| n_updates | 22500 | -| policy_gradient_loss | 0.0011 | -| std | 0.664 | -| value_loss | 7.91e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2252 | -| time_elapsed | 27477 | -| total_timesteps | 288256 | -| train/ | | -| approx_kl | 0.012971548 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | 0.695 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 22510 | -| policy_gradient_loss | -0.0109 | -| std | 0.663 | -| value_loss | 0.00184 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2253 | -| time_elapsed | 27481 | -| total_timesteps | 288384 | -| train/ | | -| approx_kl | 0.0050480887 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -76.3 | -| learning_rate | 0.0003 | -| loss | -0.00506 | -| n_updates | 22520 | -| policy_gradient_loss | -0.0016 | -| std | 0.662 | -| value_loss | 2.22e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2254 | -| time_elapsed | 27485 | -| total_timesteps | 288512 | -| train/ | | -| approx_kl | 6.3268e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -80.1 | -| learning_rate | 0.0003 | -| loss | -0.000805 | -| n_updates | 22530 | -| policy_gradient_loss | 0.00128 | -| std | 0.662 | -| value_loss | 4.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2255 | -| time_elapsed | 27489 | -| total_timesteps | 288640 | -| train/ | | -| approx_kl | 0.010774936 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 22540 | -| policy_gradient_loss | -0.00165 | -| std | 0.66 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2256 | -| time_elapsed | 27492 | -| total_timesteps | 288768 | -| train/ | | -| approx_kl | 0.0015857052 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1 | -| explained_variance | -4.61 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 22550 | -| policy_gradient_loss | -0.000535 | -| std | 0.658 | -| value_loss | 1e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 10 | -| iterations | 2257 | -| time_elapsed | 27495 | -| total_timesteps | 288896 | -| train/ | | -| approx_kl | 0.011787016 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.999 | -| explained_variance | 0.00339 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 22560 | -| policy_gradient_loss | -0.00684 | -| std | 0.656 | -| value_loss | 9.46e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2258 | -| time_elapsed | 27498 | -| total_timesteps | 289024 | -| train/ | | -| approx_kl | 0.00046863127 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.998 | -| explained_variance | 0.00129 | -| learning_rate | 0.0003 | -| loss | -0.00339 | -| n_updates | 22570 | -| policy_gradient_loss | 0.000575 | -| std | 0.656 | -| value_loss | 8.67e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2259 | -| time_elapsed | 27505 | -| total_timesteps | 289152 | -| train/ | | -| approx_kl | 0.00078420946 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.998 | -| explained_variance | 0.849 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 22580 | -| policy_gradient_loss | -0.00891 | -| std | 0.656 | -| value_loss | 0.00178 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2260 | -| time_elapsed | 27509 | -| total_timesteps | 289280 | -| train/ | | -| approx_kl | 0.0042426973 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.999 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 22590 | -| policy_gradient_loss | -0.00187 | -| std | 0.658 | -| value_loss | 1.06e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2261 | -| time_elapsed | 27513 | -| total_timesteps | 289408 | -| train/ | | -| approx_kl | 2.2950582e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1 | -| explained_variance | -6.62 | -| learning_rate | 0.0003 | -| loss | -0.000388 | -| n_updates | 22600 | -| policy_gradient_loss | 0.000771 | -| std | 0.659 | -| value_loss | 3.59e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2262 | -| time_elapsed | 27516 | -| total_timesteps | 289536 | -| train/ | | -| approx_kl | 0.0008589234 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1 | -| explained_variance | -0.478 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 22610 | -| policy_gradient_loss | -0.000188 | -| std | 0.661 | -| value_loss | 2.66e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2263 | -| time_elapsed | 27521 | -| total_timesteps | 289664 | -| train/ | | -| approx_kl | 0.0020503742 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.49 | -| learning_rate | 0.0003 | -| loss | 0.000774 | -| n_updates | 22620 | -| policy_gradient_loss | 0.000505 | -| std | 0.662 | -| value_loss | 2.16e-08 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2264 | -| time_elapsed | 27525 | -| total_timesteps | 289792 | -| train/ | | -| approx_kl | 0.000110452995 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 22630 | -| policy_gradient_loss | -0.00011 | -| std | 0.663 | -| value_loss | 2.42e-08 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 10 | -| iterations | 2265 | -| time_elapsed | 27529 | -| total_timesteps | 289920 | -| train/ | | -| approx_kl | 0.004669424 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00873 | -| n_updates | 22640 | -| policy_gradient_loss | -0.0033 | -| std | 0.665 | -| value_loss | 2.33e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2266 | -| time_elapsed | 27533 | -| total_timesteps | 290048 | -| train/ | | -| approx_kl | 0.011206113 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -6.4e-06 | -| n_updates | 22650 | -| policy_gradient_loss | -0.00116 | -| std | 0.666 | -| value_loss | 7.73e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2267 | -| time_elapsed | 27540 | -| total_timesteps | 290176 | -| train/ | | -| approx_kl | 0.0026231175 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | 0.733 | -| learning_rate | 0.0003 | -| loss | -0.0253 | -| n_updates | 22660 | -| policy_gradient_loss | -0.014 | -| std | 0.666 | -| value_loss | 0.000742 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2268 | -| time_elapsed | 27544 | -| total_timesteps | 290304 | -| train/ | | -| approx_kl | 0.00011581881 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -59.6 | -| learning_rate | 0.0003 | -| loss | -0.00026 | -| n_updates | 22670 | -| policy_gradient_loss | -5.9e-05 | -| std | 0.665 | -| value_loss | 3.47e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2269 | -| time_elapsed | 27548 | -| total_timesteps | 290432 | -| train/ | | -| approx_kl | 0.0055534984 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.00686 | -| n_updates | 22680 | -| policy_gradient_loss | -0.00237 | -| std | 0.665 | -| value_loss | 1.46e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2270 | -| time_elapsed | 27552 | -| total_timesteps | 290560 | -| train/ | | -| approx_kl | 0.009273128 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.0604 | -| learning_rate | 0.0003 | -| loss | -0.000442 | -| n_updates | 22690 | -| policy_gradient_loss | -0.00102 | -| std | 0.664 | -| value_loss | 8.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2271 | -| time_elapsed | 27557 | -| total_timesteps | 290688 | -| train/ | | -| approx_kl | 0.007710195 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.495 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 22700 | -| policy_gradient_loss | -0.00529 | -| std | 0.663 | -| value_loss | 7.39e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2272 | -| time_elapsed | 27561 | -| total_timesteps | 290816 | -| train/ | | -| approx_kl | 0.00045040436 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1.01 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 22710 | -| policy_gradient_loss | 0.000898 | -| std | 0.661 | -| value_loss | 8.8e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 10 | -| iterations | 2273 | -| time_elapsed | 27565 | -| total_timesteps | 290944 | -| train/ | | -| approx_kl | 0.0010665432 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -1 | -| explained_variance | -0.54 | -| learning_rate | 0.0003 | -| loss | 0.000427 | -| n_updates | 22720 | -| policy_gradient_loss | 0.00046 | -| std | 0.66 | -| value_loss | 2.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2274 | -| time_elapsed | 27569 | -| total_timesteps | 291072 | -| train/ | | -| approx_kl | 0.005465259 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -1 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | -0.00867 | -| n_updates | 22730 | -| policy_gradient_loss | -0.00361 | -| std | 0.657 | -| value_loss | 2.26e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2275 | -| time_elapsed | 27576 | -| total_timesteps | 291200 | -| train/ | | -| approx_kl | 0.003407032 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.997 | -| explained_variance | 0.604 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 22740 | -| policy_gradient_loss | -0.0088 | -| std | 0.654 | -| value_loss | 0.00593 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2276 | -| time_elapsed | 27581 | -| total_timesteps | 291328 | -| train/ | | -| approx_kl | 0.00059503294 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.991 | -| explained_variance | -98.4 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 22750 | -| policy_gradient_loss | -0.000681 | -| std | 0.649 | -| value_loss | 2.68e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2277 | -| time_elapsed | 27586 | -| total_timesteps | 291456 | -| train/ | | -| approx_kl | 0.00898039 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.985 | -| explained_variance | -91.9 | -| learning_rate | 0.0003 | -| loss | -0.00574 | -| n_updates | 22760 | -| policy_gradient_loss | -0.00384 | -| std | 0.647 | -| value_loss | 4.78e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2278 | -| time_elapsed | 27590 | -| total_timesteps | 291584 | -| train/ | | -| approx_kl | 0.0010311799 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.983 | -| explained_variance | -25.3 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 22770 | -| policy_gradient_loss | -0.000428 | -| std | 0.647 | -| value_loss | 8.21e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2279 | -| time_elapsed | 27594 | -| total_timesteps | 291712 | -| train/ | | -| approx_kl | 0.012929896 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.982 | -| explained_variance | -23.2 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 22780 | -| policy_gradient_loss | -0.0131 | -| std | 0.645 | -| value_loss | 6.37e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2280 | -| time_elapsed | 27598 | -| total_timesteps | 291840 | -| train/ | | -| approx_kl | 0.011762806 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.981 | -| explained_variance | -0.561 | -| learning_rate | 0.0003 | -| loss | -0.00661 | -| n_updates | 22790 | -| policy_gradient_loss | -0.00364 | -| std | 0.645 | -| value_loss | 1.79e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 10 | -| iterations | 2281 | -| time_elapsed | 27602 | -| total_timesteps | 291968 | -| train/ | | -| approx_kl | 0.008952615 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.981 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.000754 | -| n_updates | 22800 | -| policy_gradient_loss | -0.000805 | -| std | 0.645 | -| value_loss | 1.14e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2282 | -| time_elapsed | 27607 | -| total_timesteps | 292096 | -| train/ | | -| approx_kl | 0.0004825429 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.98 | -| explained_variance | -0.000142 | -| learning_rate | 0.0003 | -| loss | -0.000436 | -| n_updates | 22810 | -| policy_gradient_loss | -0.000171 | -| std | 0.645 | -| value_loss | 5.2e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2283 | -| time_elapsed | 27617 | -| total_timesteps | 292224 | -| train/ | | -| approx_kl | 0.0023549625 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.981 | -| explained_variance | 0.373 | -| learning_rate | 0.0003 | -| loss | -0.00849 | -| n_updates | 22820 | -| policy_gradient_loss | -0.00662 | -| std | 0.645 | -| value_loss | 0.00145 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2284 | -| time_elapsed | 27622 | -| total_timesteps | 292352 | -| train/ | | -| approx_kl | 0.015643153 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.981 | -| explained_variance | -185 | -| learning_rate | 0.0003 | -| loss | -0.00954 | -| n_updates | 22830 | -| policy_gradient_loss | -0.0053 | -| std | 0.645 | -| value_loss | 1.78e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2285 | -| time_elapsed | 27625 | -| total_timesteps | 292480 | -| train/ | | -| approx_kl | 2.7520582e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.98 | -| explained_variance | -217 | -| learning_rate | 0.0003 | -| loss | 5.27e-06 | -| n_updates | 22840 | -| policy_gradient_loss | 0.00226 | -| std | 0.645 | -| value_loss | 3.85e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2286 | -| time_elapsed | 27629 | -| total_timesteps | 292608 | -| train/ | | -| approx_kl | 0.017315798 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | -0.98 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 22850 | -| policy_gradient_loss | -0.0122 | -| std | 0.645 | -| value_loss | 3.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2287 | -| time_elapsed | 27632 | -| total_timesteps | 292736 | -| train/ | | -| approx_kl | 0.011582409 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.981 | -| explained_variance | -131 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 22860 | -| policy_gradient_loss | -0.00374 | -| std | 0.645 | -| value_loss | 1.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2288 | -| time_elapsed | 27636 | -| total_timesteps | 292864 | -| train/ | | -| approx_kl | 0.022720648 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | -0.982 | -| explained_variance | -4.86 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 22870 | -| policy_gradient_loss | -0.00534 | -| std | 0.647 | -| value_loss | 2.68e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 10 | -| iterations | 2289 | -| time_elapsed | 27641 | -| total_timesteps | 292992 | -| train/ | | -| approx_kl | 0.0060077645 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.983 | -| explained_variance | -0.0692 | -| learning_rate | 0.0003 | -| loss | -0.000595 | -| n_updates | 22880 | -| policy_gradient_loss | -0.000578 | -| std | 0.646 | -| value_loss | 5.46e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2290 | -| time_elapsed | 27645 | -| total_timesteps | 293120 | -| train/ | | -| approx_kl | 0.0074238777 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.982 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 22890 | -| policy_gradient_loss | -0.00618 | -| std | 0.646 | -| value_loss | 5.57e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2291 | -| time_elapsed | 27657 | -| total_timesteps | 293248 | -| train/ | | -| approx_kl | 0.0048691994 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.982 | -| explained_variance | 0.672 | -| learning_rate | 0.0003 | -| loss | -0.00568 | -| n_updates | 22900 | -| policy_gradient_loss | -0.00305 | -| std | 0.646 | -| value_loss | 0.00621 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2292 | -| time_elapsed | 27661 | -| total_timesteps | 293376 | -| train/ | | -| approx_kl | 0.0072795227 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.981 | -| explained_variance | -237 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 22910 | -| policy_gradient_loss | -0.0023 | -| std | 0.646 | -| value_loss | 1.23e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2293 | -| time_elapsed | 27664 | -| total_timesteps | 293504 | -| train/ | | -| approx_kl | 0.0058475407 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.981 | -| explained_variance | -245 | -| learning_rate | 0.0003 | -| loss | 0.000511 | -| n_updates | 22920 | -| policy_gradient_loss | 0.000174 | -| std | 0.645 | -| value_loss | 2.33e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2294 | -| time_elapsed | 27669 | -| total_timesteps | 293632 | -| train/ | | -| approx_kl | 0.0031862378 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.98 | -| explained_variance | -34.4 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 22930 | -| policy_gradient_loss | -0.000669 | -| std | 0.645 | -| value_loss | 3.6e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2295 | -| time_elapsed | 27672 | -| total_timesteps | 293760 | -| train/ | | -| approx_kl | 0.017049203 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.98 | -| explained_variance | -62.5 | -| learning_rate | 0.0003 | -| loss | -0.00879 | -| n_updates | 22940 | -| policy_gradient_loss | -0.00481 | -| std | 0.644 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2296 | -| time_elapsed | 27676 | -| total_timesteps | 293888 | -| train/ | | -| approx_kl | 0.003103639 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.978 | -| explained_variance | -0.0757 | -| learning_rate | 0.0003 | -| loss | 0.000882 | -| n_updates | 22950 | -| policy_gradient_loss | 0.000549 | -| std | 0.643 | -| value_loss | 1.29e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2297 | -| time_elapsed | 27681 | -| total_timesteps | 294016 | -| train/ | | -| approx_kl | 0.0074802465 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.976 | -| explained_variance | -2.24 | -| learning_rate | 0.0003 | -| loss | -0.00516 | -| n_updates | 22960 | -| policy_gradient_loss | -0.00236 | -| std | 0.641 | -| value_loss | 1.89e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2298 | -| time_elapsed | 27692 | -| total_timesteps | 294144 | -| train/ | | -| approx_kl | 0.0018406059 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.972 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | -0.000602 | -| n_updates | 22970 | -| policy_gradient_loss | -0.000745 | -| std | 0.638 | -| value_loss | 0.00426 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2299 | -| time_elapsed | 27696 | -| total_timesteps | 294272 | -| train/ | | -| approx_kl | 3.579608e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.97 | -| explained_variance | -174 | -| learning_rate | 0.0003 | -| loss | 4.78e-05 | -| n_updates | 22980 | -| policy_gradient_loss | 3.91e-05 | -| std | 0.638 | -| value_loss | 4.24e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2300 | -| time_elapsed | 27700 | -| total_timesteps | 294400 | -| train/ | | -| approx_kl | 0.0010151889 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.97 | -| explained_variance | -183 | -| learning_rate | 0.0003 | -| loss | -0.000621 | -| n_updates | 22990 | -| policy_gradient_loss | -0.000255 | -| std | 0.638 | -| value_loss | 6.46e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2301 | -| time_elapsed | 27704 | -| total_timesteps | 294528 | -| train/ | | -| approx_kl | 0.0084409285 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.97 | -| explained_variance | -22.3 | -| learning_rate | 0.0003 | -| loss | -0.00736 | -| n_updates | 23000 | -| policy_gradient_loss | -0.00516 | -| std | 0.639 | -| value_loss | 3.59e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2302 | -| time_elapsed | 27708 | -| total_timesteps | 294656 | -| train/ | | -| approx_kl | 0.005934557 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.97 | -| explained_variance | -14.6 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 23010 | -| policy_gradient_loss | -0.0028 | -| std | 0.638 | -| value_loss | 9.35e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2303 | -| time_elapsed | 27713 | -| total_timesteps | 294784 | -| train/ | | -| approx_kl | 0.0084695285 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.967 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 23020 | -| policy_gradient_loss | -0.00119 | -| std | 0.635 | -| value_loss | 3.06e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 10 | -| iterations | 2304 | -| time_elapsed | 27717 | -| total_timesteps | 294912 | -| train/ | | -| approx_kl | 0.009501755 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.964 | -| explained_variance | -0.571 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 23030 | -| policy_gradient_loss | -0.00483 | -| std | 0.634 | -| value_loss | 3.13e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2305 | -| time_elapsed | 27722 | -| total_timesteps | 295040 | -| train/ | | -| approx_kl | 0.019676123 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.963 | -| explained_variance | 0.0126 | -| learning_rate | 0.0003 | -| loss | -0.000775 | -| n_updates | 23040 | -| policy_gradient_loss | -0.00325 | -| std | 0.633 | -| value_loss | 1.93e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2306 | -| time_elapsed | 27731 | -| total_timesteps | 295168 | -| train/ | | -| approx_kl | 0.0006868858 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | 0.751 | -| learning_rate | 0.0003 | -| loss | -0.0094 | -| n_updates | 23050 | -| policy_gradient_loss | -0.006 | -| std | 0.633 | -| value_loss | 0.00359 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2307 | -| time_elapsed | 27736 | -| total_timesteps | 295296 | -| train/ | | -| approx_kl | 0.0023835094 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | -112 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 23060 | -| policy_gradient_loss | -0.000764 | -| std | 0.631 | -| value_loss | 1.97e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2308 | -| time_elapsed | 27739 | -| total_timesteps | 295424 | -| train/ | | -| approx_kl | 0.020776033 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.958 | -| explained_variance | -92.4 | -| learning_rate | 0.0003 | -| loss | -0.0057 | -| n_updates | 23070 | -| policy_gradient_loss | -0.00378 | -| std | 0.629 | -| value_loss | 1.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2309 | -| time_elapsed | 27742 | -| total_timesteps | 295552 | -| train/ | | -| approx_kl | 0.002126082 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -677 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 23080 | -| policy_gradient_loss | -0.000534 | -| std | 0.628 | -| value_loss | 2.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2310 | -| time_elapsed | 27746 | -| total_timesteps | 295680 | -| train/ | | -| approx_kl | 0.014747999 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | -200 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 23090 | -| policy_gradient_loss | -0.00271 | -| std | 0.628 | -| value_loss | 1.76e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2311 | -| time_elapsed | 27751 | -| total_timesteps | 295808 | -| train/ | | -| approx_kl | 0.008701934 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | -26.6 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 23100 | -| policy_gradient_loss | -0.00885 | -| std | 0.628 | -| value_loss | 4.94e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2312 | -| time_elapsed | 27755 | -| total_timesteps | 295936 | -| train/ | | -| approx_kl | 0.017714292 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | -6.56 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 23110 | -| policy_gradient_loss | -0.00478 | -| std | 0.628 | -| value_loss | 1.97e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2313 | -| time_elapsed | 27759 | -| total_timesteps | 296064 | -| train/ | | -| approx_kl | 0.0003037795 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | -0.0898 | -| learning_rate | 0.0003 | -| loss | -0.000601 | -| n_updates | 23120 | -| policy_gradient_loss | -6.38e-05 | -| std | 0.628 | -| value_loss | 3.84e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2314 | -| time_elapsed | 27766 | -| total_timesteps | 296192 | -| train/ | | -| approx_kl | 0.009653957 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 23130 | -| policy_gradient_loss | -0.00895 | -| std | 0.629 | -| value_loss | 0.000656 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2315 | -| time_elapsed | 27770 | -| total_timesteps | 296320 | -| train/ | | -| approx_kl | 0.00012060325 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -182 | -| learning_rate | 0.0003 | -| loss | 0.00026 | -| n_updates | 23140 | -| policy_gradient_loss | 0.000302 | -| std | 0.629 | -| value_loss | 5.76e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2316 | -| time_elapsed | 27774 | -| total_timesteps | 296448 | -| train/ | | -| approx_kl | 0.0064220326 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -165 | -| learning_rate | 0.0003 | -| loss | -0.027 | -| n_updates | 23150 | -| policy_gradient_loss | -0.00973 | -| std | 0.629 | -| value_loss | 6.48e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2317 | -| time_elapsed | 27779 | -| total_timesteps | 296576 | -| train/ | | -| approx_kl | 0.0222211 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -26.5 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 23160 | -| policy_gradient_loss | -0.00832 | -| std | 0.629 | -| value_loss | 1.86e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2318 | -| time_elapsed | 27785 | -| total_timesteps | 296704 | -| train/ | | -| approx_kl | 0.0046164747 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -5.05 | -| learning_rate | 0.0003 | -| loss | -0.000932 | -| n_updates | 23170 | -| policy_gradient_loss | -0.000608 | -| std | 0.629 | -| value_loss | 5.01e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2319 | -| time_elapsed | 27788 | -| total_timesteps | 296832 | -| train/ | | -| approx_kl | 0.00019314932 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.956 | -| explained_variance | -0.0998 | -| learning_rate | 0.0003 | -| loss | 7.29e-06 | -| n_updates | 23180 | -| policy_gradient_loss | 4.35e-05 | -| std | 0.629 | -| value_loss | 1.35e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2320 | -| time_elapsed | 27792 | -| total_timesteps | 296960 | -| train/ | | -| approx_kl | 0.010177258 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.00718 | -| n_updates | 23190 | -| policy_gradient_loss | -0.00371 | -| std | 0.628 | -| value_loss | 7.34e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2321 | -| time_elapsed | 27797 | -| total_timesteps | 297088 | -| train/ | | -| approx_kl | 9.614276e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | -0.00159 | -| learning_rate | 0.0003 | -| loss | -0.000102 | -| n_updates | 23200 | -| policy_gradient_loss | 0.000328 | -| std | 0.629 | -| value_loss | 9.42e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2322 | -| time_elapsed | 27805 | -| total_timesteps | 297216 | -| train/ | | -| approx_kl | 0.0013366027 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.956 | -| explained_variance | 0.73 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 23210 | -| policy_gradient_loss | -0.00816 | -| std | 0.63 | -| value_loss | 0.00285 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2323 | -| time_elapsed | 27809 | -| total_timesteps | 297344 | -| train/ | | -| approx_kl | 0.00016667554 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.957 | -| explained_variance | -190 | -| learning_rate | 0.0003 | -| loss | -9.14e-05 | -| n_updates | 23220 | -| policy_gradient_loss | -4.3e-05 | -| std | 0.631 | -| value_loss | 3.82e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2324 | -| time_elapsed | 27813 | -| total_timesteps | 297472 | -| train/ | | -| approx_kl | 1.9301893e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.958 | -| explained_variance | -151 | -| learning_rate | 0.0003 | -| loss | -9.19e-05 | -| n_updates | 23230 | -| policy_gradient_loss | -9.15e-06 | -| std | 0.63 | -| value_loss | 5e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2325 | -| time_elapsed | 27816 | -| total_timesteps | 297600 | -| train/ | | -| approx_kl | 0.0058158636 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.957 | -| explained_variance | -46.8 | -| learning_rate | 0.0003 | -| loss | -0.00831 | -| n_updates | 23240 | -| policy_gradient_loss | -0.00306 | -| std | 0.63 | -| value_loss | 6.24e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2326 | -| time_elapsed | 27821 | -| total_timesteps | 297728 | -| train/ | | -| approx_kl | 0.026492998 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | -0.957 | -| explained_variance | -16.4 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 23250 | -| policy_gradient_loss | -0.00433 | -| std | 0.631 | -| value_loss | 1.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2327 | -| time_elapsed | 27825 | -| total_timesteps | 297856 | -| train/ | | -| approx_kl | 0.007956138 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.958 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 23260 | -| policy_gradient_loss | 0.000878 | -| std | 0.631 | -| value_loss | 4.83e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2328 | -| time_elapsed | 27829 | -| total_timesteps | 297984 | -| train/ | | -| approx_kl | 0.0037629118 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | -0.366 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 23270 | -| policy_gradient_loss | -0.002 | -| std | 0.631 | -| value_loss | 2.19e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 10 | -| iterations | 2329 | -| time_elapsed | 27833 | -| total_timesteps | 298112 | -| train/ | | -| approx_kl | 0.02389835 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | 0.0097 | -| learning_rate | 0.0003 | -| loss | -0.00434 | -| n_updates | 23280 | -| policy_gradient_loss | -0.00603 | -| std | 0.631 | -| value_loss | 1.96e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 10 | -| iterations | 2330 | -| time_elapsed | 27841 | -| total_timesteps | 298240 | -| train/ | | -| approx_kl | 0.000956967 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | -2.37 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 23290 | -| policy_gradient_loss | -0.00549 | -| std | 0.631 | -| value_loss | 0.00247 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 10 | -| iterations | 2331 | -| time_elapsed | 27845 | -| total_timesteps | 298368 | -| train/ | | -| approx_kl | 0.004780202 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.96 | -| explained_variance | -340 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 23300 | -| policy_gradient_loss | -0.00383 | -| std | 0.632 | -| value_loss | 2.25e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 10 | -| iterations | 2332 | -| time_elapsed | 27850 | -| total_timesteps | 298496 | -| train/ | | -| approx_kl | 0.0030136062 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | -303 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 23310 | -| policy_gradient_loss | 0.000885 | -| std | 0.633 | -| value_loss | 6.11e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 10 | -| iterations | 2333 | -| time_elapsed | 27853 | -| total_timesteps | 298624 | -| train/ | | -| approx_kl | 0.007248938 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | -5.17 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 23320 | -| policy_gradient_loss | -0.00151 | -| std | 0.633 | -| value_loss | 7.06e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 10 | -| iterations | 2334 | -| time_elapsed | 27858 | -| total_timesteps | 298752 | -| train/ | | -| approx_kl | 0.0036891655 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | -20.1 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 23330 | -| policy_gradient_loss | -0.00129 | -| std | 0.633 | -| value_loss | 9.75e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 10 | -| iterations | 2335 | -| time_elapsed | 27862 | -| total_timesteps | 298880 | -| train/ | | -| approx_kl | 0.012795432 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | -0.516 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 23340 | -| policy_gradient_loss | -0.0026 | -| std | 0.633 | -| value_loss | 1.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2336 | -| time_elapsed | 27866 | -| total_timesteps | 299008 | -| train/ | | -| approx_kl | 0.011506649 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.963 | -| explained_variance | 0.0129 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 23350 | -| policy_gradient_loss | -0.00399 | -| std | 0.635 | -| value_loss | 1.02e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2337 | -| time_elapsed | 27876 | -| total_timesteps | 299136 | -| train/ | | -| approx_kl | 0.0021642665 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.965 | -| explained_variance | 0.796 | -| learning_rate | 0.0003 | -| loss | -0.0266 | -| n_updates | 23360 | -| policy_gradient_loss | -0.0126 | -| std | 0.635 | -| value_loss | 0.00152 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2338 | -| time_elapsed | 27879 | -| total_timesteps | 299264 | -| train/ | | -| approx_kl | 0.014255807 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.965 | -| explained_variance | 0.0302 | -| learning_rate | 0.0003 | -| loss | -0.000143 | -| n_updates | 23370 | -| policy_gradient_loss | -0.00193 | -| std | 0.634 | -| value_loss | 0.00333 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2339 | -| time_elapsed | 27883 | -| total_timesteps | 299392 | -| train/ | | -| approx_kl | 0.006624409 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.963 | -| explained_variance | -64.4 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 23380 | -| policy_gradient_loss | -0.00154 | -| std | 0.633 | -| value_loss | 6.41e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2340 | -| time_elapsed | 27888 | -| total_timesteps | 299520 | -| train/ | | -| approx_kl | 0.0016690509 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | -34.6 | -| learning_rate | 0.0003 | -| loss | -0.00529 | -| n_updates | 23390 | -| policy_gradient_loss | -0.000336 | -| std | 0.632 | -| value_loss | 2.16e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2341 | -| time_elapsed | 27892 | -| total_timesteps | 299648 | -| train/ | | -| approx_kl | 0.0003843815 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.96 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 23400 | -| policy_gradient_loss | 0.000941 | -| std | 0.631 | -| value_loss | 2.82e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2342 | -| time_elapsed | 27896 | -| total_timesteps | 299776 | -| train/ | | -| approx_kl | 0.00063425465 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.958 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 23410 | -| policy_gradient_loss | 0.000681 | -| std | 0.631 | -| value_loss | 1.79e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2343 | -| time_elapsed | 27899 | -| total_timesteps | 299904 | -| train/ | | -| approx_kl | 0.0005857886 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 23420 | -| policy_gradient_loss | 0.000643 | -| std | 0.631 | -| value_loss | 1.35e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2344 | -| time_elapsed | 27903 | -| total_timesteps | 300032 | -| train/ | | -| approx_kl | 0.003959052 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.958 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.000456 | -| n_updates | 23430 | -| policy_gradient_loss | 0.000184 | -| std | 0.63 | -| value_loss | 5.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2345 | -| time_elapsed | 27911 | -| total_timesteps | 300160 | -| train/ | | -| approx_kl | 0.005958897 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.956 | -| explained_variance | 0.797 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 23440 | -| policy_gradient_loss | -0.00609 | -| std | 0.629 | -| value_loss | 0.00105 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2346 | -| time_elapsed | 27915 | -| total_timesteps | 300288 | -| train/ | | -| approx_kl | 0.0109890085 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 3.95e-05 | -| n_updates | 23450 | -| policy_gradient_loss | -0.00122 | -| std | 0.629 | -| value_loss | 9.39e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2347 | -| time_elapsed | 27919 | -| total_timesteps | 300416 | -| train/ | | -| approx_kl | 0.0020231674 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.956 | -| explained_variance | -0.0042 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 23460 | -| policy_gradient_loss | -0.000561 | -| std | 0.629 | -| value_loss | 1.38e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2348 | -| time_elapsed | 27923 | -| total_timesteps | 300544 | -| train/ | | -| approx_kl | 0.00018740539 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -0.0857 | -| learning_rate | 0.0003 | -| loss | -0.0007 | -| n_updates | 23470 | -| policy_gradient_loss | 7.26e-05 | -| std | 0.628 | -| value_loss | 2.16e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2349 | -| time_elapsed | 27928 | -| total_timesteps | 300672 | -| train/ | | -| approx_kl | 0.002500464 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.953 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 23480 | -| policy_gradient_loss | -0.00148 | -| std | 0.627 | -| value_loss | 2.64e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2350 | -| time_elapsed | 27933 | -| total_timesteps | 300800 | -| train/ | | -| approx_kl | 0.02804799 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.951 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 23490 | -| policy_gradient_loss | -0.0114 | -| std | 0.626 | -| value_loss | 4.38e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 10 | -| iterations | 2351 | -| time_elapsed | 27937 | -| total_timesteps | 300928 | -| train/ | | -| approx_kl | 0.0014784129 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.949 | -| explained_variance | 0.0172 | -| learning_rate | 0.0003 | -| loss | 0.00918 | -| n_updates | 23500 | -| policy_gradient_loss | -0.0012 | -| std | 0.625 | -| value_loss | 0.0468 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2352 | -| time_elapsed | 27941 | -| total_timesteps | 301056 | -| train/ | | -| approx_kl | 0.0017338339 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.948 | -| explained_variance | 0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 23510 | -| policy_gradient_loss | 0.000714 | -| std | 0.624 | -| value_loss | 0.0518 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2353 | -| time_elapsed | 27948 | -| total_timesteps | 301184 | -| train/ | | -| approx_kl | 0.00030072848 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.946 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.411 | -| n_updates | 23520 | -| policy_gradient_loss | -0.000245 | -| std | 0.623 | -| value_loss | 1.18 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2354 | -| time_elapsed | 27953 | -| total_timesteps | 301312 | -| train/ | | -| approx_kl | 0.0067835315 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | 0.0051 | -| n_updates | 23530 | -| policy_gradient_loss | -0.0015 | -| std | 0.623 | -| value_loss | 0.0347 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2355 | -| time_elapsed | 27957 | -| total_timesteps | 301440 | -| train/ | | -| approx_kl | 0.007901569 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | 0.00108 | -| learning_rate | 0.0003 | -| loss | 0.073 | -| n_updates | 23540 | -| policy_gradient_loss | -0.00264 | -| std | 0.622 | -| value_loss | 0.196 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2356 | -| time_elapsed | 27961 | -| total_timesteps | 301568 | -| train/ | | -| approx_kl | 0.0144727295 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.944 | -| explained_variance | 0.00361 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 23550 | -| policy_gradient_loss | -0.00555 | -| std | 0.621 | -| value_loss | 0.0577 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2357 | -| time_elapsed | 27966 | -| total_timesteps | 301696 | -| train/ | | -| approx_kl | 0.0076498333 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.943 | -| explained_variance | 0.000678 | -| learning_rate | 0.0003 | -| loss | 0.00858 | -| n_updates | 23560 | -| policy_gradient_loss | -0.00546 | -| std | 0.622 | -| value_loss | 0.0394 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2358 | -| time_elapsed | 27969 | -| total_timesteps | 301824 | -| train/ | | -| approx_kl | 0.0072167814 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.944 | -| explained_variance | -0.000893 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 23570 | -| policy_gradient_loss | -0.00294 | -| std | 0.623 | -| value_loss | 0.349 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 10 | -| iterations | 2359 | -| time_elapsed | 27973 | -| total_timesteps | 301952 | -| train/ | | -| approx_kl | 0.0044691204 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | 0.0019 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 23580 | -| policy_gradient_loss | -0.00202 | -| std | 0.622 | -| value_loss | 0.0248 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2360 | -| time_elapsed | 27977 | -| total_timesteps | 302080 | -| train/ | | -| approx_kl | 0.00041170185 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.944 | -| explained_variance | -0.0082 | -| learning_rate | 0.0003 | -| loss | 0.00516 | -| n_updates | 23590 | -| policy_gradient_loss | 0.000902 | -| std | 0.622 | -| value_loss | 0.0171 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2361 | -| time_elapsed | 27984 | -| total_timesteps | 302208 | -| train/ | | -| approx_kl | 0.015002735 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | 0.019 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 23600 | -| policy_gradient_loss | -0.0109 | -| std | 0.622 | -| value_loss | 0.037 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2362 | -| time_elapsed | 27987 | -| total_timesteps | 302336 | -| train/ | | -| approx_kl | 0.020846922 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | 0.00289 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 23610 | -| policy_gradient_loss | -0.00719 | -| std | 0.622 | -| value_loss | 0.00753 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2363 | -| time_elapsed | 27991 | -| total_timesteps | 302464 | -| train/ | | -| approx_kl | 0.013104123 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | 0.00606 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 23620 | -| policy_gradient_loss | -0.00608 | -| std | 0.622 | -| value_loss | 0.0136 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2364 | -| time_elapsed | 27996 | -| total_timesteps | 302592 | -| train/ | | -| approx_kl | 0.0009845698 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.946 | -| explained_variance | 0.00166 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 23630 | -| policy_gradient_loss | -0.000786 | -| std | 0.625 | -| value_loss | 0.0625 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2365 | -| time_elapsed | 27999 | -| total_timesteps | 302720 | -| train/ | | -| approx_kl | 0.015921004 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.95 | -| explained_variance | 0.00285 | -| learning_rate | 0.0003 | -| loss | 0.0932 | -| n_updates | 23640 | -| policy_gradient_loss | -0.00794 | -| std | 0.627 | -| value_loss | 0.227 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2366 | -| time_elapsed | 28002 | -| total_timesteps | 302848 | -| train/ | | -| approx_kl | 0.0034395857 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.952 | -| explained_variance | 0.00129 | -| learning_rate | 0.0003 | -| loss | 0.225 | -| n_updates | 23650 | -| policy_gradient_loss | -0.00149 | -| std | 0.628 | -| value_loss | 0.477 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.11 | -| time/ | | -| fps | 10 | -| iterations | 2367 | -| time_elapsed | 28006 | -| total_timesteps | 302976 | -| train/ | | -| approx_kl | 0.00585668 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.954 | -| explained_variance | 0.00432 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 23660 | -| policy_gradient_loss | -0.000335 | -| std | 0.629 | -| value_loss | 0.0251 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.26 | -| time/ | | -| fps | 10 | -| iterations | 2368 | -| time_elapsed | 28010 | -| total_timesteps | 303104 | -| train/ | | -| approx_kl | 0.0076591643 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.957 | -| explained_variance | 0.00378 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 23670 | -| policy_gradient_loss | -0.00217 | -| std | 0.631 | -| value_loss | 0.029 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.26 | -| time/ | | -| fps | 10 | -| iterations | 2369 | -| time_elapsed | 28018 | -| total_timesteps | 303232 | -| train/ | | -| approx_kl | 0.0010064628 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.958 | -| explained_variance | 0.0043 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 23680 | -| policy_gradient_loss | -0.000188 | -| std | 0.631 | -| value_loss | 0.109 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.26 | -| time/ | | -| fps | 10 | -| iterations | 2370 | -| time_elapsed | 28023 | -| total_timesteps | 303360 | -| train/ | | -| approx_kl | 0.0011530414 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | -0.000974 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 23690 | -| policy_gradient_loss | 0.000639 | -| std | 0.631 | -| value_loss | 0.00952 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.26 | -| time/ | | -| fps | 10 | -| iterations | 2371 | -| time_elapsed | 28028 | -| total_timesteps | 303488 | -| train/ | | -| approx_kl | 0.0043649236 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | 0.00121 | -| learning_rate | 0.0003 | -| loss | 0.00805 | -| n_updates | 23700 | -| policy_gradient_loss | -0.000874 | -| std | 0.632 | -| value_loss | 0.0189 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.26 | -| time/ | | -| fps | 10 | -| iterations | 2372 | -| time_elapsed | 28032 | -| total_timesteps | 303616 | -| train/ | | -| approx_kl | 0.016234914 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | 0.0151 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 23710 | -| policy_gradient_loss | -0.00407 | -| std | 0.631 | -| value_loss | 0.00796 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.26 | -| time/ | | -| fps | 10 | -| iterations | 2373 | -| time_elapsed | 28037 | -| total_timesteps | 303744 | -| train/ | | -| approx_kl | 0.00066638016 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | -0.000604 | -| learning_rate | 0.0003 | -| loss | -9.88e-05 | -| n_updates | 23720 | -| policy_gradient_loss | -0.000119 | -| std | 0.631 | -| value_loss | 0.00717 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.26 | -| time/ | | -| fps | 10 | -| iterations | 2374 | -| time_elapsed | 28041 | -| total_timesteps | 303872 | -| train/ | | -| approx_kl | 0.018389933 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | 0.0271 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 23730 | -| policy_gradient_loss | -0.00451 | -| std | 0.632 | -| value_loss | 0.00293 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2375 | -| time_elapsed | 28044 | -| total_timesteps | 304000 | -| train/ | | -| approx_kl | 0.0030878126 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.96 | -| explained_variance | -0.00458 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 23740 | -| policy_gradient_loss | -0.00361 | -| std | 0.633 | -| value_loss | 0.0742 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2376 | -| time_elapsed | 28047 | -| total_timesteps | 304128 | -| train/ | | -| approx_kl | 0.0035166754 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | 0.00419 | -| learning_rate | 0.0003 | -| loss | 0.923 | -| n_updates | 23750 | -| policy_gradient_loss | 0.00187 | -| std | 0.633 | -| value_loss | 2.11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2377 | -| time_elapsed | 28057 | -| total_timesteps | 304256 | -| train/ | | -| approx_kl | 0.0069793155 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | 0.00446 | -| n_updates | 23760 | -| policy_gradient_loss | -0.00331 | -| std | 0.633 | -| value_loss | 0.0187 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2378 | -| time_elapsed | 28061 | -| total_timesteps | 304384 | -| train/ | | -| approx_kl | 0.012509776 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.963 | -| explained_variance | 0.00322 | -| learning_rate | 0.0003 | -| loss | 0.00811 | -| n_updates | 23770 | -| policy_gradient_loss | -0.00283 | -| std | 0.634 | -| value_loss | 0.0207 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2379 | -| time_elapsed | 28064 | -| total_timesteps | 304512 | -| train/ | | -| approx_kl | 0.009762214 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.963 | -| explained_variance | 0.00411 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 23780 | -| policy_gradient_loss | -0.00239 | -| std | 0.634 | -| value_loss | 0.0148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2380 | -| time_elapsed | 28067 | -| total_timesteps | 304640 | -| train/ | | -| approx_kl | 0.008441328 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.964 | -| explained_variance | -0.00111 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 23790 | -| policy_gradient_loss | -0.00255 | -| std | 0.634 | -| value_loss | 0.0108 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2381 | -| time_elapsed | 28070 | -| total_timesteps | 304768 | -| train/ | | -| approx_kl | 0.0065960446 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.964 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 23800 | -| policy_gradient_loss | -0.00183 | -| std | 0.635 | -| value_loss | 0.00618 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2382 | -| time_elapsed | 28074 | -| total_timesteps | 304896 | -| train/ | | -| approx_kl | 0.019136718 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -0.965 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 23810 | -| policy_gradient_loss | -0.0125 | -| std | 0.636 | -| value_loss | 0.00419 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2383 | -| time_elapsed | 28078 | -| total_timesteps | 305024 | -| train/ | | -| approx_kl | 0.0083161965 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.967 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00038 | -| n_updates | 23820 | -| policy_gradient_loss | -0.00127 | -| std | 0.636 | -| value_loss | 0.00309 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2384 | -| time_elapsed | 28088 | -| total_timesteps | 305152 | -| train/ | | -| approx_kl | 0.0015905246 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.968 | -| explained_variance | 0.187 | -| learning_rate | 0.0003 | -| loss | -0.000409 | -| n_updates | 23830 | -| policy_gradient_loss | -0.00312 | -| std | 0.638 | -| value_loss | 0.017 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2385 | -| time_elapsed | 28093 | -| total_timesteps | 305280 | -| train/ | | -| approx_kl | 0.0009021475 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.971 | -| explained_variance | -0.368 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 23840 | -| policy_gradient_loss | -0.000206 | -| std | 0.639 | -| value_loss | 0.00292 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2386 | -| time_elapsed | 28097 | -| total_timesteps | 305408 | -| train/ | | -| approx_kl | 0.00035944395 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.972 | -| explained_variance | -0.0647 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 23850 | -| policy_gradient_loss | 0.00102 | -| std | 0.64 | -| value_loss | 0.00108 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2387 | -| time_elapsed | 28102 | -| total_timesteps | 305536 | -| train/ | | -| approx_kl | 0.00054678996 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.973 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 23860 | -| policy_gradient_loss | 0.000565 | -| std | 0.64 | -| value_loss | 0.00057 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2388 | -| time_elapsed | 28106 | -| total_timesteps | 305664 | -| train/ | | -| approx_kl | 0.011425282 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.974 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 23870 | -| policy_gradient_loss | -0.00266 | -| std | 0.642 | -| value_loss | 0.000179 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2389 | -| time_elapsed | 28111 | -| total_timesteps | 305792 | -| train/ | | -| approx_kl | 0.0059573287 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.976 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 23880 | -| policy_gradient_loss | -0.00223 | -| std | 0.642 | -| value_loss | 0.000136 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2390 | -| time_elapsed | 28116 | -| total_timesteps | 305920 | -| train/ | | -| approx_kl | 0.011411888 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.976 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | -0.00573 | -| n_updates | 23890 | -| policy_gradient_loss | -0.00544 | -| std | 0.642 | -| value_loss | 0.000208 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2391 | -| time_elapsed | 28119 | -| total_timesteps | 306048 | -| train/ | | -| approx_kl | 0.0017215468 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.976 | -| explained_variance | -0.312 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 23900 | -| policy_gradient_loss | -0.000498 | -| std | 0.642 | -| value_loss | 4.14e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2392 | -| time_elapsed | 28126 | -| total_timesteps | 306176 | -| train/ | | -| approx_kl | 0.017545253 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.976 | -| explained_variance | 0.468 | -| learning_rate | 0.0003 | -| loss | 0.0041 | -| n_updates | 23910 | -| policy_gradient_loss | -0.00122 | -| std | 0.642 | -| value_loss | 0.0109 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2393 | -| time_elapsed | 28129 | -| total_timesteps | 306304 | -| train/ | | -| approx_kl | 0.0031327303 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.975 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 23920 | -| policy_gradient_loss | -0.00105 | -| std | 0.642 | -| value_loss | 3.08e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2394 | -| time_elapsed | 28134 | -| total_timesteps | 306432 | -| train/ | | -| approx_kl | 0.0024694328 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.975 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | 0.000315 | -| n_updates | 23930 | -| policy_gradient_loss | 0.000247 | -| std | 0.64 | -| value_loss | 2.82e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2395 | -| time_elapsed | 28139 | -| total_timesteps | 306560 | -| train/ | | -| approx_kl | 0.007208091 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.972 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 23940 | -| policy_gradient_loss | -0.00803 | -| std | 0.639 | -| value_loss | 2.38e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2396 | -| time_elapsed | 28143 | -| total_timesteps | 306688 | -| train/ | | -| approx_kl | 9.820005e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.97 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | -0.00082 | -| n_updates | 23950 | -| policy_gradient_loss | 0.000835 | -| std | 0.638 | -| value_loss | 1.91e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2397 | -| time_elapsed | 28147 | -| total_timesteps | 306816 | -| train/ | | -| approx_kl | 0.00084553915 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.968 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.000402 | -| n_updates | 23960 | -| policy_gradient_loss | 0.000424 | -| std | 0.636 | -| value_loss | 1.29e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.46 | -| time/ | | -| fps | 10 | -| iterations | 2398 | -| time_elapsed | 28151 | -| total_timesteps | 306944 | -| train/ | | -| approx_kl | 0.0057593063 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.965 | -| explained_variance | -0.00762 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 23970 | -| policy_gradient_loss | -0.00459 | -| std | 0.634 | -| value_loss | 1.07e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2399 | -| time_elapsed | 28155 | -| total_timesteps | 307072 | -| train/ | | -| approx_kl | 0.00087720715 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.000988 | -| n_updates | 23980 | -| policy_gradient_loss | 0.000946 | -| std | 0.632 | -| value_loss | 6.74e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2400 | -| time_elapsed | 28163 | -| total_timesteps | 307200 | -| train/ | | -| approx_kl | 0.0008539164 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.96 | -| explained_variance | 0.69 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 23990 | -| policy_gradient_loss | -0.00948 | -| std | 0.632 | -| value_loss | 0.00131 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2401 | -| time_elapsed | 28169 | -| total_timesteps | 307328 | -| train/ | | -| approx_kl | 0.004641237 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.96 | -| explained_variance | 0.0177 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 24000 | -| policy_gradient_loss | -0.0013 | -| std | 0.633 | -| value_loss | 5.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2402 | -| time_elapsed | 28173 | -| total_timesteps | 307456 | -| train/ | | -| approx_kl | 0.001826806 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.000754 | -| n_updates | 24010 | -| policy_gradient_loss | -0.000357 | -| std | 0.633 | -| value_loss | 3.65e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2403 | -| time_elapsed | 28177 | -| total_timesteps | 307584 | -| train/ | | -| approx_kl | 0.013992233 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 24020 | -| policy_gradient_loss | -0.00678 | -| std | 0.633 | -| value_loss | 3.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2404 | -| time_elapsed | 28181 | -| total_timesteps | 307712 | -| train/ | | -| approx_kl | 0.001275805 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | -0.00222 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 24030 | -| policy_gradient_loss | -0.000357 | -| std | 0.633 | -| value_loss | 3.25e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2405 | -| time_elapsed | 28186 | -| total_timesteps | 307840 | -| train/ | | -| approx_kl | 0.00023311912 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.961 | -| explained_variance | -0.00893 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 24040 | -| policy_gradient_loss | 0.000615 | -| std | 0.633 | -| value_loss | 2.6e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.43 | -| time/ | | -| fps | 10 | -| iterations | 2406 | -| time_elapsed | 28190 | -| total_timesteps | 307968 | -| train/ | | -| approx_kl | 0.0022943853 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.0003 | -| n_updates | 24050 | -| policy_gradient_loss | 9.63e-05 | -| std | 0.633 | -| value_loss | 2.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2407 | -| time_elapsed | 28195 | -| total_timesteps | 308096 | -| train/ | | -| approx_kl | 0.0034796605 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | -0.00869 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 24060 | -| policy_gradient_loss | -0.000711 | -| std | 0.633 | -| value_loss | 1.92e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2408 | -| time_elapsed | 28204 | -| total_timesteps | 308224 | -| train/ | | -| approx_kl | 0.008134058 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | 0.613 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 24070 | -| policy_gradient_loss | -0.0119 | -| std | 0.633 | -| value_loss | 0.0034 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2409 | -| time_elapsed | 28207 | -| total_timesteps | 308352 | -| train/ | | -| approx_kl | 0.0009901649 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.962 | -| explained_variance | -0.0065 | -| learning_rate | 0.0003 | -| loss | 0.000589 | -| n_updates | 24080 | -| policy_gradient_loss | 0.000503 | -| std | 0.632 | -| value_loss | 2.03e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2410 | -| time_elapsed | 28212 | -| total_timesteps | 308480 | -| train/ | | -| approx_kl | 0.012188396 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.96 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 24090 | -| policy_gradient_loss | -0.00547 | -| std | 0.632 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2411 | -| time_elapsed | 28215 | -| total_timesteps | 308608 | -| train/ | | -| approx_kl | 0.013020073 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.959 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 24100 | -| policy_gradient_loss | -0.00633 | -| std | 0.631 | -| value_loss | 8.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2412 | -| time_elapsed | 28218 | -| total_timesteps | 308736 | -| train/ | | -| approx_kl | 0.011511089 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.957 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 24110 | -| policy_gradient_loss | -0.00272 | -| std | 0.63 | -| value_loss | 5.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2413 | -| time_elapsed | 28223 | -| total_timesteps | 308864 | -| train/ | | -| approx_kl | 0.012491915 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.956 | -| explained_variance | 0.000156 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 24120 | -| policy_gradient_loss | -0.00848 | -| std | 0.629 | -| value_loss | 6.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2414 | -| time_elapsed | 28226 | -| total_timesteps | 308992 | -| train/ | | -| approx_kl | 0.001546771 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | -0.0905 | -| learning_rate | 0.0003 | -| loss | 0.000446 | -| n_updates | 24130 | -| policy_gradient_loss | 0.000358 | -| std | 0.63 | -| value_loss | 3.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2415 | -| time_elapsed | 28230 | -| total_timesteps | 309120 | -| train/ | | -| approx_kl | 0.007503208 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.956 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 24140 | -| policy_gradient_loss | -0.00237 | -| std | 0.629 | -| value_loss | 2.83e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2416 | -| time_elapsed | 28242 | -| total_timesteps | 309248 | -| train/ | | -| approx_kl | 0.03848577 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -0.955 | -| explained_variance | 0.591 | -| learning_rate | 0.0003 | -| loss | -0.0292 | -| n_updates | 24150 | -| policy_gradient_loss | -0.0209 | -| std | 0.628 | -| value_loss | 0.000824 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2417 | -| time_elapsed | 28246 | -| total_timesteps | 309376 | -| train/ | | -| approx_kl | 0.02101479 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.953 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 24160 | -| policy_gradient_loss | -0.0113 | -| std | 0.627 | -| value_loss | 1.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2418 | -| time_elapsed | 28250 | -| total_timesteps | 309504 | -| train/ | | -| approx_kl | 0.009440273 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.952 | -| explained_variance | -12.3 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 24170 | -| policy_gradient_loss | -0.00198 | -| std | 0.627 | -| value_loss | 1.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2419 | -| time_elapsed | 28254 | -| total_timesteps | 309632 | -| train/ | | -| approx_kl | 0.0011184455 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.952 | -| explained_variance | -1.83 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 24180 | -| policy_gradient_loss | -0.000358 | -| std | 0.626 | -| value_loss | 3.65e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2420 | -| time_elapsed | 28256 | -| total_timesteps | 309760 | -| train/ | | -| approx_kl | 0.0020913251 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.951 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.00443 | -| n_updates | 24190 | -| policy_gradient_loss | -0.00099 | -| std | 0.625 | -| value_loss | 2.96e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.41 | -| time/ | | -| fps | 10 | -| iterations | 2421 | -| time_elapsed | 28260 | -| total_timesteps | 309888 | -| train/ | | -| approx_kl | 0.00021294947 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.949 | -| explained_variance | 0.0152 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 24200 | -| policy_gradient_loss | 0.000675 | -| std | 0.625 | -| value_loss | 1.99e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2422 | -| time_elapsed | 28265 | -| total_timesteps | 310016 | -| train/ | | -| approx_kl | 0.01737142 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.948 | -| explained_variance | -0.00598 | -| learning_rate | 0.0003 | -| loss | -0.00448 | -| n_updates | 24210 | -| policy_gradient_loss | -0.00473 | -| std | 0.624 | -| value_loss | 1.74e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2423 | -| time_elapsed | 28274 | -| total_timesteps | 310144 | -| train/ | | -| approx_kl | 0.027214311 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.946 | -| explained_variance | 0.709 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 24220 | -| policy_gradient_loss | -0.0149 | -| std | 0.623 | -| value_loss | 0.000968 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2424 | -| time_elapsed | 28279 | -| total_timesteps | 310272 | -| train/ | | -| approx_kl | 0.015058154 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | -0.795 | -| learning_rate | 0.0003 | -| loss | 0.000509 | -| n_updates | 24230 | -| policy_gradient_loss | -0.00199 | -| std | 0.623 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2425 | -| time_elapsed | 28283 | -| total_timesteps | 310400 | -| train/ | | -| approx_kl | 0.007308513 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | -23.5 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 24240 | -| policy_gradient_loss | -0.00274 | -| std | 0.622 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2426 | -| time_elapsed | 28287 | -| total_timesteps | 310528 | -| train/ | | -| approx_kl | 0.010797648 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.945 | -| explained_variance | -4.17 | -| learning_rate | 0.0003 | -| loss | -0.000856 | -| n_updates | 24250 | -| policy_gradient_loss | -0.000934 | -| std | 0.624 | -| value_loss | 3.37e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2427 | -| time_elapsed | 28290 | -| total_timesteps | 310656 | -| train/ | | -| approx_kl | 0.008189044 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.947 | -| explained_variance | -0.886 | -| learning_rate | 0.0003 | -| loss | -0.00541 | -| n_updates | 24260 | -| policy_gradient_loss | -0.00367 | -| std | 0.624 | -| value_loss | 2.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2428 | -| time_elapsed | 28294 | -| total_timesteps | 310784 | -| train/ | | -| approx_kl | 0.011053614 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.947 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 24270 | -| policy_gradient_loss | -0.00228 | -| std | 0.624 | -| value_loss | 8.69e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2429 | -| time_elapsed | 28299 | -| total_timesteps | 310912 | -| train/ | | -| approx_kl | 0.0014191847 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.946 | -| explained_variance | -0.00544 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 24280 | -| policy_gradient_loss | -0.000687 | -| std | 0.621 | -| value_loss | 7.12e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2430 | -| time_elapsed | 28303 | -| total_timesteps | 311040 | -| train/ | | -| approx_kl | 0.002538724 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.941 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | -0.00946 | -| n_updates | 24290 | -| policy_gradient_loss | -0.00228 | -| std | 0.619 | -| value_loss | 8.23e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2431 | -| time_elapsed | 28310 | -| total_timesteps | 311168 | -| train/ | | -| approx_kl | 0.007480326 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.938 | -| explained_variance | 0.608 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 24300 | -| policy_gradient_loss | -0.00707 | -| std | 0.618 | -| value_loss | 0.00444 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2432 | -| time_elapsed | 28315 | -| total_timesteps | 311296 | -| train/ | | -| approx_kl | 0.010502175 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.936 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.00907 | -| n_updates | 24310 | -| policy_gradient_loss | -0.00562 | -| std | 0.616 | -| value_loss | 3.02e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2433 | -| time_elapsed | 28319 | -| total_timesteps | 311424 | -| train/ | | -| approx_kl | 0.0017318313 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.933 | -| explained_variance | -17.4 | -| learning_rate | 0.0003 | -| loss | -5.63e-06 | -| n_updates | 24320 | -| policy_gradient_loss | -5e-06 | -| std | 0.615 | -| value_loss | 3.23e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 10 | -| iterations | 2434 | -| time_elapsed | 28323 | -| total_timesteps | 311552 | -| train/ | | -| approx_kl | 0.0060034124 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.932 | -| explained_variance | -6.34 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 24330 | -| policy_gradient_loss | -0.00212 | -| std | 0.614 | -| value_loss | 1.37e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2435 | -| time_elapsed | 28326 | -| total_timesteps | 311680 | -| train/ | | -| approx_kl | 4.8244838e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.931 | -| explained_variance | -0.539 | -| learning_rate | 0.0003 | -| loss | -0.000141 | -| n_updates | 24340 | -| policy_gradient_loss | 0.000951 | -| std | 0.613 | -| value_loss | 6.18e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2436 | -| time_elapsed | 28331 | -| total_timesteps | 311808 | -| train/ | | -| approx_kl | 0.019495968 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.929 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 24350 | -| policy_gradient_loss | -0.00641 | -| std | 0.612 | -| value_loss | 5.69e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2437 | -| time_elapsed | 28336 | -| total_timesteps | 311936 | -| train/ | | -| approx_kl | 5.2677933e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.928 | -| explained_variance | 0.0145 | -| learning_rate | 0.0003 | -| loss | -0.000532 | -| n_updates | 24360 | -| policy_gradient_loss | -6.96e-05 | -| std | 0.613 | -| value_loss | 1.63e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2438 | -| time_elapsed | 28340 | -| total_timesteps | 312064 | -| train/ | | -| approx_kl | 0.0046639116 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.931 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 24370 | -| policy_gradient_loss | -0.00357 | -| std | 0.614 | -| value_loss | 1.94e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2439 | -| time_elapsed | 28346 | -| total_timesteps | 312192 | -| train/ | | -| approx_kl | 0.02353133 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.932 | -| explained_variance | 0.6 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 24380 | -| policy_gradient_loss | -0.00965 | -| std | 0.614 | -| value_loss | 0.00526 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2440 | -| time_elapsed | 28349 | -| total_timesteps | 312320 | -| train/ | | -| approx_kl | 0.010998144 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.931 | -| explained_variance | -0.387 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 24390 | -| policy_gradient_loss | -0.00229 | -| std | 0.613 | -| value_loss | 3.15e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2441 | -| time_elapsed | 28352 | -| total_timesteps | 312448 | -| train/ | | -| approx_kl | 0.0035823763 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.928 | -| explained_variance | -9.72 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 24400 | -| policy_gradient_loss | -0.00149 | -| std | 0.61 | -| value_loss | 1.74e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2442 | -| time_elapsed | 28356 | -| total_timesteps | 312576 | -| train/ | | -| approx_kl | 0.013748355 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.923 | -| explained_variance | -2.41 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 24410 | -| policy_gradient_loss | -0.00229 | -| std | 0.608 | -| value_loss | 8.09e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2443 | -| time_elapsed | 28360 | -| total_timesteps | 312704 | -| train/ | | -| approx_kl | 0.0037686725 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.919 | -| explained_variance | -0.24 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 24420 | -| policy_gradient_loss | -0.0011 | -| std | 0.605 | -| value_loss | 2.54e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2444 | -| time_elapsed | 28362 | -| total_timesteps | 312832 | -| train/ | | -| approx_kl | 0.00043100282 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.916 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | -0.000999 | -| n_updates | 24430 | -| policy_gradient_loss | 5.16e-05 | -| std | 0.604 | -| value_loss | 1.37e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2445 | -| time_elapsed | 28366 | -| total_timesteps | 312960 | -| train/ | | -| approx_kl | 0.008904508 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.913 | -| explained_variance | -0.283 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 24440 | -| policy_gradient_loss | -0.00134 | -| std | 0.602 | -| value_loss | 7.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2446 | -| time_elapsed | 28370 | -| total_timesteps | 313088 | -| train/ | | -| approx_kl | 0.00305775 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.909 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 24450 | -| policy_gradient_loss | -0.000866 | -| std | 0.599 | -| value_loss | 3.3e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2447 | -| time_elapsed | 28378 | -| total_timesteps | 313216 | -| train/ | | -| approx_kl | 0.036979467 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.905 | -| explained_variance | 0.367 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 24460 | -| policy_gradient_loss | -0.00698 | -| std | 0.597 | -| value_loss | 0.00386 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2448 | -| time_elapsed | 28382 | -| total_timesteps | 313344 | -| train/ | | -| approx_kl | 0.0040324377 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.903 | -| explained_variance | -1.76 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 24470 | -| policy_gradient_loss | -0.00271 | -| std | 0.597 | -| value_loss | 8.69e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2449 | -| time_elapsed | 28387 | -| total_timesteps | 313472 | -| train/ | | -| approx_kl | 0.0076288832 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.903 | -| explained_variance | 0.0116 | -| learning_rate | 0.0003 | -| loss | 0.000281 | -| n_updates | 24480 | -| policy_gradient_loss | -0.000122 | -| std | 0.596 | -| value_loss | 3.54e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2450 | -| time_elapsed | 28391 | -| total_timesteps | 313600 | -| train/ | | -| approx_kl | 0.010832587 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.902 | -| explained_variance | 0.0039 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 24490 | -| policy_gradient_loss | -0.00689 | -| std | 0.596 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2451 | -| time_elapsed | 28395 | -| total_timesteps | 313728 | -| train/ | | -| approx_kl | 0.012038132 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -0.902 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.007 | -| n_updates | 24500 | -| policy_gradient_loss | -0.00598 | -| std | 0.596 | -| value_loss | 1.37e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2452 | -| time_elapsed | 28399 | -| total_timesteps | 313856 | -| train/ | | -| approx_kl | 0.00023833802 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.9 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.00032 | -| n_updates | 24510 | -| policy_gradient_loss | -0.00012 | -| std | 0.594 | -| value_loss | 8.84e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 11 | -| iterations | 2453 | -| time_elapsed | 28403 | -| total_timesteps | 313984 | -| train/ | | -| approx_kl | 0.007905302 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.897 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 24520 | -| policy_gradient_loss | -0.00271 | -| std | 0.593 | -| value_loss | 8.31e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 11 | -| iterations | 2454 | -| time_elapsed | 28406 | -| total_timesteps | 314112 | -| train/ | | -| approx_kl | 0.00038302923 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.895 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | -0.000839 | -| n_updates | 24530 | -| policy_gradient_loss | 0.000119 | -| std | 0.592 | -| value_loss | 6.98e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 11 | -| iterations | 2455 | -| time_elapsed | 28417 | -| total_timesteps | 314240 | -| train/ | | -| approx_kl | 0.003653935 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.894 | -| explained_variance | 0.372 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 24540 | -| policy_gradient_loss | -0.00314 | -| std | 0.592 | -| value_loss | 0.00461 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 11 | -| iterations | 2456 | -| time_elapsed | 28423 | -| total_timesteps | 314368 | -| train/ | | -| approx_kl | 0.00031431834 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.895 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 24550 | -| policy_gradient_loss | 0.000961 | -| std | 0.592 | -| value_loss | 0.000103 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 11 | -| iterations | 2457 | -| time_elapsed | 28426 | -| total_timesteps | 314496 | -| train/ | | -| approx_kl | 0.0004302913 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.895 | -| explained_variance | 0.0146 | -| learning_rate | 0.0003 | -| loss | -0.0074 | -| n_updates | 24560 | -| policy_gradient_loss | 0.00101 | -| std | 0.593 | -| value_loss | 8.54e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 11 | -| iterations | 2458 | -| time_elapsed | 28431 | -| total_timesteps | 314624 | -| train/ | | -| approx_kl | 0.0036487018 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.896 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.000123 | -| n_updates | 24570 | -| policy_gradient_loss | 3.28e-05 | -| std | 0.592 | -| value_loss | 2.29e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 11 | -| iterations | 2459 | -| time_elapsed | 28436 | -| total_timesteps | 314752 | -| train/ | | -| approx_kl | 0.005103264 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.894 | -| explained_variance | -0.0732 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 24580 | -| policy_gradient_loss | -0.00261 | -| std | 0.591 | -| value_loss | 2.23e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 11 | -| iterations | 2460 | -| time_elapsed | 28440 | -| total_timesteps | 314880 | -| train/ | | -| approx_kl | 0.009763488 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.892 | -| explained_variance | -0.00223 | -| learning_rate | 0.0003 | -| loss | -2.67e-06 | -| n_updates | 24590 | -| policy_gradient_loss | -0.000864 | -| std | 0.59 | -| value_loss | 1.34e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2461 | -| time_elapsed | 28445 | -| total_timesteps | 315008 | -| train/ | | -| approx_kl | 0.0047170185 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -0.00329 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 24600 | -| policy_gradient_loss | -0.00118 | -| std | 0.59 | -| value_loss | 1.05e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2462 | -| time_elapsed | 28457 | -| total_timesteps | 315136 | -| train/ | | -| approx_kl | 0.019174322 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -0.529 | -| learning_rate | 0.0003 | -| loss | -0.0276 | -| n_updates | 24610 | -| policy_gradient_loss | -0.0174 | -| std | 0.59 | -| value_loss | 0.00116 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2463 | -| time_elapsed | 28462 | -| total_timesteps | 315264 | -| train/ | | -| approx_kl | 0.008130223 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | 0.326 | -| learning_rate | 0.0003 | -| loss | -0.0086 | -| n_updates | 24620 | -| policy_gradient_loss | -0.00335 | -| std | 0.59 | -| value_loss | 1.97e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2464 | -| time_elapsed | 28467 | -| total_timesteps | 315392 | -| train/ | | -| approx_kl | 0.00041161804 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.000915 | -| n_updates | 24630 | -| policy_gradient_loss | 0.00112 | -| std | 0.59 | -| value_loss | 3.71e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2465 | -| time_elapsed | 28471 | -| total_timesteps | 315520 | -| train/ | | -| approx_kl | 0.00070068915 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | 0.0118 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 24640 | -| policy_gradient_loss | -8.35e-05 | -| std | 0.59 | -| value_loss | 3.55e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2466 | -| time_elapsed | 28475 | -| total_timesteps | 315648 | -| train/ | | -| approx_kl | 0.00011152518 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | -0.000122 | -| n_updates | 24650 | -| policy_gradient_loss | 0.00025 | -| std | 0.589 | -| value_loss | 3.76e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2467 | -| time_elapsed | 28479 | -| total_timesteps | 315776 | -| train/ | | -| approx_kl | 0.016606329 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.888 | -| explained_variance | -0.0887 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 24660 | -| policy_gradient_loss | -0.00862 | -| std | 0.587 | -| value_loss | 4.83e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2468 | -| time_elapsed | 28483 | -| total_timesteps | 315904 | -| train/ | | -| approx_kl | 1.762691e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | 3.43e-05 | -| n_updates | 24670 | -| policy_gradient_loss | 0.000173 | -| std | 0.585 | -| value_loss | 1.94e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2469 | -| time_elapsed | 28487 | -| total_timesteps | 316032 | -| train/ | | -| approx_kl | 0.009063511 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 24680 | -| policy_gradient_loss | -0.00215 | -| std | 0.585 | -| value_loss | 1.82e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2470 | -| time_elapsed | 28497 | -| total_timesteps | 316160 | -| train/ | | -| approx_kl | 0.0013119732 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | 0.605 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 24690 | -| policy_gradient_loss | -0.0107 | -| std | 0.584 | -| value_loss | 0.00403 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2471 | -| time_elapsed | 28502 | -| total_timesteps | 316288 | -| train/ | | -| approx_kl | 0.0052559073 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00599 | -| n_updates | 24700 | -| policy_gradient_loss | -0.00207 | -| std | 0.585 | -| value_loss | 1.29e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2472 | -| time_elapsed | 28507 | -| total_timesteps | 316416 | -| train/ | | -| approx_kl | 2.4006004e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.000719 | -| n_updates | 24710 | -| policy_gradient_loss | 0.00183 | -| std | 0.585 | -| value_loss | 1.25e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2473 | -| time_elapsed | 28511 | -| total_timesteps | 316544 | -| train/ | | -| approx_kl | 0.013954621 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 24720 | -| policy_gradient_loss | -0.00305 | -| std | 0.586 | -| value_loss | 5.69e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2474 | -| time_elapsed | 28517 | -| total_timesteps | 316672 | -| train/ | | -| approx_kl | 0.00021140394 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -0.00174 | -| learning_rate | 0.0003 | -| loss | -0.000344 | -| n_updates | 24730 | -| policy_gradient_loss | -6.88e-05 | -| std | 0.587 | -| value_loss | 4.86e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2475 | -| time_elapsed | 28520 | -| total_timesteps | 316800 | -| train/ | | -| approx_kl | 0.0035951668 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | -0.00784 | -| n_updates | 24740 | -| policy_gradient_loss | -0.00247 | -| std | 0.586 | -| value_loss | 5.5e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2476 | -| time_elapsed | 28525 | -| total_timesteps | 316928 | -| train/ | | -| approx_kl | 0.009868617 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -0.00321 | -| learning_rate | 0.0003 | -| loss | -0.000648 | -| n_updates | 24750 | -| policy_gradient_loss | -0.00113 | -| std | 0.585 | -| value_loss | 3.58e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2477 | -| time_elapsed | 28530 | -| total_timesteps | 317056 | -| train/ | | -| approx_kl | 0.0032681823 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 24760 | -| policy_gradient_loss | -0.000847 | -| std | 0.586 | -| value_loss | 3.27e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2478 | -| time_elapsed | 28538 | -| total_timesteps | 317184 | -| train/ | | -| approx_kl | 0.00026181177 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | 0.531 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 24770 | -| policy_gradient_loss | -0.000523 | -| std | 0.587 | -| value_loss | 0.00791 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2479 | -| time_elapsed | 28542 | -| total_timesteps | 317312 | -| train/ | | -| approx_kl | 0.005811033 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.887 | -| explained_variance | -4.97 | -| learning_rate | 0.0003 | -| loss | -0.00586 | -| n_updates | 24780 | -| policy_gradient_loss | -0.00211 | -| std | 0.588 | -| value_loss | 1.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2480 | -| time_elapsed | 28547 | -| total_timesteps | 317440 | -| train/ | | -| approx_kl | 0.022353001 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.889 | -| explained_variance | -5.98 | -| learning_rate | 0.0003 | -| loss | -0.00393 | -| n_updates | 24790 | -| policy_gradient_loss | -0.00302 | -| std | 0.589 | -| value_loss | 5.96e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2481 | -| time_elapsed | 28551 | -| total_timesteps | 317568 | -| train/ | | -| approx_kl | 0.0003456911 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.89 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00068 | -| n_updates | 24800 | -| policy_gradient_loss | 0.000108 | -| std | 0.59 | -| value_loss | 3.28e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2482 | -| time_elapsed | 28556 | -| total_timesteps | 317696 | -| train/ | | -| approx_kl | 1.3932819e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.89 | -| explained_variance | -0.391 | -| learning_rate | 0.0003 | -| loss | -0.000402 | -| n_updates | 24810 | -| policy_gradient_loss | 0.000122 | -| std | 0.588 | -| value_loss | 2.17e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2483 | -| time_elapsed | 28559 | -| total_timesteps | 317824 | -| train/ | | -| approx_kl | 0.013237927 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.00828 | -| n_updates | 24820 | -| policy_gradient_loss | -0.00528 | -| std | 0.586 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2484 | -| time_elapsed | 28562 | -| total_timesteps | 317952 | -| train/ | | -| approx_kl | 0.0021752052 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -0.00665 | -| learning_rate | 0.0003 | -| loss | -0.00704 | -| n_updates | 24830 | -| policy_gradient_loss | -0.00147 | -| std | 0.585 | -| value_loss | 6.94e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2485 | -| time_elapsed | 28565 | -| total_timesteps | 318080 | -| train/ | | -| approx_kl | 0.020809181 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | 0.00461 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 24840 | -| policy_gradient_loss | -0.0127 | -| std | 0.585 | -| value_loss | 6.17e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2486 | -| time_elapsed | 28573 | -| total_timesteps | 318208 | -| train/ | | -| approx_kl | 0.0010451165 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 24850 | -| policy_gradient_loss | -0.00563 | -| std | 0.585 | -| value_loss | 0.000665 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2487 | -| time_elapsed | 28577 | -| total_timesteps | 318336 | -| train/ | | -| approx_kl | 0.012380714 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -41.5 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 24860 | -| policy_gradient_loss | -0.00687 | -| std | 0.585 | -| value_loss | 4.27e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2488 | -| time_elapsed | 28580 | -| total_timesteps | 318464 | -| train/ | | -| approx_kl | 0.0031626811 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -39.5 | -| learning_rate | 0.0003 | -| loss | -0.00784 | -| n_updates | 24870 | -| policy_gradient_loss | -0.00232 | -| std | 0.585 | -| value_loss | 1.62e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2489 | -| time_elapsed | 28584 | -| total_timesteps | 318592 | -| train/ | | -| approx_kl | 0.021632945 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -4.28 | -| learning_rate | 0.0003 | -| loss | -0.00718 | -| n_updates | 24880 | -| policy_gradient_loss | -0.00691 | -| std | 0.585 | -| value_loss | 1.93e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2490 | -| time_elapsed | 28588 | -| total_timesteps | 318720 | -| train/ | | -| approx_kl | 0.005267488 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -0.204 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 24890 | -| policy_gradient_loss | -0.00232 | -| std | 0.584 | -| value_loss | 1.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2491 | -| time_elapsed | 28592 | -| total_timesteps | 318848 | -| train/ | | -| approx_kl | 0.014803062 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.881 | -| explained_variance | 0.0158 | -| learning_rate | 0.0003 | -| loss | -0.000756 | -| n_updates | 24900 | -| policy_gradient_loss | -0.00278 | -| std | 0.584 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.38 | -| time/ | | -| fps | 11 | -| iterations | 2492 | -| time_elapsed | 28597 | -| total_timesteps | 318976 | -| train/ | | -| approx_kl | 0.0004503657 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | -0.000663 | -| n_updates | 24910 | -| policy_gradient_loss | -0.000265 | -| std | 0.586 | -| value_loss | 9.33e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2493 | -| time_elapsed | 28602 | -| total_timesteps | 319104 | -| train/ | | -| approx_kl | 0.0009862597 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.000749 | -| n_updates | 24920 | -| policy_gradient_loss | -0.000147 | -| std | 0.586 | -| value_loss | 1.05e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2494 | -| time_elapsed | 28610 | -| total_timesteps | 319232 | -| train/ | | -| approx_kl | 0.0066991546 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | 0.531 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 24930 | -| policy_gradient_loss | -0.0113 | -| std | 0.586 | -| value_loss | 0.000671 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2495 | -| time_elapsed | 28614 | -| total_timesteps | 319360 | -| train/ | | -| approx_kl | 0.0019071545 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -66.2 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 24940 | -| policy_gradient_loss | -0.000818 | -| std | 0.586 | -| value_loss | 5.5e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2496 | -| time_elapsed | 28618 | -| total_timesteps | 319488 | -| train/ | | -| approx_kl | 0.00017452496 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -118 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 24950 | -| policy_gradient_loss | 0.000569 | -| std | 0.586 | -| value_loss | 3.17e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2497 | -| time_elapsed | 28623 | -| total_timesteps | 319616 | -| train/ | | -| approx_kl | 0.013080869 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -37.2 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 24960 | -| policy_gradient_loss | -0.00647 | -| std | 0.586 | -| value_loss | 2.89e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2498 | -| time_elapsed | 28627 | -| total_timesteps | 319744 | -| train/ | | -| approx_kl | 7.439405e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -3.82 | -| learning_rate | 0.0003 | -| loss | -0.000199 | -| n_updates | 24970 | -| policy_gradient_loss | -8.14e-05 | -| std | 0.587 | -| value_loss | 4.57e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2499 | -| time_elapsed | 28631 | -| total_timesteps | 319872 | -| train/ | | -| approx_kl | 0.0071602697 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.887 | -| explained_variance | -0.69 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 24980 | -| policy_gradient_loss | -0.003 | -| std | 0.588 | -| value_loss | 3.23e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2500 | -| time_elapsed | 28635 | -| total_timesteps | 320000 | -| train/ | | -| approx_kl | 0.013093976 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.89 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 24990 | -| policy_gradient_loss | -0.00609 | -| std | 0.59 | -| value_loss | 2.93e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2501 | -| time_elapsed | 28639 | -| total_timesteps | 320128 | -| train/ | | -| approx_kl | 0.013705795 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -0.00218 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 25000 | -| policy_gradient_loss | -0.0101 | -| std | 0.59 | -| value_loss | 8.72e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2502 | -| time_elapsed | 28647 | -| total_timesteps | 320256 | -| train/ | | -| approx_kl | 0.0091395015 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | 0.706 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 25010 | -| policy_gradient_loss | -0.00657 | -| std | 0.59 | -| value_loss | 0.000799 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2503 | -| time_elapsed | 28651 | -| total_timesteps | 320384 | -| train/ | | -| approx_kl | 0.0039467067 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -2.74 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 25020 | -| policy_gradient_loss | -0.00689 | -| std | 0.59 | -| value_loss | 8.89e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2504 | -| time_elapsed | 28656 | -| total_timesteps | 320512 | -| train/ | | -| approx_kl | 0.0021549864 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.893 | -| explained_variance | -5.86 | -| learning_rate | 0.0003 | -| loss | -0.000921 | -| n_updates | 25030 | -| policy_gradient_loss | -0.000383 | -| std | 0.592 | -| value_loss | 2.23e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2505 | -| time_elapsed | 28660 | -| total_timesteps | 320640 | -| train/ | | -| approx_kl | 0.0051406063 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.896 | -| explained_variance | -0.656 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 25040 | -| policy_gradient_loss | -0.000995 | -| std | 0.594 | -| value_loss | 6.2e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2506 | -| time_elapsed | 28664 | -| total_timesteps | 320768 | -| train/ | | -| approx_kl | 0.021482043 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.899 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 25050 | -| policy_gradient_loss | -0.0133 | -| std | 0.595 | -| value_loss | 5.97e-08 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2507 | -| time_elapsed | 28669 | -| total_timesteps | 320896 | -| train/ | | -| approx_kl | 0.000109646004 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.898 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.000839 | -| n_updates | 25060 | -| policy_gradient_loss | 0.000565 | -| std | 0.593 | -| value_loss | 3.26e-08 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2508 | -| time_elapsed | 28673 | -| total_timesteps | 321024 | -| train/ | | -| approx_kl | 0.005814662 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.896 | -| explained_variance | -0.0844 | -| learning_rate | 0.0003 | -| loss | -0.000479 | -| n_updates | 25070 | -| policy_gradient_loss | -0.000412 | -| std | 0.592 | -| value_loss | 3.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2509 | -| time_elapsed | 28681 | -| total_timesteps | 321152 | -| train/ | | -| approx_kl | 0.002589006 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.895 | -| explained_variance | 0.647 | -| learning_rate | 0.0003 | -| loss | -0.00874 | -| n_updates | 25080 | -| policy_gradient_loss | -0.00415 | -| std | 0.592 | -| value_loss | 0.00285 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2510 | -| time_elapsed | 28686 | -| total_timesteps | 321280 | -| train/ | | -| approx_kl | 0.0027633028 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.894 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 25090 | -| policy_gradient_loss | -0.000766 | -| std | 0.592 | -| value_loss | 1.69e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2511 | -| time_elapsed | 28690 | -| total_timesteps | 321408 | -| train/ | | -| approx_kl | 0.0007505007 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.893 | -| explained_variance | -0.756 | -| learning_rate | 0.0003 | -| loss | 0.000376 | -| n_updates | 25100 | -| policy_gradient_loss | 0.000586 | -| std | 0.59 | -| value_loss | 5.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2512 | -| time_elapsed | 28694 | -| total_timesteps | 321536 | -| train/ | | -| approx_kl | 0.004200857 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -0.434 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 25110 | -| policy_gradient_loss | -0.00115 | -| std | 0.589 | -| value_loss | 3.68e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2513 | -| time_elapsed | 28697 | -| total_timesteps | 321664 | -| train/ | | -| approx_kl | 0.020609936 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.89 | -| explained_variance | -0.248 | -| learning_rate | 0.0003 | -| loss | -0.00874 | -| n_updates | 25120 | -| policy_gradient_loss | -0.00943 | -| std | 0.589 | -| value_loss | 2.26e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2514 | -| time_elapsed | 28701 | -| total_timesteps | 321792 | -| train/ | | -| approx_kl | 0.008207649 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.888 | -| explained_variance | 0.00796 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 25130 | -| policy_gradient_loss | -0.0019 | -| std | 0.587 | -| value_loss | 9.58e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2515 | -| time_elapsed | 28706 | -| total_timesteps | 321920 | -| train/ | | -| approx_kl | 0.016360758 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 25140 | -| policy_gradient_loss | -0.00802 | -| std | 0.586 | -| value_loss | 9.63e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2516 | -| time_elapsed | 28710 | -| total_timesteps | 322048 | -| train/ | | -| approx_kl | 0.016954722 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -0.00818 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 25150 | -| policy_gradient_loss | -0.00956 | -| std | 0.587 | -| value_loss | 6.3e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2517 | -| time_elapsed | 28718 | -| total_timesteps | 322176 | -| train/ | | -| approx_kl | 0.017924715 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | 0.536 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 25160 | -| policy_gradient_loss | -0.00356 | -| std | 0.586 | -| value_loss | 0.00749 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2518 | -| time_elapsed | 28722 | -| total_timesteps | 322304 | -| train/ | | -| approx_kl | 0.0020562448 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -65 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 25170 | -| policy_gradient_loss | -0.00218 | -| std | 0.585 | -| value_loss | 5.58e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2519 | -| time_elapsed | 28727 | -| total_timesteps | 322432 | -| train/ | | -| approx_kl | 0.00016587833 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -61.3 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 25180 | -| policy_gradient_loss | 0.000985 | -| std | 0.585 | -| value_loss | 2.23e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2520 | -| time_elapsed | 28731 | -| total_timesteps | 322560 | -| train/ | | -| approx_kl | 0.00057908776 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -8.67 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 25190 | -| policy_gradient_loss | 0.000483 | -| std | 0.585 | -| value_loss | 2.86e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2521 | -| time_elapsed | 28735 | -| total_timesteps | 322688 | -| train/ | | -| approx_kl | 6.9185626e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -0.616 | -| learning_rate | 0.0003 | -| loss | -0.000141 | -| n_updates | 25200 | -| policy_gradient_loss | 0.000515 | -| std | 0.585 | -| value_loss | 8.42e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2522 | -| time_elapsed | 28739 | -| total_timesteps | 322816 | -| train/ | | -| approx_kl | 0.001388846 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | 0.0023 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 25210 | -| policy_gradient_loss | -0.00101 | -| std | 0.585 | -| value_loss | 9.68e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.36 | -| time/ | | -| fps | 11 | -| iterations | 2523 | -| time_elapsed | 28744 | -| total_timesteps | 322944 | -| train/ | | -| approx_kl | 0.0002444554 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | 0.00834 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 25220 | -| policy_gradient_loss | 0.000617 | -| std | 0.586 | -| value_loss | 5.34e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2524 | -| time_elapsed | 28747 | -| total_timesteps | 323072 | -| train/ | | -| approx_kl | 0.00051981746 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -0.00673 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 25230 | -| policy_gradient_loss | 0.000192 | -| std | 0.587 | -| value_loss | 4.5e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2525 | -| time_elapsed | 28754 | -| total_timesteps | 323200 | -| train/ | | -| approx_kl | 0.011757317 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.887 | -| explained_variance | 0.291 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 25240 | -| policy_gradient_loss | -0.00573 | -| std | 0.588 | -| value_loss | 0.000912 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2526 | -| time_elapsed | 28759 | -| total_timesteps | 323328 | -| train/ | | -| approx_kl | 7.862458e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.889 | -| explained_variance | -94.5 | -| learning_rate | 0.0003 | -| loss | 0.000212 | -| n_updates | 25250 | -| policy_gradient_loss | 0.000255 | -| std | 0.589 | -| value_loss | 7.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2527 | -| time_elapsed | 28762 | -| total_timesteps | 323456 | -| train/ | | -| approx_kl | 0.006121204 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.89 | -| explained_variance | -124 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 25260 | -| policy_gradient_loss | -0.00272 | -| std | 0.59 | -| value_loss | 3.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2528 | -| time_elapsed | 28766 | -| total_timesteps | 323584 | -| train/ | | -| approx_kl | 0.01609056 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -23.7 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 25270 | -| policy_gradient_loss | -0.00808 | -| std | 0.59 | -| value_loss | 2.89e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2529 | -| time_elapsed | 28770 | -| total_timesteps | 323712 | -| train/ | | -| approx_kl | 0.0001946881 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.892 | -| explained_variance | -2.67 | -| learning_rate | 0.0003 | -| loss | 0.0016 | -| n_updates | 25280 | -| policy_gradient_loss | 0.00296 | -| std | 0.59 | -| value_loss | 5.83e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2530 | -| time_elapsed | 28774 | -| total_timesteps | 323840 | -| train/ | | -| approx_kl | 0.0013074749 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.892 | -| explained_variance | -0.336 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 25290 | -| policy_gradient_loss | -0.00106 | -| std | 0.591 | -| value_loss | 4.94e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2531 | -| time_elapsed | 28779 | -| total_timesteps | 323968 | -| train/ | | -| approx_kl | 0.0003564246 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.893 | -| explained_variance | -0.325 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 25300 | -| policy_gradient_loss | 0.00075 | -| std | 0.591 | -| value_loss | 1.95e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2532 | -| time_elapsed | 28783 | -| total_timesteps | 324096 | -| train/ | | -| approx_kl | 0.00059744576 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.894 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 25310 | -| policy_gradient_loss | 0.000257 | -| std | 0.592 | -| value_loss | 1.61e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2533 | -| time_elapsed | 28793 | -| total_timesteps | 324224 | -| train/ | | -| approx_kl | 0.018225837 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.895 | -| explained_variance | 0.501 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 25320 | -| policy_gradient_loss | -0.0146 | -| std | 0.592 | -| value_loss | 0.000618 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2534 | -| time_elapsed | 28797 | -| total_timesteps | 324352 | -| train/ | | -| approx_kl | 0.00417222 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.894 | -| explained_variance | -33.8 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 25330 | -| policy_gradient_loss | -0.00296 | -| std | 0.592 | -| value_loss | 4.79e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2535 | -| time_elapsed | 28801 | -| total_timesteps | 324480 | -| train/ | | -| approx_kl | 0.02132687 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | -0.894 | -| explained_variance | -62.2 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 25340 | -| policy_gradient_loss | -0.00265 | -| std | 0.591 | -| value_loss | 2.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2536 | -| time_elapsed | 28805 | -| total_timesteps | 324608 | -| train/ | | -| approx_kl | 0.0005200233 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.893 | -| explained_variance | -15.2 | -| learning_rate | 0.0003 | -| loss | -0.000961 | -| n_updates | 25350 | -| policy_gradient_loss | -6.89e-06 | -| std | 0.591 | -| value_loss | 4.56e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2537 | -| time_elapsed | 28808 | -| total_timesteps | 324736 | -| train/ | | -| approx_kl | 0.0022154797 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.892 | -| explained_variance | -2.63 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 25360 | -| policy_gradient_loss | -0.000342 | -| std | 0.59 | -| value_loss | 8.22e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2538 | -| time_elapsed | 28812 | -| total_timesteps | 324864 | -| train/ | | -| approx_kl | 0.019351946 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | -0.427 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 25370 | -| policy_gradient_loss | -0.00675 | -| std | 0.589 | -| value_loss | 5.83e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.37 | -| time/ | | -| fps | 11 | -| iterations | 2539 | -| time_elapsed | 28815 | -| total_timesteps | 324992 | -| train/ | | -| approx_kl | 0.010390732 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.889 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | -0.00444 | -| n_updates | 25380 | -| policy_gradient_loss | -0.00327 | -| std | 0.589 | -| value_loss | 2.2e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 11 | -| iterations | 2540 | -| time_elapsed | 28820 | -| total_timesteps | 325120 | -| train/ | | -| approx_kl | 5.6892866e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.889 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 5.26e-05 | -| n_updates | 25390 | -| policy_gradient_loss | 0.0001 | -| std | 0.589 | -| value_loss | 2.13e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 11 | -| iterations | 2541 | -| time_elapsed | 28830 | -| total_timesteps | 325248 | -| train/ | | -| approx_kl | 0.0008022385 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.891 | -| explained_variance | 0.653 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 25400 | -| policy_gradient_loss | -0.0111 | -| std | 0.59 | -| value_loss | 0.00494 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 11 | -| iterations | 2542 | -| time_elapsed | 28835 | -| total_timesteps | 325376 | -| train/ | | -| approx_kl | 0.010685945 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.89 | -| explained_variance | -183 | -| learning_rate | 0.0003 | -| loss | -0.00874 | -| n_updates | 25410 | -| policy_gradient_loss | -0.00407 | -| std | 0.589 | -| value_loss | 1.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 11 | -| iterations | 2543 | -| time_elapsed | 28838 | -| total_timesteps | 325504 | -| train/ | | -| approx_kl | 0.009860183 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.888 | -| explained_variance | -187 | -| learning_rate | 0.0003 | -| loss | -0.000319 | -| n_updates | 25420 | -| policy_gradient_loss | -0.000548 | -| std | 0.587 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 11 | -| iterations | 2544 | -| time_elapsed | 28841 | -| total_timesteps | 325632 | -| train/ | | -| approx_kl | 0.0046996167 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.887 | -| explained_variance | -157 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 25430 | -| policy_gradient_loss | -0.00105 | -| std | 0.588 | -| value_loss | 8.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 11 | -| iterations | 2545 | -| time_elapsed | 28845 | -| total_timesteps | 325760 | -| train/ | | -| approx_kl | 0.021101497 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -0.888 | -| explained_variance | -106 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 25440 | -| policy_gradient_loss | -0.0096 | -| std | 0.588 | -| value_loss | 3.35e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 11 | -| iterations | 2546 | -| time_elapsed | 28849 | -| total_timesteps | 325888 | -| train/ | | -| approx_kl | 0.0008094129 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.889 | -| explained_variance | -2.83 | -| learning_rate | 0.0003 | -| loss | 0.000121 | -| n_updates | 25450 | -| policy_gradient_loss | 7.78e-05 | -| std | 0.589 | -| value_loss | 1.98e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2547 | -| time_elapsed | 28853 | -| total_timesteps | 326016 | -| train/ | | -| approx_kl | 0.007942988 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.889 | -| explained_variance | -0.311 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 25460 | -| policy_gradient_loss | -0.00242 | -| std | 0.589 | -| value_loss | 1.38e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2548 | -| time_elapsed | 28863 | -| total_timesteps | 326144 | -| train/ | | -| approx_kl | 0.0015282712 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.889 | -| explained_variance | 0.792 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 25470 | -| policy_gradient_loss | -0.00597 | -| std | 0.588 | -| value_loss | 0.00151 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2549 | -| time_elapsed | 28867 | -| total_timesteps | 326272 | -| train/ | | -| approx_kl | 0.009612709 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.888 | -| explained_variance | 0.269 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 25480 | -| policy_gradient_loss | -0.0103 | -| std | 0.588 | -| value_loss | 6.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2550 | -| time_elapsed | 28871 | -| total_timesteps | 326400 | -| train/ | | -| approx_kl | 0.025356114 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.887 | -| explained_variance | -190 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 25490 | -| policy_gradient_loss | -0.0115 | -| std | 0.587 | -| value_loss | 3.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2551 | -| time_elapsed | 28875 | -| total_timesteps | 326528 | -| train/ | | -| approx_kl | 0.003911844 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | -68.6 | -| learning_rate | 0.0003 | -| loss | -0.00848 | -| n_updates | 25500 | -| policy_gradient_loss | -0.00257 | -| std | 0.587 | -| value_loss | 7.1e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2552 | -| time_elapsed | 28880 | -| total_timesteps | 326656 | -| train/ | | -| approx_kl | 0.022638455 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | -4.37 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 25510 | -| policy_gradient_loss | -0.00397 | -| std | 0.587 | -| value_loss | 8.27e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2553 | -| time_elapsed | 28884 | -| total_timesteps | 326784 | -| train/ | | -| approx_kl | 0.008615494 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | -0.000904 | -| n_updates | 25520 | -| policy_gradient_loss | -0.00242 | -| std | 0.586 | -| value_loss | 3.75e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2554 | -| time_elapsed | 28888 | -| total_timesteps | 326912 | -| train/ | | -| approx_kl | 0.006111257 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 25530 | -| policy_gradient_loss | -0.0019 | -| std | 0.586 | -| value_loss | 2.08e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2555 | -| time_elapsed | 28892 | -| total_timesteps | 327040 | -| train/ | | -| approx_kl | 0.008718063 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | -0.0785 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 25540 | -| policy_gradient_loss | -0.00152 | -| std | 0.586 | -| value_loss | 2.08e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2556 | -| time_elapsed | 28901 | -| total_timesteps | 327168 | -| train/ | | -| approx_kl | 0.0060593607 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | 0.778 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 25550 | -| policy_gradient_loss | -0.00991 | -| std | 0.585 | -| value_loss | 0.000404 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2557 | -| time_elapsed | 28905 | -| total_timesteps | 327296 | -| train/ | | -| approx_kl | 0.012165221 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 25560 | -| policy_gradient_loss | -0.00476 | -| std | 0.585 | -| value_loss | 1.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2558 | -| time_elapsed | 28910 | -| total_timesteps | 327424 | -| train/ | | -| approx_kl | 0.017946383 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -15.1 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 25570 | -| policy_gradient_loss | -0.00201 | -| std | 0.584 | -| value_loss | 5.77e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2559 | -| time_elapsed | 28914 | -| total_timesteps | 327552 | -| train/ | | -| approx_kl | 0.0066944715 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.88 | -| explained_variance | -2.75 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 25580 | -| policy_gradient_loss | -0.00246 | -| std | 0.583 | -| value_loss | 1.87e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2560 | -| time_elapsed | 28918 | -| total_timesteps | 327680 | -| train/ | | -| approx_kl | 7.261988e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.879 | -| explained_variance | -0.472 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 25590 | -| policy_gradient_loss | 0.00279 | -| std | 0.583 | -| value_loss | 1.66e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2561 | -| time_elapsed | 28921 | -| total_timesteps | 327808 | -| train/ | | -| approx_kl | 0.013364689 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.878 | -| explained_variance | 0.00292 | -| learning_rate | 0.0003 | -| loss | -0.00391 | -| n_updates | 25600 | -| policy_gradient_loss | -0.00479 | -| std | 0.582 | -| value_loss | 4.83e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2562 | -| time_elapsed | 28925 | -| total_timesteps | 327936 | -| train/ | | -| approx_kl | 0.0063778833 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.878 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 25610 | -| policy_gradient_loss | -0.00234 | -| std | 0.582 | -| value_loss | 4.41e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2563 | -| time_elapsed | 28929 | -| total_timesteps | 328064 | -| train/ | | -| approx_kl | 0.012550885 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.879 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 25620 | -| policy_gradient_loss | -0.0034 | -| std | 0.584 | -| value_loss | 4.85e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2564 | -| time_elapsed | 28935 | -| total_timesteps | 328192 | -| train/ | | -| approx_kl | 0.00043922197 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | 0.537 | -| learning_rate | 0.0003 | -| loss | 0.00348 | -| n_updates | 25630 | -| policy_gradient_loss | -0.000162 | -| std | 0.585 | -| value_loss | 0.00814 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2565 | -| time_elapsed | 28938 | -| total_timesteps | 328320 | -| train/ | | -| approx_kl | 0.007023297 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -48.5 | -| learning_rate | 0.0003 | -| loss | -0.00826 | -| n_updates | 25640 | -| policy_gradient_loss | -0.00336 | -| std | 0.585 | -| value_loss | 9.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2566 | -| time_elapsed | 28941 | -| total_timesteps | 328448 | -| train/ | | -| approx_kl | 0.023374597 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -34.6 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 25650 | -| policy_gradient_loss | -0.00371 | -| std | 0.585 | -| value_loss | 3.69e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2567 | -| time_elapsed | 28945 | -| total_timesteps | 328576 | -| train/ | | -| approx_kl | 0.00042594853 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -2.85 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 25660 | -| policy_gradient_loss | 0.000358 | -| std | 0.586 | -| value_loss | 4.25e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2568 | -| time_elapsed | 28948 | -| total_timesteps | 328704 | -| train/ | | -| approx_kl | 0.00033170427 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.884 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 25670 | -| policy_gradient_loss | 0.000339 | -| std | 0.586 | -| value_loss | 3.1e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2569 | -| time_elapsed | 28952 | -| total_timesteps | 328832 | -| train/ | | -| approx_kl | 0.006422776 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.000444 | -| n_updates | 25680 | -| policy_gradient_loss | -0.000724 | -| std | 0.587 | -| value_loss | 3.24e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2570 | -| time_elapsed | 28955 | -| total_timesteps | 328960 | -| train/ | | -| approx_kl | 0.00078665745 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | -0.000668 | -| n_updates | 25690 | -| policy_gradient_loss | -0.000231 | -| std | 0.587 | -| value_loss | 1.09e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2571 | -| time_elapsed | 28958 | -| total_timesteps | 329088 | -| train/ | | -| approx_kl | 0.0021245296 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.886 | -| explained_variance | -0.0963 | -| learning_rate | 0.0003 | -| loss | -0.00577 | -| n_updates | 25700 | -| policy_gradient_loss | -0.0016 | -| std | 0.586 | -| value_loss | 5.47e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2572 | -| time_elapsed | 28965 | -| total_timesteps | 329216 | -| train/ | | -| approx_kl | 0.0042376784 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.885 | -| explained_variance | 0.637 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 25710 | -| policy_gradient_loss | -0.009 | -| std | 0.586 | -| value_loss | 0.00661 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2573 | -| time_elapsed | 28968 | -| total_timesteps | 329344 | -| train/ | | -| approx_kl | 0.008966963 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.883 | -| explained_variance | -199 | -| learning_rate | 0.0003 | -| loss | -0.00942 | -| n_updates | 25720 | -| policy_gradient_loss | -0.00579 | -| std | 0.585 | -| value_loss | 2.99e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2574 | -| time_elapsed | 28972 | -| total_timesteps | 329472 | -| train/ | | -| approx_kl | 0.018685836 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -186 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 25730 | -| policy_gradient_loss | -0.00726 | -| std | 0.585 | -| value_loss | 1.64e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2575 | -| time_elapsed | 28975 | -| total_timesteps | 329600 | -| train/ | | -| approx_kl | 2.0632986e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -102 | -| learning_rate | 0.0003 | -| loss | -0.000586 | -| n_updates | 25740 | -| policy_gradient_loss | 0.00185 | -| std | 0.584 | -| value_loss | 1.79e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2576 | -| time_elapsed | 28978 | -| total_timesteps | 329728 | -| train/ | | -| approx_kl | 0.018460153 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -11.7 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 25750 | -| policy_gradient_loss | -0.00395 | -| std | 0.584 | -| value_loss | 1.93e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2577 | -| time_elapsed | 28981 | -| total_timesteps | 329856 | -| train/ | | -| approx_kl | 0.005863629 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.882 | -| explained_variance | -2.21 | -| learning_rate | 0.0003 | -| loss | -0.000567 | -| n_updates | 25760 | -| policy_gradient_loss | -0.000363 | -| std | 0.584 | -| value_loss | 7.92e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2578 | -| time_elapsed | 28985 | -| total_timesteps | 329984 | -| train/ | | -| approx_kl | 0.0038588464 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.88 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 25770 | -| policy_gradient_loss | -0.000626 | -| std | 0.583 | -| value_loss | 2.8e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2579 | -| time_elapsed | 28989 | -| total_timesteps | 330112 | -| train/ | | -| approx_kl | 0.011758732 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.877 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | -0.00783 | -| n_updates | 25780 | -| policy_gradient_loss | -0.00496 | -| std | 0.581 | -| value_loss | 1.52e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2580 | -| time_elapsed | 28999 | -| total_timesteps | 330240 | -| train/ | | -| approx_kl | 0.005507751 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.873 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 25790 | -| policy_gradient_loss | -0.0115 | -| std | 0.578 | -| value_loss | 0.000555 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2581 | -| time_elapsed | 29003 | -| total_timesteps | 330368 | -| train/ | | -| approx_kl | 0.017662754 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.871 | -| explained_variance | -19.6 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 25800 | -| policy_gradient_loss | -0.00812 | -| std | 0.578 | -| value_loss | 6.48e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2582 | -| time_elapsed | 29007 | -| total_timesteps | 330496 | -| train/ | | -| approx_kl | 0.00011555059 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.871 | -| explained_variance | -16.1 | -| learning_rate | 0.0003 | -| loss | -0.000964 | -| n_updates | 25810 | -| policy_gradient_loss | 0.000527 | -| std | 0.578 | -| value_loss | 1.51e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2583 | -| time_elapsed | 29011 | -| total_timesteps | 330624 | -| train/ | | -| approx_kl | 0.0004316545 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.87 | -| explained_variance | -2.93 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 25820 | -| policy_gradient_loss | 0.000287 | -| std | 0.577 | -| value_loss | 6.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2584 | -| time_elapsed | 29014 | -| total_timesteps | 330752 | -| train/ | | -| approx_kl | 0.008763848 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.869 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | 0.0006 | -| n_updates | 25830 | -| policy_gradient_loss | -0.000958 | -| std | 0.577 | -| value_loss | 3.26e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2585 | -| time_elapsed | 29018 | -| total_timesteps | 330880 | -| train/ | | -| approx_kl | 0.0060403505 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.868 | -| explained_variance | -0.464 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 25840 | -| policy_gradient_loss | -0.00154 | -| std | 0.576 | -| value_loss | 9.29e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2586 | -| time_elapsed | 29021 | -| total_timesteps | 331008 | -| train/ | | -| approx_kl | 0.000838259 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.868 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.00017 | -| n_updates | 25850 | -| policy_gradient_loss | 0.000105 | -| std | 0.576 | -| value_loss | 4.38e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2587 | -| time_elapsed | 29030 | -| total_timesteps | 331136 | -| train/ | | -| approx_kl | 0.00036068144 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.868 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | -0.00959 | -| n_updates | 25860 | -| policy_gradient_loss | -0.00561 | -| std | 0.577 | -| value_loss | 0.00138 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2588 | -| time_elapsed | 29034 | -| total_timesteps | 331264 | -| train/ | | -| approx_kl | 0.0063679544 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.869 | -| explained_variance | -1.49 | -| learning_rate | 0.0003 | -| loss | -0.00721 | -| n_updates | 25870 | -| policy_gradient_loss | -0.00298 | -| std | 0.577 | -| value_loss | 9.04e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2589 | -| time_elapsed | 29037 | -| total_timesteps | 331392 | -| train/ | | -| approx_kl | 3.9245933e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.87 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | -0.000134 | -| n_updates | 25880 | -| policy_gradient_loss | 0.00107 | -| std | 0.577 | -| value_loss | 6.6e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2590 | -| time_elapsed | 29041 | -| total_timesteps | 331520 | -| train/ | | -| approx_kl | 5.511567e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.869 | -| explained_variance | -2.99 | -| learning_rate | 0.0003 | -| loss | -0.000218 | -| n_updates | 25890 | -| policy_gradient_loss | 0.000308 | -| std | 0.576 | -| value_loss | 2.23e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2591 | -| time_elapsed | 29045 | -| total_timesteps | 331648 | -| train/ | | -| approx_kl | 0.0004884994 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.866 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.000878 | -| n_updates | 25900 | -| policy_gradient_loss | -6.02e-05 | -| std | 0.575 | -| value_loss | 7.64e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2592 | -| time_elapsed | 29049 | -| total_timesteps | 331776 | -| train/ | | -| approx_kl | 0.0056880172 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.866 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.000867 | -| n_updates | 25910 | -| policy_gradient_loss | -0.000611 | -| std | 0.576 | -| value_loss | 4.97e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 11 | -| iterations | 2593 | -| time_elapsed | 29054 | -| total_timesteps | 331904 | -| train/ | | -| approx_kl | 0.001255384 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.869 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.00084 | -| n_updates | 25920 | -| policy_gradient_loss | -0.000372 | -| std | 0.578 | -| value_loss | 2.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2594 | -| time_elapsed | 29058 | -| total_timesteps | 332032 | -| train/ | | -| approx_kl | 0.009425213 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.871 | -| explained_variance | -0.0791 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 25930 | -| policy_gradient_loss | -0.00344 | -| std | 0.578 | -| value_loss | 1.36e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2595 | -| time_elapsed | 29067 | -| total_timesteps | 332160 | -| train/ | | -| approx_kl | 0.0023335703 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.871 | -| explained_variance | 0.638 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 25940 | -| policy_gradient_loss | -0.00237 | -| std | 0.577 | -| value_loss | 0.00578 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2596 | -| time_elapsed | 29070 | -| total_timesteps | 332288 | -| train/ | | -| approx_kl | 0.0060276403 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.869 | -| explained_variance | -179 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 25950 | -| policy_gradient_loss | -0.00557 | -| std | 0.576 | -| value_loss | 1.82e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2597 | -| time_elapsed | 29074 | -| total_timesteps | 332416 | -| train/ | | -| approx_kl | 2.5238842e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.868 | -| explained_variance | -160 | -| learning_rate | 0.0003 | -| loss | 6.86e-05 | -| n_updates | 25960 | -| policy_gradient_loss | 0.0016 | -| std | 0.576 | -| value_loss | 7.5e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2598 | -| time_elapsed | 29078 | -| total_timesteps | 332544 | -| train/ | | -| approx_kl | 0.017204333 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.867 | -| explained_variance | -30.7 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 25970 | -| policy_gradient_loss | -0.012 | -| std | 0.576 | -| value_loss | 5.44e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2599 | -| time_elapsed | 29081 | -| total_timesteps | 332672 | -| train/ | | -| approx_kl | 0.0061625885 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.866 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 25980 | -| policy_gradient_loss | -0.00113 | -| std | 0.575 | -| value_loss | 1.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2600 | -| time_elapsed | 29084 | -| total_timesteps | 332800 | -| train/ | | -| approx_kl | 0.003266896 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.865 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 25990 | -| policy_gradient_loss | -0.00105 | -| std | 0.574 | -| value_loss | 6.24e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 11 | -| iterations | 2601 | -| time_elapsed | 29087 | -| total_timesteps | 332928 | -| train/ | | -| approx_kl | 0.008535424 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.863 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.000971 | -| n_updates | 26000 | -| policy_gradient_loss | -0.00178 | -| std | 0.573 | -| value_loss | 3.18e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2602 | -| time_elapsed | 29089 | -| total_timesteps | 333056 | -| train/ | | -| approx_kl | 0.0022974014 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 26010 | -| policy_gradient_loss | -0.00139 | -| std | 0.569 | -| value_loss | 3.75e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2603 | -| time_elapsed | 29096 | -| total_timesteps | 333184 | -| train/ | | -| approx_kl | 0.0007214376 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.852 | -| explained_variance | 0.624 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 26020 | -| policy_gradient_loss | -0.0051 | -| std | 0.566 | -| value_loss | 0.0055 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2604 | -| time_elapsed | 29100 | -| total_timesteps | 333312 | -| train/ | | -| approx_kl | 0.005163266 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.848 | -| explained_variance | -3.38 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 26030 | -| policy_gradient_loss | -0.00562 | -| std | 0.564 | -| value_loss | 2.93e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2605 | -| time_elapsed | 29104 | -| total_timesteps | 333440 | -| train/ | | -| approx_kl | 0.0004056117 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -1.53 | -| learning_rate | 0.0003 | -| loss | 0.000597 | -| n_updates | 26040 | -| policy_gradient_loss | 0.000524 | -| std | 0.563 | -| value_loss | 9.83e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2606 | -| time_elapsed | 29108 | -| total_timesteps | 333568 | -| train/ | | -| approx_kl | 0.000528435 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.844 | -| explained_variance | -0.258 | -| learning_rate | 0.0003 | -| loss | -0.00072 | -| n_updates | 26050 | -| policy_gradient_loss | -0.0002 | -| std | 0.562 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2607 | -| time_elapsed | 29111 | -| total_timesteps | 333696 | -| train/ | | -| approx_kl | 0.015122355 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | -0.0477 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 26060 | -| policy_gradient_loss | -0.0079 | -| std | 0.562 | -| value_loss | 3.3e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2608 | -| time_elapsed | 29115 | -| total_timesteps | 333824 | -| train/ | | -| approx_kl | 0.0019624282 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | 0.00162 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 26070 | -| policy_gradient_loss | -0.0017 | -| std | 0.561 | -| value_loss | 1.66e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2609 | -| time_elapsed | 29119 | -| total_timesteps | 333952 | -| train/ | | -| approx_kl | 0.01320341 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 26080 | -| policy_gradient_loss | -0.00262 | -| std | 0.561 | -| value_loss | 1.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2610 | -| time_elapsed | 29123 | -| total_timesteps | 334080 | -| train/ | | -| approx_kl | 0.007336096 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 26090 | -| policy_gradient_loss | -0.0057 | -| std | 0.56 | -| value_loss | 1.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2611 | -| time_elapsed | 29131 | -| total_timesteps | 334208 | -| train/ | | -| approx_kl | 0.007900592 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.839 | -| explained_variance | 0.618 | -| learning_rate | 0.0003 | -| loss | -0.00808 | -| n_updates | 26100 | -| policy_gradient_loss | -0.00521 | -| std | 0.56 | -| value_loss | 0.00671 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2612 | -| time_elapsed | 29135 | -| total_timesteps | 334336 | -| train/ | | -| approx_kl | 0.0127429385 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -16.7 | -| learning_rate | 0.0003 | -| loss | -0.00941 | -| n_updates | 26110 | -| policy_gradient_loss | -0.00575 | -| std | 0.559 | -| value_loss | 3.84e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2613 | -| time_elapsed | 29139 | -| total_timesteps | 334464 | -| train/ | | -| approx_kl | 0.016897166 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.007 | -| n_updates | 26120 | -| policy_gradient_loss | -0.00426 | -| std | 0.558 | -| value_loss | 1.39e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2614 | -| time_elapsed | 29144 | -| total_timesteps | 334592 | -| train/ | | -| approx_kl | 0.0004894468 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -0.52 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 26130 | -| policy_gradient_loss | 0.000319 | -| std | 0.559 | -| value_loss | 3.94e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2615 | -| time_elapsed | 29147 | -| total_timesteps | 334720 | -| train/ | | -| approx_kl | 0.000407106 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00839 | -| n_updates | 26140 | -| policy_gradient_loss | 0.00159 | -| std | 0.559 | -| value_loss | 5.57e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2616 | -| time_elapsed | 29150 | -| total_timesteps | 334848 | -| train/ | | -| approx_kl | 0.020801922 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 26150 | -| policy_gradient_loss | -0.0157 | -| std | 0.559 | -| value_loss | 2.64e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2617 | -| time_elapsed | 29154 | -| total_timesteps | 334976 | -| train/ | | -| approx_kl | 0.0019890328 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.0044 | -| n_updates | 26160 | -| policy_gradient_loss | -0.00111 | -| std | 0.56 | -| value_loss | 1.43e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2618 | -| time_elapsed | 29157 | -| total_timesteps | 335104 | -| train/ | | -| approx_kl | 0.00014871941 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 26170 | -| policy_gradient_loss | 0.00252 | -| std | 0.561 | -| value_loss | 1.04e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2619 | -| time_elapsed | 29165 | -| total_timesteps | 335232 | -| train/ | | -| approx_kl | 0.004634006 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 26180 | -| policy_gradient_loss | -0.00361 | -| std | 0.56 | -| value_loss | 0.00127 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2620 | -| time_elapsed | 29168 | -| total_timesteps | 335360 | -| train/ | | -| approx_kl | 0.012598085 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | -20.8 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 26190 | -| policy_gradient_loss | -0.00834 | -| std | 0.56 | -| value_loss | 1.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2621 | -| time_elapsed | 29172 | -| total_timesteps | 335488 | -| train/ | | -| approx_kl | 0.012272014 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | 0.00244 | -| n_updates | 26200 | -| policy_gradient_loss | -0.00057 | -| std | 0.562 | -| value_loss | 8.03e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2622 | -| time_elapsed | 29175 | -| total_timesteps | 335616 | -| train/ | | -| approx_kl | 0.00083901896 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.844 | -| explained_variance | -15.8 | -| learning_rate | 0.0003 | -| loss | -0.000298 | -| n_updates | 26210 | -| policy_gradient_loss | -0.000127 | -| std | 0.563 | -| value_loss | 2.83e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2623 | -| time_elapsed | 29177 | -| total_timesteps | 335744 | -| train/ | | -| approx_kl | 0.011069873 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.0075 | -| n_updates | 26220 | -| policy_gradient_loss | -0.00493 | -| std | 0.563 | -| value_loss | 4.66e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2624 | -| time_elapsed | 29180 | -| total_timesteps | 335872 | -| train/ | | -| approx_kl | 0.018193021 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -0.0848 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 26230 | -| policy_gradient_loss | -0.0132 | -| std | 0.563 | -| value_loss | 3.28e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2625 | -| time_elapsed | 29184 | -| total_timesteps | 336000 | -| train/ | | -| approx_kl | 0.000579871 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.000386 | -| n_updates | 26240 | -| policy_gradient_loss | 0.000284 | -| std | 0.563 | -| value_loss | 3.29e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2626 | -| time_elapsed | 29187 | -| total_timesteps | 336128 | -| train/ | | -| approx_kl | 0.00026100525 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -0.000127 | -| learning_rate | 0.0003 | -| loss | -0.000133 | -| n_updates | 26250 | -| policy_gradient_loss | -5.73e-05 | -| std | 0.563 | -| value_loss | 1.52e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2627 | -| time_elapsed | 29195 | -| total_timesteps | 336256 | -| train/ | | -| approx_kl | 0.0070509054 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.846 | -| explained_variance | -3.86 | -| learning_rate | 0.0003 | -| loss | -0.00765 | -| n_updates | 26260 | -| policy_gradient_loss | -0.00434 | -| std | 0.565 | -| value_loss | 0.00219 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2628 | -| time_elapsed | 29198 | -| total_timesteps | 336384 | -| train/ | | -| approx_kl | 0.001091799 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.849 | -| explained_variance | -222 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 26270 | -| policy_gradient_loss | -0.00107 | -| std | 0.566 | -| value_loss | 2.22e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2629 | -| time_elapsed | 29202 | -| total_timesteps | 336512 | -| train/ | | -| approx_kl | 0.0002736468 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.851 | -| explained_variance | -119 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 26280 | -| policy_gradient_loss | 0.000421 | -| std | 0.567 | -| value_loss | 4.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2630 | -| time_elapsed | 29206 | -| total_timesteps | 336640 | -| train/ | | -| approx_kl | 0.011051535 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.851 | -| explained_variance | -41 | -| learning_rate | 0.0003 | -| loss | -0.000848 | -| n_updates | 26290 | -| policy_gradient_loss | -0.000623 | -| std | 0.567 | -| value_loss | 5.24e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2631 | -| time_elapsed | 29209 | -| total_timesteps | 336768 | -| train/ | | -| approx_kl | 0.0024338407 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.852 | -| explained_variance | -0.67 | -| learning_rate | 0.0003 | -| loss | -0.00389 | -| n_updates | 26300 | -| policy_gradient_loss | -0.0011 | -| std | 0.568 | -| value_loss | 8.48e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2632 | -| time_elapsed | 29213 | -| total_timesteps | 336896 | -| train/ | | -| approx_kl | 0.004477908 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.855 | -| explained_variance | -0.078 | -| learning_rate | 0.0003 | -| loss | 0.000216 | -| n_updates | 26310 | -| policy_gradient_loss | -0.000111 | -| std | 0.57 | -| value_loss | 4.99e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2633 | -| time_elapsed | 29216 | -| total_timesteps | 337024 | -| train/ | | -| approx_kl | 0.0001973852 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.856 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | -0.000177 | -| n_updates | 26320 | -| policy_gradient_loss | -6.54e-05 | -| std | 0.569 | -| value_loss | 2.61e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2634 | -| time_elapsed | 29224 | -| total_timesteps | 337152 | -| train/ | | -| approx_kl | 0.0010943445 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.855 | -| explained_variance | 0.667 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 26330 | -| policy_gradient_loss | -0.00246 | -| std | 0.568 | -| value_loss | 0.00602 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2635 | -| time_elapsed | 29227 | -| total_timesteps | 337280 | -| train/ | | -| approx_kl | 0.010204184 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.852 | -| explained_variance | -79.4 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 26340 | -| policy_gradient_loss | -0.00386 | -| std | 0.567 | -| value_loss | 2.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2636 | -| time_elapsed | 29232 | -| total_timesteps | 337408 | -| train/ | | -| approx_kl | 0.010337242 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.852 | -| explained_variance | -240 | -| learning_rate | 0.0003 | -| loss | -0.00561 | -| n_updates | 26350 | -| policy_gradient_loss | -0.00246 | -| std | 0.567 | -| value_loss | 8.14e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2637 | -| time_elapsed | 29237 | -| total_timesteps | 337536 | -| train/ | | -| approx_kl | 0.02229481 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.851 | -| explained_variance | -63.3 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 26360 | -| policy_gradient_loss | -0.0117 | -| std | 0.566 | -| value_loss | 2.56e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2638 | -| time_elapsed | 29240 | -| total_timesteps | 337664 | -| train/ | | -| approx_kl | 0.0035556185 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.85 | -| explained_variance | -0.0874 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 26370 | -| policy_gradient_loss | -0.00139 | -| std | 0.566 | -| value_loss | 2.51e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2639 | -| time_elapsed | 29243 | -| total_timesteps | 337792 | -| train/ | | -| approx_kl | 0.0012281807 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.848 | -| explained_variance | -0.736 | -| learning_rate | 0.0003 | -| loss | 0.000433 | -| n_updates | 26380 | -| policy_gradient_loss | 0.000549 | -| std | 0.564 | -| value_loss | 3.5e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.94 | -| time/ | | -| fps | 11 | -| iterations | 2640 | -| time_elapsed | 29246 | -| total_timesteps | 337920 | -| train/ | | -| approx_kl | 0.004368767 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -0.0963 | -| learning_rate | 0.0003 | -| loss | -0.00952 | -| n_updates | 26390 | -| policy_gradient_loss | -0.00336 | -| std | 0.562 | -| value_loss | 2.21e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2641 | -| time_elapsed | 29250 | -| total_timesteps | 338048 | -| train/ | | -| approx_kl | 3.298861e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | 0.00657 | -| learning_rate | 0.0003 | -| loss | -0.000619 | -| n_updates | 26400 | -| policy_gradient_loss | 0.00131 | -| std | 0.561 | -| value_loss | 9.66e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2642 | -| time_elapsed | 29256 | -| total_timesteps | 338176 | -| train/ | | -| approx_kl | 0.0024902518 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | 0.838 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 26410 | -| policy_gradient_loss | -0.0028 | -| std | 0.559 | -| value_loss | 0.0018 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2643 | -| time_elapsed | 29260 | -| total_timesteps | 338304 | -| train/ | | -| approx_kl | 0.004905084 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -149 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 26420 | -| policy_gradient_loss | -0.00375 | -| std | 0.559 | -| value_loss | 1.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2644 | -| time_elapsed | 29264 | -| total_timesteps | 338432 | -| train/ | | -| approx_kl | 0.017953146 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -94.2 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 26430 | -| policy_gradient_loss | -0.0113 | -| std | 0.559 | -| value_loss | 5.27e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2645 | -| time_elapsed | 29267 | -| total_timesteps | 338560 | -| train/ | | -| approx_kl | 0.0003286628 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -8 | -| learning_rate | 0.0003 | -| loss | -0.000222 | -| n_updates | 26440 | -| policy_gradient_loss | -7.81e-05 | -| std | 0.56 | -| value_loss | 3.2e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2646 | -| time_elapsed | 29272 | -| total_timesteps | 338688 | -| train/ | | -| approx_kl | 0.01085349 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00565 | -| n_updates | 26450 | -| policy_gradient_loss | -0.00379 | -| std | 0.561 | -| value_loss | 1.38e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2647 | -| time_elapsed | 29276 | -| total_timesteps | 338816 | -| train/ | | -| approx_kl | 0.01976089 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | -0.458 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 26460 | -| policy_gradient_loss | -0.0116 | -| std | 0.561 | -| value_loss | 8.21e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2648 | -| time_elapsed | 29280 | -| total_timesteps | 338944 | -| train/ | | -| approx_kl | 0.015493228 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 26470 | -| policy_gradient_loss | -0.00395 | -| std | 0.562 | -| value_loss | 8.4e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2649 | -| time_elapsed | 29283 | -| total_timesteps | 339072 | -| train/ | | -| approx_kl | 0.007624488 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.843 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 26480 | -| policy_gradient_loss | -0.00202 | -| std | 0.563 | -| value_loss | 3.55e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2650 | -| time_elapsed | 29289 | -| total_timesteps | 339200 | -| train/ | | -| approx_kl | 0.011914983 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.844 | -| explained_variance | -3.91 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 26490 | -| policy_gradient_loss | -0.00845 | -| std | 0.563 | -| value_loss | 0.00258 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2651 | -| time_elapsed | 29291 | -| total_timesteps | 339328 | -| train/ | | -| approx_kl | 0.02083198 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -96.1 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 26500 | -| policy_gradient_loss | -0.0124 | -| std | 0.564 | -| value_loss | 1.76e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2652 | -| time_elapsed | 29295 | -| total_timesteps | 339456 | -| train/ | | -| approx_kl | 0.007652811 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.847 | -| explained_variance | -210 | -| learning_rate | 0.0003 | -| loss | -0.000726 | -| n_updates | 26510 | -| policy_gradient_loss | -0.0011 | -| std | 0.565 | -| value_loss | 5.7e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2653 | -| time_elapsed | 29298 | -| total_timesteps | 339584 | -| train/ | | -| approx_kl | 0.0064109135 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.849 | -| explained_variance | -32.5 | -| learning_rate | 0.0003 | -| loss | -0.00949 | -| n_updates | 26520 | -| policy_gradient_loss | -0.00475 | -| std | 0.566 | -| value_loss | 1.55e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2654 | -| time_elapsed | 29302 | -| total_timesteps | 339712 | -| train/ | | -| approx_kl | 0.01684188 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -0.851 | -| explained_variance | 0.00343 | -| learning_rate | 0.0003 | -| loss | 0.00315 | -| n_updates | 26530 | -| policy_gradient_loss | -0.00104 | -| std | 0.567 | -| value_loss | 3.24e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2655 | -| time_elapsed | 29306 | -| total_timesteps | 339840 | -| train/ | | -| approx_kl | 0.010514434 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.853 | -| explained_variance | -0.546 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 26540 | -| policy_gradient_loss | -0.00287 | -| std | 0.568 | -| value_loss | 1.05e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2656 | -| time_elapsed | 29310 | -| total_timesteps | 339968 | -| train/ | | -| approx_kl | 6.7252666e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.853 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.000223 | -| n_updates | 26550 | -| policy_gradient_loss | 0.000134 | -| std | 0.567 | -| value_loss | 5.25e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2657 | -| time_elapsed | 29314 | -| total_timesteps | 340096 | -| train/ | | -| approx_kl | 0.00046893395 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.852 | -| explained_variance | 0.00775 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 26560 | -| policy_gradient_loss | 0.00011 | -| std | 0.568 | -| value_loss | 0.00221 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2658 | -| time_elapsed | 29320 | -| total_timesteps | 340224 | -| train/ | | -| approx_kl | 0.007919464 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.854 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.059 | -| n_updates | 26570 | -| policy_gradient_loss | -0.00346 | -| std | 0.569 | -| value_loss | 0.185 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2659 | -| time_elapsed | 29321 | -| total_timesteps | 340352 | -| train/ | | -| approx_kl | 0.018192206 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.855 | -| explained_variance | 0.00342 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 26580 | -| policy_gradient_loss | -0.00688 | -| std | 0.57 | -| value_loss | 0.336 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2660 | -| time_elapsed | 29325 | -| total_timesteps | 340480 | -| train/ | | -| approx_kl | 0.010877917 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | 0.00151 | -| learning_rate | 0.0003 | -| loss | 0.0767 | -| n_updates | 26590 | -| policy_gradient_loss | -0.00341 | -| std | 0.57 | -| value_loss | 0.173 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2661 | -| time_elapsed | 29327 | -| total_timesteps | 340608 | -| train/ | | -| approx_kl | 0.0030198863 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | -0.0009 | -| learning_rate | 0.0003 | -| loss | 0.26 | -| n_updates | 26600 | -| policy_gradient_loss | -0.00108 | -| std | 0.57 | -| value_loss | 0.54 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2662 | -| time_elapsed | 29331 | -| total_timesteps | 340736 | -| train/ | | -| approx_kl | 0.018574057 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | -0.00347 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 26610 | -| policy_gradient_loss | -0.0078 | -| std | 0.57 | -| value_loss | 0.0482 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2663 | -| time_elapsed | 29334 | -| total_timesteps | 340864 | -| train/ | | -| approx_kl | 0.012866519 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | -0.00438 | -| learning_rate | 0.0003 | -| loss | -0.000814 | -| n_updates | 26620 | -| policy_gradient_loss | -0.00635 | -| std | 0.57 | -| value_loss | 0.0346 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.95 | -| time/ | | -| fps | 11 | -| iterations | 2664 | -| time_elapsed | 29338 | -| total_timesteps | 340992 | -| train/ | | -| approx_kl | 0.008826596 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | 0.00534 | -| n_updates | 26630 | -| policy_gradient_loss | -0.00189 | -| std | 0.572 | -| value_loss | 0.0129 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 11 | -| iterations | 2665 | -| time_elapsed | 29341 | -| total_timesteps | 341120 | -| train/ | | -| approx_kl | 0.0073745395 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.86 | -| explained_variance | 0.00231 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 26640 | -| policy_gradient_loss | -0.00358 | -| std | 0.572 | -| value_loss | 0.473 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 11 | -| iterations | 2666 | -| time_elapsed | 29350 | -| total_timesteps | 341248 | -| train/ | | -| approx_kl | 0.0033712792 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.86 | -| explained_variance | 0.00301 | -| learning_rate | 0.0003 | -| loss | 0.0674 | -| n_updates | 26650 | -| policy_gradient_loss | 0.000626 | -| std | 0.572 | -| value_loss | 0.195 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 11 | -| iterations | 2667 | -| time_elapsed | 29353 | -| total_timesteps | 341376 | -| train/ | | -| approx_kl | 0.009758158 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.86 | -| explained_variance | -0.000118 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 26660 | -| policy_gradient_loss | -0.00549 | -| std | 0.572 | -| value_loss | 0.0179 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 11 | -| iterations | 2668 | -| time_elapsed | 29357 | -| total_timesteps | 341504 | -| train/ | | -| approx_kl | 4.7240406e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | 0.000187 | -| learning_rate | 0.0003 | -| loss | 0.00309 | -| n_updates | 26670 | -| policy_gradient_loss | 0.00195 | -| std | 0.571 | -| value_loss | 0.0198 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 11 | -| iterations | 2669 | -| time_elapsed | 29360 | -| total_timesteps | 341632 | -| train/ | | -| approx_kl | 0.014167389 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | 0.00134 | -| learning_rate | 0.0003 | -| loss | 0.00187 | -| n_updates | 26680 | -| policy_gradient_loss | -0.00267 | -| std | 0.571 | -| value_loss | 0.00909 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 11 | -| iterations | 2670 | -| time_elapsed | 29364 | -| total_timesteps | 341760 | -| train/ | | -| approx_kl | 0.009507846 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | -0.00187 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 26690 | -| policy_gradient_loss | -0.00735 | -| std | 0.571 | -| value_loss | 0.0162 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 11 | -| iterations | 2671 | -| time_elapsed | 29367 | -| total_timesteps | 341888 | -| train/ | | -| approx_kl | 0.00040524662 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | -0.0022 | -| learning_rate | 0.0003 | -| loss | -0.000919 | -| n_updates | 26700 | -| policy_gradient_loss | 0.000617 | -| std | 0.571 | -| value_loss | 0.00933 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2672 | -| time_elapsed | 29371 | -| total_timesteps | 342016 | -| train/ | | -| approx_kl | 0.0006380649 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 26710 | -| policy_gradient_loss | 0.000384 | -| std | 0.571 | -| value_loss | 0.00569 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2673 | -| time_elapsed | 29381 | -| total_timesteps | 342144 | -| train/ | | -| approx_kl | 0.00011562486 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | 0.105 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 26720 | -| policy_gradient_loss | -0.000563 | -| std | 0.571 | -| value_loss | 0.0437 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2674 | -| time_elapsed | 29385 | -| total_timesteps | 342272 | -| train/ | | -| approx_kl | 0.0015732287 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 26730 | -| policy_gradient_loss | -0.000373 | -| std | 0.57 | -| value_loss | 0.00346 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2675 | -| time_elapsed | 29388 | -| total_timesteps | 342400 | -| train/ | | -| approx_kl | 0.0015839571 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | 0.0063 | -| learning_rate | 0.0003 | -| loss | 0.00118 | -| n_updates | 26740 | -| policy_gradient_loss | 0.000705 | -| std | 0.57 | -| value_loss | 0.00121 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2676 | -| time_elapsed | 29391 | -| total_timesteps | 342528 | -| train/ | | -| approx_kl | 0.0070789875 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00499 | -| n_updates | 26750 | -| policy_gradient_loss | -0.00288 | -| std | 0.571 | -| value_loss | 0.0019 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2677 | -| time_elapsed | 29394 | -| total_timesteps | 342656 | -| train/ | | -| approx_kl | 0.015380662 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | -0.0892 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 26760 | -| policy_gradient_loss | -0.0093 | -| std | 0.571 | -| value_loss | 0.000816 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2678 | -| time_elapsed | 29397 | -| total_timesteps | 342784 | -| train/ | | -| approx_kl | 0.00011177454 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | -0.082 | -| learning_rate | 0.0003 | -| loss | 0.000309 | -| n_updates | 26770 | -| policy_gradient_loss | 0.000292 | -| std | 0.571 | -| value_loss | 0.000777 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.1 | -| time/ | | -| fps | 11 | -| iterations | 2679 | -| time_elapsed | 29400 | -| total_timesteps | 342912 | -| train/ | | -| approx_kl | 0.008937091 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.86 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 26780 | -| policy_gradient_loss | -0.00204 | -| std | 0.572 | -| value_loss | 0.000858 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2680 | -| time_elapsed | 29404 | -| total_timesteps | 343040 | -| train/ | | -| approx_kl | 0.00013296236 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.86 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -6.77e-05 | -| n_updates | 26790 | -| policy_gradient_loss | -4.77e-05 | -| std | 0.572 | -| value_loss | 0.000312 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2681 | -| time_elapsed | 29411 | -| total_timesteps | 343168 | -| train/ | | -| approx_kl | 0.000488858 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.862 | -| explained_variance | 0.718 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 26800 | -| policy_gradient_loss | -0.00182 | -| std | 0.574 | -| value_loss | 0.00229 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2682 | -| time_elapsed | 29415 | -| total_timesteps | 343296 | -| train/ | | -| approx_kl | 0.006480113 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.866 | -| explained_variance | -0.0516 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 26810 | -| policy_gradient_loss | -0.00303 | -| std | 0.575 | -| value_loss | 0.000349 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2683 | -| time_elapsed | 29417 | -| total_timesteps | 343424 | -| train/ | | -| approx_kl | 0.0020542603 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.866 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 26820 | -| policy_gradient_loss | -0.00103 | -| std | 0.575 | -| value_loss | 0.000237 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2684 | -| time_elapsed | 29421 | -| total_timesteps | 343552 | -| train/ | | -| approx_kl | 0.008602693 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.866 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 0.000472 | -| n_updates | 26830 | -| policy_gradient_loss | -0.000418 | -| std | 0.575 | -| value_loss | 7.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2685 | -| time_elapsed | 29425 | -| total_timesteps | 343680 | -| train/ | | -| approx_kl | 0.004667489 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.865 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.00487 | -| n_updates | 26840 | -| policy_gradient_loss | -0.00204 | -| std | 0.575 | -| value_loss | 6.94e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2686 | -| time_elapsed | 29428 | -| total_timesteps | 343808 | -| train/ | | -| approx_kl | 0.009318189 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.867 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.000383 | -| n_updates | 26850 | -| policy_gradient_loss | -0.0012 | -| std | 0.577 | -| value_loss | 5.85e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2687 | -| time_elapsed | 29431 | -| total_timesteps | 343936 | -| train/ | | -| approx_kl | 0.0074950764 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.87 | -| explained_variance | -0.000906 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 26860 | -| policy_gradient_loss | -0.00441 | -| std | 0.578 | -| value_loss | 6.66e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2688 | -| time_elapsed | 29435 | -| total_timesteps | 344064 | -| train/ | | -| approx_kl | 0.008501331 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.872 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.000592 | -| n_updates | 26870 | -| policy_gradient_loss | -0.000935 | -| std | 0.579 | -| value_loss | 3.8e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2689 | -| time_elapsed | 29441 | -| total_timesteps | 344192 | -| train/ | | -| approx_kl | 0.00079833204 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.873 | -| explained_variance | 0.838 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 26880 | -| policy_gradient_loss | -0.000698 | -| std | 0.579 | -| value_loss | 0.000843 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2690 | -| time_elapsed | 29445 | -| total_timesteps | 344320 | -| train/ | | -| approx_kl | 0.0030704096 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.872 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 26890 | -| policy_gradient_loss | -0.000776 | -| std | 0.579 | -| value_loss | 2.5e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2691 | -| time_elapsed | 29448 | -| total_timesteps | 344448 | -| train/ | | -| approx_kl | 0.01210144 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -0.871 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 26900 | -| policy_gradient_loss | -0.00237 | -| std | 0.577 | -| value_loss | 2.25e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2692 | -| time_elapsed | 29452 | -| total_timesteps | 344576 | -| train/ | | -| approx_kl | 0.007577234 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.869 | -| explained_variance | -0.00675 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 26910 | -| policy_gradient_loss | -0.00214 | -| std | 0.577 | -| value_loss | 1.96e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2693 | -| time_elapsed | 29455 | -| total_timesteps | 344704 | -| train/ | | -| approx_kl | 0.0008482381 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.868 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 26920 | -| policy_gradient_loss | -0.000304 | -| std | 0.576 | -| value_loss | 1.84e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2694 | -| time_elapsed | 29459 | -| total_timesteps | 344832 | -| train/ | | -| approx_kl | 0.00096768234 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.865 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 26930 | -| policy_gradient_loss | -8.66e-05 | -| std | 0.574 | -| value_loss | 1.66e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2695 | -| time_elapsed | 29462 | -| total_timesteps | 344960 | -| train/ | | -| approx_kl | 0.00076993345 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.863 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.000285 | -| n_updates | 26940 | -| policy_gradient_loss | 0.000443 | -| std | 0.572 | -| value_loss | 1.13e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2696 | -| time_elapsed | 29465 | -| total_timesteps | 345088 | -| train/ | | -| approx_kl | 0.0077546425 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.859 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 26950 | -| policy_gradient_loss | -0.00146 | -| std | 0.57 | -| value_loss | 9.75e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2697 | -| time_elapsed | 29473 | -| total_timesteps | 345216 | -| train/ | | -| approx_kl | 0.00084746815 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 26960 | -| policy_gradient_loss | -0.0081 | -| std | 0.569 | -| value_loss | 0.000309 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2698 | -| time_elapsed | 29477 | -| total_timesteps | 345344 | -| train/ | | -| approx_kl | 0.009328388 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.856 | -| explained_variance | 0.0202 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 26970 | -| policy_gradient_loss | -0.00267 | -| std | 0.57 | -| value_loss | 1.02e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2699 | -| time_elapsed | 29482 | -| total_timesteps | 345472 | -| train/ | | -| approx_kl | 0.017220017 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 26980 | -| policy_gradient_loss | -0.00813 | -| std | 0.57 | -| value_loss | 6.72e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2700 | -| time_elapsed | 29487 | -| total_timesteps | 345600 | -| train/ | | -| approx_kl | 0.0052270247 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | 0.0182 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 26990 | -| policy_gradient_loss | -0.00114 | -| std | 0.57 | -| value_loss | 4.2e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2701 | -| time_elapsed | 29491 | -| total_timesteps | 345728 | -| train/ | | -| approx_kl | 0.0032177656 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | -0.00581 | -| n_updates | 27000 | -| policy_gradient_loss | -0.00164 | -| std | 0.571 | -| value_loss | 3.81e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2702 | -| time_elapsed | 29494 | -| total_timesteps | 345856 | -| train/ | | -| approx_kl | 0.01726634 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 27010 | -| policy_gradient_loss | -0.00427 | -| std | 0.571 | -| value_loss | 3.2e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2703 | -| time_elapsed | 29499 | -| total_timesteps | 345984 | -| train/ | | -| approx_kl | 2.5774352e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.858 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -1.99e-05 | -| n_updates | 27020 | -| policy_gradient_loss | 6.47e-05 | -| std | 0.571 | -| value_loss | 2.6e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2704 | -| time_elapsed | 29502 | -| total_timesteps | 346112 | -| train/ | | -| approx_kl | 0.01059977 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | -0.0081 | -| n_updates | 27030 | -| policy_gradient_loss | -0.0042 | -| std | 0.57 | -| value_loss | 2.09e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2705 | -| time_elapsed | 29510 | -| total_timesteps | 346240 | -| train/ | | -| approx_kl | 0.0073023792 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | 0.77 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 27040 | -| policy_gradient_loss | -0.00585 | -| std | 0.57 | -| value_loss | 0.00197 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2706 | -| time_elapsed | 29514 | -| total_timesteps | 346368 | -| train/ | | -| approx_kl | 0.009100011 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.856 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 27050 | -| policy_gradient_loss | -0.00318 | -| std | 0.57 | -| value_loss | 2.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2707 | -| time_elapsed | 29518 | -| total_timesteps | 346496 | -| train/ | | -| approx_kl | 0.012315835 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.856 | -| explained_variance | 0.0215 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 27060 | -| policy_gradient_loss | -0.00215 | -| std | 0.57 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2708 | -| time_elapsed | 29521 | -| total_timesteps | 346624 | -| train/ | | -| approx_kl | 0.009351989 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.857 | -| explained_variance | 0.00333 | -| learning_rate | 0.0003 | -| loss | -0.00972 | -| n_updates | 27070 | -| policy_gradient_loss | -0.00553 | -| std | 0.57 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2709 | -| time_elapsed | 29524 | -| total_timesteps | 346752 | -| train/ | | -| approx_kl | 0.0019190621 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.856 | -| explained_variance | -0.0801 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 27080 | -| policy_gradient_loss | -0.000816 | -| std | 0.568 | -| value_loss | 7.71e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2710 | -| time_elapsed | 29528 | -| total_timesteps | 346880 | -| train/ | | -| approx_kl | 0.013759184 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.853 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.000377 | -| n_updates | 27090 | -| policy_gradient_loss | -0.00202 | -| std | 0.567 | -| value_loss | 5.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2711 | -| time_elapsed | 29532 | -| total_timesteps | 347008 | -| train/ | | -| approx_kl | 0.009857967 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.85 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 27100 | -| policy_gradient_loss | -0.00271 | -| std | 0.566 | -| value_loss | 5.31e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2712 | -| time_elapsed | 29541 | -| total_timesteps | 347136 | -| train/ | | -| approx_kl | 0.0022481594 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.848 | -| explained_variance | 0.777 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 27110 | -| policy_gradient_loss | -0.00485 | -| std | 0.563 | -| value_loss | 0.00157 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2713 | -| time_elapsed | 29545 | -| total_timesteps | 347264 | -| train/ | | -| approx_kl | 0.009103399 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.843 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 27120 | -| policy_gradient_loss | -0.00537 | -| std | 0.561 | -| value_loss | 2.2e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2714 | -| time_elapsed | 29548 | -| total_timesteps | 347392 | -| train/ | | -| approx_kl | 0.010567727 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 27130 | -| policy_gradient_loss | -0.00226 | -| std | 0.56 | -| value_loss | 1.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2715 | -| time_elapsed | 29551 | -| total_timesteps | 347520 | -| train/ | | -| approx_kl | 0.010346304 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -0.0081 | -| learning_rate | 0.0003 | -| loss | -0.00878 | -| n_updates | 27140 | -| policy_gradient_loss | -0.00508 | -| std | 0.559 | -| value_loss | 6.58e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2716 | -| time_elapsed | 29555 | -| total_timesteps | 347648 | -| train/ | | -| approx_kl | 0.00036508823 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.000766 | -| n_updates | 27150 | -| policy_gradient_loss | 6.88e-05 | -| std | 0.559 | -| value_loss | 5.98e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2717 | -| time_elapsed | 29557 | -| total_timesteps | 347776 | -| train/ | | -| approx_kl | 0.0076715164 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 27160 | -| policy_gradient_loss | -0.00112 | -| std | 0.558 | -| value_loss | 5.19e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2718 | -| time_elapsed | 29560 | -| total_timesteps | 347904 | -| train/ | | -| approx_kl | 0.00863189 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.833 | -| explained_variance | -0.0466 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 27170 | -| policy_gradient_loss | -0.0022 | -| std | 0.556 | -| value_loss | 5.12e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2719 | -| time_elapsed | 29564 | -| total_timesteps | 348032 | -| train/ | | -| approx_kl | 8.433778e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.83 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.000266 | -| n_updates | 27180 | -| policy_gradient_loss | 0.00018 | -| std | 0.554 | -| value_loss | 4.65e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2720 | -| time_elapsed | 29571 | -| total_timesteps | 348160 | -| train/ | | -| approx_kl | 0.0017334651 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.827 | -| explained_variance | -0.0818 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 27190 | -| policy_gradient_loss | -0.0078 | -| std | 0.553 | -| value_loss | 0.00128 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2721 | -| time_elapsed | 29574 | -| total_timesteps | 348288 | -| train/ | | -| approx_kl | 0.0020199048 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.827 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 27200 | -| policy_gradient_loss | -0.00107 | -| std | 0.555 | -| value_loss | 9.04e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2722 | -| time_elapsed | 29577 | -| total_timesteps | 348416 | -| train/ | | -| approx_kl | 0.0013957683 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.833 | -| explained_variance | -12.9 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 27210 | -| policy_gradient_loss | -0.000839 | -| std | 0.558 | -| value_loss | 5.77e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2723 | -| time_elapsed | 29579 | -| total_timesteps | 348544 | -| train/ | | -| approx_kl | 0.0002741709 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -0.896 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 27220 | -| policy_gradient_loss | 0.00108 | -| std | 0.559 | -| value_loss | 3.31e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2724 | -| time_elapsed | 29582 | -| total_timesteps | 348672 | -| train/ | | -| approx_kl | 0.013346504 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 27230 | -| policy_gradient_loss | -0.00282 | -| std | 0.56 | -| value_loss | 1.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2725 | -| time_elapsed | 29585 | -| total_timesteps | 348800 | -| train/ | | -| approx_kl | 0.010029705 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | 0.0173 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 27240 | -| policy_gradient_loss | -0.00182 | -| std | 0.559 | -| value_loss | 1.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2726 | -| time_elapsed | 29589 | -| total_timesteps | 348928 | -| train/ | | -| approx_kl | 0.002142909 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -0.00385 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 27250 | -| policy_gradient_loss | -0.00213 | -| std | 0.558 | -| value_loss | 1.07e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2727 | -| time_elapsed | 29593 | -| total_timesteps | 349056 | -| train/ | | -| approx_kl | 0.00021177297 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 27260 | -| policy_gradient_loss | 0.000714 | -| std | 0.558 | -| value_loss | 6.58e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2728 | -| time_elapsed | 29600 | -| total_timesteps | 349184 | -| train/ | | -| approx_kl | 0.0007454909 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.834 | -| explained_variance | 0.81 | -| learning_rate | 0.0003 | -| loss | -0.00364 | -| n_updates | 27270 | -| policy_gradient_loss | 4.66e-05 | -| std | 0.557 | -| value_loss | 0.00178 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2729 | -| time_elapsed | 29604 | -| total_timesteps | 349312 | -| train/ | | -| approx_kl | 0.008711171 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.834 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 27280 | -| policy_gradient_loss | -2.86e-05 | -| std | 0.558 | -| value_loss | 1.21e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2730 | -| time_elapsed | 29608 | -| total_timesteps | 349440 | -| train/ | | -| approx_kl | 0.0061622444 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.835 | -| explained_variance | 0.00654 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 27290 | -| policy_gradient_loss | -0.00276 | -| std | 0.558 | -| value_loss | 2.91e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2731 | -| time_elapsed | 29611 | -| total_timesteps | 349568 | -| train/ | | -| approx_kl | 6.189104e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | -0.000384 | -| n_updates | 27300 | -| policy_gradient_loss | 0.00205 | -| std | 0.558 | -| value_loss | 2.38e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2732 | -| time_elapsed | 29615 | -| total_timesteps | 349696 | -| train/ | | -| approx_kl | 0.00093865325 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.0999 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 27310 | -| policy_gradient_loss | 1.66e-05 | -| std | 0.558 | -| value_loss | 1.8e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2733 | -| time_elapsed | 29618 | -| total_timesteps | 349824 | -| train/ | | -| approx_kl | 0.008752133 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | -0.000371 | -| n_updates | 27320 | -| policy_gradient_loss | -0.000603 | -| std | 0.558 | -| value_loss | 1.51e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 11 | -| iterations | 2734 | -| time_elapsed | 29624 | -| total_timesteps | 349952 | -| train/ | | -| approx_kl | 0.0070625227 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 27330 | -| policy_gradient_loss | -0.00402 | -| std | 0.559 | -| value_loss | 1.44e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2735 | -| time_elapsed | 29628 | -| total_timesteps | 350080 | -| train/ | | -| approx_kl | 0.0035798273 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -0.00126 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 27340 | -| policy_gradient_loss | -0.00349 | -| std | 0.559 | -| value_loss | 1.77e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2736 | -| time_elapsed | 29634 | -| total_timesteps | 350208 | -| train/ | | -| approx_kl | 0.004177765 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | 0.661 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 27350 | -| policy_gradient_loss | -0.00316 | -| std | 0.559 | -| value_loss | 0.0061 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2737 | -| time_elapsed | 29638 | -| total_timesteps | 350336 | -| train/ | | -| approx_kl | 0.0047442485 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -0.502 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 27360 | -| policy_gradient_loss | -0.00401 | -| std | 0.559 | -| value_loss | 3.88e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2738 | -| time_elapsed | 29641 | -| total_timesteps | 350464 | -| train/ | | -| approx_kl | 5.4511707e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -1.63 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 27370 | -| policy_gradient_loss | 0.00261 | -| std | 0.559 | -| value_loss | 1.57e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2739 | -| time_elapsed | 29644 | -| total_timesteps | 350592 | -| train/ | | -| approx_kl | 0.0007860358 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 27380 | -| policy_gradient_loss | 7.51e-05 | -| std | 0.56 | -| value_loss | 2.27e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2740 | -| time_elapsed | 29648 | -| total_timesteps | 350720 | -| train/ | | -| approx_kl | 0.0004073372 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.839 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 27390 | -| policy_gradient_loss | 0.000328 | -| std | 0.56 | -| value_loss | 1.2e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2741 | -| time_elapsed | 29652 | -| total_timesteps | 350848 | -| train/ | | -| approx_kl | 0.0005245097 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 27400 | -| policy_gradient_loss | 0.000515 | -| std | 0.561 | -| value_loss | 9.14e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2742 | -| time_elapsed | 29655 | -| total_timesteps | 350976 | -| train/ | | -| approx_kl | 0.020067228 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 27410 | -| policy_gradient_loss | -0.0116 | -| std | 0.561 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2743 | -| time_elapsed | 29658 | -| total_timesteps | 351104 | -| train/ | | -| approx_kl | 0.0021395348 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | -0.000382 | -| n_updates | 27420 | -| policy_gradient_loss | -0.000187 | -| std | 0.561 | -| value_loss | 6.42e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2744 | -| time_elapsed | 29667 | -| total_timesteps | 351232 | -| train/ | | -| approx_kl | 0.010500778 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | 0.212 | -| learning_rate | 0.0003 | -| loss | 0.00573 | -| n_updates | 27430 | -| policy_gradient_loss | -0.00638 | -| std | 0.561 | -| value_loss | 0.0335 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2745 | -| time_elapsed | 29670 | -| total_timesteps | 351360 | -| train/ | | -| approx_kl | 0.0028415502 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | 0.101 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 27440 | -| policy_gradient_loss | -0.00336 | -| std | 0.562 | -| value_loss | 0.0026 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2746 | -| time_elapsed | 29674 | -| total_timesteps | 351488 | -| train/ | | -| approx_kl | 0.016000375 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -0.843 | -| explained_variance | -0.0933 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 27450 | -| policy_gradient_loss | -0.00578 | -| std | 0.562 | -| value_loss | 0.000937 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2747 | -| time_elapsed | 29677 | -| total_timesteps | 351616 | -| train/ | | -| approx_kl | 0.0066385446 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | -18.7 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 27460 | -| policy_gradient_loss | -0.00293 | -| std | 0.562 | -| value_loss | 2.12e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2748 | -| time_elapsed | 29681 | -| total_timesteps | 351744 | -| train/ | | -| approx_kl | 0.0019042995 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.00122 | -| n_updates | 27470 | -| policy_gradient_loss | 0.000957 | -| std | 0.562 | -| value_loss | 3.85e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 11 | -| iterations | 2749 | -| time_elapsed | 29684 | -| total_timesteps | 351872 | -| train/ | | -| approx_kl | 0.001301996 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 27480 | -| policy_gradient_loss | -0.0004 | -| std | 0.56 | -| value_loss | 3.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2750 | -| time_elapsed | 29688 | -| total_timesteps | 352000 | -| train/ | | -| approx_kl | 0.0045777615 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.839 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.001 | -| n_updates | 27490 | -| policy_gradient_loss | -0.000592 | -| std | 0.559 | -| value_loss | 2.46e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2751 | -| time_elapsed | 29692 | -| total_timesteps | 352128 | -| train/ | | -| approx_kl | 0.002386549 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | 0.0118 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 27500 | -| policy_gradient_loss | -0.00109 | -| std | 0.56 | -| value_loss | 5.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2752 | -| time_elapsed | 29700 | -| total_timesteps | 352256 | -| train/ | | -| approx_kl | 0.01391063 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.84 | -| explained_variance | 0.626 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 27510 | -| policy_gradient_loss | -0.00373 | -| std | 0.561 | -| value_loss | 0.00705 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2753 | -| time_elapsed | 29703 | -| total_timesteps | 352384 | -| train/ | | -| approx_kl | 0.008813545 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | -0.582 | -| learning_rate | 0.0003 | -| loss | -0.0087 | -| n_updates | 27520 | -| policy_gradient_loss | -0.00402 | -| std | 0.562 | -| value_loss | 1.43e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2754 | -| time_elapsed | 29707 | -| total_timesteps | 352512 | -| train/ | | -| approx_kl | 0.0011244963 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | 0.000407 | -| n_updates | 27530 | -| policy_gradient_loss | 0.000367 | -| std | 0.56 | -| value_loss | 3.37e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2755 | -| time_elapsed | 29710 | -| total_timesteps | 352640 | -| train/ | | -| approx_kl | 0.0059614964 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.839 | -| explained_variance | -0.625 | -| learning_rate | 0.0003 | -| loss | -0.00766 | -| n_updates | 27540 | -| policy_gradient_loss | -0.00302 | -| std | 0.559 | -| value_loss | 2.96e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2756 | -| time_elapsed | 29713 | -| total_timesteps | 352768 | -| train/ | | -| approx_kl | 6.8650115e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.000278 | -| n_updates | 27550 | -| policy_gradient_loss | 0.000631 | -| std | 0.558 | -| value_loss | 1.27e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2757 | -| time_elapsed | 29716 | -| total_timesteps | 352896 | -| train/ | | -| approx_kl | 0.00024604402 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -7.75e-05 | -| n_updates | 27560 | -| policy_gradient_loss | 0.000121 | -| std | 0.559 | -| value_loss | 1.3e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2758 | -| time_elapsed | 29720 | -| total_timesteps | 353024 | -| train/ | | -| approx_kl | 0.0073579485 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.839 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 27570 | -| policy_gradient_loss | -0.00862 | -| std | 0.561 | -| value_loss | 1.6e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2759 | -| time_elapsed | 29726 | -| total_timesteps | 353152 | -| train/ | | -| approx_kl | 0.009409494 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.841 | -| explained_variance | 0.564 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 27580 | -| policy_gradient_loss | -0.00867 | -| std | 0.562 | -| value_loss | 0.00571 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2760 | -| time_elapsed | 29729 | -| total_timesteps | 353280 | -| train/ | | -| approx_kl | 0.010418939 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.843 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 27590 | -| policy_gradient_loss | -0.00282 | -| std | 0.563 | -| value_loss | 2.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2761 | -| time_elapsed | 29730 | -| total_timesteps | 353408 | -| train/ | | -| approx_kl | 0.009935463 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.844 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 27600 | -| policy_gradient_loss | -0.00336 | -| std | 0.562 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2762 | -| time_elapsed | 29733 | -| total_timesteps | 353536 | -| train/ | | -| approx_kl | 0.0027171285 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.844 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 27610 | -| policy_gradient_loss | -0.00165 | -| std | 0.563 | -| value_loss | 1.55e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2763 | -| time_elapsed | 29735 | -| total_timesteps | 353664 | -| train/ | | -| approx_kl | 0.00013533421 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.846 | -| explained_variance | 0.013 | -| learning_rate | 0.0003 | -| loss | -0.00067 | -| n_updates | 27620 | -| policy_gradient_loss | 0.000726 | -| std | 0.564 | -| value_loss | 1.39e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2764 | -| time_elapsed | 29738 | -| total_timesteps | 353792 | -| train/ | | -| approx_kl | 0.0029619597 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.845 | -| explained_variance | -0.00723 | -| learning_rate | 0.0003 | -| loss | 0.000265 | -| n_updates | 27630 | -| policy_gradient_loss | 0.000139 | -| std | 0.563 | -| value_loss | 1.29e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2765 | -| time_elapsed | 29741 | -| total_timesteps | 353920 | -| train/ | | -| approx_kl | 0.010198191 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.844 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00842 | -| n_updates | 27640 | -| policy_gradient_loss | -0.00496 | -| std | 0.562 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2766 | -| time_elapsed | 29743 | -| total_timesteps | 354048 | -| train/ | | -| approx_kl | 0.016325805 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.842 | -| explained_variance | 0.014 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 27650 | -| policy_gradient_loss | -0.0109 | -| std | 0.561 | -| value_loss | 1.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2767 | -| time_elapsed | 29748 | -| total_timesteps | 354176 | -| train/ | | -| approx_kl | 0.001428419 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.839 | -| explained_variance | 0.444 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 27660 | -| policy_gradient_loss | -0.00975 | -| std | 0.56 | -| value_loss | 0.0013 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2768 | -| time_elapsed | 29751 | -| total_timesteps | 354304 | -| train/ | | -| approx_kl | 0.0063876845 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.838 | -| explained_variance | -13 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 27670 | -| policy_gradient_loss | -0.00146 | -| std | 0.559 | -| value_loss | 2.11e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2769 | -| time_elapsed | 29753 | -| total_timesteps | 354432 | -| train/ | | -| approx_kl | 0.0010858614 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -83.2 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 27680 | -| policy_gradient_loss | 4.68e-05 | -| std | 0.558 | -| value_loss | 6.97e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2770 | -| time_elapsed | 29757 | -| total_timesteps | 354560 | -| train/ | | -| approx_kl | 0.0006397357 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -13.4 | -| learning_rate | 0.0003 | -| loss | -0.00487 | -| n_updates | 27690 | -| policy_gradient_loss | 0.00138 | -| std | 0.559 | -| value_loss | 1.9e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2771 | -| time_elapsed | 29759 | -| total_timesteps | 354688 | -| train/ | | -| approx_kl | 0.035370458 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -10.3 | -| learning_rate | 0.0003 | -| loss | -0.0284 | -| n_updates | 27700 | -| policy_gradient_loss | -0.0186 | -| std | 0.559 | -| value_loss | 3.28e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2772 | -| time_elapsed | 29761 | -| total_timesteps | 354816 | -| train/ | | -| approx_kl | 0.00011486816 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -0.997 | -| learning_rate | 0.0003 | -| loss | 0.000138 | -| n_updates | 27710 | -| policy_gradient_loss | 0.000622 | -| std | 0.558 | -| value_loss | 1.11e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2773 | -| time_elapsed | 29765 | -| total_timesteps | 354944 | -| train/ | | -| approx_kl | 0.015187973 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.834 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 27720 | -| policy_gradient_loss | -0.0043 | -| std | 0.557 | -| value_loss | 1.22e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2774 | -| time_elapsed | 29769 | -| total_timesteps | 355072 | -| train/ | | -| approx_kl | 0.0052651432 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.835 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 27730 | -| policy_gradient_loss | -0.00112 | -| std | 0.558 | -| value_loss | 7.36e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2775 | -| time_elapsed | 29774 | -| total_timesteps | 355200 | -| train/ | | -| approx_kl | 0.008090281 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | 0.52 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 27740 | -| policy_gradient_loss | -0.0132 | -| std | 0.559 | -| value_loss | 0.00854 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2776 | -| time_elapsed | 29778 | -| total_timesteps | 355328 | -| train/ | | -| approx_kl | 0.009356493 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.837 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | -0.000946 | -| n_updates | 27750 | -| policy_gradient_loss | -0.00124 | -| std | 0.559 | -| value_loss | 8.81e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2777 | -| time_elapsed | 29782 | -| total_timesteps | 355456 | -| train/ | | -| approx_kl | 0.00038982066 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.836 | -| explained_variance | -42.9 | -| learning_rate | 0.0003 | -| loss | -0.000297 | -| n_updates | 27760 | -| policy_gradient_loss | -0.00014 | -| std | 0.557 | -| value_loss | 1.48e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2778 | -| time_elapsed | 29786 | -| total_timesteps | 355584 | -| train/ | | -| approx_kl | 0.011557908 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.833 | -| explained_variance | -17.3 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 27770 | -| policy_gradient_loss | -0.00321 | -| std | 0.556 | -| value_loss | 1.4e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2779 | -| time_elapsed | 29789 | -| total_timesteps | 355712 | -| train/ | | -| approx_kl | 0.00188802 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.83 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 27780 | -| policy_gradient_loss | -0.000455 | -| std | 0.554 | -| value_loss | 2.82e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2780 | -| time_elapsed | 29792 | -| total_timesteps | 355840 | -| train/ | | -| approx_kl | 0.0026593667 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.828 | -| explained_variance | 0.015 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 27790 | -| policy_gradient_loss | -0.000562 | -| std | 0.554 | -| value_loss | 5.91e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2781 | -| time_elapsed | 29795 | -| total_timesteps | 355968 | -| train/ | | -| approx_kl | 1.9325176e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.827 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.000219 | -| n_updates | 27800 | -| policy_gradient_loss | 0.000816 | -| std | 0.553 | -| value_loss | 6.61e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2782 | -| time_elapsed | 29799 | -| total_timesteps | 356096 | -| train/ | | -| approx_kl | 0.0006584469 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.827 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | 0.000378 | -| n_updates | 27810 | -| policy_gradient_loss | 0.000323 | -| std | 0.554 | -| value_loss | 4.72e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2783 | -| time_elapsed | 29808 | -| total_timesteps | 356224 | -| train/ | | -| approx_kl | 0.0015015232 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.828 | -| explained_variance | 0.767 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 27820 | -| policy_gradient_loss | -0.00798 | -| std | 0.554 | -| value_loss | 0.00113 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2784 | -| time_elapsed | 29812 | -| total_timesteps | 356352 | -| train/ | | -| approx_kl | 0.0026838414 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.83 | -| explained_variance | -5.05 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 27830 | -| policy_gradient_loss | -0.00447 | -| std | 0.555 | -| value_loss | 4.81e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2785 | -| time_elapsed | 29815 | -| total_timesteps | 356480 | -| train/ | | -| approx_kl | 0.00018352875 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.831 | -| explained_variance | -15.7 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 27840 | -| policy_gradient_loss | 0.00185 | -| std | 0.555 | -| value_loss | 1.09e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2786 | -| time_elapsed | 29819 | -| total_timesteps | 356608 | -| train/ | | -| approx_kl | 0.021718223 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.831 | -| explained_variance | -44 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 27850 | -| policy_gradient_loss | -0.00572 | -| std | 0.555 | -| value_loss | 4.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2787 | -| time_elapsed | 29823 | -| total_timesteps | 356736 | -| train/ | | -| approx_kl | 0.015319299 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.829 | -| explained_variance | -2.54 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 27860 | -| policy_gradient_loss | -0.00893 | -| std | 0.555 | -| value_loss | 1.21e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2788 | -| time_elapsed | 29827 | -| total_timesteps | 356864 | -| train/ | | -| approx_kl | 0.00035648956 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.829 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 27870 | -| policy_gradient_loss | 0.000505 | -| std | 0.554 | -| value_loss | 2.18e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 11 | -| iterations | 2789 | -| time_elapsed | 29831 | -| total_timesteps | 356992 | -| train/ | | -| approx_kl | 0.00071645994 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.827 | -| explained_variance | -0.0825 | -| learning_rate | 0.0003 | -| loss | -0.00532 | -| n_updates | 27880 | -| policy_gradient_loss | 0.000517 | -| std | 0.553 | -| value_loss | 2.77e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2790 | -| time_elapsed | 29834 | -| total_timesteps | 357120 | -| train/ | | -| approx_kl | 0.0008167899 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.825 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.000586 | -| n_updates | 27890 | -| policy_gradient_loss | 0.000535 | -| std | 0.551 | -| value_loss | 9.74e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2791 | -| time_elapsed | 29843 | -| total_timesteps | 357248 | -| train/ | | -| approx_kl | 0.004368783 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.823 | -| explained_variance | -4.42 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 27900 | -| policy_gradient_loss | -0.00724 | -| std | 0.551 | -| value_loss | 0.00237 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2792 | -| time_elapsed | 29846 | -| total_timesteps | 357376 | -| train/ | | -| approx_kl | 0.012885597 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.822 | -| explained_variance | -21.5 | -| learning_rate | 0.0003 | -| loss | -0.0063 | -| n_updates | 27910 | -| policy_gradient_loss | -0.00379 | -| std | 0.55 | -| value_loss | 2.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2793 | -| time_elapsed | 29849 | -| total_timesteps | 357504 | -| train/ | | -| approx_kl | 0.000987533 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.82 | -| explained_variance | -43.3 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 27920 | -| policy_gradient_loss | -0.000234 | -| std | 0.549 | -| value_loss | 1.07e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2794 | -| time_elapsed | 29852 | -| total_timesteps | 357632 | -| train/ | | -| approx_kl | 0.01976261 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.818 | -| explained_variance | -7.33 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 27930 | -| policy_gradient_loss | -0.012 | -| std | 0.548 | -| value_loss | 4.34e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2795 | -| time_elapsed | 29854 | -| total_timesteps | 357760 | -| train/ | | -| approx_kl | 0.01214269 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.817 | -| explained_variance | -0.891 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 27940 | -| policy_gradient_loss | -0.00405 | -| std | 0.547 | -| value_loss | 2.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2796 | -| time_elapsed | 29856 | -| total_timesteps | 357888 | -| train/ | | -| approx_kl | 0.007153781 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.814 | -| explained_variance | -0.36 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 27950 | -| policy_gradient_loss | -0.00183 | -| std | 0.545 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2797 | -| time_elapsed | 29859 | -| total_timesteps | 358016 | -| train/ | | -| approx_kl | 0.005490384 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.811 | -| explained_variance | -0.458 | -| learning_rate | 0.0003 | -| loss | -0.00345 | -| n_updates | 27960 | -| policy_gradient_loss | -0.00141 | -| std | 0.544 | -| value_loss | 3.29e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2798 | -| time_elapsed | 29867 | -| total_timesteps | 358144 | -| train/ | | -| approx_kl | 0.0061127525 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.81 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 27970 | -| policy_gradient_loss | -0.00527 | -| std | 0.543 | -| value_loss | 0.00176 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2799 | -| time_elapsed | 29871 | -| total_timesteps | 358272 | -| train/ | | -| approx_kl | 0.0056226505 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.808 | -| explained_variance | -0.527 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 27980 | -| policy_gradient_loss | -0.00125 | -| std | 0.542 | -| value_loss | 2.59e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2800 | -| time_elapsed | 29875 | -| total_timesteps | 358400 | -| train/ | | -| approx_kl | 0.022304887 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -0.806 | -| explained_variance | -7.24 | -| learning_rate | 0.0003 | -| loss | -0.0258 | -| n_updates | 27990 | -| policy_gradient_loss | -0.0165 | -| std | 0.541 | -| value_loss | 9.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 11 | -| iterations | 2801 | -| time_elapsed | 29879 | -| total_timesteps | 358528 | -| train/ | | -| approx_kl | 0.007824683 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.804 | -| explained_variance | -0.92 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 28000 | -| policy_gradient_loss | -0.00127 | -| std | 0.539 | -| value_loss | 3.77e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2802 | -| time_elapsed | 29883 | -| total_timesteps | 358656 | -| train/ | | -| approx_kl | 0.0070874332 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.8 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 28010 | -| policy_gradient_loss | -0.00868 | -| std | 0.538 | -| value_loss | 2.72e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2803 | -| time_elapsed | 29886 | -| total_timesteps | 358784 | -| train/ | | -| approx_kl | 0.013372957 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | -0.797 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.000863 | -| n_updates | 28020 | -| policy_gradient_loss | -0.000744 | -| std | 0.536 | -| value_loss | 1.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2804 | -| time_elapsed | 29890 | -| total_timesteps | 358912 | -| train/ | | -| approx_kl | 0.011346397 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.795 | -| explained_variance | -0.00397 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 28030 | -| policy_gradient_loss | -0.00657 | -| std | 0.535 | -| value_loss | 1.15e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2805 | -| time_elapsed | 29894 | -| total_timesteps | 359040 | -| train/ | | -| approx_kl | 0.0027899141 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.793 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.000301 | -| n_updates | 28040 | -| policy_gradient_loss | -0.000249 | -| std | 0.534 | -| value_loss | 1.09e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2806 | -| time_elapsed | 29901 | -| total_timesteps | 359168 | -| train/ | | -| approx_kl | 7.825461e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.792 | -| explained_variance | 0.129 | -| learning_rate | 0.0003 | -| loss | -0.00364 | -| n_updates | 28050 | -| policy_gradient_loss | -0.00173 | -| std | 0.534 | -| value_loss | 0.00106 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2807 | -| time_elapsed | 29903 | -| total_timesteps | 359296 | -| train/ | | -| approx_kl | 0.0007131314 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.792 | -| explained_variance | -16.2 | -| learning_rate | 0.0003 | -| loss | -0.000591 | -| n_updates | 28060 | -| policy_gradient_loss | -0.000196 | -| std | 0.534 | -| value_loss | 3.27e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2808 | -| time_elapsed | 29907 | -| total_timesteps | 359424 | -| train/ | | -| approx_kl | 0.016192978 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.791 | -| explained_variance | -14.5 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 28070 | -| policy_gradient_loss | -0.00336 | -| std | 0.533 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2809 | -| time_elapsed | 29909 | -| total_timesteps | 359552 | -| train/ | | -| approx_kl | 0.035540946 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | -0.789 | -| explained_variance | -2.08 | -| learning_rate | 0.0003 | -| loss | -0.0374 | -| n_updates | 28080 | -| policy_gradient_loss | -0.0254 | -| std | 0.532 | -| value_loss | 3.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2810 | -| time_elapsed | 29911 | -| total_timesteps | 359680 | -| train/ | | -| approx_kl | 0.013284646 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.789 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.00077 | -| n_updates | 28090 | -| policy_gradient_loss | -0.00191 | -| std | 0.533 | -| value_loss | 1.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2811 | -| time_elapsed | 29914 | -| total_timesteps | 359808 | -| train/ | | -| approx_kl | 0.011087048 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.789 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.000744 | -| n_updates | 28100 | -| policy_gradient_loss | -0.00145 | -| std | 0.533 | -| value_loss | 1.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2812 | -| time_elapsed | 29916 | -| total_timesteps | 359936 | -| train/ | | -| approx_kl | 0.011184014 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.789 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | -0.00437 | -| n_updates | 28110 | -| policy_gradient_loss | -0.00286 | -| std | 0.533 | -| value_loss | 1.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2813 | -| time_elapsed | 29918 | -| total_timesteps | 360064 | -| train/ | | -| approx_kl | 0.006949598 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.79 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | -0.0008 | -| n_updates | 28120 | -| policy_gradient_loss | -0.000924 | -| std | 0.533 | -| value_loss | 1.33e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2814 | -| time_elapsed | 29923 | -| total_timesteps | 360192 | -| train/ | | -| approx_kl | 0.00052575185 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.789 | -| explained_variance | 0.727 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 28130 | -| policy_gradient_loss | -0.00442 | -| std | 0.532 | -| value_loss | 0.000467 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2815 | -| time_elapsed | 29927 | -| total_timesteps | 360320 | -| train/ | | -| approx_kl | 0.012400851 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.789 | -| explained_variance | -56.4 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 28140 | -| policy_gradient_loss | -0.00498 | -| std | 0.532 | -| value_loss | 3.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2816 | -| time_elapsed | 29930 | -| total_timesteps | 360448 | -| train/ | | -| approx_kl | 0.009412718 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.787 | -| explained_variance | -59.5 | -| learning_rate | 0.0003 | -| loss | 0.000327 | -| n_updates | 28150 | -| policy_gradient_loss | -3.75e-05 | -| std | 0.531 | -| value_loss | 1.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2817 | -| time_elapsed | 29933 | -| total_timesteps | 360576 | -| train/ | | -| approx_kl | 0.010155256 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.784 | -| explained_variance | -9.8 | -| learning_rate | 0.0003 | -| loss | -0.00544 | -| n_updates | 28160 | -| policy_gradient_loss | -0.00225 | -| std | 0.529 | -| value_loss | 1.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2818 | -| time_elapsed | 29937 | -| total_timesteps | 360704 | -| train/ | | -| approx_kl | 0.022210062 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | -0.782 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.00689 | -| n_updates | 28170 | -| policy_gradient_loss | -0.00632 | -| std | 0.529 | -| value_loss | 9.49e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2819 | -| time_elapsed | 29940 | -| total_timesteps | 360832 | -| train/ | | -| approx_kl | 0.0059375125 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.781 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.0096 | -| n_updates | 28180 | -| policy_gradient_loss | -0.00372 | -| std | 0.528 | -| value_loss | 6.59e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2820 | -| time_elapsed | 29944 | -| total_timesteps | 360960 | -| train/ | | -| approx_kl | 0.00015928899 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.78 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 28190 | -| policy_gradient_loss | 0.00139 | -| std | 0.528 | -| value_loss | 2.34e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2821 | -| time_elapsed | 29949 | -| total_timesteps | 361088 | -| train/ | | -| approx_kl | 0.00077155954 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.78 | -| explained_variance | -0.0718 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 28200 | -| policy_gradient_loss | 0.000661 | -| std | 0.528 | -| value_loss | 3.37e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2822 | -| time_elapsed | 29956 | -| total_timesteps | 361216 | -| train/ | | -| approx_kl | 7.134676e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.779 | -| explained_variance | 0.485 | -| learning_rate | 0.0003 | -| loss | 0.00493 | -| n_updates | 28210 | -| policy_gradient_loss | -0.000423 | -| std | 0.527 | -| value_loss | 0.0177 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2823 | -| time_elapsed | 29960 | -| total_timesteps | 361344 | -| train/ | | -| approx_kl | 0.00066469517 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.778 | -| explained_variance | -5.67 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 28220 | -| policy_gradient_loss | 9.69e-06 | -| std | 0.527 | -| value_loss | 3e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2824 | -| time_elapsed | 29963 | -| total_timesteps | 361472 | -| train/ | | -| approx_kl | 0.0013840401 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.777 | -| explained_variance | -76.2 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 28230 | -| policy_gradient_loss | -0.000215 | -| std | 0.526 | -| value_loss | 7.01e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2825 | -| time_elapsed | 29966 | -| total_timesteps | 361600 | -| train/ | | -| approx_kl | 0.00045005465 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.777 | -| explained_variance | -3.02 | -| learning_rate | 0.0003 | -| loss | -0.00231 | -| n_updates | 28240 | -| policy_gradient_loss | 0.000787 | -| std | 0.526 | -| value_loss | 4.58e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2826 | -| time_elapsed | 29970 | -| total_timesteps | 361728 | -| train/ | | -| approx_kl | 0.00023595477 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.776 | -| explained_variance | -0.913 | -| learning_rate | 0.0003 | -| loss | -0.00074 | -| n_updates | 28250 | -| policy_gradient_loss | 0.000313 | -| std | 0.525 | -| value_loss | 2.03e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2827 | -| time_elapsed | 29974 | -| total_timesteps | 361856 | -| train/ | | -| approx_kl | 0.011404892 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.774 | -| explained_variance | -0.258 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 28260 | -| policy_gradient_loss | -0.00167 | -| std | 0.524 | -| value_loss | 1.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.85 | -| time/ | | -| fps | 12 | -| iterations | 2828 | -| time_elapsed | 29977 | -| total_timesteps | 361984 | -| train/ | | -| approx_kl | 0.008741733 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.773 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 28270 | -| policy_gradient_loss | -0.00582 | -| std | 0.524 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2829 | -| time_elapsed | 29981 | -| total_timesteps | 362112 | -| train/ | | -| approx_kl | 0.0032007701 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.773 | -| explained_variance | -0.00374 | -| learning_rate | 0.0003 | -| loss | 7.14e-05 | -| n_updates | 28280 | -| policy_gradient_loss | 8.03e-05 | -| std | 0.525 | -| value_loss | 5.34e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2830 | -| time_elapsed | 29990 | -| total_timesteps | 362240 | -| train/ | | -| approx_kl | 0.0009817143 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.776 | -| explained_variance | 0.539 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 28290 | -| policy_gradient_loss | -0.00412 | -| std | 0.526 | -| value_loss | 0.011 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2831 | -| time_elapsed | 29995 | -| total_timesteps | 362368 | -| train/ | | -| approx_kl | 0.013187148 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.778 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 28300 | -| policy_gradient_loss | -0.00562 | -| std | 0.526 | -| value_loss | 0.000131 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2832 | -| time_elapsed | 29999 | -| total_timesteps | 362496 | -| train/ | | -| approx_kl | 0.0061907955 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.777 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 28310 | -| policy_gradient_loss | -0.00229 | -| std | 0.526 | -| value_loss | 3.54e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2833 | -| time_elapsed | 30002 | -| total_timesteps | 362624 | -| train/ | | -| approx_kl | 0.015160972 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.776 | -| explained_variance | -0.542 | -| learning_rate | 0.0003 | -| loss | -0.00036 | -| n_updates | 28320 | -| policy_gradient_loss | -0.00194 | -| std | 0.526 | -| value_loss | 2.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2834 | -| time_elapsed | 30005 | -| total_timesteps | 362752 | -| train/ | | -| approx_kl | 0.012996259 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.775 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | -0.03 | -| n_updates | 28330 | -| policy_gradient_loss | -0.0143 | -| std | 0.525 | -| value_loss | 2.12e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.86 | -| time/ | | -| fps | 12 | -| iterations | 2835 | -| time_elapsed | 30008 | -| total_timesteps | 362880 | -| train/ | | -| approx_kl | 0.0060282676 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.774 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.000518 | -| n_updates | 28340 | -| policy_gradient_loss | 0.00022 | -| std | 0.524 | -| value_loss | 4.82e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2836 | -| time_elapsed | 30011 | -| total_timesteps | 363008 | -| train/ | | -| approx_kl | 0.00907424 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.772 | -| explained_variance | 0.00916 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 28350 | -| policy_gradient_loss | -0.00226 | -| std | 0.523 | -| value_loss | 1.84e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2837 | -| time_elapsed | 30019 | -| total_timesteps | 363136 | -| train/ | | -| approx_kl | 0.0006258583 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.77 | -| explained_variance | 0.558 | -| learning_rate | 0.0003 | -| loss | -0.00868 | -| n_updates | 28360 | -| policy_gradient_loss | -0.00438 | -| std | 0.522 | -| value_loss | 0.00114 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2838 | -| time_elapsed | 30023 | -| total_timesteps | 363264 | -| train/ | | -| approx_kl | 0.00953719 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.769 | -| explained_variance | 0.376 | -| learning_rate | 0.0003 | -| loss | -0.00918 | -| n_updates | 28370 | -| policy_gradient_loss | -0.00523 | -| std | 0.522 | -| value_loss | 2.38e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2839 | -| time_elapsed | 30027 | -| total_timesteps | 363392 | -| train/ | | -| approx_kl | 0.0012036334 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.768 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 28380 | -| policy_gradient_loss | -0.000415 | -| std | 0.522 | -| value_loss | 1.24e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2840 | -| time_elapsed | 30030 | -| total_timesteps | 363520 | -| train/ | | -| approx_kl | 0.00029721973 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.768 | -| explained_variance | 0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 28390 | -| policy_gradient_loss | 0.000413 | -| std | 0.521 | -| value_loss | 7.04e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2841 | -| time_elapsed | 30033 | -| total_timesteps | 363648 | -| train/ | | -| approx_kl | 0.018142888 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.766 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 28400 | -| policy_gradient_loss | -0.00651 | -| std | 0.52 | -| value_loss | 8.52e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2842 | -| time_elapsed | 30036 | -| total_timesteps | 363776 | -| train/ | | -| approx_kl | 0.01116039 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.765 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | -0.0245 | -| n_updates | 28410 | -| policy_gradient_loss | -0.0138 | -| std | 0.52 | -| value_loss | 4.36e-07 | ----------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2843 | -| time_elapsed | 30040 | -| total_timesteps | 363904 | -| train/ | | -| approx_kl | 0.000111970585 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.764 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 3.13e-05 | -| n_updates | 28420 | -| policy_gradient_loss | 0.000431 | -| std | 0.519 | -| value_loss | 4.38e-07 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2844 | -| time_elapsed | 30043 | -| total_timesteps | 364032 | -| train/ | | -| approx_kl | 0.015611882 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.761 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 28430 | -| policy_gradient_loss | -0.0151 | -| std | 0.517 | -| value_loss | 7.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2845 | -| time_elapsed | 30051 | -| total_timesteps | 364160 | -| train/ | | -| approx_kl | 0.018419744 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.759 | -| explained_variance | 0.682 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 28440 | -| policy_gradient_loss | -0.0057 | -| std | 0.516 | -| value_loss | 0.0058 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2846 | -| time_elapsed | 30055 | -| total_timesteps | 364288 | -| train/ | | -| approx_kl | 0.018017482 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.757 | -| explained_variance | 0.099 | -| learning_rate | 0.0003 | -| loss | -0.00918 | -| n_updates | 28450 | -| policy_gradient_loss | -0.00725 | -| std | 0.515 | -| value_loss | 3.65e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2847 | -| time_elapsed | 30058 | -| total_timesteps | 364416 | -| train/ | | -| approx_kl | 0.01671274 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.755 | -| explained_variance | -12.5 | -| learning_rate | 0.0003 | -| loss | -0.000651 | -| n_updates | 28460 | -| policy_gradient_loss | -0.00203 | -| std | 0.514 | -| value_loss | 4.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2848 | -| time_elapsed | 30061 | -| total_timesteps | 364544 | -| train/ | | -| approx_kl | 0.005055161 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.754 | -| explained_variance | -0.766 | -| learning_rate | 0.0003 | -| loss | -0.00811 | -| n_updates | 28470 | -| policy_gradient_loss | -0.00291 | -| std | 0.514 | -| value_loss | 1.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2849 | -| time_elapsed | 30066 | -| total_timesteps | 364672 | -| train/ | | -| approx_kl | 0.0007282214 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.754 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 28480 | -| policy_gradient_loss | 0.000133 | -| std | 0.514 | -| value_loss | 8.87e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2850 | -| time_elapsed | 30069 | -| total_timesteps | 364800 | -| train/ | | -| approx_kl | 0.0004496572 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.753 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 28490 | -| policy_gradient_loss | 0.000447 | -| std | 0.513 | -| value_loss | 8.87e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2851 | -| time_elapsed | 30073 | -| total_timesteps | 364928 | -| train/ | | -| approx_kl | 0.02021212 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -0.751 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 28500 | -| policy_gradient_loss | -0.00702 | -| std | 0.512 | -| value_loss | 8.04e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2852 | -| time_elapsed | 30077 | -| total_timesteps | 365056 | -| train/ | | -| approx_kl | 0.0090771355 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.749 | -| explained_variance | 0.0159 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 28510 | -| policy_gradient_loss | -0.00803 | -| std | 0.511 | -| value_loss | 4.19e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2853 | -| time_elapsed | 30082 | -| total_timesteps | 365184 | -| train/ | | -| approx_kl | 0.0029314638 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.748 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 28520 | -| policy_gradient_loss | -0.00409 | -| std | 0.51 | -| value_loss | 0.00137 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2854 | -| time_elapsed | 30086 | -| total_timesteps | 365312 | -| train/ | | -| approx_kl | 0.0060767634 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.746 | -| explained_variance | -1.58 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 28530 | -| policy_gradient_loss | -0.00392 | -| std | 0.51 | -| value_loss | 1.63e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2855 | -| time_elapsed | 30089 | -| total_timesteps | 365440 | -| train/ | | -| approx_kl | 0.014764853 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.745 | -| explained_variance | 0.00775 | -| learning_rate | 0.0003 | -| loss | -0.000899 | -| n_updates | 28540 | -| policy_gradient_loss | -0.00306 | -| std | 0.51 | -| value_loss | 1.19e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2856 | -| time_elapsed | 30093 | -| total_timesteps | 365568 | -| train/ | | -| approx_kl | 0.0018611739 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.744 | -| explained_variance | 0.00939 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 28550 | -| policy_gradient_loss | -0.000509 | -| std | 0.508 | -| value_loss | 2.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2857 | -| time_elapsed | 30096 | -| total_timesteps | 365696 | -| train/ | | -| approx_kl | 0.005664857 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.74 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 28560 | -| policy_gradient_loss | -0.00376 | -| std | 0.507 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2858 | -| time_elapsed | 30100 | -| total_timesteps | 365824 | -| train/ | | -| approx_kl | 8.089631e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.739 | -| explained_variance | -0.0921 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 28570 | -| policy_gradient_loss | 0.0018 | -| std | 0.506 | -| value_loss | 6.32e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.87 | -| time/ | | -| fps | 12 | -| iterations | 2859 | -| time_elapsed | 30103 | -| total_timesteps | 365952 | -| train/ | | -| approx_kl | 0.0010066417 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.738 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 28580 | -| policy_gradient_loss | 0.000107 | -| std | 0.506 | -| value_loss | 3.77e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2860 | -| time_elapsed | 30107 | -| total_timesteps | 366080 | -| train/ | | -| approx_kl | 0.006111343 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.737 | -| explained_variance | -0.0764 | -| learning_rate | 0.0003 | -| loss | 0.000291 | -| n_updates | 28590 | -| policy_gradient_loss | 2.78e-05 | -| std | 0.505 | -| value_loss | 4.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2861 | -| time_elapsed | 30115 | -| total_timesteps | 366208 | -| train/ | | -| approx_kl | 0.007015613 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.736 | -| explained_variance | 0.745 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 28600 | -| policy_gradient_loss | -0.00138 | -| std | 0.504 | -| value_loss | 0.00424 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2862 | -| time_elapsed | 30120 | -| total_timesteps | 366336 | -| train/ | | -| approx_kl | 0.013452214 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.734 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00888 | -| n_updates | 28610 | -| policy_gradient_loss | -0.00758 | -| std | 0.504 | -| value_loss | 2.21e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2863 | -| time_elapsed | 30123 | -| total_timesteps | 366464 | -| train/ | | -| approx_kl | 0.012381309 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.734 | -| explained_variance | -3.88 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 28620 | -| policy_gradient_loss | -0.00965 | -| std | 0.504 | -| value_loss | 1.56e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2864 | -| time_elapsed | 30128 | -| total_timesteps | 366592 | -| train/ | | -| approx_kl | 0.008068746 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.735 | -| explained_variance | -1.13 | -| learning_rate | 0.0003 | -| loss | 0.000887 | -| n_updates | 28630 | -| policy_gradient_loss | 0.000327 | -| std | 0.504 | -| value_loss | 2.71e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2865 | -| time_elapsed | 30131 | -| total_timesteps | 366720 | -| train/ | | -| approx_kl | 0.0061684325 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.735 | -| explained_variance | -0.308 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 28640 | -| policy_gradient_loss | -0.0033 | -| std | 0.505 | -| value_loss | 2.29e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2866 | -| time_elapsed | 30134 | -| total_timesteps | 366848 | -| train/ | | -| approx_kl | 0.03089683 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.735 | -| explained_variance | 0.00971 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 28650 | -| policy_gradient_loss | -0.0167 | -| std | 0.505 | -| value_loss | 8.35e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2867 | -| time_elapsed | 30138 | -| total_timesteps | 366976 | -| train/ | | -| approx_kl | 0.00048004533 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.734 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | -0.000329 | -| n_updates | 28660 | -| policy_gradient_loss | -0.000133 | -| std | 0.503 | -| value_loss | 1.05e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2868 | -| time_elapsed | 30141 | -| total_timesteps | 367104 | -| train/ | | -| approx_kl | 0.010393663 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.731 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 28670 | -| policy_gradient_loss | -0.00583 | -| std | 0.502 | -| value_loss | 6.93e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2869 | -| time_elapsed | 30151 | -| total_timesteps | 367232 | -| train/ | | -| approx_kl | 0.0076581175 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.728 | -| explained_variance | 0.81 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 28680 | -| policy_gradient_loss | -0.00387 | -| std | 0.5 | -| value_loss | 0.00153 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2870 | -| time_elapsed | 30154 | -| total_timesteps | 367360 | -| train/ | | -| approx_kl | 0.0006317261 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.724 | -| explained_variance | -0.712 | -| learning_rate | 0.0003 | -| loss | -0.000572 | -| n_updates | 28690 | -| policy_gradient_loss | -0.000215 | -| std | 0.498 | -| value_loss | 7.2e-06 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2871 | -| time_elapsed | 30157 | -| total_timesteps | 367488 | -| train/ | | -| approx_kl | 0.000101448735 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.721 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.000588 | -| n_updates | 28700 | -| policy_gradient_loss | -0.000217 | -| std | 0.496 | -| value_loss | 5.02e-06 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2872 | -| time_elapsed | 30161 | -| total_timesteps | 367616 | -| train/ | | -| approx_kl | 0.0043988423 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.716 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 28710 | -| policy_gradient_loss | -0.00111 | -| std | 0.494 | -| value_loss | 1.66e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2873 | -| time_elapsed | 30164 | -| total_timesteps | 367744 | -| train/ | | -| approx_kl | 0.0020356134 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.712 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 28720 | -| policy_gradient_loss | -0.00112 | -| std | 0.492 | -| value_loss | 1.38e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2874 | -| time_elapsed | 30168 | -| total_timesteps | 367872 | -| train/ | | -| approx_kl | 0.00020455336 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.71 | -| explained_variance | 0.00735 | -| learning_rate | 0.0003 | -| loss | -0.000889 | -| n_updates | 28730 | -| policy_gradient_loss | 0.000427 | -| std | 0.491 | -| value_loss | 7.69e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2875 | -| time_elapsed | 30171 | -| total_timesteps | 368000 | -| train/ | | -| approx_kl | 0.00011194078 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.706 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 28740 | -| policy_gradient_loss | -0.0005 | -| std | 0.488 | -| value_loss | 2.74e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2876 | -| time_elapsed | 30176 | -| total_timesteps | 368128 | -| train/ | | -| approx_kl | 0.013915893 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.699 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | -0.00593 | -| n_updates | 28750 | -| policy_gradient_loss | -0.00393 | -| std | 0.485 | -| value_loss | 1.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2877 | -| time_elapsed | 30184 | -| total_timesteps | 368256 | -| train/ | | -| approx_kl | 0.001522725 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.695 | -| explained_variance | 0.665 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 28760 | -| policy_gradient_loss | -0.00643 | -| std | 0.485 | -| value_loss | 0.00376 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2878 | -| time_elapsed | 30188 | -| total_timesteps | 368384 | -| train/ | | -| approx_kl | 0.009146866 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.695 | -| explained_variance | -3.71 | -| learning_rate | 0.0003 | -| loss | -0.00854 | -| n_updates | 28770 | -| policy_gradient_loss | -0.00374 | -| std | 0.484 | -| value_loss | 3.07e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2879 | -| time_elapsed | 30191 | -| total_timesteps | 368512 | -| train/ | | -| approx_kl | 5.6913123e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.694 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 28780 | -| policy_gradient_loss | 0.00357 | -| std | 0.484 | -| value_loss | 3.22e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2880 | -| time_elapsed | 30194 | -| total_timesteps | 368640 | -| train/ | | -| approx_kl | 0.013555813 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.694 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 28790 | -| policy_gradient_loss | -0.000612 | -| std | 0.484 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2881 | -| time_elapsed | 30197 | -| total_timesteps | 368768 | -| train/ | | -| approx_kl | 0.0058304183 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.694 | -| explained_variance | 0.021 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 28800 | -| policy_gradient_loss | -0.00118 | -| std | 0.484 | -| value_loss | 8.46e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2882 | -| time_elapsed | 30201 | -| total_timesteps | 368896 | -| train/ | | -| approx_kl | 0.0013168191 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.693 | -| explained_variance | -0.0804 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 28810 | -| policy_gradient_loss | -0.000309 | -| std | 0.484 | -| value_loss | 4.36e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2883 | -| time_elapsed | 30204 | -| total_timesteps | 369024 | -| train/ | | -| approx_kl | 0.013351088 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.694 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 28820 | -| policy_gradient_loss | -0.00361 | -| std | 0.484 | -| value_loss | 2.47e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2884 | -| time_elapsed | 30212 | -| total_timesteps | 369152 | -| train/ | | -| approx_kl | 0.0013356451 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.692 | -| explained_variance | 0.632 | -| learning_rate | 0.0003 | -| loss | -0.0248 | -| n_updates | 28830 | -| policy_gradient_loss | -0.0102 | -| std | 0.483 | -| value_loss | 0.00261 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2885 | -| time_elapsed | 30216 | -| total_timesteps | 369280 | -| train/ | | -| approx_kl | 0.0076805046 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.691 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.00773 | -| n_updates | 28840 | -| policy_gradient_loss | -0.00381 | -| std | 0.483 | -| value_loss | 6.98e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2886 | -| time_elapsed | 30218 | -| total_timesteps | 369408 | -| train/ | | -| approx_kl | 0.0030328599 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.69 | -| explained_variance | -83.5 | -| learning_rate | 0.0003 | -| loss | -0.00773 | -| n_updates | 28850 | -| policy_gradient_loss | -0.00176 | -| std | 0.482 | -| value_loss | 6.21e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2887 | -| time_elapsed | 30222 | -| total_timesteps | 369536 | -| train/ | | -| approx_kl | 0.00020182994 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.689 | -| explained_variance | -0.317 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 28860 | -| policy_gradient_loss | 0.0013 | -| std | 0.482 | -| value_loss | 8.45e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2888 | -| time_elapsed | 30224 | -| total_timesteps | 369664 | -| train/ | | -| approx_kl | 0.024509242 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | -0.688 | -| explained_variance | -0.0862 | -| learning_rate | 0.0003 | -| loss | -0.00793 | -| n_updates | 28870 | -| policy_gradient_loss | -0.00769 | -| std | 0.482 | -| value_loss | 3.62e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2889 | -| time_elapsed | 30228 | -| total_timesteps | 369792 | -| train/ | | -| approx_kl | 0.007911539 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.688 | -| explained_variance | -0.849 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 28880 | -| policy_gradient_loss | -0.00145 | -| std | 0.481 | -| value_loss | 1.04e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2890 | -| time_elapsed | 30231 | -| total_timesteps | 369920 | -| train/ | | -| approx_kl | 0.0085194735 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.686 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | -0.00076 | -| n_updates | 28890 | -| policy_gradient_loss | -0.00102 | -| std | 0.479 | -| value_loss | 3.01e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2891 | -| time_elapsed | 30236 | -| total_timesteps | 370048 | -| train/ | | -| approx_kl | 0.008511282 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.682 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 28900 | -| policy_gradient_loss | -0.0019 | -| std | 0.478 | -| value_loss | 2.43e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2892 | -| time_elapsed | 30242 | -| total_timesteps | 370176 | -| train/ | | -| approx_kl | 0.0060941367 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.681 | -| explained_variance | -0.437 | -| learning_rate | 0.0003 | -| loss | -0.00811 | -| n_updates | 28910 | -| policy_gradient_loss | -0.00346 | -| std | 0.478 | -| value_loss | 0.00177 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2893 | -| time_elapsed | 30246 | -| total_timesteps | 370304 | -| train/ | | -| approx_kl | 0.00018690946 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.682 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 28920 | -| policy_gradient_loss | 0.00215 | -| std | 0.479 | -| value_loss | 4.61e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2894 | -| time_elapsed | 30249 | -| total_timesteps | 370432 | -| train/ | | -| approx_kl | 0.0125044715 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.682 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 28930 | -| policy_gradient_loss | -0.000992 | -| std | 0.478 | -| value_loss | 1.89e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2895 | -| time_elapsed | 30251 | -| total_timesteps | 370560 | -| train/ | | -| approx_kl | 0.008596292 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.681 | -| explained_variance | -53.1 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 28940 | -| policy_gradient_loss | -0.00805 | -| std | 0.478 | -| value_loss | 1.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2896 | -| time_elapsed | 30254 | -| total_timesteps | 370688 | -| train/ | | -| approx_kl | 0.018652005 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.681 | -| explained_variance | -5.2 | -| learning_rate | 0.0003 | -| loss | -0.00565 | -| n_updates | 28950 | -| policy_gradient_loss | -0.005 | -| std | 0.478 | -| value_loss | 7.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2897 | -| time_elapsed | 30257 | -| total_timesteps | 370816 | -| train/ | | -| approx_kl | 0.007989073 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.68 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 28960 | -| policy_gradient_loss | -0.00827 | -| std | 0.477 | -| value_loss | 4.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2898 | -| time_elapsed | 30260 | -| total_timesteps | 370944 | -| train/ | | -| approx_kl | 0.020783842 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.68 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 28970 | -| policy_gradient_loss | -0.00485 | -| std | 0.478 | -| value_loss | 5.11e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2899 | -| time_elapsed | 30264 | -| total_timesteps | 371072 | -| train/ | | -| approx_kl | 0.0072892504 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.681 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 28980 | -| policy_gradient_loss | -0.00736 | -| std | 0.479 | -| value_loss | 2.73e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2900 | -| time_elapsed | 30270 | -| total_timesteps | 371200 | -| train/ | | -| approx_kl | 0.008895357 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.683 | -| explained_variance | 0.578 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 28990 | -| policy_gradient_loss | -0.0126 | -| std | 0.479 | -| value_loss | 0.00147 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2901 | -| time_elapsed | 30273 | -| total_timesteps | 371328 | -| train/ | | -| approx_kl | 0.004216817 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.683 | -| explained_variance | -15.6 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 29000 | -| policy_gradient_loss | -0.000963 | -| std | 0.479 | -| value_loss | 7.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2902 | -| time_elapsed | 30276 | -| total_timesteps | 371456 | -| train/ | | -| approx_kl | 0.012001417 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.682 | -| explained_variance | -54.9 | -| learning_rate | 0.0003 | -| loss | -0.000649 | -| n_updates | 29010 | -| policy_gradient_loss | -0.00093 | -| std | 0.478 | -| value_loss | 3.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2903 | -| time_elapsed | 30278 | -| total_timesteps | 371584 | -| train/ | | -| approx_kl | 0.01315907 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.679 | -| explained_variance | -10.2 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 29020 | -| policy_gradient_loss | -0.00642 | -| std | 0.477 | -| value_loss | 1.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2904 | -| time_elapsed | 30282 | -| total_timesteps | 371712 | -| train/ | | -| approx_kl | 0.007758582 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.678 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.000655 | -| n_updates | 29030 | -| policy_gradient_loss | -0.000918 | -| std | 0.476 | -| value_loss | 2.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2905 | -| time_elapsed | 30285 | -| total_timesteps | 371840 | -| train/ | | -| approx_kl | 0.00723256 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.675 | -| explained_variance | -0.563 | -| learning_rate | 0.0003 | -| loss | -0.0044 | -| n_updates | 29040 | -| policy_gradient_loss | -0.00161 | -| std | 0.475 | -| value_loss | 1.49e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2906 | -| time_elapsed | 30288 | -| total_timesteps | 371968 | -| train/ | | -| approx_kl | 0.00014054636 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.675 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 29050 | -| policy_gradient_loss | 0.00112 | -| std | 0.475 | -| value_loss | 1.66e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2907 | -| time_elapsed | 30291 | -| total_timesteps | 372096 | -| train/ | | -| approx_kl | 0.006962959 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.674 | -| explained_variance | -0.0061 | -| learning_rate | 0.0003 | -| loss | -0.000433 | -| n_updates | 29060 | -| policy_gradient_loss | -0.000627 | -| std | 0.475 | -| value_loss | 1.1e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2908 | -| time_elapsed | 30299 | -| total_timesteps | 372224 | -| train/ | | -| approx_kl | 0.0013358514 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.674 | -| explained_variance | 0.619 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 29070 | -| policy_gradient_loss | -0.00695 | -| std | 0.475 | -| value_loss | 0.00757 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2909 | -| time_elapsed | 30302 | -| total_timesteps | 372352 | -| train/ | | -| approx_kl | 0.0071491534 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.674 | -| explained_variance | 0.146 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 29080 | -| policy_gradient_loss | -0.00106 | -| std | 0.474 | -| value_loss | 4.73e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2910 | -| time_elapsed | 30306 | -| total_timesteps | 372480 | -| train/ | | -| approx_kl | 0.0081584845 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.673 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.00362 | -| n_updates | 29090 | -| policy_gradient_loss | -0.00164 | -| std | 0.474 | -| value_loss | 2.12e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2911 | -| time_elapsed | 30309 | -| total_timesteps | 372608 | -| train/ | | -| approx_kl | 0.014261037 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.672 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.000632 | -| n_updates | 29100 | -| policy_gradient_loss | -0.00209 | -| std | 0.473 | -| value_loss | 8.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2912 | -| time_elapsed | 30311 | -| total_timesteps | 372736 | -| train/ | | -| approx_kl | 0.005993095 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.671 | -| explained_variance | 0.00601 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 29110 | -| policy_gradient_loss | -0.00331 | -| std | 0.473 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2913 | -| time_elapsed | 30315 | -| total_timesteps | 372864 | -| train/ | | -| approx_kl | 0.013568748 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | -0.67 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00679 | -| n_updates | 29120 | -| policy_gradient_loss | -0.00687 | -| std | 0.472 | -| value_loss | 9.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2914 | -| time_elapsed | 30318 | -| total_timesteps | 372992 | -| train/ | | -| approx_kl | 0.016185211 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.669 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 29130 | -| policy_gradient_loss | -0.00692 | -| std | 0.472 | -| value_loss | 1.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2915 | -| time_elapsed | 30321 | -| total_timesteps | 373120 | -| train/ | | -| approx_kl | 0.015433252 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.668 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | -0.00072 | -| n_updates | 29140 | -| policy_gradient_loss | -0.00324 | -| std | 0.472 | -| value_loss | 1.29e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2916 | -| time_elapsed | 30329 | -| total_timesteps | 373248 | -| train/ | | -| approx_kl | 0.00029624836 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.669 | -| explained_variance | 0.727 | -| learning_rate | 0.0003 | -| loss | -0.000682 | -| n_updates | 29150 | -| policy_gradient_loss | -0.000768 | -| std | 0.473 | -| value_loss | 0.00278 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2917 | -| time_elapsed | 30332 | -| total_timesteps | 373376 | -| train/ | | -| approx_kl | 0.0062311525 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.669 | -| explained_variance | -5.58 | -| learning_rate | 0.0003 | -| loss | -0.00564 | -| n_updates | 29160 | -| policy_gradient_loss | -0.00217 | -| std | 0.473 | -| value_loss | 2.11e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2918 | -| time_elapsed | 30336 | -| total_timesteps | 373504 | -| train/ | | -| approx_kl | 0.02183736 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.67 | -| explained_variance | -7.88 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 29170 | -| policy_gradient_loss | -0.00329 | -| std | 0.472 | -| value_loss | 3.85e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2919 | -| time_elapsed | 30340 | -| total_timesteps | 373632 | -| train/ | | -| approx_kl | 0.010641006 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.668 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 29180 | -| policy_gradient_loss | -0.00467 | -| std | 0.472 | -| value_loss | 1.08e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2920 | -| time_elapsed | 30344 | -| total_timesteps | 373760 | -| train/ | | -| approx_kl | 0.0076677743 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | 0.00775 | -| learning_rate | 0.0003 | -| loss | -0.00056 | -| n_updates | 29190 | -| policy_gradient_loss | -0.00134 | -| std | 0.471 | -| value_loss | 1.72e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.88 | -| time/ | | -| fps | 12 | -| iterations | 2921 | -| time_elapsed | 30348 | -| total_timesteps | 373888 | -| train/ | | -| approx_kl | 0.010420866 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 29200 | -| policy_gradient_loss | -0.00345 | -| std | 0.472 | -| value_loss | 1.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2922 | -| time_elapsed | 30351 | -| total_timesteps | 374016 | -| train/ | | -| approx_kl | 0.013484895 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.668 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 29210 | -| policy_gradient_loss | -0.00227 | -| std | 0.472 | -| value_loss | 2.98e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2923 | -| time_elapsed | 30360 | -| total_timesteps | 374144 | -| train/ | | -| approx_kl | 0.0025887075 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | 0.55 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 29220 | -| policy_gradient_loss | -0.00691 | -| std | 0.471 | -| value_loss | 0.00903 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2924 | -| time_elapsed | 30364 | -| total_timesteps | 374272 | -| train/ | | -| approx_kl | 0.01178571 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.666 | -| explained_variance | 0.251 | -| learning_rate | 0.0003 | -| loss | -0.00515 | -| n_updates | 29230 | -| policy_gradient_loss | -0.00309 | -| std | 0.471 | -| value_loss | 7.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2925 | -| time_elapsed | 30367 | -| total_timesteps | 374400 | -| train/ | | -| approx_kl | 0.005258777 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.665 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 29240 | -| policy_gradient_loss | -0.000966 | -| std | 0.471 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2926 | -| time_elapsed | 30369 | -| total_timesteps | 374528 | -| train/ | | -| approx_kl | 0.012688762 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.666 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 29250 | -| policy_gradient_loss | -0.00364 | -| std | 0.471 | -| value_loss | 5.55e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2927 | -| time_elapsed | 30373 | -| total_timesteps | 374656 | -| train/ | | -| approx_kl | 0.0109975105 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.666 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.0086 | -| n_updates | 29260 | -| policy_gradient_loss | -0.00427 | -| std | 0.471 | -| value_loss | 3.18e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2928 | -| time_elapsed | 30375 | -| total_timesteps | 374784 | -| train/ | | -| approx_kl | 0.0012454523 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | -6.5e-05 | -| n_updates | 29270 | -| policy_gradient_loss | 0.000118 | -| std | 0.472 | -| value_loss | 3.29e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.89 | -| time/ | | -| fps | 12 | -| iterations | 2929 | -| time_elapsed | 30379 | -| total_timesteps | 374912 | -| train/ | | -| approx_kl | 0.011489729 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.67 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -0.00943 | -| n_updates | 29280 | -| policy_gradient_loss | -0.00398 | -| std | 0.473 | -| value_loss | 3.78e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2930 | -| time_elapsed | 30382 | -| total_timesteps | 375040 | -| train/ | | -| approx_kl | 0.0019318995 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.671 | -| explained_variance | -0.000293 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 29290 | -| policy_gradient_loss | -0.000447 | -| std | 0.474 | -| value_loss | 1.92e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2931 | -| time_elapsed | 30389 | -| total_timesteps | 375168 | -| train/ | | -| approx_kl | 0.011930339 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.672 | -| explained_variance | 0.606 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 29300 | -| policy_gradient_loss | -0.0126 | -| std | 0.474 | -| value_loss | 0.00585 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2932 | -| time_elapsed | 30393 | -| total_timesteps | 375296 | -| train/ | | -| approx_kl | 0.0056655286 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.672 | -| explained_variance | -0.453 | -| learning_rate | 0.0003 | -| loss | -0.000273 | -| n_updates | 29310 | -| policy_gradient_loss | -0.000495 | -| std | 0.473 | -| value_loss | 1.58e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2933 | -| time_elapsed | 30396 | -| total_timesteps | 375424 | -| train/ | | -| approx_kl | 0.014091583 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.67 | -| explained_variance | -8.08 | -| learning_rate | 0.0003 | -| loss | -0.0256 | -| n_updates | 29320 | -| policy_gradient_loss | -0.0127 | -| std | 0.473 | -| value_loss | 2.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2934 | -| time_elapsed | 30398 | -| total_timesteps | 375552 | -| train/ | | -| approx_kl | 0.005579819 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.67 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 29330 | -| policy_gradient_loss | -0.00492 | -| std | 0.473 | -| value_loss | 5.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2935 | -| time_elapsed | 30400 | -| total_timesteps | 375680 | -| train/ | | -| approx_kl | 0.011148962 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.67 | -| explained_variance | -0.625 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 29340 | -| policy_gradient_loss | 0.0005 | -| std | 0.473 | -| value_loss | 1.15e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2936 | -| time_elapsed | 30403 | -| total_timesteps | 375808 | -| train/ | | -| approx_kl | 0.0068672914 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.668 | -| explained_variance | -0.0804 | -| learning_rate | 0.0003 | -| loss | -0.00706 | -| n_updates | 29350 | -| policy_gradient_loss | -0.00275 | -| std | 0.472 | -| value_loss | 7.93e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2937 | -| time_elapsed | 30405 | -| total_timesteps | 375936 | -| train/ | | -| approx_kl | 0.005484282 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.666 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 29360 | -| policy_gradient_loss | -0.00123 | -| std | 0.47 | -| value_loss | 7.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2938 | -| time_elapsed | 30408 | -| total_timesteps | 376064 | -| train/ | | -| approx_kl | 0.017982285 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -0.663 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 29370 | -| policy_gradient_loss | -0.00376 | -| std | 0.469 | -| value_loss | 1.42e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2939 | -| time_elapsed | 30415 | -| total_timesteps | 376192 | -| train/ | | -| approx_kl | 0.0019969244 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.662 | -| explained_variance | 0.636 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 29380 | -| policy_gradient_loss | -0.0054 | -| std | 0.469 | -| value_loss | 0.00137 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2940 | -| time_elapsed | 30419 | -| total_timesteps | 376320 | -| train/ | | -| approx_kl | 0.001267452 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.662 | -| explained_variance | -13.4 | -| learning_rate | 0.0003 | -| loss | -1.77e-05 | -| n_updates | 29390 | -| policy_gradient_loss | -5.05e-06 | -| std | 0.469 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2941 | -| time_elapsed | 30422 | -| total_timesteps | 376448 | -| train/ | | -| approx_kl | 0.011319982 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.661 | -| explained_variance | -35.6 | -| learning_rate | 0.0003 | -| loss | -0.00599 | -| n_updates | 29400 | -| policy_gradient_loss | -0.00301 | -| std | 0.468 | -| value_loss | 5.9e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2942 | -| time_elapsed | 30426 | -| total_timesteps | 376576 | -| train/ | | -| approx_kl | 0.0018600638 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.658 | -| explained_variance | -5.17 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 29410 | -| policy_gradient_loss | -0.000239 | -| std | 0.467 | -| value_loss | 1.05e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2943 | -| time_elapsed | 30430 | -| total_timesteps | 376704 | -| train/ | | -| approx_kl | 0.018643318 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | -0.657 | -| explained_variance | -0.323 | -| learning_rate | 0.0003 | -| loss | 0.00023 | -| n_updates | 29420 | -| policy_gradient_loss | -0.00186 | -| std | 0.467 | -| value_loss | 2.53e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2944 | -| time_elapsed | 30433 | -| total_timesteps | 376832 | -| train/ | | -| approx_kl | 0.00507031 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.657 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 29430 | -| policy_gradient_loss | -0.000914 | -| std | 0.467 | -| value_loss | 2.24e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2945 | -| time_elapsed | 30437 | -| total_timesteps | 376960 | -| train/ | | -| approx_kl | 0.022092845 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.659 | -| explained_variance | 0.00442 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 29440 | -| policy_gradient_loss | -0.00773 | -| std | 0.468 | -| value_loss | 2.55e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2946 | -| time_elapsed | 30441 | -| total_timesteps | 377088 | -| train/ | | -| approx_kl | 0.0051732315 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.66 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 29450 | -| policy_gradient_loss | -0.000772 | -| std | 0.468 | -| value_loss | 1.47e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2947 | -| time_elapsed | 30450 | -| total_timesteps | 377216 | -| train/ | | -| approx_kl | 0.008264355 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.66 | -| explained_variance | 0.602 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 29460 | -| policy_gradient_loss | -0.00421 | -| std | 0.468 | -| value_loss | 0.00754 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2948 | -| time_elapsed | 30454 | -| total_timesteps | 377344 | -| train/ | | -| approx_kl | 0.0001091226 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.659 | -| explained_variance | -8.09 | -| learning_rate | 0.0003 | -| loss | -0.000118 | -| n_updates | 29470 | -| policy_gradient_loss | -1.09e-05 | -| std | 0.468 | -| value_loss | 2.66e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2949 | -| time_elapsed | 30457 | -| total_timesteps | 377472 | -| train/ | | -| approx_kl | 0.0069274562 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.658 | -| explained_variance | -5.1 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 29480 | -| policy_gradient_loss | -0.00315 | -| std | 0.467 | -| value_loss | 1.32e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2950 | -| time_elapsed | 30459 | -| total_timesteps | 377600 | -| train/ | | -| approx_kl | 0.02215557 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -0.657 | -| explained_variance | -0.236 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 29490 | -| policy_gradient_loss | -0.0112 | -| std | 0.466 | -| value_loss | 5.22e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2951 | -| time_elapsed | 30464 | -| total_timesteps | 377728 | -| train/ | | -| approx_kl | 0.0065653874 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.655 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 29500 | -| policy_gradient_loss | -0.00159 | -| std | 0.465 | -| value_loss | 5.83e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2952 | -| time_elapsed | 30467 | -| total_timesteps | 377856 | -| train/ | | -| approx_kl | 0.01115683 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.654 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 29510 | -| policy_gradient_loss | -0.0121 | -| std | 0.465 | -| value_loss | 1.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.9 | -| time/ | | -| fps | 12 | -| iterations | 2953 | -| time_elapsed | 30471 | -| total_timesteps | 377984 | -| train/ | | -| approx_kl | 0.018441789 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | -0.654 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 29520 | -| policy_gradient_loss | -0.00513 | -| std | 0.465 | -| value_loss | 4.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2954 | -| time_elapsed | 30474 | -| total_timesteps | 378112 | -| train/ | | -| approx_kl | 0.009512694 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.654 | -| explained_variance | 3.15e-05 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 29530 | -| policy_gradient_loss | -0.00278 | -| std | 0.466 | -| value_loss | 2.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2955 | -| time_elapsed | 30484 | -| total_timesteps | 378240 | -| train/ | | -| approx_kl | 0.018641705 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.656 | -| explained_variance | 0.681 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 29540 | -| policy_gradient_loss | -0.00144 | -| std | 0.466 | -| value_loss | 0.00344 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2956 | -| time_elapsed | 30487 | -| total_timesteps | 378368 | -| train/ | | -| approx_kl | 0.0011405139 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.656 | -| explained_variance | -27.6 | -| learning_rate | 0.0003 | -| loss | -8.86e-05 | -| n_updates | 29550 | -| policy_gradient_loss | -4.56e-05 | -| std | 0.467 | -| value_loss | 2.17e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2957 | -| time_elapsed | 30492 | -| total_timesteps | 378496 | -| train/ | | -| approx_kl | 0.012393278 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.657 | -| explained_variance | -10.4 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 29560 | -| policy_gradient_loss | -0.0034 | -| std | 0.467 | -| value_loss | 4.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2958 | -| time_elapsed | 30496 | -| total_timesteps | 378624 | -| train/ | | -| approx_kl | 0.016383277 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.658 | -| explained_variance | -0.792 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 29570 | -| policy_gradient_loss | -0.00189 | -| std | 0.468 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2959 | -| time_elapsed | 30498 | -| total_timesteps | 378752 | -| train/ | | -| approx_kl | 0.007635549 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.659 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 29580 | -| policy_gradient_loss | -0.0019 | -| std | 0.468 | -| value_loss | 6.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2960 | -| time_elapsed | 30501 | -| total_timesteps | 378880 | -| train/ | | -| approx_kl | 0.007981591 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.661 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.000503 | -| n_updates | 29590 | -| policy_gradient_loss | -0.000721 | -| std | 0.469 | -| value_loss | 5.36e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2961 | -| time_elapsed | 30504 | -| total_timesteps | 379008 | -| train/ | | -| approx_kl | 2.1241838e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.664 | -| explained_variance | 0.00765 | -| learning_rate | 0.0003 | -| loss | -0.000396 | -| n_updates | 29600 | -| policy_gradient_loss | -0.000177 | -| std | 0.471 | -| value_loss | 3.15e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2962 | -| time_elapsed | 30513 | -| total_timesteps | 379136 | -| train/ | | -| approx_kl | 0.0039016781 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | 0.677 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 29610 | -| policy_gradient_loss | -0.00621 | -| std | 0.472 | -| value_loss | 0.00119 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2963 | -| time_elapsed | 30516 | -| total_timesteps | 379264 | -| train/ | | -| approx_kl | 0.0007407067 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.669 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | 0.0003 | -| n_updates | 29620 | -| policy_gradient_loss | 0.000216 | -| std | 0.472 | -| value_loss | 1.31e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2964 | -| time_elapsed | 30520 | -| total_timesteps | 379392 | -| train/ | | -| approx_kl | 0.0065424917 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.669 | -| explained_variance | -46 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 29630 | -| policy_gradient_loss | -0.000933 | -| std | 0.472 | -| value_loss | 2.55e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2965 | -| time_elapsed | 30524 | -| total_timesteps | 379520 | -| train/ | | -| approx_kl | 0.00062648486 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.669 | -| explained_variance | -24.4 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 29640 | -| policy_gradient_loss | -0.0001 | -| std | 0.473 | -| value_loss | 1.94e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2966 | -| time_elapsed | 30528 | -| total_timesteps | 379648 | -| train/ | | -| approx_kl | 0.01559836 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.671 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 29650 | -| policy_gradient_loss | -0.00397 | -| std | 0.474 | -| value_loss | 5.59e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2967 | -| time_elapsed | 30532 | -| total_timesteps | 379776 | -| train/ | | -| approx_kl | 0.005605975 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.672 | -| explained_variance | 0.0081 | -| learning_rate | 0.0003 | -| loss | -0.00919 | -| n_updates | 29660 | -| policy_gradient_loss | -0.00359 | -| std | 0.474 | -| value_loss | 2.93e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2968 | -| time_elapsed | 30536 | -| total_timesteps | 379904 | -| train/ | | -| approx_kl | 3.896421e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.673 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | -0.000181 | -| n_updates | 29670 | -| policy_gradient_loss | 0.00138 | -| std | 0.475 | -| value_loss | 3.49e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2969 | -| time_elapsed | 30538 | -| total_timesteps | 380032 | -| train/ | | -| approx_kl | 0.00084026274 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.674 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 29680 | -| policy_gradient_loss | -1.14e-05 | -| std | 0.475 | -| value_loss | 1.1e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2970 | -| time_elapsed | 30545 | -| total_timesteps | 380160 | -| train/ | | -| approx_kl | 0.0032353848 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.675 | -| explained_variance | 0.603 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 29690 | -| policy_gradient_loss | -0.00222 | -| std | 0.475 | -| value_loss | 0.00735 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2971 | -| time_elapsed | 30550 | -| total_timesteps | 380288 | -| train/ | | -| approx_kl | 0.0034494447 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.673 | -| explained_variance | 0.229 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 29700 | -| policy_gradient_loss | -0.00069 | -| std | 0.474 | -| value_loss | 1.95e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2972 | -| time_elapsed | 30554 | -| total_timesteps | 380416 | -| train/ | | -| approx_kl | 0.0036755754 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.671 | -| explained_variance | -20.9 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 29710 | -| policy_gradient_loss | -0.00218 | -| std | 0.472 | -| value_loss | 2.91e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2973 | -| time_elapsed | 30557 | -| total_timesteps | 380544 | -| train/ | | -| approx_kl | 0.025407627 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.668 | -| explained_variance | -2.89 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 29720 | -| policy_gradient_loss | -0.00562 | -| std | 0.471 | -| value_loss | 6.58e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2974 | -| time_elapsed | 30561 | -| total_timesteps | 380672 | -| train/ | | -| approx_kl | 0.015681362 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | -0.704 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 29730 | -| policy_gradient_loss | -0.00357 | -| std | 0.471 | -| value_loss | 3.59e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2975 | -| time_elapsed | 30565 | -| total_timesteps | 380800 | -| train/ | | -| approx_kl | 0.0044138245 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.000558 | -| n_updates | 29740 | -| policy_gradient_loss | -0.000683 | -| std | 0.472 | -| value_loss | 2.22e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.92 | -| time/ | | -| fps | 12 | -| iterations | 2976 | -| time_elapsed | 30568 | -| total_timesteps | 380928 | -| train/ | | -| approx_kl | 0.003233932 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.668 | -| explained_variance | 0.00168 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 29750 | -| policy_gradient_loss | -0.00154 | -| std | 0.472 | -| value_loss | 1.85e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2977 | -| time_elapsed | 30573 | -| total_timesteps | 381056 | -| train/ | | -| approx_kl | 0.0038987978 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.669 | -| explained_variance | -0.0942 | -| learning_rate | 0.0003 | -| loss | 0.00102 | -| n_updates | 29760 | -| policy_gradient_loss | 0.000487 | -| std | 0.472 | -| value_loss | 2.18e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2978 | -| time_elapsed | 30579 | -| total_timesteps | 381184 | -| train/ | | -| approx_kl | 0.00067642424 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.667 | -| explained_variance | 0.67 | -| learning_rate | 0.0003 | -| loss | -0.00414 | -| n_updates | 29770 | -| policy_gradient_loss | -0.00269 | -| std | 0.471 | -| value_loss | 0.00479 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2979 | -| time_elapsed | 30581 | -| total_timesteps | 381312 | -| train/ | | -| approx_kl | 0.005271434 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.664 | -| explained_variance | 0.0314 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 29780 | -| policy_gradient_loss | -0.00163 | -| std | 0.468 | -| value_loss | 1.83e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2980 | -| time_elapsed | 30584 | -| total_timesteps | 381440 | -| train/ | | -| approx_kl | 0.006618253 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.658 | -| explained_variance | 0.0267 | -| learning_rate | 0.0003 | -| loss | -0.000301 | -| n_updates | 29790 | -| policy_gradient_loss | -0.000747 | -| std | 0.467 | -| value_loss | 5.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2981 | -| time_elapsed | 30587 | -| total_timesteps | 381568 | -| train/ | | -| approx_kl | 0.005367124 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.656 | -| explained_variance | 0.0181 | -| learning_rate | 0.0003 | -| loss | 0.0548 | -| n_updates | 29800 | -| policy_gradient_loss | -0.00182 | -| std | 0.466 | -| value_loss | 0.142 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2982 | -| time_elapsed | 30591 | -| total_timesteps | 381696 | -| train/ | | -| approx_kl | 0.008705151 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.655 | -| explained_variance | -0.0782 | -| learning_rate | 0.0003 | -| loss | 0.00698 | -| n_updates | 29810 | -| policy_gradient_loss | 0.00048 | -| std | 0.466 | -| value_loss | 0.015 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2983 | -| time_elapsed | 30595 | -| total_timesteps | 381824 | -| train/ | | -| approx_kl | 0.014083677 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.655 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.00767 | -| n_updates | 29820 | -| policy_gradient_loss | -0.00585 | -| std | 0.466 | -| value_loss | 0.00598 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 12 | -| iterations | 2984 | -| time_elapsed | 30599 | -| total_timesteps | 381952 | -| train/ | | -| approx_kl | 0.004921659 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.656 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 29830 | -| policy_gradient_loss | -0.0035 | -| std | 0.466 | -| value_loss | 0.00197 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2985 | -| time_elapsed | 30603 | -| total_timesteps | 382080 | -| train/ | | -| approx_kl | 0.015743779 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.654 | -| explained_variance | -0.0658 | -| learning_rate | 0.0003 | -| loss | -0.00348 | -| n_updates | 29840 | -| policy_gradient_loss | -0.0042 | -| std | 0.465 | -| value_loss | 0.00105 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2986 | -| time_elapsed | 30609 | -| total_timesteps | 382208 | -| train/ | | -| approx_kl | 0.010788517 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.654 | -| explained_variance | 0.45 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 29850 | -| policy_gradient_loss | -0.00711 | -| std | 0.465 | -| value_loss | 0.00423 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2987 | -| time_elapsed | 30612 | -| total_timesteps | 382336 | -| train/ | | -| approx_kl | 0.00013458403 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.653 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.000757 | -| n_updates | 29860 | -| policy_gradient_loss | -1.82e-05 | -| std | 0.464 | -| value_loss | 0.000269 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2988 | -| time_elapsed | 30615 | -| total_timesteps | 382464 | -| train/ | | -| approx_kl | 0.009018475 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.649 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 29870 | -| policy_gradient_loss | -0.00203 | -| std | 0.462 | -| value_loss | 0.000325 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2989 | -| time_elapsed | 30620 | -| total_timesteps | 382592 | -| train/ | | -| approx_kl | 0.0055140257 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.646 | -| explained_variance | -0.0628 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 29880 | -| policy_gradient_loss | -0.00118 | -| std | 0.461 | -| value_loss | 0.000137 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2990 | -| time_elapsed | 30623 | -| total_timesteps | 382720 | -| train/ | | -| approx_kl | 0.0050338577 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.644 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 29890 | -| policy_gradient_loss | -0.000734 | -| std | 0.46 | -| value_loss | 0.00012 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2991 | -| time_elapsed | 30627 | -| total_timesteps | 382848 | -| train/ | | -| approx_kl | 0.0033765337 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.643 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 29900 | -| policy_gradient_loss | -0.00143 | -| std | 0.46 | -| value_loss | 0.000109 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.98 | -| time/ | | -| fps | 12 | -| iterations | 2992 | -| time_elapsed | 30631 | -| total_timesteps | 382976 | -| train/ | | -| approx_kl | 0.0007647865 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.643 | -| explained_variance | -0.0804 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 29910 | -| policy_gradient_loss | 8.48e-05 | -| std | 0.46 | -| value_loss | 3.27e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 12 | -| iterations | 2993 | -| time_elapsed | 30635 | -| total_timesteps | 383104 | -| train/ | | -| approx_kl | 0.01548933 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.642 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 29920 | -| policy_gradient_loss | -0.0108 | -| std | 0.46 | -| value_loss | 2.1e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 12 | -| iterations | 2994 | -| time_elapsed | 30643 | -| total_timesteps | 383232 | -| train/ | | -| approx_kl | 0.007653989 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.642 | -| explained_variance | 0.602 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 29930 | -| policy_gradient_loss | -0.00317 | -| std | 0.46 | -| value_loss | 0.00443 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 12 | -| iterations | 2995 | -| time_elapsed | 30647 | -| total_timesteps | 383360 | -| train/ | | -| approx_kl | 0.0026627767 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.642 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.817 | -| n_updates | 29940 | -| policy_gradient_loss | 0.00147 | -| std | 0.46 | -| value_loss | 2.07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 12 | -| iterations | 2996 | -| time_elapsed | 30650 | -| total_timesteps | 383488 | -| train/ | | -| approx_kl | 0.0060554827 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.641 | -| explained_variance | -0.0579 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 29950 | -| policy_gradient_loss | -0.00222 | -| std | 0.459 | -| value_loss | 0.0437 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 12 | -| iterations | 2997 | -| time_elapsed | 30654 | -| total_timesteps | 383616 | -| train/ | | -| approx_kl | 0.017274138 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.641 | -| explained_variance | -0.000354 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 29960 | -| policy_gradient_loss | -0.00594 | -| std | 0.459 | -| value_loss | 0.00685 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 12 | -| iterations | 2998 | -| time_elapsed | 30658 | -| total_timesteps | 383744 | -| train/ | | -| approx_kl | 0.0056785527 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.64 | -| explained_variance | 0.00142 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 29970 | -| policy_gradient_loss | -0.00477 | -| std | 0.459 | -| value_loss | 0.269 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 12 | -| iterations | 2999 | -| time_elapsed | 30661 | -| total_timesteps | 383872 | -| train/ | | -| approx_kl | 0.019457057 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.64 | -| explained_variance | 0.00267 | -| learning_rate | 0.0003 | -| loss | 0.0992 | -| n_updates | 29980 | -| policy_gradient_loss | -0.0105 | -| std | 0.459 | -| value_loss | 0.272 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3000 | -| time_elapsed | 30665 | -| total_timesteps | 384000 | -| train/ | | -| approx_kl | 0.0040950896 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.641 | -| explained_variance | 0.00147 | -| learning_rate | 0.0003 | -| loss | 0.73 | -| n_updates | 29990 | -| policy_gradient_loss | -0.00276 | -| std | 0.46 | -| value_loss | 1.83 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3001 | -| time_elapsed | 30667 | -| total_timesteps | 384128 | -| train/ | | -| approx_kl | 0.0007539191 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.642 | -| explained_variance | -0.00183 | -| learning_rate | 0.0003 | -| loss | 0.096 | -| n_updates | 30000 | -| policy_gradient_loss | -4.73e-05 | -| std | 0.46 | -| value_loss | 0.207 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3002 | -| time_elapsed | 30674 | -| total_timesteps | 384256 | -| train/ | | -| approx_kl | 0.081290096 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.641 | -| explained_variance | 0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 30010 | -| policy_gradient_loss | -0.00561 | -| std | 0.459 | -| value_loss | 0.0188 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3003 | -| time_elapsed | 30678 | -| total_timesteps | 384384 | -| train/ | | -| approx_kl | 0.00014891056 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.64 | -| explained_variance | 0.00135 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 30020 | -| policy_gradient_loss | 0.000369 | -| std | 0.458 | -| value_loss | 0.017 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3004 | -| time_elapsed | 30681 | -| total_timesteps | 384512 | -| train/ | | -| approx_kl | 0.0028792592 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.638 | -| explained_variance | 0.000515 | -| learning_rate | 0.0003 | -| loss | -0.000934 | -| n_updates | 30030 | -| policy_gradient_loss | -0.000786 | -| std | 0.458 | -| value_loss | 0.00769 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3005 | -| time_elapsed | 30684 | -| total_timesteps | 384640 | -| train/ | | -| approx_kl | 0.00061336625 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.64 | -| explained_variance | 0.00253 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 30040 | -| policy_gradient_loss | 0.000547 | -| std | 0.459 | -| value_loss | 0.0907 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3006 | -| time_elapsed | 30688 | -| total_timesteps | 384768 | -| train/ | | -| approx_kl | 0.0070056026 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.641 | -| explained_variance | 0.00129 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 30050 | -| policy_gradient_loss | -0.00191 | -| std | 0.459 | -| value_loss | 0.0856 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.29 | -| time/ | | -| fps | 12 | -| iterations | 3007 | -| time_elapsed | 30690 | -| total_timesteps | 384896 | -| train/ | | -| approx_kl | 0.004582934 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.641 | -| explained_variance | 0.00378 | -| learning_rate | 0.0003 | -| loss | 0.00232 | -| n_updates | 30060 | -| policy_gradient_loss | -0.00156 | -| std | 0.46 | -| value_loss | 0.00996 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3008 | -| time_elapsed | 30693 | -| total_timesteps | 385024 | -| train/ | | -| approx_kl | 0.0015009607 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.642 | -| explained_variance | 0.000634 | -| learning_rate | 0.0003 | -| loss | 0.00222 | -| n_updates | 30070 | -| policy_gradient_loss | -0.000887 | -| std | 0.459 | -| value_loss | 0.0245 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3009 | -| time_elapsed | 30702 | -| total_timesteps | 385152 | -| train/ | | -| approx_kl | 6.556767e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.641 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.052 | -| n_updates | 30080 | -| policy_gradient_loss | 0.000645 | -| std | 0.459 | -| value_loss | 0.128 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3010 | -| time_elapsed | 30705 | -| total_timesteps | 385280 | -| train/ | | -| approx_kl | 0.0010792695 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.64 | -| explained_variance | -0.000802 | -| learning_rate | 0.0003 | -| loss | -0.000917 | -| n_updates | 30090 | -| policy_gradient_loss | -8.45e-05 | -| std | 0.459 | -| value_loss | 0.00755 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3011 | -| time_elapsed | 30709 | -| total_timesteps | 385408 | -| train/ | | -| approx_kl | 0.0011544486 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.64 | -| explained_variance | 0.00286 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 30100 | -| policy_gradient_loss | 0.00104 | -| std | 0.459 | -| value_loss | 0.434 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3012 | -| time_elapsed | 30713 | -| total_timesteps | 385536 | -| train/ | | -| approx_kl | 0.0035758377 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.64 | -| explained_variance | 0.00319 | -| learning_rate | 0.0003 | -| loss | 0.0807 | -| n_updates | 30110 | -| policy_gradient_loss | -0.00132 | -| std | 0.459 | -| value_loss | 0.205 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3013 | -| time_elapsed | 30717 | -| total_timesteps | 385664 | -| train/ | | -| approx_kl | 0.00017137919 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.639 | -| explained_variance | 0.00242 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 30120 | -| policy_gradient_loss | 0.00168 | -| std | 0.458 | -| value_loss | 0.0387 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3014 | -| time_elapsed | 30720 | -| total_timesteps | 385792 | -| train/ | | -| approx_kl | 0.0154976975 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.638 | -| explained_variance | 0.00254 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 30130 | -| policy_gradient_loss | -0.00533 | -| std | 0.458 | -| value_loss | 0.259 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.39 | -| time/ | | -| fps | 12 | -| iterations | 3015 | -| time_elapsed | 30724 | -| total_timesteps | 385920 | -| train/ | | -| approx_kl | 0.00841174 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.636 | -| explained_variance | 0.00248 | -| learning_rate | 0.0003 | -| loss | 0.00182 | -| n_updates | 30140 | -| policy_gradient_loss | -0.00484 | -| std | 0.457 | -| value_loss | 0.0237 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3016 | -| time_elapsed | 30728 | -| total_timesteps | 386048 | -| train/ | | -| approx_kl | 0.014512943 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.634 | -| explained_variance | 2.61e-05 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 30150 | -| policy_gradient_loss | -0.0083 | -| std | 0.456 | -| value_loss | 0.0325 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3017 | -| time_elapsed | 30734 | -| total_timesteps | 386176 | -| train/ | | -| approx_kl | 0.0019697794 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.632 | -| explained_variance | 0.00254 | -| learning_rate | 0.0003 | -| loss | 0.328 | -| n_updates | 30160 | -| policy_gradient_loss | -0.00143 | -| std | 0.455 | -| value_loss | 0.676 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3018 | -| time_elapsed | 30737 | -| total_timesteps | 386304 | -| train/ | | -| approx_kl | 0.0012130667 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.63 | -| explained_variance | 0.00014 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 30170 | -| policy_gradient_loss | -0.000382 | -| std | 0.454 | -| value_loss | 0.0417 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3019 | -| time_elapsed | 30740 | -| total_timesteps | 386432 | -| train/ | | -| approx_kl | 0.0006044335 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.63 | -| explained_variance | -5.29e-05 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 30180 | -| policy_gradient_loss | 3.05e-05 | -| std | 0.454 | -| value_loss | 0.0252 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3020 | -| time_elapsed | 30743 | -| total_timesteps | 386560 | -| train/ | | -| approx_kl | 0.0118358135 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | -0.631 | -| explained_variance | -0.000314 | -| learning_rate | 0.0003 | -| loss | 0.00322 | -| n_updates | 30190 | -| policy_gradient_loss | -0.0014 | -| std | 0.455 | -| value_loss | 0.0204 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3021 | -| time_elapsed | 30746 | -| total_timesteps | 386688 | -| train/ | | -| approx_kl | 0.0015617386 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | -0.00109 | -| learning_rate | 0.0003 | -| loss | 0.000882 | -| n_updates | 30200 | -| policy_gradient_loss | -0.000287 | -| std | 0.456 | -| value_loss | 0.0143 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3022 | -| time_elapsed | 30749 | -| total_timesteps | 386816 | -| train/ | | -| approx_kl | 0.003988897 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.634 | -| explained_variance | -0.00469 | -| learning_rate | 0.0003 | -| loss | -0.00897 | -| n_updates | 30210 | -| policy_gradient_loss | -0.0028 | -| std | 0.456 | -| value_loss | 0.0103 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3023 | -| time_elapsed | 30753 | -| total_timesteps | 386944 | -| train/ | | -| approx_kl | 0.0133386515 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.634 | -| explained_variance | -0.00899 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 30220 | -| policy_gradient_loss | -0.00285 | -| std | 0.456 | -| value_loss | 0.00661 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3024 | -| time_elapsed | 30756 | -| total_timesteps | 387072 | -| train/ | | -| approx_kl | 0.008519346 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.634 | -| explained_variance | -0.0477 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 30230 | -| policy_gradient_loss | -0.0031 | -| std | 0.456 | -| value_loss | 0.00386 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3025 | -| time_elapsed | 30762 | -| total_timesteps | 387200 | -| train/ | | -| approx_kl | 0.00018948037 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | 0.122 | -| learning_rate | 0.0003 | -| loss | 0.00315 | -| n_updates | 30240 | -| policy_gradient_loss | -0.000244 | -| std | 0.456 | -| value_loss | 0.0214 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3026 | -| time_elapsed | 30766 | -| total_timesteps | 387328 | -| train/ | | -| approx_kl | 0.018507639 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | -0.364 | -| learning_rate | 0.0003 | -| loss | -0.00746 | -| n_updates | 30250 | -| policy_gradient_loss | -0.0065 | -| std | 0.456 | -| value_loss | 0.00121 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3027 | -| time_elapsed | 30768 | -| total_timesteps | 387456 | -| train/ | | -| approx_kl | 0.006091969 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | -0.000942 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 30260 | -| policy_gradient_loss | -0.00123 | -| std | 0.456 | -| value_loss | 0.00112 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3028 | -| time_elapsed | 30772 | -| total_timesteps | 387584 | -| train/ | | -| approx_kl | 0.021413622 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 30270 | -| policy_gradient_loss | -0.00601 | -| std | 0.456 | -| value_loss | 0.00203 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3029 | -| time_elapsed | 30774 | -| total_timesteps | 387712 | -| train/ | | -| approx_kl | 0.009580957 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.00933 | -| n_updates | 30280 | -| policy_gradient_loss | -0.00404 | -| std | 0.456 | -| value_loss | 0.000536 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3030 | -| time_elapsed | 30778 | -| total_timesteps | 387840 | -| train/ | | -| approx_kl | 0.0005405573 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.000604 | -| n_updates | 30290 | -| policy_gradient_loss | 0.000481 | -| std | 0.456 | -| value_loss | 0.000341 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 12 | -| iterations | 3031 | -| time_elapsed | 30782 | -| total_timesteps | 387968 | -| train/ | | -| approx_kl | 0.011759346 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.634 | -| explained_variance | -0.0056 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 30300 | -| policy_gradient_loss | -0.00862 | -| std | 0.456 | -| value_loss | 0.000506 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3032 | -| time_elapsed | 30787 | -| total_timesteps | 388096 | -| train/ | | -| approx_kl | 0.00012946734 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.633 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 30310 | -| policy_gradient_loss | 2.95e-05 | -| std | 0.454 | -| value_loss | 0.00018 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3033 | -| time_elapsed | 30795 | -| total_timesteps | 388224 | -| train/ | | -| approx_kl | 0.0057391394 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.628 | -| explained_variance | 0.587 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 30320 | -| policy_gradient_loss | -0.00437 | -| std | 0.453 | -| value_loss | 0.00454 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3034 | -| time_elapsed | 30798 | -| total_timesteps | 388352 | -| train/ | | -| approx_kl | 0.008604272 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.626 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.000464 | -| n_updates | 30330 | -| policy_gradient_loss | -0.00113 | -| std | 0.452 | -| value_loss | 0.000129 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3035 | -| time_elapsed | 30801 | -| total_timesteps | 388480 | -| train/ | | -| approx_kl | 0.0074765747 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.624 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 30340 | -| policy_gradient_loss | -0.00503 | -| std | 0.451 | -| value_loss | 9.51e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3036 | -| time_elapsed | 30804 | -| total_timesteps | 388608 | -| train/ | | -| approx_kl | 4.0705083e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.622 | -| explained_variance | -0.0944 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 30350 | -| policy_gradient_loss | 0.00273 | -| std | 0.45 | -| value_loss | 0.000107 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3037 | -| time_elapsed | 30807 | -| total_timesteps | 388736 | -| train/ | | -| approx_kl | 0.019236924 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 30360 | -| policy_gradient_loss | -0.00742 | -| std | 0.45 | -| value_loss | 2.71e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3038 | -| time_elapsed | 30810 | -| total_timesteps | 388864 | -| train/ | | -| approx_kl | 0.0052646454 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.00915 | -| n_updates | 30370 | -| policy_gradient_loss | -0.00331 | -| std | 0.45 | -| value_loss | 3.53e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3039 | -| time_elapsed | 30813 | -| total_timesteps | 388992 | -| train/ | | -| approx_kl | 6.9281086e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 30380 | -| policy_gradient_loss | 0.00486 | -| std | 0.45 | -| value_loss | 4.59e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3040 | -| time_elapsed | 30816 | -| total_timesteps | 389120 | -| train/ | | -| approx_kl | 0.00083015254 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 30390 | -| policy_gradient_loss | 8.97e-05 | -| std | 0.45 | -| value_loss | 1.57e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3041 | -| time_elapsed | 30826 | -| total_timesteps | 389248 | -| train/ | | -| approx_kl | 0.027866697 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 30400 | -| policy_gradient_loss | -0.00547 | -| std | 0.448 | -| value_loss | 0.00184 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3042 | -| time_elapsed | 30830 | -| total_timesteps | 389376 | -| train/ | | -| approx_kl | 0.0021527598 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.614 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 30410 | -| policy_gradient_loss | -0.000402 | -| std | 0.447 | -| value_loss | 1.03e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3043 | -| time_elapsed | 30833 | -| total_timesteps | 389504 | -| train/ | | -| approx_kl | 0.014492296 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.612 | -| explained_variance | -0.082 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 30420 | -| policy_gradient_loss | -0.000297 | -| std | 0.446 | -| value_loss | 9.01e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3044 | -| time_elapsed | 30836 | -| total_timesteps | 389632 | -| train/ | | -| approx_kl | 0.00011001341 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.611 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | -0.0002 | -| n_updates | 30430 | -| policy_gradient_loss | -8.08e-05 | -| std | 0.445 | -| value_loss | 8.22e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3045 | -| time_elapsed | 30839 | -| total_timesteps | 389760 | -| train/ | | -| approx_kl | 0.008837107 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -0.00658 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 30440 | -| policy_gradient_loss | -0.00173 | -| std | 0.443 | -| value_loss | 7.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.6 | -| time/ | | -| fps | 12 | -| iterations | 3046 | -| time_elapsed | 30843 | -| total_timesteps | 389888 | -| train/ | | -| approx_kl | 0.012313975 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 30450 | -| policy_gradient_loss | -0.00598 | -| std | 0.441 | -| value_loss | 6.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3047 | -| time_elapsed | 30847 | -| total_timesteps | 390016 | -| train/ | | -| approx_kl | 0.015137153 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.00932 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 30460 | -| policy_gradient_loss | -0.0101 | -| std | 0.44 | -| value_loss | 1.52e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3048 | -| time_elapsed | 30856 | -| total_timesteps | 390144 | -| train/ | | -| approx_kl | 0.0008327225 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | 0.589 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 30470 | -| policy_gradient_loss | -0.00805 | -| std | 0.44 | -| value_loss | 0.00612 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3049 | -| time_elapsed | 30859 | -| total_timesteps | 390272 | -| train/ | | -| approx_kl | 2.4595065e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | 0.0415 | -| learning_rate | 0.0003 | -| loss | 7.82e-06 | -| n_updates | 30480 | -| policy_gradient_loss | 6.26e-06 | -| std | 0.44 | -| value_loss | 6.83e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3050 | -| time_elapsed | 30863 | -| total_timesteps | 390400 | -| train/ | | -| approx_kl | 0.00963252 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | -0.00507 | -| n_updates | 30490 | -| policy_gradient_loss | -0.00512 | -| std | 0.44 | -| value_loss | 0.00645 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3051 | -| time_elapsed | 30866 | -| total_timesteps | 390528 | -| train/ | | -| approx_kl | 0.002605986 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -0.00657 | -| learning_rate | 0.0003 | -| loss | -0.000636 | -| n_updates | 30500 | -| policy_gradient_loss | -0.000547 | -| std | 0.441 | -| value_loss | 0.000589 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3052 | -| time_elapsed | 30868 | -| total_timesteps | 390656 | -| train/ | | -| approx_kl | 0.0038675454 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.00883 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 30510 | -| policy_gradient_loss | -0.000197 | -| std | 0.441 | -| value_loss | 0.00477 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3053 | -| time_elapsed | 30872 | -| total_timesteps | 390784 | -| train/ | | -| approx_kl | 0.00900842 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 30520 | -| policy_gradient_loss | -0.00215 | -| std | 0.44 | -| value_loss | 0.000193 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 12 | -| iterations | 3054 | -| time_elapsed | 30875 | -| total_timesteps | 390912 | -| train/ | | -| approx_kl | 0.011334955 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -1.09e-05 | -| n_updates | 30530 | -| policy_gradient_loss | -0.00109 | -| std | 0.439 | -| value_loss | 0.000139 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3055 | -| time_elapsed | 30879 | -| total_timesteps | 391040 | -| train/ | | -| approx_kl | 0.015539376 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 30540 | -| policy_gradient_loss | -0.0107 | -| std | 0.439 | -| value_loss | 0.00029 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3056 | -| time_elapsed | 30885 | -| total_timesteps | 391168 | -| train/ | | -| approx_kl | 0.012335367 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | 0.685 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 30550 | -| policy_gradient_loss | -0.00681 | -| std | 0.439 | -| value_loss | 0.0014 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3057 | -| time_elapsed | 30889 | -| total_timesteps | 391296 | -| train/ | | -| approx_kl | 0.00024041673 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.000368 | -| n_updates | 30560 | -| policy_gradient_loss | -3.7e-05 | -| std | 0.438 | -| value_loss | 7.06e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3058 | -| time_elapsed | 30892 | -| total_timesteps | 391424 | -| train/ | | -| approx_kl | 0.016391808 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.000263 | -| n_updates | 30570 | -| policy_gradient_loss | -0.00225 | -| std | 0.437 | -| value_loss | 0.000311 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3059 | -| time_elapsed | 30896 | -| total_timesteps | 391552 | -| train/ | | -| approx_kl | 0.0074657695 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | 0.0156 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 30580 | -| policy_gradient_loss | -0.000566 | -| std | 0.437 | -| value_loss | 0.00594 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3060 | -| time_elapsed | 30899 | -| total_timesteps | 391680 | -| train/ | | -| approx_kl | 0.011433063 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 30590 | -| policy_gradient_loss | -0.00342 | -| std | 0.437 | -| value_loss | 0.0392 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3061 | -| time_elapsed | 30903 | -| total_timesteps | 391808 | -| train/ | | -| approx_kl | 0.0074075824 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0762 | -| n_updates | 30600 | -| policy_gradient_loss | -0.00151 | -| std | 0.438 | -| value_loss | 0.229 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 12 | -| iterations | 3062 | -| time_elapsed | 30907 | -| total_timesteps | 391936 | -| train/ | | -| approx_kl | 0.004946591 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.00354 | -| learning_rate | 0.0003 | -| loss | 0.0458 | -| n_updates | 30610 | -| policy_gradient_loss | -0.00132 | -| std | 0.439 | -| value_loss | 0.105 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3063 | -| time_elapsed | 30909 | -| total_timesteps | 392064 | -| train/ | | -| approx_kl | 0.0093076695 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | 0.00063 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 30620 | -| policy_gradient_loss | -0.00122 | -| std | 0.441 | -| value_loss | 0.00945 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3064 | -| time_elapsed | 30914 | -| total_timesteps | 392192 | -| train/ | | -| approx_kl | 0.007946785 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 30630 | -| policy_gradient_loss | -0.00251 | -| std | 0.442 | -| value_loss | 0.0795 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3065 | -| time_elapsed | 30917 | -| total_timesteps | 392320 | -| train/ | | -| approx_kl | 0.0008852391 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.0007 | -| learning_rate | 0.0003 | -| loss | -0.000273 | -| n_updates | 30640 | -| policy_gradient_loss | -1e-05 | -| std | 0.44 | -| value_loss | 0.00717 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3066 | -| time_elapsed | 30921 | -| total_timesteps | 392448 | -| train/ | | -| approx_kl | 0.013569573 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | 0.000407 | -| learning_rate | 0.0003 | -| loss | 0.0047 | -| n_updates | 30650 | -| policy_gradient_loss | 0.00135 | -| std | 0.44 | -| value_loss | 0.00644 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3067 | -| time_elapsed | 30925 | -| total_timesteps | 392576 | -| train/ | | -| approx_kl | 0.029523186 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | 0.00362 | -| learning_rate | 0.0003 | -| loss | 0.00562 | -| n_updates | 30660 | -| policy_gradient_loss | -0.0127 | -| std | 0.44 | -| value_loss | 0.0407 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3068 | -| time_elapsed | 30928 | -| total_timesteps | 392704 | -| train/ | | -| approx_kl | 0.024287166 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.00212 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 30670 | -| policy_gradient_loss | -0.0102 | -| std | 0.439 | -| value_loss | 0.00997 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3069 | -| time_elapsed | 30931 | -| total_timesteps | 392832 | -| train/ | | -| approx_kl | 0.007846225 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -0.0026 | -| learning_rate | 0.0003 | -| loss | 0.00118 | -| n_updates | 30680 | -| policy_gradient_loss | -0.00055 | -| std | 0.439 | -| value_loss | 0.00327 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 12 | -| iterations | 3070 | -| time_elapsed | 30934 | -| total_timesteps | 392960 | -| train/ | | -| approx_kl | 0.016436366 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | 0.00151 | -| learning_rate | 0.0003 | -| loss | -0.00645 | -| n_updates | 30690 | -| policy_gradient_loss | -0.00691 | -| std | 0.439 | -| value_loss | 0.000971 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3071 | -| time_elapsed | 30938 | -| total_timesteps | 393088 | -| train/ | | -| approx_kl | 0.014096474 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -0.00626 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 30700 | -| policy_gradient_loss | -0.00135 | -| std | 0.441 | -| value_loss | 0.0019 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3072 | -| time_elapsed | 30944 | -| total_timesteps | 393216 | -| train/ | | -| approx_kl | 0.049241956 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | 0.00963 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 30710 | -| policy_gradient_loss | -0.00206 | -| std | 0.441 | -| value_loss | 0.346 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3073 | -| time_elapsed | 30952 | -| total_timesteps | 393344 | -| train/ | | -| approx_kl | 0.013130484 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | 0.00173 | -| learning_rate | 0.0003 | -| loss | 2.6 | -| n_updates | 30720 | -| policy_gradient_loss | -0.0108 | -| std | 0.441 | -| value_loss | 5.51 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3074 | -| time_elapsed | 30958 | -| total_timesteps | 393472 | -| train/ | | -| approx_kl | 0.024986133 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | 0.00252 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 30730 | -| policy_gradient_loss | -0.0131 | -| std | 0.441 | -| value_loss | 0.066 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3075 | -| time_elapsed | 30962 | -| total_timesteps | 393600 | -| train/ | | -| approx_kl | 0.011850854 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | 2.87e-05 | -| learning_rate | 0.0003 | -| loss | 0.0087 | -| n_updates | 30740 | -| policy_gradient_loss | -0.0023 | -| std | 0.44 | -| value_loss | 0.0264 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3076 | -| time_elapsed | 30966 | -| total_timesteps | 393728 | -| train/ | | -| approx_kl | 3.359653e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | 0.0013 | -| learning_rate | 0.0003 | -| loss | 0.00384 | -| n_updates | 30750 | -| policy_gradient_loss | 2.88e-05 | -| std | 0.44 | -| value_loss | 0.0157 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3077 | -| time_elapsed | 30970 | -| total_timesteps | 393856 | -| train/ | | -| approx_kl | 0.0071793837 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | 0.00218 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 30760 | -| policy_gradient_loss | -0.0011 | -| std | 0.439 | -| value_loss | 0.0415 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 12 | -| iterations | 3078 | -| time_elapsed | 30974 | -| total_timesteps | 393984 | -| train/ | | -| approx_kl | 0.013991067 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | 0.00702 | -| learning_rate | 0.0003 | -| loss | -0.000381 | -| n_updates | 30770 | -| policy_gradient_loss | -0.00212 | -| std | 0.437 | -| value_loss | 0.007 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3079 | -| time_elapsed | 30976 | -| total_timesteps | 394112 | -| train/ | | -| approx_kl | 0.01762839 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.00158 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 30780 | -| policy_gradient_loss | -0.013 | -| std | 0.437 | -| value_loss | 0.123 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3080 | -| time_elapsed | 30984 | -| total_timesteps | 394240 | -| train/ | | -| approx_kl | 0.016003612 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 30790 | -| policy_gradient_loss | -0.00723 | -| std | 0.437 | -| value_loss | 0.0665 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3081 | -| time_elapsed | 30987 | -| total_timesteps | 394368 | -| train/ | | -| approx_kl | 0.008122332 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.000375 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 30800 | -| policy_gradient_loss | -0.00554 | -| std | 0.437 | -| value_loss | 0.018 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3082 | -| time_elapsed | 30990 | -| total_timesteps | 394496 | -| train/ | | -| approx_kl | 0.0027743054 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.000438 | -| learning_rate | 0.0003 | -| loss | 0.00444 | -| n_updates | 30810 | -| policy_gradient_loss | 0.00103 | -| std | 0.438 | -| value_loss | 0.0141 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3083 | -| time_elapsed | 30993 | -| total_timesteps | 394624 | -| train/ | | -| approx_kl | 0.013356036 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -0.0016 | -| learning_rate | 0.0003 | -| loss | 0.00393 | -| n_updates | 30820 | -| policy_gradient_loss | -0.000164 | -| std | 0.438 | -| value_loss | 0.0108 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3084 | -| time_elapsed | 30997 | -| total_timesteps | 394752 | -| train/ | | -| approx_kl | 0.0132958945 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.00408 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 30830 | -| policy_gradient_loss | -0.00457 | -| std | 0.438 | -| value_loss | 0.00859 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3085 | -| time_elapsed | 31000 | -| total_timesteps | 394880 | -| train/ | | -| approx_kl | 0.00026435964 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.00791 | -| learning_rate | 0.0003 | -| loss | 0.000616 | -| n_updates | 30840 | -| policy_gradient_loss | -5.89e-05 | -| std | 0.438 | -| value_loss | 0.00443 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3086 | -| time_elapsed | 31004 | -| total_timesteps | 395008 | -| train/ | | -| approx_kl | 0.010169579 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 30850 | -| policy_gradient_loss | -0.00409 | -| std | 0.437 | -| value_loss | 0.00252 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3087 | -| time_elapsed | 31014 | -| total_timesteps | 395136 | -| train/ | | -| approx_kl | 0.012857002 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.189 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 30860 | -| policy_gradient_loss | -0.00751 | -| std | 0.437 | -| value_loss | 0.0144 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3088 | -| time_elapsed | 31018 | -| total_timesteps | 395264 | -| train/ | | -| approx_kl | 0.02605962 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 30870 | -| policy_gradient_loss | -0.0109 | -| std | 0.437 | -| value_loss | 0.000529 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3089 | -| time_elapsed | 31021 | -| total_timesteps | 395392 | -| train/ | | -| approx_kl | 0.011557091 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | 0.0182 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 30880 | -| policy_gradient_loss | -0.00179 | -| std | 0.437 | -| value_loss | 0.00047 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3090 | -| time_elapsed | 31024 | -| total_timesteps | 395520 | -| train/ | | -| approx_kl | 0.0066019427 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.0489 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 30890 | -| policy_gradient_loss | -0.00166 | -| std | 0.438 | -| value_loss | 0.000395 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3091 | -| time_elapsed | 31028 | -| total_timesteps | 395648 | -| train/ | | -| approx_kl | 0.015801508 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | 0.0089 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 30900 | -| policy_gradient_loss | -0.00473 | -| std | 0.438 | -| value_loss | 0.0834 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3092 | -| time_elapsed | 31031 | -| total_timesteps | 395776 | -| train/ | | -| approx_kl | 0.00645471 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00072 | -| n_updates | 30910 | -| policy_gradient_loss | -0.00147 | -| std | 0.435 | -| value_loss | 0.00376 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.1 | -| time/ | | -| fps | 12 | -| iterations | 3093 | -| time_elapsed | 31034 | -| total_timesteps | 395904 | -| train/ | | -| approx_kl | 0.013760779 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | 0.00542 | -| learning_rate | 0.0003 | -| loss | -0.000405 | -| n_updates | 30920 | -| policy_gradient_loss | -0.00164 | -| std | 0.434 | -| value_loss | 0.00186 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3094 | -| time_elapsed | 31038 | -| total_timesteps | 396032 | -| train/ | | -| approx_kl | 0.019153692 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | -0.00976 | -| n_updates | 30930 | -| policy_gradient_loss | -0.00656 | -| std | 0.433 | -| value_loss | 0.000905 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3095 | -| time_elapsed | 31047 | -| total_timesteps | 396160 | -| train/ | | -| approx_kl | 0.010024645 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | 0.246 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 30940 | -| policy_gradient_loss | -0.0065 | -| std | 0.433 | -| value_loss | 0.0164 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3096 | -| time_elapsed | 31051 | -| total_timesteps | 396288 | -| train/ | | -| approx_kl | 0.022863243 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 30950 | -| policy_gradient_loss | -0.00969 | -| std | 0.433 | -| value_loss | 0.000325 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3097 | -| time_elapsed | 31054 | -| total_timesteps | 396416 | -| train/ | | -| approx_kl | 0.014851181 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 30960 | -| policy_gradient_loss | -0.00581 | -| std | 0.433 | -| value_loss | 0.00025 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3098 | -| time_elapsed | 31058 | -| total_timesteps | 396544 | -| train/ | | -| approx_kl | 0.010452842 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 30970 | -| policy_gradient_loss | -0.00307 | -| std | 0.432 | -| value_loss | 0.000128 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3099 | -| time_elapsed | 31061 | -| total_timesteps | 396672 | -| train/ | | -| approx_kl | 0.017080719 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -0.0917 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 30980 | -| policy_gradient_loss | -0.0117 | -| std | 0.431 | -| value_loss | 0.000169 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3100 | -| time_elapsed | 31065 | -| total_timesteps | 396800 | -| train/ | | -| approx_kl | 0.0014643795 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -0.0816 | -| learning_rate | 0.0003 | -| loss | -6.18e-05 | -| n_updates | 30990 | -| policy_gradient_loss | -1.54e-05 | -| std | 0.432 | -| value_loss | 6.96e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.12 | -| time/ | | -| fps | 12 | -| iterations | 3101 | -| time_elapsed | 31067 | -| total_timesteps | 396928 | -| train/ | | -| approx_kl | 4.945323e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -0.00594 | -| learning_rate | 0.0003 | -| loss | -7.48e-05 | -| n_updates | 31000 | -| policy_gradient_loss | 3.02e-06 | -| std | 0.431 | -| value_loss | 5.84e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3102 | -| time_elapsed | 31071 | -| total_timesteps | 397056 | -| train/ | | -| approx_kl | 0.0010152792 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | -0.000578 | -| n_updates | 31010 | -| policy_gradient_loss | -0.000244 | -| std | 0.43 | -| value_loss | 5.07e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3103 | -| time_elapsed | 31078 | -| total_timesteps | 397184 | -| train/ | | -| approx_kl | 0.002430627 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.574 | -| explained_variance | 0.516 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 31020 | -| policy_gradient_loss | -0.00892 | -| std | 0.429 | -| value_loss | 0.00606 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3104 | -| time_elapsed | 31081 | -| total_timesteps | 397312 | -| train/ | | -| approx_kl | 0.01574713 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 31030 | -| policy_gradient_loss | -0.00916 | -| std | 0.429 | -| value_loss | 5.02e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3105 | -| time_elapsed | 31084 | -| total_timesteps | 397440 | -| train/ | | -| approx_kl | 0.015620769 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 31040 | -| policy_gradient_loss | -0.00251 | -| std | 0.429 | -| value_loss | 4.61e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3106 | -| time_elapsed | 31087 | -| total_timesteps | 397568 | -| train/ | | -| approx_kl | 0.034811623 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 31050 | -| policy_gradient_loss | -0.0139 | -| std | 0.429 | -| value_loss | 6.16e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3107 | -| time_elapsed | 31090 | -| total_timesteps | 397696 | -| train/ | | -| approx_kl | 0.00561896 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -0.0907 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 31060 | -| policy_gradient_loss | -0.001 | -| std | 0.43 | -| value_loss | 3.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3108 | -| time_elapsed | 31093 | -| total_timesteps | 397824 | -| train/ | | -| approx_kl | 0.010476426 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 31070 | -| policy_gradient_loss | -0.00275 | -| std | 0.431 | -| value_loss | 3.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3109 | -| time_elapsed | 31095 | -| total_timesteps | 397952 | -| train/ | | -| approx_kl | 0.005883646 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.578 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 31080 | -| policy_gradient_loss | -0.00156 | -| std | 0.431 | -| value_loss | 1.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3110 | -| time_elapsed | 31098 | -| total_timesteps | 398080 | -| train/ | | -| approx_kl | 0.010246141 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.578 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | -0.00932 | -| n_updates | 31090 | -| policy_gradient_loss | -0.00306 | -| std | 0.431 | -| value_loss | 1.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3111 | -| time_elapsed | 31107 | -| total_timesteps | 398208 | -| train/ | | -| approx_kl | 0.011216837 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.578 | -| explained_variance | 0.572 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 31100 | -| policy_gradient_loss | -0.00665 | -| std | 0.431 | -| value_loss | 0.00443 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3112 | -| time_elapsed | 31111 | -| total_timesteps | 398336 | -| train/ | | -| approx_kl | 0.019870928 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -3.02 | -| learning_rate | 0.0003 | -| loss | -0.00199 | -| n_updates | 31110 | -| policy_gradient_loss | -0.00358 | -| std | 0.431 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3113 | -| time_elapsed | 31115 | -| total_timesteps | 398464 | -| train/ | | -| approx_kl | 0.019032106 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | -1.91 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 31120 | -| policy_gradient_loss | -0.00262 | -| std | 0.43 | -| value_loss | 2.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3114 | -| time_elapsed | 31119 | -| total_timesteps | 398592 | -| train/ | | -| approx_kl | 0.013672826 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 31130 | -| policy_gradient_loss | -0.00202 | -| std | 0.428 | -| value_loss | 1.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3115 | -| time_elapsed | 31123 | -| total_timesteps | 398720 | -| train/ | | -| approx_kl | 0.01668883 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | -0.435 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 31140 | -| policy_gradient_loss | -0.00249 | -| std | 0.427 | -| value_loss | 2.55e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3116 | -| time_elapsed | 31127 | -| total_timesteps | 398848 | -| train/ | | -| approx_kl | 0.025480108 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | -0.568 | -| explained_variance | -0.0993 | -| learning_rate | 0.0003 | -| loss | 0.00065 | -| n_updates | 31150 | -| policy_gradient_loss | -0.00258 | -| std | 0.427 | -| value_loss | 2.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3117 | -| time_elapsed | 31129 | -| total_timesteps | 398976 | -| train/ | | -| approx_kl | 0.017497208 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | -0.567 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 31160 | -| policy_gradient_loss | -0.00396 | -| std | 0.427 | -| value_loss | 6.34e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3118 | -| time_elapsed | 31131 | -| total_timesteps | 399104 | -| train/ | | -| approx_kl | 5.3110998e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.568 | -| explained_variance | -0.0714 | -| learning_rate | 0.0003 | -| loss | -0.000774 | -| n_updates | 31170 | -| policy_gradient_loss | -0.00015 | -| std | 0.428 | -| value_loss | 4.74e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3119 | -| time_elapsed | 31139 | -| total_timesteps | 399232 | -| train/ | | -| approx_kl | 0.010439439 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | 0.571 | -| learning_rate | 0.0003 | -| loss | -0.000895 | -| n_updates | 31180 | -| policy_gradient_loss | -0.00251 | -| std | 0.429 | -| value_loss | 0.00461 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3120 | -| time_elapsed | 31144 | -| total_timesteps | 399360 | -| train/ | | -| approx_kl | 0.03971854 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -89.6 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 31190 | -| policy_gradient_loss | -0.0104 | -| std | 0.429 | -| value_loss | 3.53e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3121 | -| time_elapsed | 31147 | -| total_timesteps | 399488 | -| train/ | | -| approx_kl | 3.9755832e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -30.2 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 31200 | -| policy_gradient_loss | 0.00151 | -| std | 0.429 | -| value_loss | 1.04e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3122 | -| time_elapsed | 31152 | -| total_timesteps | 399616 | -| train/ | | -| approx_kl | 0.015791982 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | -10.4 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 31210 | -| policy_gradient_loss | -0.0062 | -| std | 0.429 | -| value_loss | 4.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3123 | -| time_elapsed | 31155 | -| total_timesteps | 399744 | -| train/ | | -| approx_kl | 0.008685704 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.571 | -| explained_variance | -4.16 | -| learning_rate | 0.0003 | -| loss | -0.000986 | -| n_updates | 31220 | -| policy_gradient_loss | -0.00111 | -| std | 0.428 | -| value_loss | 2.23e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3124 | -| time_elapsed | 31159 | -| total_timesteps | 399872 | -| train/ | | -| approx_kl | 0.0161827 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | -0.568 | -| explained_variance | -0.749 | -| learning_rate | 0.0003 | -| loss | 0.00283 | -| n_updates | 31230 | -| policy_gradient_loss | -0.000202 | -| std | 0.426 | -| value_loss | 1.35e-10 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3125 | -| time_elapsed | 31163 | -| total_timesteps | 400000 | -| train/ | | -| approx_kl | 0.0011143223 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | -0.000568 | -| n_updates | 31240 | -| policy_gradient_loss | -0.000125 | -| std | 0.426 | -| value_loss | 2.55e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3126 | -| time_elapsed | 31167 | -| total_timesteps | 400128 | -| train/ | | -| approx_kl | 0.013613844 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.565 | -| explained_variance | -0.0052 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 31250 | -| policy_gradient_loss | -0.00392 | -| std | 0.425 | -| value_loss | 1.72e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3127 | -| time_elapsed | 31174 | -| total_timesteps | 400256 | -| train/ | | -| approx_kl | 0.0041864715 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.563 | -| explained_variance | 0.471 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 31260 | -| policy_gradient_loss | -0.00327 | -| std | 0.424 | -| value_loss | 0.0102 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3128 | -| time_elapsed | 31178 | -| total_timesteps | 400384 | -| train/ | | -| approx_kl | 0.020994052 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.561 | -| explained_variance | -146 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 31270 | -| policy_gradient_loss | -0.00936 | -| std | 0.424 | -| value_loss | 2.66e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3129 | -| time_elapsed | 31182 | -| total_timesteps | 400512 | -| train/ | | -| approx_kl | 0.03612271 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | -0.561 | -| explained_variance | -116 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 31280 | -| policy_gradient_loss | -0.00353 | -| std | 0.424 | -| value_loss | 1.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3130 | -| time_elapsed | 31185 | -| total_timesteps | 400640 | -| train/ | | -| approx_kl | 0.023631018 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.561 | -| explained_variance | -28.1 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 31290 | -| policy_gradient_loss | -0.00377 | -| std | 0.424 | -| value_loss | 1.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3131 | -| time_elapsed | 31189 | -| total_timesteps | 400768 | -| train/ | | -| approx_kl | 0.006152869 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.562 | -| explained_variance | -3.24 | -| learning_rate | 0.0003 | -| loss | -0.00866 | -| n_updates | 31300 | -| policy_gradient_loss | -0.00137 | -| std | 0.425 | -| value_loss | 1.78e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.13 | -| time/ | | -| fps | 12 | -| iterations | 3132 | -| time_elapsed | 31194 | -| total_timesteps | 400896 | -| train/ | | -| approx_kl | 0.007427942 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.564 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | 2.06e-05 | -| n_updates | 31310 | -| policy_gradient_loss | 0.00015 | -| std | 0.426 | -| value_loss | 6.68e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3133 | -| time_elapsed | 31197 | -| total_timesteps | 401024 | -| train/ | | -| approx_kl | 0.009183551 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | 0.0041 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 31320 | -| policy_gradient_loss | -0.00196 | -| std | 0.426 | -| value_loss | 7.06e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3134 | -| time_elapsed | 31205 | -| total_timesteps | 401152 | -| train/ | | -| approx_kl | 0.014607335 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.567 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 31330 | -| policy_gradient_loss | -0.00669 | -| std | 0.427 | -| value_loss | 0.00109 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3135 | -| time_elapsed | 31210 | -| total_timesteps | 401280 | -| train/ | | -| approx_kl | 0.013576401 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.567 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | 0.000234 | -| n_updates | 31340 | -| policy_gradient_loss | -0.00115 | -| std | 0.426 | -| value_loss | 3.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3136 | -| time_elapsed | 31214 | -| total_timesteps | 401408 | -| train/ | | -| approx_kl | 0.03710567 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | -0.435 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 31350 | -| policy_gradient_loss | -0.0162 | -| std | 0.426 | -| value_loss | 3.81e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3137 | -| time_elapsed | 31216 | -| total_timesteps | 401536 | -| train/ | | -| approx_kl | 0.018140199 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | -0.531 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 31360 | -| policy_gradient_loss | -0.00803 | -| std | 0.426 | -| value_loss | 1.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3138 | -| time_elapsed | 31219 | -| total_timesteps | 401664 | -| train/ | | -| approx_kl | 0.015853845 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | -0.0987 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 31370 | -| policy_gradient_loss | -0.00482 | -| std | 0.426 | -| value_loss | 1.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3139 | -| time_elapsed | 31222 | -| total_timesteps | 401792 | -| train/ | | -| approx_kl | 0.009378377 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 31380 | -| policy_gradient_loss | -0.00104 | -| std | 0.426 | -| value_loss | 4.71e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 3.03 | -| time/ | | -| fps | 12 | -| iterations | 3140 | -| time_elapsed | 31226 | -| total_timesteps | 401920 | -| train/ | | -| approx_kl | 0.0057297964 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.565 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | -0.000857 | -| n_updates | 31390 | -| policy_gradient_loss | -0.000335 | -| std | 0.426 | -| value_loss | 3.36e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3141 | -| time_elapsed | 31229 | -| total_timesteps | 402048 | -| train/ | | -| approx_kl | 0.01581992 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.564 | -| explained_variance | -0.0785 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 31400 | -| policy_gradient_loss | -0.00418 | -| std | 0.425 | -| value_loss | 4.75e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3142 | -| time_elapsed | 31236 | -| total_timesteps | 402176 | -| train/ | | -| approx_kl | 0.012435216 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.563 | -| explained_variance | 0.664 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 31410 | -| policy_gradient_loss | -0.009 | -| std | 0.425 | -| value_loss | 0.000631 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3143 | -| time_elapsed | 31239 | -| total_timesteps | 402304 | -| train/ | | -| approx_kl | 0.021924365 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.562 | -| explained_variance | -0.0874 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 31420 | -| policy_gradient_loss | -0.00356 | -| std | 0.425 | -| value_loss | 6.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3144 | -| time_elapsed | 31243 | -| total_timesteps | 402432 | -| train/ | | -| approx_kl | 0.016430218 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | -0.563 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 31430 | -| policy_gradient_loss | -0.00401 | -| std | 0.425 | -| value_loss | 4.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3145 | -| time_elapsed | 31247 | -| total_timesteps | 402560 | -| train/ | | -| approx_kl | 0.015716614 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.564 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 31440 | -| policy_gradient_loss | -0.00333 | -| std | 0.426 | -| value_loss | 9.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3146 | -| time_elapsed | 31251 | -| total_timesteps | 402688 | -| train/ | | -| approx_kl | 0.015666913 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.565 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 31450 | -| policy_gradient_loss | -0.00611 | -| std | 0.426 | -| value_loss | 1.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3147 | -| time_elapsed | 31254 | -| total_timesteps | 402816 | -| train/ | | -| approx_kl | 0.022400755 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | -0.000875 | -| n_updates | 31460 | -| policy_gradient_loss | -0.00208 | -| std | 0.427 | -| value_loss | 4.74e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.83 | -| time/ | | -| fps | 12 | -| iterations | 3148 | -| time_elapsed | 31257 | -| total_timesteps | 402944 | -| train/ | | -| approx_kl | 0.0072905906 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.568 | -| explained_variance | -0.00745 | -| learning_rate | 0.0003 | -| loss | -0.000982 | -| n_updates | 31470 | -| policy_gradient_loss | -0.000687 | -| std | 0.427 | -| value_loss | 3.73e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3149 | -| time_elapsed | 31260 | -| total_timesteps | 403072 | -| train/ | | -| approx_kl | 0.018136382 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.569 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 31480 | -| policy_gradient_loss | -0.00984 | -| std | 0.428 | -| value_loss | 7.99e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3150 | -| time_elapsed | 31266 | -| total_timesteps | 403200 | -| train/ | | -| approx_kl | 0.01313487 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.569 | -| explained_variance | 0.592 | -| learning_rate | 0.0003 | -| loss | -0.00579 | -| n_updates | 31490 | -| policy_gradient_loss | -0.00357 | -| std | 0.427 | -| value_loss | 0.00423 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3151 | -| time_elapsed | 31270 | -| total_timesteps | 403328 | -| train/ | | -| approx_kl | 0.01516818 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.567 | -| explained_variance | -2.26 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 31500 | -| policy_gradient_loss | -0.00325 | -| std | 0.426 | -| value_loss | 9.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3152 | -| time_elapsed | 31273 | -| total_timesteps | 403456 | -| train/ | | -| approx_kl | 0.016366348 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.566 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 31510 | -| policy_gradient_loss | -0.00338 | -| std | 0.426 | -| value_loss | 7.28e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3153 | -| time_elapsed | 31276 | -| total_timesteps | 403584 | -| train/ | | -| approx_kl | 0.0065352535 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.568 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | -0.000457 | -| n_updates | 31520 | -| policy_gradient_loss | -0.000381 | -| std | 0.427 | -| value_loss | 2.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3154 | -| time_elapsed | 31279 | -| total_timesteps | 403712 | -| train/ | | -| approx_kl | 0.018779106 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | 0.00687 | -| learning_rate | 0.0003 | -| loss | -0.00681 | -| n_updates | 31530 | -| policy_gradient_loss | -0.00546 | -| std | 0.429 | -| value_loss | 2.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3155 | -| time_elapsed | 31283 | -| total_timesteps | 403840 | -| train/ | | -| approx_kl | 0.017453687 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | -0.083 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 31540 | -| policy_gradient_loss | -0.00924 | -| std | 0.429 | -| value_loss | 1.29e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 12 | -| iterations | 3156 | -| time_elapsed | 31285 | -| total_timesteps | 403968 | -| train/ | | -| approx_kl | 0.01744455 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -0.0961 | -| learning_rate | 0.0003 | -| loss | -0.0087 | -| n_updates | 31550 | -| policy_gradient_loss | -0.00735 | -| std | 0.429 | -| value_loss | 6e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3157 | -| time_elapsed | 31289 | -| total_timesteps | 404096 | -| train/ | | -| approx_kl | 0.010636444 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | 0.000657 | -| n_updates | 31560 | -| policy_gradient_loss | -0.000844 | -| std | 0.429 | -| value_loss | 4.77e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3158 | -| time_elapsed | 31296 | -| total_timesteps | 404224 | -| train/ | | -| approx_kl | 0.0060866103 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | 0.493 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 31570 | -| policy_gradient_loss | -0.00287 | -| std | 0.429 | -| value_loss | 0.00933 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3159 | -| time_elapsed | 31300 | -| total_timesteps | 404352 | -| train/ | | -| approx_kl | 0.013498128 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.571 | -| explained_variance | -61.5 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 31580 | -| policy_gradient_loss | -0.00194 | -| std | 0.428 | -| value_loss | 3.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3160 | -| time_elapsed | 31303 | -| total_timesteps | 404480 | -| train/ | | -| approx_kl | 0.031837963 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | -47.4 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 31590 | -| policy_gradient_loss | -0.00859 | -| std | 0.428 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3161 | -| time_elapsed | 31306 | -| total_timesteps | 404608 | -| train/ | | -| approx_kl | 0.0039734757 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.569 | -| explained_variance | -7.03 | -| learning_rate | 0.0003 | -| loss | -0.000333 | -| n_updates | 31600 | -| policy_gradient_loss | -0.000287 | -| std | 0.427 | -| value_loss | 1.65e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3162 | -| time_elapsed | 31309 | -| total_timesteps | 404736 | -| train/ | | -| approx_kl | 0.01546544 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.569 | -| explained_variance | -0.499 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 31610 | -| policy_gradient_loss | -0.00456 | -| std | 0.428 | -| value_loss | 6.25e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3163 | -| time_elapsed | 31313 | -| total_timesteps | 404864 | -| train/ | | -| approx_kl | 0.0074373055 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.569 | -| explained_variance | 0.00656 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 31620 | -| policy_gradient_loss | -0.00224 | -| std | 0.428 | -| value_loss | 7.34e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 12 | -| iterations | 3164 | -| time_elapsed | 31317 | -| total_timesteps | 404992 | -| train/ | | -| approx_kl | 0.0127665475 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | -0.00976 | -| n_updates | 31630 | -| policy_gradient_loss | -0.00354 | -| std | 0.428 | -| value_loss | 3.82e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3165 | -| time_elapsed | 31319 | -| total_timesteps | 405120 | -| train/ | | -| approx_kl | 0.0066132406 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | -0.0831 | -| learning_rate | 0.0003 | -| loss | -0.000936 | -| n_updates | 31640 | -| policy_gradient_loss | -0.000679 | -| std | 0.428 | -| value_loss | 2.11e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3166 | -| time_elapsed | 31329 | -| total_timesteps | 405248 | -| train/ | | -| approx_kl | 0.016542481 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | 0.617 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 31650 | -| policy_gradient_loss | -0.00421 | -| std | 0.428 | -| value_loss | 0.00377 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3167 | -| time_elapsed | 31333 | -| total_timesteps | 405376 | -| train/ | | -| approx_kl | 0.024584835 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | -1.75 | -| learning_rate | 0.0003 | -| loss | -0.00762 | -| n_updates | 31660 | -| policy_gradient_loss | -0.00647 | -| std | 0.428 | -| value_loss | 6.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3168 | -| time_elapsed | 31336 | -| total_timesteps | 405504 | -| train/ | | -| approx_kl | 0.002915916 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.57 | -| explained_variance | -0.544 | -| learning_rate | 0.0003 | -| loss | -0.000598 | -| n_updates | 31670 | -| policy_gradient_loss | -0.000223 | -| std | 0.428 | -| value_loss | 1.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3169 | -| time_elapsed | 31340 | -| total_timesteps | 405632 | -| train/ | | -| approx_kl | 0.015950158 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.571 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.00579 | -| n_updates | 31680 | -| policy_gradient_loss | -0.00574 | -| std | 0.428 | -| value_loss | 2.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3170 | -| time_elapsed | 31343 | -| total_timesteps | 405760 | -| train/ | | -| approx_kl | 0.017302461 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.571 | -| explained_variance | -0.244 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 31690 | -| policy_gradient_loss | -0.00604 | -| std | 0.428 | -| value_loss | 6.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3171 | -| time_elapsed | 31347 | -| total_timesteps | 405888 | -| train/ | | -| approx_kl | 0.011813768 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.571 | -| explained_variance | -0.0574 | -| learning_rate | 0.0003 | -| loss | 0.000603 | -| n_updates | 31700 | -| policy_gradient_loss | -6.01e-05 | -| std | 0.428 | -| value_loss | 9.31e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3172 | -| time_elapsed | 31351 | -| total_timesteps | 406016 | -| train/ | | -| approx_kl | 0.021429786 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.571 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 31710 | -| policy_gradient_loss | -0.00714 | -| std | 0.428 | -| value_loss | 6.99e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3173 | -| time_elapsed | 31361 | -| total_timesteps | 406144 | -| train/ | | -| approx_kl | 0.0051717106 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | 0.665 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 31720 | -| policy_gradient_loss | -0.00154 | -| std | 0.429 | -| value_loss | 0.00254 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3174 | -| time_elapsed | 31364 | -| total_timesteps | 406272 | -| train/ | | -| approx_kl | 0.0131032225 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | -2.37 | -| learning_rate | 0.0003 | -| loss | -0.000619 | -| n_updates | 31730 | -| policy_gradient_loss | -0.00106 | -| std | 0.429 | -| value_loss | 6.53e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3175 | -| time_elapsed | 31368 | -| total_timesteps | 406400 | -| train/ | | -| approx_kl | 0.00854997 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | -6.64 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 31740 | -| policy_gradient_loss | -0.000737 | -| std | 0.429 | -| value_loss | 3.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3176 | -| time_elapsed | 31371 | -| total_timesteps | 406528 | -| train/ | | -| approx_kl | 0.015390214 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | -0.807 | -| learning_rate | 0.0003 | -| loss | -0.00599 | -| n_updates | 31750 | -| policy_gradient_loss | -0.00565 | -| std | 0.429 | -| value_loss | 2.18e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3177 | -| time_elapsed | 31376 | -| total_timesteps | 406656 | -| train/ | | -| approx_kl | 0.012510036 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.572 | -| explained_variance | -0.637 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 31760 | -| policy_gradient_loss | -0.00186 | -| std | 0.429 | -| value_loss | 5.03e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3178 | -| time_elapsed | 31379 | -| total_timesteps | 406784 | -| train/ | | -| approx_kl | 0.02085847 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.573 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 31770 | -| policy_gradient_loss | -0.0062 | -| std | 0.429 | -| value_loss | 6.66e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 12 | -| iterations | 3179 | -| time_elapsed | 31382 | -| total_timesteps | 406912 | -| train/ | | -| approx_kl | 0.006486337 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.575 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 31780 | -| policy_gradient_loss | -0.00104 | -| std | 0.431 | -| value_loss | 2.15e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3180 | -| time_elapsed | 31385 | -| total_timesteps | 407040 | -| train/ | | -| approx_kl | 0.008417945 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -0.00285 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 31790 | -| policy_gradient_loss | -0.00392 | -| std | 0.433 | -| value_loss | 2.26e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3181 | -| time_elapsed | 31391 | -| total_timesteps | 407168 | -| train/ | | -| approx_kl | 0.0124311205 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | 0.743 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 31800 | -| policy_gradient_loss | -0.00607 | -| std | 0.433 | -| value_loss | 0.001 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3182 | -| time_elapsed | 31395 | -| total_timesteps | 407296 | -| train/ | | -| approx_kl | 0.009744557 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 31810 | -| policy_gradient_loss | -0.00119 | -| std | 0.435 | -| value_loss | 3.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3183 | -| time_elapsed | 31399 | -| total_timesteps | 407424 | -| train/ | | -| approx_kl | 0.009250465 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.645 | -| learning_rate | 0.0003 | -| loss | -0.000499 | -| n_updates | 31820 | -| policy_gradient_loss | -0.00141 | -| std | 0.435 | -| value_loss | 1.55e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3184 | -| time_elapsed | 31402 | -| total_timesteps | 407552 | -| train/ | | -| approx_kl | 0.0005288429 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.000204 | -| n_updates | 31830 | -| policy_gradient_loss | -7.7e-05 | -| std | 0.436 | -| value_loss | 1.24e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3185 | -| time_elapsed | 31406 | -| total_timesteps | 407680 | -| train/ | | -| approx_kl | 0.013079148 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 31840 | -| policy_gradient_loss | -0.00563 | -| std | 0.436 | -| value_loss | 9.04e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3186 | -| time_elapsed | 31410 | -| total_timesteps | 407808 | -| train/ | | -| approx_kl | 0.0056955013 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -0.0603 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 31850 | -| policy_gradient_loss | -0.00127 | -| std | 0.437 | -| value_loss | 1.01e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3187 | -| time_elapsed | 31412 | -| total_timesteps | 407936 | -| train/ | | -| approx_kl | 0.0014105281 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | -0.00788 | -| n_updates | 31860 | -| policy_gradient_loss | 0.000597 | -| std | 0.437 | -| value_loss | 1.62e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3188 | -| time_elapsed | 31415 | -| total_timesteps | 408064 | -| train/ | | -| approx_kl | 0.0010676859 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 31870 | -| policy_gradient_loss | 0.000586 | -| std | 0.438 | -| value_loss | 4.42e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3189 | -| time_elapsed | 31422 | -| total_timesteps | 408192 | -| train/ | | -| approx_kl | 0.014550714 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | 0.561 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 31880 | -| policy_gradient_loss | -0.00454 | -| std | 0.438 | -| value_loss | 0.00618 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3190 | -| time_elapsed | 31425 | -| total_timesteps | 408320 | -| train/ | | -| approx_kl | 0.0137429 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -6.73 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 31890 | -| policy_gradient_loss | -0.00206 | -| std | 0.438 | -| value_loss | 1.83e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3191 | -| time_elapsed | 31428 | -| total_timesteps | 408448 | -| train/ | | -| approx_kl | 4.0519517e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -4.79 | -| learning_rate | 0.0003 | -| loss | -0.000152 | -| n_updates | 31900 | -| policy_gradient_loss | 0.000235 | -| std | 0.439 | -| value_loss | 8.04e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 12 | -| iterations | 3192 | -| time_elapsed | 31433 | -| total_timesteps | 408576 | -| train/ | | -| approx_kl | 0.012269848 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.345 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 31910 | -| policy_gradient_loss | -0.00366 | -| std | 0.44 | -| value_loss | 3.27e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 13 | -| iterations | 3193 | -| time_elapsed | 31437 | -| total_timesteps | 408704 | -| train/ | | -| approx_kl | 0.01005303 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | 0.0037 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 31920 | -| policy_gradient_loss | -0.00166 | -| std | 0.439 | -| value_loss | 2.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 13 | -| iterations | 3194 | -| time_elapsed | 31439 | -| total_timesteps | 408832 | -| train/ | | -| approx_kl | 0.010732432 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | 0.00398 | -| learning_rate | 0.0003 | -| loss | -0.00361 | -| n_updates | 31930 | -| policy_gradient_loss | -0.00347 | -| std | 0.438 | -| value_loss | 2.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 13 | -| iterations | 3195 | -| time_elapsed | 31442 | -| total_timesteps | 408960 | -| train/ | | -| approx_kl | 0.018955138 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 31940 | -| policy_gradient_loss | -0.00931 | -| std | 0.438 | -| value_loss | 3.11e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3196 | -| time_elapsed | 31446 | -| total_timesteps | 409088 | -| train/ | | -| approx_kl | 0.0012911474 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.000308 | -| n_updates | 31950 | -| policy_gradient_loss | 0.000358 | -| std | 0.437 | -| value_loss | 1.31e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3197 | -| time_elapsed | 31454 | -| total_timesteps | 409216 | -| train/ | | -| approx_kl | 0.058660228 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | 0.554 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 31960 | -| policy_gradient_loss | -0.00281 | -| std | 0.436 | -| value_loss | 0.00687 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3198 | -| time_elapsed | 31457 | -| total_timesteps | 409344 | -| train/ | | -| approx_kl | 0.00085071824 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -12.5 | -| learning_rate | 0.0003 | -| loss | -0.00036 | -| n_updates | 31970 | -| policy_gradient_loss | -7.82e-05 | -| std | 0.436 | -| value_loss | 1.3e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3199 | -| time_elapsed | 31459 | -| total_timesteps | 409472 | -| train/ | | -| approx_kl | 0.0097342115 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -8.37 | -| learning_rate | 0.0003 | -| loss | -0.00863 | -| n_updates | 31980 | -| policy_gradient_loss | -0.00312 | -| std | 0.436 | -| value_loss | 5.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3200 | -| time_elapsed | 31462 | -| total_timesteps | 409600 | -| train/ | | -| approx_kl | 0.007566971 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -0.643 | -| learning_rate | 0.0003 | -| loss | -2.23e-05 | -| n_updates | 31990 | -| policy_gradient_loss | -0.000196 | -| std | 0.436 | -| value_loss | 1.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3201 | -| time_elapsed | 31464 | -| total_timesteps | 409728 | -| train/ | | -| approx_kl | 0.010702232 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 32000 | -| policy_gradient_loss | -0.00146 | -| std | 0.437 | -| value_loss | 1.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3202 | -| time_elapsed | 31467 | -| total_timesteps | 409856 | -| train/ | | -| approx_kl | 0.012916672 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.0075 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 32010 | -| policy_gradient_loss | -0.00684 | -| std | 0.437 | -| value_loss | 1.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3203 | -| time_elapsed | 31469 | -| total_timesteps | 409984 | -| train/ | | -| approx_kl | 0.0062714787 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -0.0662 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 32020 | -| policy_gradient_loss | -0.000839 | -| std | 0.436 | -| value_loss | 1.01e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3204 | -| time_elapsed | 31472 | -| total_timesteps | 410112 | -| train/ | | -| approx_kl | 0.010311409 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.00236 | -| learning_rate | 0.0003 | -| loss | -0.00545 | -| n_updates | 32030 | -| policy_gradient_loss | -0.00247 | -| std | 0.435 | -| value_loss | 1.05e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3205 | -| time_elapsed | 31481 | -| total_timesteps | 410240 | -| train/ | | -| approx_kl | 0.0573853 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | 0.688 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 32040 | -| policy_gradient_loss | -0.0118 | -| std | 0.434 | -| value_loss | 0.000747 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3206 | -| time_elapsed | 31484 | -| total_timesteps | 410368 | -| train/ | | -| approx_kl | 0.003248061 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | -0.000946 | -| n_updates | 32050 | -| policy_gradient_loss | -0.000318 | -| std | 0.434 | -| value_loss | 4.92e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3207 | -| time_elapsed | 31486 | -| total_timesteps | 410496 | -| train/ | | -| approx_kl | 0.0045190337 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -32 | -| learning_rate | 0.0003 | -| loss | -0.00941 | -| n_updates | 32060 | -| policy_gradient_loss | -0.00699 | -| std | 0.434 | -| value_loss | 3.29e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3208 | -| time_elapsed | 31489 | -| total_timesteps | 410624 | -| train/ | | -| approx_kl | 0.042166587 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -3.31 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 32070 | -| policy_gradient_loss | -0.0104 | -| std | 0.434 | -| value_loss | 7.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3209 | -| time_elapsed | 31493 | -| total_timesteps | 410752 | -| train/ | | -| approx_kl | 0.003513482 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -0.91 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 32080 | -| policy_gradient_loss | -0.000548 | -| std | 0.433 | -| value_loss | 3.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3210 | -| time_elapsed | 31497 | -| total_timesteps | 410880 | -| train/ | | -| approx_kl | 0.007671579 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 0.000701 | -| n_updates | 32090 | -| policy_gradient_loss | 0.000213 | -| std | 0.433 | -| value_loss | 1.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3211 | -| time_elapsed | 31500 | -| total_timesteps | 411008 | -| train/ | | -| approx_kl | 0.008679816 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00635 | -| n_updates | 32100 | -| policy_gradient_loss | -0.00252 | -| std | 0.433 | -| value_loss | 1.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3212 | -| time_elapsed | 31509 | -| total_timesteps | 411136 | -| train/ | | -| approx_kl | 0.004106221 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | 0.521 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 32110 | -| policy_gradient_loss | -0.0116 | -| std | 0.433 | -| value_loss | 0.00921 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3213 | -| time_elapsed | 31511 | -| total_timesteps | 411264 | -| train/ | | -| approx_kl | 0.00018746266 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -123 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 32120 | -| policy_gradient_loss | -0.00258 | -| std | 0.433 | -| value_loss | 7.01e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3214 | -| time_elapsed | 31514 | -| total_timesteps | 411392 | -| train/ | | -| approx_kl | 0.018016454 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | -30.3 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 32130 | -| policy_gradient_loss | -0.00641 | -| std | 0.433 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3215 | -| time_elapsed | 31518 | -| total_timesteps | 411520 | -| train/ | | -| approx_kl | 0.011045868 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -3.24 | -| learning_rate | 0.0003 | -| loss | 0.000762 | -| n_updates | 32140 | -| policy_gradient_loss | 0.000369 | -| std | 0.434 | -| value_loss | 1.54e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3216 | -| time_elapsed | 31521 | -| total_timesteps | 411648 | -| train/ | | -| approx_kl | 0.0059162946 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.000863 | -| n_updates | 32150 | -| policy_gradient_loss | -0.000769 | -| std | 0.435 | -| value_loss | 9.65e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3217 | -| time_elapsed | 31524 | -| total_timesteps | 411776 | -| train/ | | -| approx_kl | 0.008049812 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | 0.00425 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 32160 | -| policy_gradient_loss | -0.00206 | -| std | 0.435 | -| value_loss | 1.13e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3218 | -| time_elapsed | 31527 | -| total_timesteps | 411904 | -| train/ | | -| approx_kl | 3.4032855e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | 0.0058 | -| learning_rate | 0.0003 | -| loss | -0.000191 | -| n_updates | 32170 | -| policy_gradient_loss | -3.02e-05 | -| std | 0.436 | -| value_loss | 8.03e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3219 | -| time_elapsed | 31530 | -| total_timesteps | 412032 | -| train/ | | -| approx_kl | 0.008443896 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 32180 | -| policy_gradient_loss | -0.00109 | -| std | 0.438 | -| value_loss | 8.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3220 | -| time_elapsed | 31537 | -| total_timesteps | 412160 | -| train/ | | -| approx_kl | 0.002496615 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | 0.693 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 32190 | -| policy_gradient_loss | -0.00873 | -| std | 0.439 | -| value_loss | 0.00235 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3221 | -| time_elapsed | 31540 | -| total_timesteps | 412288 | -| train/ | | -| approx_kl | 0.011500424 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -0.324 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 32200 | -| policy_gradient_loss | -0.00248 | -| std | 0.441 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3222 | -| time_elapsed | 31544 | -| total_timesteps | 412416 | -| train/ | | -| approx_kl | 0.015711114 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -3.53 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 32210 | -| policy_gradient_loss | -0.00681 | -| std | 0.441 | -| value_loss | 1.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3223 | -| time_elapsed | 31548 | -| total_timesteps | 412544 | -| train/ | | -| approx_kl | 0.012717671 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | 0.00137 | -| n_updates | 32220 | -| policy_gradient_loss | 0.000646 | -| std | 0.442 | -| value_loss | 3.64e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3224 | -| time_elapsed | 31551 | -| total_timesteps | 412672 | -| train/ | | -| approx_kl | 0.0016501625 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.0905 | -| learning_rate | 0.0003 | -| loss | 0.00012 | -| n_updates | 32230 | -| policy_gradient_loss | 7.14e-05 | -| std | 0.442 | -| value_loss | 1.96e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3225 | -| time_elapsed | 31555 | -| total_timesteps | 412800 | -| train/ | | -| approx_kl | 0.02181756 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.0237 | -| n_updates | 32240 | -| policy_gradient_loss | -0.013 | -| std | 0.442 | -| value_loss | 1.31e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3226 | -| time_elapsed | 31558 | -| total_timesteps | 412928 | -| train/ | | -| approx_kl | 0.00038567302 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.000459 | -| n_updates | 32250 | -| policy_gradient_loss | 0.000573 | -| std | 0.442 | -| value_loss | 1.23e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3227 | -| time_elapsed | 31561 | -| total_timesteps | 413056 | -| train/ | | -| approx_kl | 0.00085352804 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.000632 | -| n_updates | 32260 | -| policy_gradient_loss | -8.42e-05 | -| std | 0.442 | -| value_loss | 1.13e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3228 | -| time_elapsed | 31567 | -| total_timesteps | 413184 | -| train/ | | -| approx_kl | 0.11954748 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | 0.591 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 32270 | -| policy_gradient_loss | -0.000645 | -| std | 0.441 | -| value_loss | 0.00574 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3229 | -| time_elapsed | 31570 | -| total_timesteps | 413312 | -| train/ | | -| approx_kl | 0.012234834 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -8.88 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 32280 | -| policy_gradient_loss | -0.00228 | -| std | 0.44 | -| value_loss | 2.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3230 | -| time_elapsed | 31573 | -| total_timesteps | 413440 | -| train/ | | -| approx_kl | 0.018976662 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -5.03 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 32290 | -| policy_gradient_loss | -0.00207 | -| std | 0.44 | -| value_loss | 7.33e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3231 | -| time_elapsed | 31576 | -| total_timesteps | 413568 | -| train/ | | -| approx_kl | 0.009936636 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.386 | -| learning_rate | 0.0003 | -| loss | 0.000687 | -| n_updates | 32300 | -| policy_gradient_loss | -0.000439 | -| std | 0.439 | -| value_loss | 2.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3232 | -| time_elapsed | 31579 | -| total_timesteps | 413696 | -| train/ | | -| approx_kl | 0.018123932 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.00938 | -| learning_rate | 0.0003 | -| loss | -0.00968 | -| n_updates | 32310 | -| policy_gradient_loss | -0.00731 | -| std | 0.438 | -| value_loss | 2.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3233 | -| time_elapsed | 31582 | -| total_timesteps | 413824 | -| train/ | | -| approx_kl | 0.010641259 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 32320 | -| policy_gradient_loss | -0.00307 | -| std | 0.438 | -| value_loss | 1.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 13 | -| iterations | 3234 | -| time_elapsed | 31586 | -| total_timesteps | 413952 | -| train/ | | -| approx_kl | 0.014699147 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.00436 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 32330 | -| policy_gradient_loss | -0.00625 | -| std | 0.437 | -| value_loss | 2.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3235 | -| time_elapsed | 31591 | -| total_timesteps | 414080 | -| train/ | | -| approx_kl | 0.018226558 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 32340 | -| policy_gradient_loss | -0.00447 | -| std | 0.437 | -| value_loss | 1.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3236 | -| time_elapsed | 31597 | -| total_timesteps | 414208 | -| train/ | | -| approx_kl | 0.08995059 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | 0.575 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 32350 | -| policy_gradient_loss | -0.00977 | -| std | 0.436 | -| value_loss | 0.00688 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3237 | -| time_elapsed | 31601 | -| total_timesteps | 414336 | -| train/ | | -| approx_kl | 0.025401566 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -2.58 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 32360 | -| policy_gradient_loss | -0.0047 | -| std | 0.437 | -| value_loss | 1.84e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3238 | -| time_elapsed | 31602 | -| total_timesteps | 414464 | -| train/ | | -| approx_kl | 0.0029333362 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -3.34 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 32370 | -| policy_gradient_loss | -0.00185 | -| std | 0.437 | -| value_loss | 1.12e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3239 | -| time_elapsed | 31605 | -| total_timesteps | 414592 | -| train/ | | -| approx_kl | 0.0005772987 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 32380 | -| policy_gradient_loss | 0.00123 | -| std | 0.437 | -| value_loss | 3.34e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3240 | -| time_elapsed | 31607 | -| total_timesteps | 414720 | -| train/ | | -| approx_kl | 0.011818275 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -0.00868 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 32390 | -| policy_gradient_loss | -0.00256 | -| std | 0.436 | -| value_loss | 1.6e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3241 | -| time_elapsed | 31610 | -| total_timesteps | 414848 | -| train/ | | -| approx_kl | 0.0011622701 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.000159 | -| n_updates | 32400 | -| policy_gradient_loss | -1.46e-05 | -| std | 0.437 | -| value_loss | 6.76e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3242 | -| time_elapsed | 31614 | -| total_timesteps | 414976 | -| train/ | | -| approx_kl | 0.010479616 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | -0.00585 | -| n_updates | 32410 | -| policy_gradient_loss | -0.0033 | -| std | 0.438 | -| value_loss | 7.16e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3243 | -| time_elapsed | 31617 | -| total_timesteps | 415104 | -| train/ | | -| approx_kl | 0.0076012686 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | 0.00159 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 32420 | -| policy_gradient_loss | -0.0049 | -| std | 0.438 | -| value_loss | 4.72e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3244 | -| time_elapsed | 31625 | -| total_timesteps | 415232 | -| train/ | | -| approx_kl | 0.057646003 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | 0.567 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 32430 | -| policy_gradient_loss | -0.00346 | -| std | 0.438 | -| value_loss | 0.00755 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3245 | -| time_elapsed | 31628 | -| total_timesteps | 415360 | -| train/ | | -| approx_kl | 0.018916443 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -12.1 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 32440 | -| policy_gradient_loss | -0.00826 | -| std | 0.437 | -| value_loss | 1.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3246 | -| time_elapsed | 31632 | -| total_timesteps | 415488 | -| train/ | | -| approx_kl | 0.022739874 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -9.35 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 32450 | -| policy_gradient_loss | -0.00457 | -| std | 0.437 | -| value_loss | 7.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3247 | -| time_elapsed | 31635 | -| total_timesteps | 415616 | -| train/ | | -| approx_kl | 0.007474401 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.696 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 32460 | -| policy_gradient_loss | -0.0012 | -| std | 0.438 | -| value_loss | 2.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3248 | -| time_elapsed | 31639 | -| total_timesteps | 415744 | -| train/ | | -| approx_kl | 0.004156865 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.00341 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 32470 | -| policy_gradient_loss | -0.000615 | -| std | 0.437 | -| value_loss | 1.7e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 13 | -| iterations | 3249 | -| time_elapsed | 31642 | -| total_timesteps | 415872 | -| train/ | | -| approx_kl | 0.0020980595 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 32480 | -| policy_gradient_loss | -0.000209 | -| std | 0.437 | -| value_loss | 1.79e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3250 | -| time_elapsed | 31646 | -| total_timesteps | 416000 | -| train/ | | -| approx_kl | 0.0008061291 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -0.00328 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 32490 | -| policy_gradient_loss | 0.00141 | -| std | 0.436 | -| value_loss | 1.42e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3251 | -| time_elapsed | 31650 | -| total_timesteps | 416128 | -| train/ | | -| approx_kl | 0.0014959206 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | 0.00977 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 32500 | -| policy_gradient_loss | 0.000323 | -| std | 0.434 | -| value_loss | 2.14e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3252 | -| time_elapsed | 31658 | -| total_timesteps | 416256 | -| train/ | | -| approx_kl | 0.049184307 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | 0.565 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 32510 | -| policy_gradient_loss | -0.00931 | -| std | 0.434 | -| value_loss | 0.00798 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3253 | -| time_elapsed | 31660 | -| total_timesteps | 416384 | -| train/ | | -| approx_kl | 0.0282506 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -3.92 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 32520 | -| policy_gradient_loss | -0.0139 | -| std | 0.433 | -| value_loss | 5.03e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3254 | -| time_elapsed | 31663 | -| total_timesteps | 416512 | -| train/ | | -| approx_kl | 0.017987836 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 32530 | -| policy_gradient_loss | -0.0069 | -| std | 0.433 | -| value_loss | 2.24e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3255 | -| time_elapsed | 31666 | -| total_timesteps | 416640 | -| train/ | | -| approx_kl | 3.580004e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -0.00914 | -| learning_rate | 0.0003 | -| loss | -0.000421 | -| n_updates | 32540 | -| policy_gradient_loss | -0.000135 | -| std | 0.434 | -| value_loss | 2.46e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3256 | -| time_elapsed | 31669 | -| total_timesteps | 416768 | -| train/ | | -| approx_kl | 0.014302725 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 32550 | -| policy_gradient_loss | -0.0068 | -| std | 0.435 | -| value_loss | 3.69e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3257 | -| time_elapsed | 31673 | -| total_timesteps | 416896 | -| train/ | | -| approx_kl | 4.5806868e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | 0.00886 | -| learning_rate | 0.0003 | -| loss | -0.000206 | -| n_updates | 32560 | -| policy_gradient_loss | 2.78e-05 | -| std | 0.437 | -| value_loss | 2.08e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3258 | -| time_elapsed | 31677 | -| total_timesteps | 417024 | -| train/ | | -| approx_kl | 0.021974966 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 32570 | -| policy_gradient_loss | -0.00656 | -| std | 0.438 | -| value_loss | 2.9e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3259 | -| time_elapsed | 31685 | -| total_timesteps | 417152 | -| train/ | | -| approx_kl | 0.38197574 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | 0.291 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 32580 | -| policy_gradient_loss | -0.0107 | -| std | 0.439 | -| value_loss | 0.00102 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3260 | -| time_elapsed | 31689 | -| total_timesteps | 417280 | -| train/ | | -| approx_kl | 0.018009901 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -0.0836 | -| learning_rate | 0.0003 | -| loss | -0.00919 | -| n_updates | 32590 | -| policy_gradient_loss | -0.00656 | -| std | 0.439 | -| value_loss | 5.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3261 | -| time_elapsed | 31693 | -| total_timesteps | 417408 | -| train/ | | -| approx_kl | 0.004670006 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 32600 | -| policy_gradient_loss | -0.00143 | -| std | 0.44 | -| value_loss | 4.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3262 | -| time_elapsed | 31696 | -| total_timesteps | 417536 | -| train/ | | -| approx_kl | 0.009591209 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 32610 | -| policy_gradient_loss | -0.00289 | -| std | 0.44 | -| value_loss | 2.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3263 | -| time_elapsed | 31698 | -| total_timesteps | 417664 | -| train/ | | -| approx_kl | 0.00639511 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -0.0805 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 32620 | -| policy_gradient_loss | -0.000924 | -| std | 0.44 | -| value_loss | 2.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3264 | -| time_elapsed | 31700 | -| total_timesteps | 417792 | -| train/ | | -| approx_kl | 0.005220377 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00728 | -| n_updates | 32630 | -| policy_gradient_loss | -0.00144 | -| std | 0.44 | -| value_loss | 2.62e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3265 | -| time_elapsed | 31704 | -| total_timesteps | 417920 | -| train/ | | -| approx_kl | 0.00058891135 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.000669 | -| n_updates | 32640 | -| policy_gradient_loss | 0.000935 | -| std | 0.44 | -| value_loss | 1.25e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3266 | -| time_elapsed | 31707 | -| total_timesteps | 418048 | -| train/ | | -| approx_kl | 0.010132777 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 32650 | -| policy_gradient_loss | -0.00287 | -| std | 0.44 | -| value_loss | 1.87e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3267 | -| time_elapsed | 31713 | -| total_timesteps | 418176 | -| train/ | | -| approx_kl | 0.01023896 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | 0.577 | -| learning_rate | 0.0003 | -| loss | -0.00562 | -| n_updates | 32660 | -| policy_gradient_loss | -0.00475 | -| std | 0.44 | -| value_loss | 0.00743 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3268 | -| time_elapsed | 31717 | -| total_timesteps | 418304 | -| train/ | | -| approx_kl | 0.0044359444 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -2.85 | -| learning_rate | 0.0003 | -| loss | -0.00864 | -| n_updates | 32670 | -| policy_gradient_loss | -0.00213 | -| std | 0.439 | -| value_loss | 2.01e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3269 | -| time_elapsed | 31722 | -| total_timesteps | 418432 | -| train/ | | -| approx_kl | 0.013619471 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -2.23 | -| learning_rate | 0.0003 | -| loss | 0.000582 | -| n_updates | 32680 | -| policy_gradient_loss | -0.000275 | -| std | 0.44 | -| value_loss | 1.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3270 | -| time_elapsed | 31725 | -| total_timesteps | 418560 | -| train/ | | -| approx_kl | 0.007961342 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 32690 | -| policy_gradient_loss | -0.00119 | -| std | 0.44 | -| value_loss | 8.51e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3271 | -| time_elapsed | 31727 | -| total_timesteps | 418688 | -| train/ | | -| approx_kl | 0.012432943 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -0.0716 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 32700 | -| policy_gradient_loss | -0.00521 | -| std | 0.439 | -| value_loss | 5.78e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3272 | -| time_elapsed | 31730 | -| total_timesteps | 418816 | -| train/ | | -| approx_kl | 0.00980472 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.00169 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 32710 | -| policy_gradient_loss | -0.00212 | -| std | 0.438 | -| value_loss | 3.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3273 | -| time_elapsed | 31735 | -| total_timesteps | 418944 | -| train/ | | -| approx_kl | 0.007737077 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.0024 | -| learning_rate | 0.0003 | -| loss | -0.00998 | -| n_updates | 32720 | -| policy_gradient_loss | -0.00337 | -| std | 0.439 | -| value_loss | 2.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3274 | -| time_elapsed | 31739 | -| total_timesteps | 419072 | -| train/ | | -| approx_kl | 0.026466222 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 32730 | -| policy_gradient_loss | -0.007 | -| std | 0.439 | -| value_loss | 6.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3275 | -| time_elapsed | 31746 | -| total_timesteps | 419200 | -| train/ | | -| approx_kl | 0.014987594 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | 0.728 | -| learning_rate | 0.0003 | -| loss | -0.00568 | -| n_updates | 32740 | -| policy_gradient_loss | -0.00244 | -| std | 0.439 | -| value_loss | 0.000822 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3276 | -| time_elapsed | 31750 | -| total_timesteps | 419328 | -| train/ | | -| approx_kl | 0.033054005 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | -0.000869 | -| n_updates | 32750 | -| policy_gradient_loss | -0.00247 | -| std | 0.44 | -| value_loss | 2.31e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3277 | -| time_elapsed | 31754 | -| total_timesteps | 419456 | -| train/ | | -| approx_kl | 0.01578885 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 32760 | -| policy_gradient_loss | -0.0105 | -| std | 0.439 | -| value_loss | 1.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3278 | -| time_elapsed | 31757 | -| total_timesteps | 419584 | -| train/ | | -| approx_kl | 0.025192862 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -4.66 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 32770 | -| policy_gradient_loss | -0.00352 | -| std | 0.439 | -| value_loss | 1.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3279 | -| time_elapsed | 31760 | -| total_timesteps | 419712 | -| train/ | | -| approx_kl | 0.00900985 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.454 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 32780 | -| policy_gradient_loss | -0.00288 | -| std | 0.438 | -| value_loss | 8.77e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3280 | -| time_elapsed | 31764 | -| total_timesteps | 419840 | -| train/ | | -| approx_kl | 0.0071094204 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 32790 | -| policy_gradient_loss | -0.000962 | -| std | 0.437 | -| value_loss | 5.74e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3281 | -| time_elapsed | 31766 | -| total_timesteps | 419968 | -| train/ | | -| approx_kl | 0.011764645 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.0872 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 32800 | -| policy_gradient_loss | -0.00336 | -| std | 0.437 | -| value_loss | 7.44e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3282 | -| time_elapsed | 31768 | -| total_timesteps | 420096 | -| train/ | | -| approx_kl | 0.00826004 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.00882 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 32810 | -| policy_gradient_loss | -0.0012 | -| std | 0.437 | -| value_loss | 4.09e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3283 | -| time_elapsed | 31775 | -| total_timesteps | 420224 | -| train/ | | -| approx_kl | 0.03425107 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | 0.579 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 32820 | -| policy_gradient_loss | -0.0129 | -| std | 0.438 | -| value_loss | 0.00766 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3284 | -| time_elapsed | 31780 | -| total_timesteps | 420352 | -| train/ | | -| approx_kl | 0.00083624595 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -5.31 | -| learning_rate | 0.0003 | -| loss | 9.21e-05 | -| n_updates | 32830 | -| policy_gradient_loss | 0.000367 | -| std | 0.439 | -| value_loss | 1.48e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3285 | -| time_elapsed | 31785 | -| total_timesteps | 420480 | -| train/ | | -| approx_kl | 0.0006121171 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | 0.000155 | -| n_updates | 32840 | -| policy_gradient_loss | 9.35e-05 | -| std | 0.44 | -| value_loss | 7.71e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3286 | -| time_elapsed | 31788 | -| total_timesteps | 420608 | -| train/ | | -| approx_kl | 0.009841364 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.763 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 32850 | -| policy_gradient_loss | -0.00128 | -| std | 0.44 | -| value_loss | 1.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3287 | -| time_elapsed | 31791 | -| total_timesteps | 420736 | -| train/ | | -| approx_kl | 0.005970498 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 32860 | -| policy_gradient_loss | -0.0012 | -| std | 0.442 | -| value_loss | 1.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3288 | -| time_elapsed | 31794 | -| total_timesteps | 420864 | -| train/ | | -| approx_kl | 0.003611904 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00689 | -| n_updates | 32870 | -| policy_gradient_loss | -0.00147 | -| std | 0.444 | -| value_loss | 8.28e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3289 | -| time_elapsed | 31797 | -| total_timesteps | 420992 | -| train/ | | -| approx_kl | 0.00017870101 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | 0.0061 | -| learning_rate | 0.0003 | -| loss | -0.000572 | -| n_updates | 32880 | -| policy_gradient_loss | 0.000494 | -| std | 0.445 | -| value_loss | 3.68e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3290 | -| time_elapsed | 31800 | -| total_timesteps | 421120 | -| train/ | | -| approx_kl | 0.001678599 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.00679 | -| n_updates | 32890 | -| policy_gradient_loss | 0.000201 | -| std | 0.445 | -| value_loss | 4.77e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3291 | -| time_elapsed | 31809 | -| total_timesteps | 421248 | -| train/ | | -| approx_kl | 3.8859434e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | 0.772 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 32900 | -| policy_gradient_loss | -4.52e-05 | -| std | 0.445 | -| value_loss | 0.000757 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3292 | -| time_elapsed | 31811 | -| total_timesteps | 421376 | -| train/ | | -| approx_kl | 0.016252395 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 32910 | -| policy_gradient_loss | -0.00116 | -| std | 0.445 | -| value_loss | 1.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3293 | -| time_elapsed | 31814 | -| total_timesteps | 421504 | -| train/ | | -| approx_kl | 0.004290159 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -19.1 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 32920 | -| policy_gradient_loss | -0.000452 | -| std | 0.444 | -| value_loss | 8.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3294 | -| time_elapsed | 31817 | -| total_timesteps | 421632 | -| train/ | | -| approx_kl | 0.007684958 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -4.18 | -| learning_rate | 0.0003 | -| loss | -0.00092 | -| n_updates | 32930 | -| policy_gradient_loss | -0.000961 | -| std | 0.443 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3295 | -| time_elapsed | 31819 | -| total_timesteps | 421760 | -| train/ | | -| approx_kl | 0.012666376 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -0.39 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 32940 | -| policy_gradient_loss | -0.00462 | -| std | 0.443 | -| value_loss | 6.81e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3296 | -| time_elapsed | 31823 | -| total_timesteps | 421888 | -| train/ | | -| approx_kl | 0.015750587 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | 0.00475 | -| learning_rate | 0.0003 | -| loss | -0.0371 | -| n_updates | 32950 | -| policy_gradient_loss | -0.0176 | -| std | 0.443 | -| value_loss | 2.48e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3297 | -| time_elapsed | 31825 | -| total_timesteps | 422016 | -| train/ | | -| approx_kl | 0.00040434883 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -0.0616 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 32960 | -| policy_gradient_loss | 0.00232 | -| std | 0.443 | -| value_loss | 3.84e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3298 | -| time_elapsed | 31833 | -| total_timesteps | 422144 | -| train/ | | -| approx_kl | 0.0012203637 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | 0.687 | -| learning_rate | 0.0003 | -| loss | -0.00507 | -| n_updates | 32970 | -| policy_gradient_loss | -0.000314 | -| std | 0.442 | -| value_loss | 0.000646 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3299 | -| time_elapsed | 31838 | -| total_timesteps | 422272 | -| train/ | | -| approx_kl | 0.019299619 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -4.67 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 32980 | -| policy_gradient_loss | -0.00131 | -| std | 0.442 | -| value_loss | 5.67e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3300 | -| time_elapsed | 31841 | -| total_timesteps | 422400 | -| train/ | | -| approx_kl | 7.3830597e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -18.6 | -| learning_rate | 0.0003 | -| loss | -3.64e-05 | -| n_updates | 32990 | -| policy_gradient_loss | -3.26e-06 | -| std | 0.442 | -| value_loss | 1.21e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3301 | -| time_elapsed | 31845 | -| total_timesteps | 422528 | -| train/ | | -| approx_kl | 0.01493538 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 33000 | -| policy_gradient_loss | -0.00557 | -| std | 0.441 | -| value_loss | 3.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3302 | -| time_elapsed | 31849 | -| total_timesteps | 422656 | -| train/ | | -| approx_kl | 0.030597284 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.0976 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 33010 | -| policy_gradient_loss | -0.017 | -| std | 0.441 | -| value_loss | 8.4e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3303 | -| time_elapsed | 31852 | -| total_timesteps | 422784 | -| train/ | | -| approx_kl | 0.006892233 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 33020 | -| policy_gradient_loss | -0.00081 | -| std | 0.442 | -| value_loss | 1e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3304 | -| time_elapsed | 31856 | -| total_timesteps | 422912 | -| train/ | | -| approx_kl | 0.01274216 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 33030 | -| policy_gradient_loss | -0.00205 | -| std | 0.443 | -| value_loss | 9.23e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3305 | -| time_elapsed | 31859 | -| total_timesteps | 423040 | -| train/ | | -| approx_kl | 0.010794013 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -0.0851 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 33040 | -| policy_gradient_loss | -0.000965 | -| std | 0.443 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3306 | -| time_elapsed | 31866 | -| total_timesteps | 423168 | -| train/ | | -| approx_kl | 0.0015887157 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.000685 | -| n_updates | 33050 | -| policy_gradient_loss | -0.000721 | -| std | 0.442 | -| value_loss | 0.00195 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3307 | -| time_elapsed | 31870 | -| total_timesteps | 423296 | -| train/ | | -| approx_kl | 0.014950787 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.673 | -| learning_rate | 0.0003 | -| loss | -0.00767 | -| n_updates | 33060 | -| policy_gradient_loss | -0.00619 | -| std | 0.44 | -| value_loss | 5.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3308 | -| time_elapsed | 31874 | -| total_timesteps | 423424 | -| train/ | | -| approx_kl | 0.015418918 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -5.74 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 33070 | -| policy_gradient_loss | -0.00719 | -| std | 0.44 | -| value_loss | 9.13e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3309 | -| time_elapsed | 31878 | -| total_timesteps | 423552 | -| train/ | | -| approx_kl | 0.0036284246 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.755 | -| learning_rate | 0.0003 | -| loss | -0.0077 | -| n_updates | 33080 | -| policy_gradient_loss | -0.00199 | -| std | 0.44 | -| value_loss | 5.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3310 | -| time_elapsed | 31882 | -| total_timesteps | 423680 | -| train/ | | -| approx_kl | 0.019928489 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 33090 | -| policy_gradient_loss | -0.0127 | -| std | 0.44 | -| value_loss | 1.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3311 | -| time_elapsed | 31885 | -| total_timesteps | 423808 | -| train/ | | -| approx_kl | 0.012309054 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.724 | -| learning_rate | 0.0003 | -| loss | -0.000626 | -| n_updates | 33100 | -| policy_gradient_loss | -0.00194 | -| std | 0.44 | -| value_loss | 8.26e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3312 | -| time_elapsed | 31889 | -| total_timesteps | 423936 | -| train/ | | -| approx_kl | 0.013432357 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | 0.00338 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 33110 | -| policy_gradient_loss | -0.00257 | -| std | 0.441 | -| value_loss | 4.15e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3313 | -| time_elapsed | 31892 | -| total_timesteps | 424064 | -| train/ | | -| approx_kl | 0.014834695 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 33120 | -| policy_gradient_loss | -0.0109 | -| std | 0.441 | -| value_loss | 4.94e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3314 | -| time_elapsed | 31897 | -| total_timesteps | 424192 | -| train/ | | -| approx_kl | 0.0035829267 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | 0.741 | -| learning_rate | 0.0003 | -| loss | -0.00709 | -| n_updates | 33130 | -| policy_gradient_loss | -0.00528 | -| std | 0.441 | -| value_loss | 0.00219 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3315 | -| time_elapsed | 31899 | -| total_timesteps | 424320 | -| train/ | | -| approx_kl | 0.017590895 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 33140 | -| policy_gradient_loss | -0.0062 | -| std | 0.441 | -| value_loss | 1.86e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3316 | -| time_elapsed | 31901 | -| total_timesteps | 424448 | -| train/ | | -| approx_kl | 0.0011318338 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | 9.57e-05 | -| n_updates | 33150 | -| policy_gradient_loss | 0.000143 | -| std | 0.443 | -| value_loss | 2.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3317 | -| time_elapsed | 31905 | -| total_timesteps | 424576 | -| train/ | | -| approx_kl | 0.011891859 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -0.235 | -| learning_rate | 0.0003 | -| loss | -0.00453 | -| n_updates | 33160 | -| policy_gradient_loss | -0.003 | -| std | 0.444 | -| value_loss | 2e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3318 | -| time_elapsed | 31908 | -| total_timesteps | 424704 | -| train/ | | -| approx_kl | 0.02307182 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.00774 | -| n_updates | 33170 | -| policy_gradient_loss | -0.00628 | -| std | 0.445 | -| value_loss | 1.24e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3319 | -| time_elapsed | 31912 | -| total_timesteps | 424832 | -| train/ | | -| approx_kl | 0.0075309244 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 33180 | -| policy_gradient_loss | -0.00231 | -| std | 0.445 | -| value_loss | 1.03e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3320 | -| time_elapsed | 31916 | -| total_timesteps | 424960 | -| train/ | | -| approx_kl | 0.0048266044 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | -0.000448 | -| n_updates | 33190 | -| policy_gradient_loss | -0.0003 | -| std | 0.445 | -| value_loss | 1.01e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3321 | -| time_elapsed | 31920 | -| total_timesteps | 425088 | -| train/ | | -| approx_kl | 0.004133025 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 33200 | -| policy_gradient_loss | -0.000538 | -| std | 0.445 | -| value_loss | 4.26e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3322 | -| time_elapsed | 31929 | -| total_timesteps | 425216 | -| train/ | | -| approx_kl | 0.003599567 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | 0.768 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 33210 | -| policy_gradient_loss | -0.0072 | -| std | 0.445 | -| value_loss | 0.00171 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3323 | -| time_elapsed | 31932 | -| total_timesteps | 425344 | -| train/ | | -| approx_kl | 0.00039112032 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.000487 | -| n_updates | 33220 | -| policy_gradient_loss | 0.000721 | -| std | 0.445 | -| value_loss | 1.12e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3324 | -| time_elapsed | 31935 | -| total_timesteps | 425472 | -| train/ | | -| approx_kl | 0.019170815 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -0.92 | -| learning_rate | 0.0003 | -| loss | -5.24e-05 | -| n_updates | 33230 | -| policy_gradient_loss | -0.00156 | -| std | 0.445 | -| value_loss | 4.04e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3325 | -| time_elapsed | 31939 | -| total_timesteps | 425600 | -| train/ | | -| approx_kl | 0.0019617616 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -0.0802 | -| learning_rate | 0.0003 | -| loss | -0.000867 | -| n_updates | 33240 | -| policy_gradient_loss | -0.000322 | -| std | 0.446 | -| value_loss | 3.03e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3326 | -| time_elapsed | 31943 | -| total_timesteps | 425728 | -| train/ | | -| approx_kl | 0.00026851008 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.614 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.000736 | -| n_updates | 33250 | -| policy_gradient_loss | -0.000295 | -| std | 0.449 | -| value_loss | 1.31e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3327 | -| time_elapsed | 31946 | -| total_timesteps | 425856 | -| train/ | | -| approx_kl | 0.016568452 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -0.0925 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 33260 | -| policy_gradient_loss | -0.00624 | -| std | 0.45 | -| value_loss | 7.35e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3328 | -| time_elapsed | 31950 | -| total_timesteps | 425984 | -| train/ | | -| approx_kl | 1.4013611e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.623 | -| explained_variance | 0.00157 | -| learning_rate | 0.0003 | -| loss | -0.000158 | -| n_updates | 33270 | -| policy_gradient_loss | 8.5e-05 | -| std | 0.452 | -| value_loss | 5.77e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3329 | -| time_elapsed | 31953 | -| total_timesteps | 426112 | -| train/ | | -| approx_kl | 2.98284e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.625 | -| explained_variance | -0.0954 | -| learning_rate | 0.0003 | -| loss | 4.81e-05 | -| n_updates | 33280 | -| policy_gradient_loss | 0.000115 | -| std | 0.452 | -| value_loss | 5.37e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3330 | -| time_elapsed | 31963 | -| total_timesteps | 426240 | -| train/ | | -| approx_kl | 0.005585975 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.624 | -| explained_variance | 0.583 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 33290 | -| policy_gradient_loss | -0.0129 | -| std | 0.451 | -| value_loss | 0.00805 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3331 | -| time_elapsed | 31965 | -| total_timesteps | 426368 | -| train/ | | -| approx_kl | 0.0012616436 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.624 | -| explained_variance | -223 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 33300 | -| policy_gradient_loss | -0.000275 | -| std | 0.452 | -| value_loss | 5.28e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3332 | -| time_elapsed | 31969 | -| total_timesteps | 426496 | -| train/ | | -| approx_kl | 0.021603517 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.627 | -| explained_variance | -227 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 33310 | -| policy_gradient_loss | -0.00196 | -| std | 0.453 | -| value_loss | 2.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3333 | -| time_elapsed | 31972 | -| total_timesteps | 426624 | -| train/ | | -| approx_kl | 0.021865254 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | -0.629 | -| explained_variance | -21.7 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 33320 | -| policy_gradient_loss | -0.00175 | -| std | 0.455 | -| value_loss | 1.42e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3334 | -| time_elapsed | 31975 | -| total_timesteps | 426752 | -| train/ | | -| approx_kl | 0.01645736 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.631 | -| explained_variance | -0.504 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 33330 | -| policy_gradient_loss | -0.00389 | -| std | 0.455 | -| value_loss | 2.26e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3335 | -| time_elapsed | 31978 | -| total_timesteps | 426880 | -| train/ | | -| approx_kl | 0.0012390504 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.632 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | -0.000717 | -| n_updates | 33340 | -| policy_gradient_loss | -0.000105 | -| std | 0.455 | -| value_loss | 1.91e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3336 | -| time_elapsed | 31981 | -| total_timesteps | 427008 | -| train/ | | -| approx_kl | 0.0047358302 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.631 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.00722 | -| n_updates | 33350 | -| policy_gradient_loss | -0.00195 | -| std | 0.454 | -| value_loss | 1.02e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3337 | -| time_elapsed | 31990 | -| total_timesteps | 427136 | -| train/ | | -| approx_kl | 0.0029727323 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.629 | -| explained_variance | 0.786 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 33360 | -| policy_gradient_loss | -0.0107 | -| std | 0.454 | -| value_loss | 0.00157 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3338 | -| time_elapsed | 31994 | -| total_timesteps | 427264 | -| train/ | | -| approx_kl | 0.00030657346 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.628 | -| explained_variance | -12.5 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 33370 | -| policy_gradient_loss | 0.00388 | -| std | 0.454 | -| value_loss | 1.29e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3339 | -| time_elapsed | 31999 | -| total_timesteps | 427392 | -| train/ | | -| approx_kl | 0.0006391504 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.629 | -| explained_variance | -29.3 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 33380 | -| policy_gradient_loss | 0.000234 | -| std | 0.454 | -| value_loss | 3.39e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3340 | -| time_elapsed | 32002 | -| total_timesteps | 427520 | -| train/ | | -| approx_kl | 0.0017306111 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.628 | -| explained_variance | -6.68 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 33390 | -| policy_gradient_loss | 3.55e-05 | -| std | 0.454 | -| value_loss | 8.19e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3341 | -| time_elapsed | 32006 | -| total_timesteps | 427648 | -| train/ | | -| approx_kl | 0.00075749867 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.628 | -| explained_variance | -0.258 | -| learning_rate | 0.0003 | -| loss | -0.00574 | -| n_updates | 33400 | -| policy_gradient_loss | 0.00165 | -| std | 0.454 | -| value_loss | 3.42e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3342 | -| time_elapsed | 32009 | -| total_timesteps | 427776 | -| train/ | | -| approx_kl | 0.01832918 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.629 | -| explained_variance | -0.068 | -| learning_rate | 0.0003 | -| loss | 0.00334 | -| n_updates | 33410 | -| policy_gradient_loss | -0.000211 | -| std | 0.454 | -| value_loss | 1.82e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3343 | -| time_elapsed | 32012 | -| total_timesteps | 427904 | -| train/ | | -| approx_kl | 0.017633647 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.629 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 33420 | -| policy_gradient_loss | -0.00775 | -| std | 0.454 | -| value_loss | 1.33e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3344 | -| time_elapsed | 32015 | -| total_timesteps | 428032 | -| train/ | | -| approx_kl | 0.0127157625 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.628 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | 0.000778 | -| n_updates | 33430 | -| policy_gradient_loss | -0.000608 | -| std | 0.453 | -| value_loss | 1.96e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3345 | -| time_elapsed | 32021 | -| total_timesteps | 428160 | -| train/ | | -| approx_kl | 0.037062503 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.627 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 33440 | -| policy_gradient_loss | -0.0181 | -| std | 0.453 | -| value_loss | 0.00059 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3346 | -| time_elapsed | 32026 | -| total_timesteps | 428288 | -| train/ | | -| approx_kl | 0.03460889 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | -0.626 | -| explained_variance | -20.3 | -| learning_rate | 0.0003 | -| loss | -0.00655 | -| n_updates | 33450 | -| policy_gradient_loss | -0.00523 | -| std | 0.452 | -| value_loss | 1.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3347 | -| time_elapsed | 32028 | -| total_timesteps | 428416 | -| train/ | | -| approx_kl | 0.005886012 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.624 | -| explained_variance | -29.3 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 33460 | -| policy_gradient_loss | -0.00108 | -| std | 0.451 | -| value_loss | 8.31e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3348 | -| time_elapsed | 32031 | -| total_timesteps | 428544 | -| train/ | | -| approx_kl | 0.0024884767 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -4.51 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 33470 | -| policy_gradient_loss | -0.000822 | -| std | 0.449 | -| value_loss | 1.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3349 | -| time_elapsed | 32034 | -| total_timesteps | 428672 | -| train/ | | -| approx_kl | 0.025923373 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 33480 | -| policy_gradient_loss | -0.0132 | -| std | 0.449 | -| value_loss | 7.64e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3350 | -| time_elapsed | 32036 | -| total_timesteps | 428800 | -| train/ | | -| approx_kl | 0.00015133317 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.0921 | -| learning_rate | 0.0003 | -| loss | -0.000218 | -| n_updates | 33490 | -| policy_gradient_loss | -6.76e-05 | -| std | 0.449 | -| value_loss | 2.87e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 13 | -| iterations | 3351 | -| time_elapsed | 32039 | -| total_timesteps | 428928 | -| train/ | | -| approx_kl | 0.010055482 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.000597 | -| n_updates | 33500 | -| policy_gradient_loss | -0.00082 | -| std | 0.45 | -| value_loss | 2.1e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3352 | -| time_elapsed | 32042 | -| total_timesteps | 429056 | -| train/ | | -| approx_kl | 0.0126487855 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 33510 | -| policy_gradient_loss | -0.00388 | -| std | 0.45 | -| value_loss | 1.75e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3353 | -| time_elapsed | 32048 | -| total_timesteps | 429184 | -| train/ | | -| approx_kl | 0.026345853 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 33520 | -| policy_gradient_loss | -0.0189 | -| std | 0.45 | -| value_loss | 0.00118 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3354 | -| time_elapsed | 32050 | -| total_timesteps | 429312 | -| train/ | | -| approx_kl | 0.023622986 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 33530 | -| policy_gradient_loss | -0.00625 | -| std | 0.449 | -| value_loss | 2.75e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3355 | -| time_elapsed | 32053 | -| total_timesteps | 429440 | -| train/ | | -| approx_kl | 0.0007802611 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -3.15 | -| learning_rate | 0.0003 | -| loss | -0.000762 | -| n_updates | 33540 | -| policy_gradient_loss | -0.000317 | -| std | 0.449 | -| value_loss | 1.36e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3356 | -| time_elapsed | 32055 | -| total_timesteps | 429568 | -| train/ | | -| approx_kl | 0.010153606 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.617 | -| explained_variance | -0.576 | -| learning_rate | 0.0003 | -| loss | 0.000295 | -| n_updates | 33550 | -| policy_gradient_loss | -0.000684 | -| std | 0.449 | -| value_loss | 1.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3357 | -| time_elapsed | 32058 | -| total_timesteps | 429696 | -| train/ | | -| approx_kl | 0.00615352 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.482 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 33560 | -| policy_gradient_loss | -0.00107 | -| std | 0.449 | -| value_loss | 2.65e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3358 | -| time_elapsed | 32062 | -| total_timesteps | 429824 | -| train/ | | -| approx_kl | 0.01245104 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -0.092 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 33570 | -| policy_gradient_loss | -0.00654 | -| std | 0.448 | -| value_loss | 1.46e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3359 | -| time_elapsed | 32065 | -| total_timesteps | 429952 | -| train/ | | -| approx_kl | 0.014705941 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | 0.0016 | -| learning_rate | 0.0003 | -| loss | -0.000244 | -| n_updates | 33580 | -| policy_gradient_loss | -0.0015 | -| std | 0.448 | -| value_loss | 8.9e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3360 | -| time_elapsed | 32070 | -| total_timesteps | 430080 | -| train/ | | -| approx_kl | 0.0077843843 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.614 | -| explained_variance | -0.000302 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 33590 | -| policy_gradient_loss | -0.00246 | -| std | 0.447 | -| value_loss | 7.7e-09 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3361 | -| time_elapsed | 32077 | -| total_timesteps | 430208 | -| train/ | | -| approx_kl | 0.08982 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.613 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.0266 | -| n_updates | 33600 | -| policy_gradient_loss | -0.0177 | -| std | 0.447 | -| value_loss | 0.000434 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3362 | -| time_elapsed | 32081 | -| total_timesteps | 430336 | -| train/ | | -| approx_kl | 0.013255641 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.613 | -| explained_variance | -24.9 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 33610 | -| policy_gradient_loss | -0.0022 | -| std | 0.446 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3363 | -| time_elapsed | 32085 | -| total_timesteps | 430464 | -| train/ | | -| approx_kl | 0.0005132712 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.612 | -| explained_variance | -46.4 | -| learning_rate | 0.0003 | -| loss | 0.000259 | -| n_updates | 33620 | -| policy_gradient_loss | 0.00059 | -| std | 0.446 | -| value_loss | 6.43e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3364 | -| time_elapsed | 32088 | -| total_timesteps | 430592 | -| train/ | | -| approx_kl | 0.031891223 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -5.2 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 33630 | -| policy_gradient_loss | -0.00737 | -| std | 0.445 | -| value_loss | 1.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3365 | -| time_elapsed | 32092 | -| total_timesteps | 430720 | -| train/ | | -| approx_kl | 0.0040206164 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -0.0942 | -| learning_rate | 0.0003 | -| loss | -0.000143 | -| n_updates | 33640 | -| policy_gradient_loss | 6.59e-06 | -| std | 0.444 | -| value_loss | 2.93e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3366 | -| time_elapsed | 32096 | -| total_timesteps | 430848 | -| train/ | | -| approx_kl | 0.00060613523 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | -0.000601 | -| n_updates | 33650 | -| policy_gradient_loss | 2.82e-06 | -| std | 0.444 | -| value_loss | 2.52e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3367 | -| time_elapsed | 32100 | -| total_timesteps | 430976 | -| train/ | | -| approx_kl | 0.0004101121 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | 1.56e-05 | -| n_updates | 33660 | -| policy_gradient_loss | 0.000167 | -| std | 0.445 | -| value_loss | 1.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3368 | -| time_elapsed | 32104 | -| total_timesteps | 431104 | -| train/ | | -| approx_kl | 0.005549956 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 33670 | -| policy_gradient_loss | -0.000675 | -| std | 0.446 | -| value_loss | 7.88e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3369 | -| time_elapsed | 32113 | -| total_timesteps | 431232 | -| train/ | | -| approx_kl | 0.019133706 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.613 | -| explained_variance | 0.615 | -| learning_rate | 0.0003 | -| loss | -0.00742 | -| n_updates | 33680 | -| policy_gradient_loss | -0.00857 | -| std | 0.447 | -| value_loss | 0.00683 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3370 | -| time_elapsed | 32117 | -| total_timesteps | 431360 | -| train/ | | -| approx_kl | 0.024259742 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.613 | -| explained_variance | -768 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 33690 | -| policy_gradient_loss | -0.00698 | -| std | 0.447 | -| value_loss | 1.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3371 | -| time_elapsed | 32121 | -| total_timesteps | 431488 | -| train/ | | -| approx_kl | 0.010054371 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.614 | -| explained_variance | -831 | -| learning_rate | 0.0003 | -| loss | 0.00122 | -| n_updates | 33700 | -| policy_gradient_loss | 0.00073 | -| std | 0.447 | -| value_loss | 7.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3372 | -| time_elapsed | 32125 | -| total_timesteps | 431616 | -| train/ | | -| approx_kl | 0.012799991 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -645 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 33710 | -| policy_gradient_loss | -0.00459 | -| std | 0.448 | -| value_loss | 3.43e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3373 | -| time_elapsed | 32128 | -| total_timesteps | 431744 | -| train/ | | -| approx_kl | 0.03307407 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -25.2 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 33720 | -| policy_gradient_loss | -0.00403 | -| std | 0.448 | -| value_loss | 6.1e-10 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3374 | -| time_elapsed | 32132 | -| total_timesteps | 431872 | -| train/ | | -| approx_kl | 2.6058406e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -2.01 | -| learning_rate | 0.0003 | -| loss | 5.19e-05 | -| n_updates | 33730 | -| policy_gradient_loss | 0.00053 | -| std | 0.448 | -| value_loss | 1.14e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3375 | -| time_elapsed | 32136 | -| total_timesteps | 432000 | -| train/ | | -| approx_kl | 0.013630385 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -0.508 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 33740 | -| policy_gradient_loss | -0.00387 | -| std | 0.448 | -| value_loss | 5.5e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3376 | -| time_elapsed | 32138 | -| total_timesteps | 432128 | -| train/ | | -| approx_kl | 0.0011379695 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | 0.00567 | -| learning_rate | 0.0003 | -| loss | -0.000575 | -| n_updates | 33750 | -| policy_gradient_loss | -0.000212 | -| std | 0.447 | -| value_loss | 2.88e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3377 | -| time_elapsed | 32145 | -| total_timesteps | 432256 | -| train/ | | -| approx_kl | 0.007876549 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.614 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 33760 | -| policy_gradient_loss | -0.00553 | -| std | 0.447 | -| value_loss | 0.000437 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3378 | -| time_elapsed | 32147 | -| total_timesteps | 432384 | -| train/ | | -| approx_kl | 0.00087174866 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -40.3 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 33770 | -| policy_gradient_loss | 0.00116 | -| std | 0.448 | -| value_loss | 1.29e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3379 | -| time_elapsed | 32151 | -| total_timesteps | 432512 | -| train/ | | -| approx_kl | 0.001351058 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -60.5 | -| learning_rate | 0.0003 | -| loss | -0.00796 | -| n_updates | 33780 | -| policy_gradient_loss | 0.0012 | -| std | 0.448 | -| value_loss | 6.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3380 | -| time_elapsed | 32154 | -| total_timesteps | 432640 | -| train/ | | -| approx_kl | 0.05123624 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -19 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 33790 | -| policy_gradient_loss | -0.0154 | -| std | 0.448 | -| value_loss | 8.42e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3381 | -| time_elapsed | 32158 | -| total_timesteps | 432768 | -| train/ | | -| approx_kl | 0.0059397793 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | 0.000916 | -| n_updates | 33800 | -| policy_gradient_loss | 0.000589 | -| std | 0.448 | -| value_loss | 2.37e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3382 | -| time_elapsed | 32161 | -| total_timesteps | 432896 | -| train/ | | -| approx_kl | 0.01406875 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.00506 | -| n_updates | 33810 | -| policy_gradient_loss | -0.00317 | -| std | 0.448 | -| value_loss | 1.12e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3383 | -| time_elapsed | 32164 | -| total_timesteps | 433024 | -| train/ | | -| approx_kl | 0.007867018 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.000615 | -| n_updates | 33820 | -| policy_gradient_loss | -0.000725 | -| std | 0.448 | -| value_loss | 1.16e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3384 | -| time_elapsed | 32173 | -| total_timesteps | 433152 | -| train/ | | -| approx_kl | 0.0028947517 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | 0.73 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 33830 | -| policy_gradient_loss | -0.0127 | -| std | 0.448 | -| value_loss | 0.00323 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3385 | -| time_elapsed | 32177 | -| total_timesteps | 433280 | -| train/ | | -| approx_kl | 0.019475985 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.617 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 33840 | -| policy_gradient_loss | -0.00664 | -| std | 0.448 | -| value_loss | 3.34e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3386 | -| time_elapsed | 32180 | -| total_timesteps | 433408 | -| train/ | | -| approx_kl | 3.387849e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -185 | -| learning_rate | 0.0003 | -| loss | 0.000296 | -| n_updates | 33850 | -| policy_gradient_loss | 0.00159 | -| std | 0.449 | -| value_loss | 1.75e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3387 | -| time_elapsed | 32184 | -| total_timesteps | 433536 | -| train/ | | -| approx_kl | 0.036819033 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -19.9 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 33860 | -| policy_gradient_loss | -0.0067 | -| std | 0.449 | -| value_loss | 1.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3388 | -| time_elapsed | 32186 | -| total_timesteps | 433664 | -| train/ | | -| approx_kl | 0.02212624 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 33870 | -| policy_gradient_loss | -0.00983 | -| std | 0.45 | -| value_loss | 3.22e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3389 | -| time_elapsed | 32189 | -| total_timesteps | 433792 | -| train/ | | -| approx_kl | 0.008382755 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -0.0798 | -| learning_rate | 0.0003 | -| loss | -0.00095 | -| n_updates | 33880 | -| policy_gradient_loss | -0.00096 | -| std | 0.449 | -| value_loss | 2.95e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 13 | -| iterations | 3390 | -| time_elapsed | 32193 | -| total_timesteps | 433920 | -| train/ | | -| approx_kl | 0.018503863 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 33890 | -| policy_gradient_loss | -0.0125 | -| std | 0.449 | -| value_loss | 3.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3391 | -| time_elapsed | 32197 | -| total_timesteps | 434048 | -| train/ | | -| approx_kl | 0.004030927 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.00725 | -| n_updates | 33900 | -| policy_gradient_loss | -0.00125 | -| std | 0.449 | -| value_loss | 1.09e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3392 | -| time_elapsed | 32204 | -| total_timesteps | 434176 | -| train/ | | -| approx_kl | 0.023315743 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.00874 | -| n_updates | 33910 | -| policy_gradient_loss | -0.00683 | -| std | 0.45 | -| value_loss | 0.00054 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3393 | -| time_elapsed | 32208 | -| total_timesteps | 434304 | -| train/ | | -| approx_kl | 0.0019234421 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -21.8 | -| learning_rate | 0.0003 | -| loss | -0.00063 | -| n_updates | 33920 | -| policy_gradient_loss | -0.000251 | -| std | 0.45 | -| value_loss | 3.61e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3394 | -| time_elapsed | 32212 | -| total_timesteps | 434432 | -| train/ | | -| approx_kl | 0.013671215 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -33.7 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 33930 | -| policy_gradient_loss | -0.00596 | -| std | 0.45 | -| value_loss | 2.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3395 | -| time_elapsed | 32216 | -| total_timesteps | 434560 | -| train/ | | -| approx_kl | 0.024584467 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 33940 | -| policy_gradient_loss | -0.012 | -| std | 0.45 | -| value_loss | 2.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3396 | -| time_elapsed | 32219 | -| total_timesteps | 434688 | -| train/ | | -| approx_kl | 0.017063625 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.621 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 33950 | -| policy_gradient_loss | -0.00407 | -| std | 0.45 | -| value_loss | 1.76e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3397 | -| time_elapsed | 32223 | -| total_timesteps | 434816 | -| train/ | | -| approx_kl | 0.01570237 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 33960 | -| policy_gradient_loss | -0.00815 | -| std | 0.45 | -| value_loss | 1.56e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3398 | -| time_elapsed | 32225 | -| total_timesteps | 434944 | -| train/ | | -| approx_kl | 0.0044919113 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -0.000103 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 33970 | -| policy_gradient_loss | -0.00311 | -| std | 0.45 | -| value_loss | 1.51e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3399 | -| time_elapsed | 32229 | -| total_timesteps | 435072 | -| train/ | | -| approx_kl | 0.00026122783 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | -0.000701 | -| n_updates | 33980 | -| policy_gradient_loss | 0.000641 | -| std | 0.449 | -| value_loss | 1.01e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3400 | -| time_elapsed | 32235 | -| total_timesteps | 435200 | -| train/ | | -| approx_kl | 0.02474389 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | 0.776 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 33990 | -| policy_gradient_loss | -0.0149 | -| std | 0.45 | -| value_loss | 0.00243 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3401 | -| time_elapsed | 32239 | -| total_timesteps | 435328 | -| train/ | | -| approx_kl | 0.019252682 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -62.4 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 34000 | -| policy_gradient_loss | -0.0144 | -| std | 0.449 | -| value_loss | 2.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3402 | -| time_elapsed | 32243 | -| total_timesteps | 435456 | -| train/ | | -| approx_kl | 0.008145665 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -96.2 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 34010 | -| policy_gradient_loss | -0.000893 | -| std | 0.45 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3403 | -| time_elapsed | 32246 | -| total_timesteps | 435584 | -| train/ | | -| approx_kl | 0.014944784 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -4.54 | -| learning_rate | 0.0003 | -| loss | -0.000958 | -| n_updates | 34020 | -| policy_gradient_loss | -0.00164 | -| std | 0.45 | -| value_loss | 8.99e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3404 | -| time_elapsed | 32249 | -| total_timesteps | 435712 | -| train/ | | -| approx_kl | 0.011634526 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.622 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | -0.00575 | -| n_updates | 34030 | -| policy_gradient_loss | -0.00328 | -| std | 0.451 | -| value_loss | 5.36e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3405 | -| time_elapsed | 32252 | -| total_timesteps | 435840 | -| train/ | | -| approx_kl | 0.014230545 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.622 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 34040 | -| policy_gradient_loss | -0.00358 | -| std | 0.451 | -| value_loss | 4.91e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3406 | -| time_elapsed | 32255 | -| total_timesteps | 435968 | -| train/ | | -| approx_kl | 0.011793889 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.622 | -| explained_variance | -0.0697 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 34050 | -| policy_gradient_loss | -0.00219 | -| std | 0.45 | -| value_loss | 3.3e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3407 | -| time_elapsed | 32258 | -| total_timesteps | 436096 | -| train/ | | -| approx_kl | 0.010623681 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | -0.00565 | -| n_updates | 34060 | -| policy_gradient_loss | -0.00323 | -| std | 0.45 | -| value_loss | 6.46e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3408 | -| time_elapsed | 32267 | -| total_timesteps | 436224 | -| train/ | | -| approx_kl | 0.007523533 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | 0.874 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 34070 | -| policy_gradient_loss | -0.00259 | -| std | 0.449 | -| value_loss | 0.000366 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3409 | -| time_elapsed | 32272 | -| total_timesteps | 436352 | -| train/ | | -| approx_kl | 0.01658577 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -62.6 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 34080 | -| policy_gradient_loss | -0.00665 | -| std | 0.449 | -| value_loss | 1.23e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3410 | -| time_elapsed | 32275 | -| total_timesteps | 436480 | -| train/ | | -| approx_kl | 0.001970153 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -50.4 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 34090 | -| policy_gradient_loss | -0.000191 | -| std | 0.449 | -| value_loss | 4.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3411 | -| time_elapsed | 32278 | -| total_timesteps | 436608 | -| train/ | | -| approx_kl | 0.036358498 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | -0.617 | -| explained_variance | -5.77 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 34100 | -| policy_gradient_loss | -0.0142 | -| std | 0.448 | -| value_loss | 7.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3412 | -| time_elapsed | 32282 | -| total_timesteps | 436736 | -| train/ | | -| approx_kl | 0.018682167 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | -0.617 | -| explained_variance | -0.525 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 34110 | -| policy_gradient_loss | -0.00284 | -| std | 0.449 | -| value_loss | 4.34e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3413 | -| time_elapsed | 32285 | -| total_timesteps | 436864 | -| train/ | | -| approx_kl | 0.0058175963 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -0.0882 | -| learning_rate | 0.0003 | -| loss | -0.00055 | -| n_updates | 34120 | -| policy_gradient_loss | -0.000636 | -| std | 0.449 | -| value_loss | 1.28e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3414 | -| time_elapsed | 32288 | -| total_timesteps | 436992 | -| train/ | | -| approx_kl | 0.010670469 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 34130 | -| policy_gradient_loss | -0.00283 | -| std | 0.449 | -| value_loss | 1.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3415 | -| time_elapsed | 32291 | -| total_timesteps | 437120 | -| train/ | | -| approx_kl | 0.003952253 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | 0.00329 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 34140 | -| policy_gradient_loss | -0.000925 | -| std | 0.446 | -| value_loss | 9.96e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3416 | -| time_elapsed | 32300 | -| total_timesteps | 437248 | -| train/ | | -| approx_kl | 0.016760834 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.611 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 34150 | -| policy_gradient_loss | -0.0122 | -| std | 0.445 | -| value_loss | 0.00204 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3417 | -| time_elapsed | 32305 | -| total_timesteps | 437376 | -| train/ | | -| approx_kl | 0.031134991 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -202 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 34160 | -| policy_gradient_loss | -0.00888 | -| std | 0.445 | -| value_loss | 2.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3418 | -| time_elapsed | 32309 | -| total_timesteps | 437504 | -| train/ | | -| approx_kl | 0.03801522 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -262 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 34170 | -| policy_gradient_loss | -0.0149 | -| std | 0.444 | -| value_loss | 1.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3419 | -| time_elapsed | 32313 | -| total_timesteps | 437632 | -| train/ | | -| approx_kl | 0.023201808 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -28.2 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 34180 | -| policy_gradient_loss | -0.00712 | -| std | 0.444 | -| value_loss | 9.85e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3420 | -| time_elapsed | 32317 | -| total_timesteps | 437760 | -| train/ | | -| approx_kl | 0.0028692072 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.000219 | -| n_updates | 34190 | -| policy_gradient_loss | -9.1e-05 | -| std | 0.445 | -| value_loss | 1.54e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3421 | -| time_elapsed | 32319 | -| total_timesteps | 437888 | -| train/ | | -| approx_kl | 0.0014091684 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.611 | -| explained_variance | -0.0996 | -| learning_rate | 0.0003 | -| loss | -0.000835 | -| n_updates | 34200 | -| policy_gradient_loss | -0.000309 | -| std | 0.447 | -| value_loss | 1.05e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3422 | -| time_elapsed | 32323 | -| total_timesteps | 438016 | -| train/ | | -| approx_kl | 0.013430877 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.614 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 34210 | -| policy_gradient_loss | -0.0029 | -| std | 0.448 | -| value_loss | 9.04e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3423 | -| time_elapsed | 32332 | -| total_timesteps | 438144 | -| train/ | | -| approx_kl | 0.007974076 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | 0.691 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 34220 | -| policy_gradient_loss | -0.00304 | -| std | 0.448 | -| value_loss | 0.00565 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3424 | -| time_elapsed | 32334 | -| total_timesteps | 438272 | -| train/ | | -| approx_kl | 0.016286464 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -1.11e+03 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 34230 | -| policy_gradient_loss | -0.00301 | -| std | 0.448 | -| value_loss | 4.36e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3425 | -| time_elapsed | 32338 | -| total_timesteps | 438400 | -| train/ | | -| approx_kl | 5.197013e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -1.11e+03 | -| learning_rate | 0.0003 | -| loss | -0.000233 | -| n_updates | 34240 | -| policy_gradient_loss | 0.00206 | -| std | 0.448 | -| value_loss | 1.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3426 | -| time_elapsed | 32341 | -| total_timesteps | 438528 | -| train/ | | -| approx_kl | 0.022902567 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -1.12e+03 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 34250 | -| policy_gradient_loss | -0.00989 | -| std | 0.448 | -| value_loss | 5.8e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3427 | -| time_elapsed | 32344 | -| total_timesteps | 438656 | -| train/ | | -| approx_kl | 0.0026622084 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -284 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 34260 | -| policy_gradient_loss | -0.00036 | -| std | 0.448 | -| value_loss | 1.37e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3428 | -| time_elapsed | 32348 | -| total_timesteps | 438784 | -| train/ | | -| approx_kl | 7.736497e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.617 | -| explained_variance | -20.7 | -| learning_rate | 0.0003 | -| loss | -8.65e-05 | -| n_updates | 34270 | -| policy_gradient_loss | 0.000194 | -| std | 0.448 | -| value_loss | 1.2e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3429 | -| time_elapsed | 32351 | -| total_timesteps | 438912 | -| train/ | | -| approx_kl | 0.0014562418 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -3.04 | -| learning_rate | 0.0003 | -| loss | -0.000526 | -| n_updates | 34280 | -| policy_gradient_loss | -0.000261 | -| std | 0.446 | -| value_loss | 2.76e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3430 | -| time_elapsed | 32356 | -| total_timesteps | 439040 | -| train/ | | -| approx_kl | 0.011639522 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -0.204 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 34290 | -| policy_gradient_loss | -0.00447 | -| std | 0.444 | -| value_loss | 2.31e-11 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3431 | -| time_elapsed | 32363 | -| total_timesteps | 439168 | -| train/ | | -| approx_kl | 0.00090194447 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.00955 | -| n_updates | 34300 | -| policy_gradient_loss | -0.00733 | -| std | 0.443 | -| value_loss | 0.00122 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3432 | -| time_elapsed | 32367 | -| total_timesteps | 439296 | -| train/ | | -| approx_kl | 0.010757205 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -40 | -| learning_rate | 0.0003 | -| loss | -0.00565 | -| n_updates | 34310 | -| policy_gradient_loss | -0.00212 | -| std | 0.441 | -| value_loss | 1.48e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3433 | -| time_elapsed | 32371 | -| total_timesteps | 439424 | -| train/ | | -| approx_kl | 2.4630455e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -48.1 | -| learning_rate | 0.0003 | -| loss | -0.000473 | -| n_updates | 34320 | -| policy_gradient_loss | 0.00107 | -| std | 0.44 | -| value_loss | 7.28e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3434 | -| time_elapsed | 32374 | -| total_timesteps | 439552 | -| train/ | | -| approx_kl | 0.046918504 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -11.3 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 34330 | -| policy_gradient_loss | -0.0155 | -| std | 0.44 | -| value_loss | 2.33e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3435 | -| time_elapsed | 32378 | -| total_timesteps | 439680 | -| train/ | | -| approx_kl | 0.011818666 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -1.92 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 34340 | -| policy_gradient_loss | -0.000613 | -| std | 0.44 | -| value_loss | 3.76e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3436 | -| time_elapsed | 32382 | -| total_timesteps | 439808 | -| train/ | | -| approx_kl | 0.009917736 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.572 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 34350 | -| policy_gradient_loss | -0.00169 | -| std | 0.441 | -| value_loss | 4.48e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 13 | -| iterations | 3437 | -| time_elapsed | 32385 | -| total_timesteps | 439936 | -| train/ | | -| approx_kl | 0.01810935 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 34360 | -| policy_gradient_loss | -0.00977 | -| std | 0.442 | -| value_loss | 4.73e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3438 | -| time_elapsed | 32388 | -| total_timesteps | 440064 | -| train/ | | -| approx_kl | 0.001348536 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -0.00134 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 34370 | -| policy_gradient_loss | 0.000311 | -| std | 0.442 | -| value_loss | 4.56e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3439 | -| time_elapsed | 32395 | -| total_timesteps | 440192 | -| train/ | | -| approx_kl | 0.027233608 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 34380 | -| policy_gradient_loss | -0.0143 | -| std | 0.442 | -| value_loss | 0.0004 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3440 | -| time_elapsed | 32399 | -| total_timesteps | 440320 | -| train/ | | -| approx_kl | 0.020254249 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -66.8 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 34390 | -| policy_gradient_loss | -0.00182 | -| std | 0.442 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3441 | -| time_elapsed | 32403 | -| total_timesteps | 440448 | -| train/ | | -| approx_kl | 0.011969837 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -53.1 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 34400 | -| policy_gradient_loss | -0.00408 | -| std | 0.442 | -| value_loss | 4.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3442 | -| time_elapsed | 32407 | -| total_timesteps | 440576 | -| train/ | | -| approx_kl | 0.016818935 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -3.5 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 34410 | -| policy_gradient_loss | -0.00199 | -| std | 0.441 | -| value_loss | 6.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3443 | -| time_elapsed | 32410 | -| total_timesteps | 440704 | -| train/ | | -| approx_kl | 0.013502493 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 34420 | -| policy_gradient_loss | -0.00262 | -| std | 0.441 | -| value_loss | 4.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3444 | -| time_elapsed | 32414 | -| total_timesteps | 440832 | -| train/ | | -| approx_kl | 0.016491424 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.00512 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 34430 | -| policy_gradient_loss | -0.0117 | -| std | 0.441 | -| value_loss | 3.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 13 | -| iterations | 3445 | -| time_elapsed | 32417 | -| total_timesteps | 440960 | -| train/ | | -| approx_kl | 0.029773438 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.00341 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 34440 | -| policy_gradient_loss | -0.00937 | -| std | 0.442 | -| value_loss | 1.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3446 | -| time_elapsed | 32421 | -| total_timesteps | 441088 | -| train/ | | -| approx_kl | 0.009846944 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -0.00441 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 34450 | -| policy_gradient_loss | -0.00244 | -| std | 0.442 | -| value_loss | 1.57e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3447 | -| time_elapsed | 32427 | -| total_timesteps | 441216 | -| train/ | | -| approx_kl | 0.0074104834 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 34460 | -| policy_gradient_loss | -0.00119 | -| std | 0.441 | -| value_loss | 0.00304 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3448 | -| time_elapsed | 32431 | -| total_timesteps | 441344 | -| train/ | | -| approx_kl | 0.0064659305 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -763 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 34470 | -| policy_gradient_loss | -0.00199 | -| std | 0.441 | -| value_loss | 2.53e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3449 | -| time_elapsed | 32433 | -| total_timesteps | 441472 | -| train/ | | -| approx_kl | 0.003368844 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -634 | -| learning_rate | 0.0003 | -| loss | 0.000897 | -| n_updates | 34480 | -| policy_gradient_loss | 0.00068 | -| std | 0.441 | -| value_loss | 8.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3450 | -| time_elapsed | 32436 | -| total_timesteps | 441600 | -| train/ | | -| approx_kl | 0.012694551 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -23.7 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 34490 | -| policy_gradient_loss | -0.0026 | -| std | 0.442 | -| value_loss | 2.89e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3451 | -| time_elapsed | 32438 | -| total_timesteps | 441728 | -| train/ | | -| approx_kl | 3.634859e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -3.08 | -| learning_rate | 0.0003 | -| loss | -0.000478 | -| n_updates | 34500 | -| policy_gradient_loss | 0.0018 | -| std | 0.442 | -| value_loss | 1.29e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3452 | -| time_elapsed | 32442 | -| total_timesteps | 441856 | -| train/ | | -| approx_kl | 0.0016945126 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.63 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 34510 | -| policy_gradient_loss | 0.000165 | -| std | 0.442 | -| value_loss | 9.29e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3453 | -| time_elapsed | 32445 | -| total_timesteps | 441984 | -| train/ | | -| approx_kl | 0.011587065 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.00213 | -| n_updates | 34520 | -| policy_gradient_loss | 0.000493 | -| std | 0.442 | -| value_loss | 6.2e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3454 | -| time_elapsed | 32448 | -| total_timesteps | 442112 | -| train/ | | -| approx_kl | 0.006527217 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 34530 | -| policy_gradient_loss | -0.0025 | -| std | 0.442 | -| value_loss | 2.03e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3455 | -| time_elapsed | 32457 | -| total_timesteps | 442240 | -| train/ | | -| approx_kl | 0.012547519 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.907 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 34540 | -| policy_gradient_loss | -0.00309 | -| std | 0.441 | -| value_loss | 0.00102 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3456 | -| time_elapsed | 32462 | -| total_timesteps | 442368 | -| train/ | | -| approx_kl | 0.0071708946 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -162 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 34550 | -| policy_gradient_loss | -0.00714 | -| std | 0.442 | -| value_loss | 2.33e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3457 | -| time_elapsed | 32465 | -| total_timesteps | 442496 | -| train/ | | -| approx_kl | 0.015720956 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -160 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 34560 | -| policy_gradient_loss | -0.00451 | -| std | 0.442 | -| value_loss | 9.12e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3458 | -| time_elapsed | 32468 | -| total_timesteps | 442624 | -| train/ | | -| approx_kl | 0.0045418683 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -54.6 | -| learning_rate | 0.0003 | -| loss | 0.00077 | -| n_updates | 34570 | -| policy_gradient_loss | 0.000656 | -| std | 0.442 | -| value_loss | 1.11e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3459 | -| time_elapsed | 32472 | -| total_timesteps | 442752 | -| train/ | | -| approx_kl | 0.015435081 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 34580 | -| policy_gradient_loss | -0.0114 | -| std | 0.442 | -| value_loss | 8.91e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 13 | -| iterations | 3460 | -| time_elapsed | 32476 | -| total_timesteps | 442880 | -| train/ | | -| approx_kl | 0.01135825 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -0.533 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 34590 | -| policy_gradient_loss | -0.00585 | -| std | 0.442 | -| value_loss | 1.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3461 | -| time_elapsed | 32480 | -| total_timesteps | 443008 | -| train/ | | -| approx_kl | 0.014342589 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | 0.00199 | -| n_updates | 34600 | -| policy_gradient_loss | 0.000343 | -| std | 0.442 | -| value_loss | 2.09e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3462 | -| time_elapsed | 32487 | -| total_timesteps | 443136 | -| train/ | | -| approx_kl | 0.010332828 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.761 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 34610 | -| policy_gradient_loss | -0.0112 | -| std | 0.442 | -| value_loss | 0.00238 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3463 | -| time_elapsed | 32489 | -| total_timesteps | 443264 | -| train/ | | -| approx_kl | 0.0019117494 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -128 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 34620 | -| policy_gradient_loss | -0.000102 | -| std | 0.443 | -| value_loss | 6.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3464 | -| time_elapsed | 32492 | -| total_timesteps | 443392 | -| train/ | | -| approx_kl | 0.024990302 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -299 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 34630 | -| policy_gradient_loss | -0.00989 | -| std | 0.443 | -| value_loss | 2.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3465 | -| time_elapsed | 32496 | -| total_timesteps | 443520 | -| train/ | | -| approx_kl | 0.020550545 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -31.5 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 34640 | -| policy_gradient_loss | -0.00451 | -| std | 0.443 | -| value_loss | 7.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3466 | -| time_elapsed | 32498 | -| total_timesteps | 443648 | -| train/ | | -| approx_kl | 0.006106876 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.000206 | -| n_updates | 34650 | -| policy_gradient_loss | -0.000259 | -| std | 0.443 | -| value_loss | 1.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3467 | -| time_elapsed | 32502 | -| total_timesteps | 443776 | -| train/ | | -| approx_kl | 0.006094232 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | -0.000444 | -| n_updates | 34660 | -| policy_gradient_loss | -0.000599 | -| std | 0.444 | -| value_loss | 1.67e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3468 | -| time_elapsed | 32505 | -| total_timesteps | 443904 | -| train/ | | -| approx_kl | 0.0042393776 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | 0.0057 | -| learning_rate | 0.0003 | -| loss | -0.000427 | -| n_updates | 34670 | -| policy_gradient_loss | -0.000395 | -| std | 0.445 | -| value_loss | 1.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3469 | -| time_elapsed | 32508 | -| total_timesteps | 444032 | -| train/ | | -| approx_kl | 0.015232066 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 34680 | -| policy_gradient_loss | -0.00934 | -| std | 0.445 | -| value_loss | 1.2e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3470 | -| time_elapsed | 32516 | -| total_timesteps | 444160 | -| train/ | | -| approx_kl | 0.0042902203 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 34690 | -| policy_gradient_loss | -0.00936 | -| std | 0.445 | -| value_loss | 0.000369 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3471 | -| time_elapsed | 32519 | -| total_timesteps | 444288 | -| train/ | | -| approx_kl | 0.0009195311 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -44.9 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 34700 | -| policy_gradient_loss | 0.000673 | -| std | 0.445 | -| value_loss | 3.56e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3472 | -| time_elapsed | 32522 | -| total_timesteps | 444416 | -| train/ | | -| approx_kl | 0.000855227 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.61 | -| explained_variance | -55.9 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 34710 | -| policy_gradient_loss | 0.000343 | -| std | 0.445 | -| value_loss | 1.8e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3473 | -| time_elapsed | 32524 | -| total_timesteps | 444544 | -| train/ | | -| approx_kl | 0.01613889 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -7.54 | -| learning_rate | 0.0003 | -| loss | -0.000537 | -| n_updates | 34720 | -| policy_gradient_loss | -0.000717 | -| std | 0.444 | -| value_loss | 2.44e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3474 | -| time_elapsed | 32527 | -| total_timesteps | 444672 | -| train/ | | -| approx_kl | 0.020723054 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -0.617 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 34730 | -| policy_gradient_loss | -0.00805 | -| std | 0.444 | -| value_loss | 8.91e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3475 | -| time_elapsed | 32532 | -| total_timesteps | 444800 | -| train/ | | -| approx_kl | 0.019230235 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -0.0704 | -| learning_rate | 0.0003 | -| loss | 0.000415 | -| n_updates | 34740 | -| policy_gradient_loss | -0.00196 | -| std | 0.444 | -| value_loss | 9.43e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3476 | -| time_elapsed | 32536 | -| total_timesteps | 444928 | -| train/ | | -| approx_kl | 0.0020477744 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -0.0781 | -| learning_rate | 0.0003 | -| loss | -0.000776 | -| n_updates | 34750 | -| policy_gradient_loss | -0.000312 | -| std | 0.444 | -| value_loss | 3.32e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3477 | -| time_elapsed | 32540 | -| total_timesteps | 445056 | -| train/ | | -| approx_kl | 0.005164153 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -0.00936 | -| learning_rate | 0.0003 | -| loss | -0.00883 | -| n_updates | 34760 | -| policy_gradient_loss | -0.00265 | -| std | 0.444 | -| value_loss | 5.53e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3478 | -| time_elapsed | 32547 | -| total_timesteps | 445184 | -| train/ | | -| approx_kl | 0.00061560865 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 34770 | -| policy_gradient_loss | -0.00622 | -| std | 0.445 | -| value_loss | 0.00031 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3479 | -| time_elapsed | 32550 | -| total_timesteps | 445312 | -| train/ | | -| approx_kl | 0.004560695 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -212 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 34780 | -| policy_gradient_loss | -0.0015 | -| std | 0.445 | -| value_loss | 3.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3480 | -| time_elapsed | 32553 | -| total_timesteps | 445440 | -| train/ | | -| approx_kl | 0.013820644 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -295 | -| learning_rate | 0.0003 | -| loss | 0.000345 | -| n_updates | 34790 | -| policy_gradient_loss | -0.000538 | -| std | 0.445 | -| value_loss | 2.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3481 | -| time_elapsed | 32556 | -| total_timesteps | 445568 | -| train/ | | -| approx_kl | 0.01047397 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -243 | -| learning_rate | 0.0003 | -| loss | -0.00846 | -| n_updates | 34800 | -| policy_gradient_loss | -0.00293 | -| std | 0.445 | -| value_loss | 1.65e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3482 | -| time_elapsed | 32559 | -| total_timesteps | 445696 | -| train/ | | -| approx_kl | 2.8640963e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -95.9 | -| learning_rate | 0.0003 | -| loss | -0.000766 | -| n_updates | 34810 | -| policy_gradient_loss | 0.00279 | -| std | 0.445 | -| value_loss | 1.32e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3483 | -| time_elapsed | 32563 | -| total_timesteps | 445824 | -| train/ | | -| approx_kl | 0.014789348 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 34820 | -| policy_gradient_loss | -0.00972 | -| std | 0.445 | -| value_loss | 1.6e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3484 | -| time_elapsed | 32566 | -| total_timesteps | 445952 | -| train/ | | -| approx_kl | 0.008911353 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -1.47 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 34830 | -| policy_gradient_loss | -0.00135 | -| std | 0.445 | -| value_loss | 4.72e-12 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3485 | -| time_elapsed | 32571 | -| total_timesteps | 446080 | -| train/ | | -| approx_kl | 0.0018188558 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.611 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 34840 | -| policy_gradient_loss | -0.000229 | -| std | 0.447 | -| value_loss | 5.76e-12 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3486 | -| time_elapsed | 32577 | -| total_timesteps | 446208 | -| train/ | | -| approx_kl | 0.028848475 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -11.5 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 34850 | -| policy_gradient_loss | -0.00684 | -| std | 0.448 | -| value_loss | 0.00361 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3487 | -| time_elapsed | 32581 | -| total_timesteps | 446336 | -| train/ | | -| approx_kl | 0.0020248909 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -1.84e+03 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 34860 | -| policy_gradient_loss | -0.00176 | -| std | 0.45 | -| value_loss | 1.74e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3488 | -| time_elapsed | 32584 | -| total_timesteps | 446464 | -| train/ | | -| approx_kl | 0.0073868744 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.622 | -| explained_variance | -1.13e+03 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 34870 | -| policy_gradient_loss | -0.00392 | -| std | 0.451 | -| value_loss | 4.32e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3489 | -| time_elapsed | 32586 | -| total_timesteps | 446592 | -| train/ | | -| approx_kl | 0.029193453 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | -0.624 | -| explained_variance | -88.9 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 34880 | -| policy_gradient_loss | -0.00238 | -| std | 0.451 | -| value_loss | 1.95e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3490 | -| time_elapsed | 32588 | -| total_timesteps | 446720 | -| train/ | | -| approx_kl | 0.0143771535 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.623 | -| explained_variance | -1.84 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 34890 | -| policy_gradient_loss | -0.00541 | -| std | 0.451 | -| value_loss | 1.3e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3491 | -| time_elapsed | 32591 | -| total_timesteps | 446848 | -| train/ | | -| approx_kl | 0.012083784 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | -0.62 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 34900 | -| policy_gradient_loss | -0.00223 | -| std | 0.449 | -| value_loss | 1.36e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3492 | -| time_elapsed | 32594 | -| total_timesteps | 446976 | -| train/ | | -| approx_kl | 0.0070191985 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 34910 | -| policy_gradient_loss | -0.00644 | -| std | 0.448 | -| value_loss | 1.27e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3493 | -| time_elapsed | 32598 | -| total_timesteps | 447104 | -| train/ | | -| approx_kl | 0.020748297 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 34920 | -| policy_gradient_loss | -0.00587 | -| std | 0.448 | -| value_loss | 1.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3494 | -| time_elapsed | 32605 | -| total_timesteps | 447232 | -| train/ | | -| approx_kl | 0.01050763 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 34930 | -| policy_gradient_loss | -0.0115 | -| std | 0.448 | -| value_loss | 0.00188 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3495 | -| time_elapsed | 32609 | -| total_timesteps | 447360 | -| train/ | | -| approx_kl | 0.0010442203 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.615 | -| explained_variance | -86.9 | -| learning_rate | 0.0003 | -| loss | 0.000204 | -| n_updates | 34940 | -| policy_gradient_loss | 0.000148 | -| std | 0.448 | -| value_loss | 2.72e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3496 | -| time_elapsed | 32612 | -| total_timesteps | 447488 | -| train/ | | -| approx_kl | 0.010651475 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.617 | -| explained_variance | -274 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 34950 | -| policy_gradient_loss | -0.00168 | -| std | 0.449 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3497 | -| time_elapsed | 32615 | -| total_timesteps | 447616 | -| train/ | | -| approx_kl | 0.037239347 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -7.04 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 34960 | -| policy_gradient_loss | -0.0149 | -| std | 0.449 | -| value_loss | 5.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3498 | -| time_elapsed | 32618 | -| total_timesteps | 447744 | -| train/ | | -| approx_kl | 0.010872806 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -218 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 34970 | -| policy_gradient_loss | -0.00972 | -| std | 0.449 | -| value_loss | 7.49e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3499 | -| time_elapsed | 32620 | -| total_timesteps | 447872 | -| train/ | | -| approx_kl | 0.04443557 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | -0.619 | -| explained_variance | -9.26 | -| learning_rate | 0.0003 | -| loss | -0.026 | -| n_updates | 34980 | -| policy_gradient_loss | -0.0173 | -| std | 0.449 | -| value_loss | 1.66e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3500 | -| time_elapsed | 32623 | -| total_timesteps | 448000 | -| train/ | | -| approx_kl | 0.0016771704 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | -0.0834 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 34990 | -| policy_gradient_loss | -6.8e-05 | -| std | 0.449 | -| value_loss | 2.4e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3501 | -| time_elapsed | 32626 | -| total_timesteps | 448128 | -| train/ | | -| approx_kl | 0.0023777941 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.618 | -| explained_variance | 0.00243 | -| learning_rate | 0.0003 | -| loss | 0.000136 | -| n_updates | 35000 | -| policy_gradient_loss | 0.000387 | -| std | 0.448 | -| value_loss | 1.79e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3502 | -| time_elapsed | 32632 | -| total_timesteps | 448256 | -| train/ | | -| approx_kl | 0.017896265 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.00638 | -| n_updates | 35010 | -| policy_gradient_loss | -0.00467 | -| std | 0.448 | -| value_loss | 7.31e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3503 | -| time_elapsed | 32636 | -| total_timesteps | 448384 | -| train/ | | -| approx_kl | 1.7046928e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.616 | -| explained_variance | -1.15e+03 | -| learning_rate | 0.0003 | -| loss | -0.000141 | -| n_updates | 35020 | -| policy_gradient_loss | -3.65e-05 | -| std | 0.447 | -| value_loss | 2.17e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3504 | -| time_elapsed | 32640 | -| total_timesteps | 448512 | -| train/ | | -| approx_kl | 7.2721625e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.613 | -| explained_variance | -1.54e+03 | -| learning_rate | 0.0003 | -| loss | -0.000393 | -| n_updates | 35030 | -| policy_gradient_loss | -0.000169 | -| std | 0.446 | -| value_loss | 5.43e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3505 | -| time_elapsed | 32644 | -| total_timesteps | 448640 | -| train/ | | -| approx_kl | 1.7083483e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.609 | -| explained_variance | -416 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 35040 | -| policy_gradient_loss | -4.69e-05 | -| std | 0.444 | -| value_loss | 5.48e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3506 | -| time_elapsed | 32648 | -| total_timesteps | 448768 | -| train/ | | -| approx_kl | 0.014876835 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -245 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 35050 | -| policy_gradient_loss | -0.00224 | -| std | 0.444 | -| value_loss | 3.48e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3507 | -| time_elapsed | 32651 | -| total_timesteps | 448896 | -| train/ | | -| approx_kl | 0.0007986545 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -6.93 | -| learning_rate | 0.0003 | -| loss | -0.00454 | -| n_updates | 35060 | -| policy_gradient_loss | 0.000933 | -| std | 0.443 | -| value_loss | 1.6e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3508 | -| time_elapsed | 32654 | -| total_timesteps | 449024 | -| train/ | | -| approx_kl | 0.00090963347 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -0.28 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 35070 | -| policy_gradient_loss | 0.00101 | -| std | 0.443 | -| value_loss | 6.3e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3509 | -| time_elapsed | 32662 | -| total_timesteps | 449152 | -| train/ | | -| approx_kl | 0.037490055 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | 0.819 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 35080 | -| policy_gradient_loss | -0.0111 | -| std | 0.443 | -| value_loss | 0.00265 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3510 | -| time_elapsed | 32665 | -| total_timesteps | 449280 | -| train/ | | -| approx_kl | 0.035473976 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -760 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 35090 | -| policy_gradient_loss | -0.011 | -| std | 0.443 | -| value_loss | 5.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3511 | -| time_elapsed | 32669 | -| total_timesteps | 449408 | -| train/ | | -| approx_kl | 0.030532807 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -2.56e+03 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 35100 | -| policy_gradient_loss | -0.0142 | -| std | 0.442 | -| value_loss | 2.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3512 | -| time_elapsed | 32673 | -| total_timesteps | 449536 | -| train/ | | -| approx_kl | 0.012563033 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -7.64e+03 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 35110 | -| policy_gradient_loss | -0.00718 | -| std | 0.442 | -| value_loss | 2.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3513 | -| time_elapsed | 32677 | -| total_timesteps | 449664 | -| train/ | | -| approx_kl | 0.0054279743 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -15.9 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 35120 | -| policy_gradient_loss | -0.00563 | -| std | 0.442 | -| value_loss | 1.82e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3514 | -| time_elapsed | 32682 | -| total_timesteps | 449792 | -| train/ | | -| approx_kl | 0.0009275682 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.905 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 35130 | -| policy_gradient_loss | 0.000664 | -| std | 0.442 | -| value_loss | 3.42e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3515 | -| time_elapsed | 32685 | -| total_timesteps | 449920 | -| train/ | | -| approx_kl | 0.020599319 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | 0.00506 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 35140 | -| policy_gradient_loss | -0.0121 | -| std | 0.442 | -| value_loss | 2.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3516 | -| time_elapsed | 32689 | -| total_timesteps | 450048 | -| train/ | | -| approx_kl | 0.01171081 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 35150 | -| policy_gradient_loss | -0.000789 | -| std | 0.442 | -| value_loss | 2.59e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3517 | -| time_elapsed | 32694 | -| total_timesteps | 450176 | -| train/ | | -| approx_kl | 0.0101046935 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 35160 | -| policy_gradient_loss | -0.0112 | -| std | 0.442 | -| value_loss | 0.00215 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3518 | -| time_elapsed | 32698 | -| total_timesteps | 450304 | -| train/ | | -| approx_kl | 0.025163975 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -646 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 35170 | -| policy_gradient_loss | -0.00292 | -| std | 0.442 | -| value_loss | 3.76e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3519 | -| time_elapsed | 32702 | -| total_timesteps | 450432 | -| train/ | | -| approx_kl | 0.0045934943 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -4.07e+03 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 35180 | -| policy_gradient_loss | -0.00325 | -| std | 0.441 | -| value_loss | 2.01e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3520 | -| time_elapsed | 32705 | -| total_timesteps | 450560 | -| train/ | | -| approx_kl | 0.00040149363 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -307 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 35190 | -| policy_gradient_loss | 0.00153 | -| std | 0.44 | -| value_loss | 1.25e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3521 | -| time_elapsed | 32708 | -| total_timesteps | 450688 | -| train/ | | -| approx_kl | 0.039418492 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -144 | -| learning_rate | 0.0003 | -| loss | -0.00926 | -| n_updates | 35200 | -| policy_gradient_loss | -0.00573 | -| std | 0.44 | -| value_loss | 3.66e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3522 | -| time_elapsed | 32711 | -| total_timesteps | 450816 | -| train/ | | -| approx_kl | 0.023176294 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -2.23 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 35210 | -| policy_gradient_loss | -0.0047 | -| std | 0.441 | -| value_loss | 1.03e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3523 | -| time_elapsed | 32713 | -| total_timesteps | 450944 | -| train/ | | -| approx_kl | 0.008689264 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 35220 | -| policy_gradient_loss | -0.00115 | -| std | 0.441 | -| value_loss | 5.61e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3524 | -| time_elapsed | 32717 | -| total_timesteps | 451072 | -| train/ | | -| approx_kl | 0.004175962 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 35230 | -| policy_gradient_loss | -0.000614 | -| std | 0.44 | -| value_loss | 7.5e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3525 | -| time_elapsed | 32722 | -| total_timesteps | 451200 | -| train/ | | -| approx_kl | 0.015921729 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 35240 | -| policy_gradient_loss | -0.00201 | -| std | 0.439 | -| value_loss | 0.00147 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3526 | -| time_elapsed | 32726 | -| total_timesteps | 451328 | -| train/ | | -| approx_kl | 0.019626392 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -6.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 35250 | -| policy_gradient_loss | -0.00815 | -| std | 0.438 | -| value_loss | 6.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3527 | -| time_elapsed | 32730 | -| total_timesteps | 451456 | -| train/ | | -| approx_kl | 0.040095568 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -1.47e+04 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 35260 | -| policy_gradient_loss | -0.0122 | -| std | 0.438 | -| value_loss | 1.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3528 | -| time_elapsed | 32734 | -| total_timesteps | 451584 | -| train/ | | -| approx_kl | 0.014579465 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -723 | -| learning_rate | 0.0003 | -| loss | -0.00599 | -| n_updates | 35270 | -| policy_gradient_loss | -0.00437 | -| std | 0.437 | -| value_loss | 7.25e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3529 | -| time_elapsed | 32737 | -| total_timesteps | 451712 | -| train/ | | -| approx_kl | 0.0061046924 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -325 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 35280 | -| policy_gradient_loss | -0.00139 | -| std | 0.437 | -| value_loss | 2.79e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3530 | -| time_elapsed | 32740 | -| total_timesteps | 451840 | -| train/ | | -| approx_kl | 0.00026417314 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -18.1 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 35290 | -| policy_gradient_loss | 0.00138 | -| std | 0.436 | -| value_loss | 5.79e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3531 | -| time_elapsed | 32743 | -| total_timesteps | 451968 | -| train/ | | -| approx_kl | 0.0011595865 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -0.563 | -| learning_rate | 0.0003 | -| loss | -0.00359 | -| n_updates | 35300 | -| policy_gradient_loss | 0.000261 | -| std | 0.435 | -| value_loss | 2.07e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3532 | -| time_elapsed | 32747 | -| total_timesteps | 452096 | -| train/ | | -| approx_kl | 0.022308502 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -1.21 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 35310 | -| policy_gradient_loss | -0.00347 | -| std | 0.435 | -| value_loss | 8.79e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3533 | -| time_elapsed | 32755 | -| total_timesteps | 452224 | -| train/ | | -| approx_kl | 0.012661835 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 35320 | -| policy_gradient_loss | -0.0108 | -| std | 0.434 | -| value_loss | 0.00386 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3534 | -| time_elapsed | 32759 | -| total_timesteps | 452352 | -| train/ | | -| approx_kl | 0.025181513 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -1.72e+03 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 35330 | -| policy_gradient_loss | -0.00667 | -| std | 0.434 | -| value_loss | 1.43e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3535 | -| time_elapsed | 32762 | -| total_timesteps | 452480 | -| train/ | | -| approx_kl | 0.0051327934 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -2.05e+03 | -| learning_rate | 0.0003 | -| loss | 0.000873 | -| n_updates | 35340 | -| policy_gradient_loss | 0.000833 | -| std | 0.433 | -| value_loss | 5.73e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3536 | -| time_elapsed | 32766 | -| total_timesteps | 452608 | -| train/ | | -| approx_kl | 0.0064813327 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -249 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 35350 | -| policy_gradient_loss | -0.00331 | -| std | 0.432 | -| value_loss | 1.56e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3537 | -| time_elapsed | 32768 | -| total_timesteps | 452736 | -| train/ | | -| approx_kl | 0.0028651038 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -987 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 35360 | -| policy_gradient_loss | -0.000698 | -| std | 0.433 | -| value_loss | 8.91e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3538 | -| time_elapsed | 32770 | -| total_timesteps | 452864 | -| train/ | | -| approx_kl | 0.0016226533 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | -139 | -| learning_rate | 0.0003 | -| loss | 0.000498 | -| n_updates | 35370 | -| policy_gradient_loss | 0.000532 | -| std | 0.434 | -| value_loss | 5.81e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3539 | -| time_elapsed | 32773 | -| total_timesteps | 452992 | -| train/ | | -| approx_kl | 0.012155994 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -7.52 | -| learning_rate | 0.0003 | -| loss | -0.00857 | -| n_updates | 35380 | -| policy_gradient_loss | -0.00331 | -| std | 0.435 | -| value_loss | 3.44e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3540 | -| time_elapsed | 32776 | -| total_timesteps | 453120 | -| train/ | | -| approx_kl | 0.020832513 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.903 | -| learning_rate | 0.0003 | -| loss | -0.00623 | -| n_updates | 35390 | -| policy_gradient_loss | -0.00661 | -| std | 0.435 | -| value_loss | 7.11e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3541 | -| time_elapsed | 32785 | -| total_timesteps | 453248 | -| train/ | | -| approx_kl | 0.019066915 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | 0.971 | -| learning_rate | 0.0003 | -| loss | -0.0096 | -| n_updates | 35400 | -| policy_gradient_loss | -0.00501 | -| std | 0.436 | -| value_loss | 0.000287 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3542 | -| time_elapsed | 32788 | -| total_timesteps | 453376 | -| train/ | | -| approx_kl | 0.018251218 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -3e+03 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 35410 | -| policy_gradient_loss | -0.0134 | -| std | 0.435 | -| value_loss | 4.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3543 | -| time_elapsed | 32791 | -| total_timesteps | 453504 | -| train/ | | -| approx_kl | 0.017362999 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -1.27e+04 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 35420 | -| policy_gradient_loss | -0.00501 | -| std | 0.435 | -| value_loss | 1.61e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3544 | -| time_elapsed | 32793 | -| total_timesteps | 453632 | -| train/ | | -| approx_kl | 7.4457144e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -266 | -| learning_rate | 0.0003 | -| loss | 0.000449 | -| n_updates | 35430 | -| policy_gradient_loss | 0.0015 | -| std | 0.434 | -| value_loss | 2.29e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3545 | -| time_elapsed | 32796 | -| total_timesteps | 453760 | -| train/ | | -| approx_kl | 0.0018295508 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -52.3 | -| learning_rate | 0.0003 | -| loss | -0.00391 | -| n_updates | 35440 | -| policy_gradient_loss | -0.000177 | -| std | 0.434 | -| value_loss | 5.62e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3546 | -| time_elapsed | 32799 | -| total_timesteps | 453888 | -| train/ | | -| approx_kl | 0.0006788103 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -9.01 | -| learning_rate | 0.0003 | -| loss | -0.00593 | -| n_updates | 35450 | -| policy_gradient_loss | 0.00184 | -| std | 0.435 | -| value_loss | 1.08e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3547 | -| time_elapsed | 32802 | -| total_timesteps | 454016 | -| train/ | | -| approx_kl | 0.028654233 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.00963 | -| n_updates | 35460 | -| policy_gradient_loss | -0.00953 | -| std | 0.435 | -| value_loss | 3.46e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3548 | -| time_elapsed | 32810 | -| total_timesteps | 454144 | -| train/ | | -| approx_kl | 0.014983574 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | 0.447 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 35470 | -| policy_gradient_loss | -0.00478 | -| std | 0.436 | -| value_loss | 0.00136 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3549 | -| time_elapsed | 32814 | -| total_timesteps | 454272 | -| train/ | | -| approx_kl | 0.042112797 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -2.92e+03 | -| learning_rate | 0.0003 | -| loss | 6.23e-06 | -| n_updates | 35480 | -| policy_gradient_loss | -0.00347 | -| std | 0.436 | -| value_loss | 4.99e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3550 | -| time_elapsed | 32818 | -| total_timesteps | 454400 | -| train/ | | -| approx_kl | 0.00073143 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -2.64e+03 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 35490 | -| policy_gradient_loss | -0.000698 | -| std | 0.439 | -| value_loss | 1.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3551 | -| time_elapsed | 32821 | -| total_timesteps | 454528 | -| train/ | | -| approx_kl | 0.006713243 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -34.6 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 35500 | -| policy_gradient_loss | -0.00511 | -| std | 0.441 | -| value_loss | 3.51e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3552 | -| time_elapsed | 32824 | -| total_timesteps | 454656 | -| train/ | | -| approx_kl | 0.01475809 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -25.2 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 35510 | -| policy_gradient_loss | -0.0032 | -| std | 0.442 | -| value_loss | 4.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3553 | -| time_elapsed | 32827 | -| total_timesteps | 454784 | -| train/ | | -| approx_kl | 0.009949076 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.604 | -| explained_variance | -0.911 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 35520 | -| policy_gradient_loss | -0.00157 | -| std | 0.443 | -| value_loss | 1.09e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3554 | -| time_elapsed | 32830 | -| total_timesteps | 454912 | -| train/ | | -| approx_kl | 0.0022109903 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -0.0652 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 35530 | -| policy_gradient_loss | -0.000486 | -| std | 0.444 | -| value_loss | 5.02e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3555 | -| time_elapsed | 32833 | -| total_timesteps | 455040 | -| train/ | | -| approx_kl | 0.004923433 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | 0.00586 | -| learning_rate | 0.0003 | -| loss | 2.79e-05 | -| n_updates | 35540 | -| policy_gradient_loss | 3.26e-05 | -| std | 0.444 | -| value_loss | 7.95e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3556 | -| time_elapsed | 32841 | -| total_timesteps | 455168 | -| train/ | | -| approx_kl | 0.008220684 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | 0.934 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 35550 | -| policy_gradient_loss | -0.00125 | -| std | 0.444 | -| value_loss | 0.000725 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3557 | -| time_elapsed | 32846 | -| total_timesteps | 455296 | -| train/ | | -| approx_kl | 0.018283391 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -458 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 35560 | -| policy_gradient_loss | -0.00133 | -| std | 0.444 | -| value_loss | 3.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3558 | -| time_elapsed | 32850 | -| total_timesteps | 455424 | -| train/ | | -| approx_kl | 0.027094012 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -1.31e+03 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 35570 | -| policy_gradient_loss | -0.0102 | -| std | 0.444 | -| value_loss | 7.99e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3559 | -| time_elapsed | 32854 | -| total_timesteps | 455552 | -| train/ | | -| approx_kl | 0.0021148124 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.606 | -| explained_variance | -2.85 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 35580 | -| policy_gradient_loss | -0.000251 | -| std | 0.443 | -| value_loss | 7.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3560 | -| time_elapsed | 32858 | -| total_timesteps | 455680 | -| train/ | | -| approx_kl | 0.001961781 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -5.26 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 35590 | -| policy_gradient_loss | -0.00124 | -| std | 0.444 | -| value_loss | 6.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3561 | -| time_elapsed | 32862 | -| total_timesteps | 455808 | -| train/ | | -| approx_kl | 0.013142543 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -0.0807 | -| learning_rate | 0.0003 | -| loss | 0.000787 | -| n_updates | 35600 | -| policy_gradient_loss | -0.00076 | -| std | 0.444 | -| value_loss | 5.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3562 | -| time_elapsed | 32866 | -| total_timesteps | 455936 | -| train/ | | -| approx_kl | 0.012192933 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -5.74 | -| learning_rate | 0.0003 | -| loss | -0.00627 | -| n_updates | 35610 | -| policy_gradient_loss | -0.00291 | -| std | 0.444 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3563 | -| time_elapsed | 32869 | -| total_timesteps | 456064 | -| train/ | | -| approx_kl | 0.023569914 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | 0.000401 | -| n_updates | 35620 | -| policy_gradient_loss | -0.00329 | -| std | 0.444 | -| value_loss | 2.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3564 | -| time_elapsed | 32875 | -| total_timesteps | 456192 | -| train/ | | -| approx_kl | 0.015498806 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.607 | -| explained_variance | -12.2 | -| learning_rate | 0.0003 | -| loss | -0.005 | -| n_updates | 35630 | -| policy_gradient_loss | -0.00295 | -| std | 0.444 | -| value_loss | 0.00435 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3565 | -| time_elapsed | 32877 | -| total_timesteps | 456320 | -| train/ | | -| approx_kl | 4.3576583e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -2.48e+03 | -| learning_rate | 0.0003 | -| loss | -0.000116 | -| n_updates | 35640 | -| policy_gradient_loss | 0.00156 | -| std | 0.445 | -| value_loss | 1.92e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3566 | -| time_elapsed | 32881 | -| total_timesteps | 456448 | -| train/ | | -| approx_kl | 0.0011912514 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.608 | -| explained_variance | -4.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 35650 | -| policy_gradient_loss | 4.12e-06 | -| std | 0.444 | -| value_loss | 5.24e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3567 | -| time_elapsed | 32884 | -| total_timesteps | 456576 | -| train/ | | -| approx_kl | 0.044598803 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | -0.605 | -| explained_variance | -55.7 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 35660 | -| policy_gradient_loss | -0.00823 | -| std | 0.443 | -| value_loss | 2.48e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3568 | -| time_elapsed | 32889 | -| total_timesteps | 456704 | -| train/ | | -| approx_kl | 0.02485506 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -62.3 | -| learning_rate | 0.0003 | -| loss | 0.000994 | -| n_updates | 35670 | -| policy_gradient_loss | -0.000777 | -| std | 0.442 | -| value_loss | 3.24e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3569 | -| time_elapsed | 32892 | -| total_timesteps | 456832 | -| train/ | | -| approx_kl | 0.012759816 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.603 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 35680 | -| policy_gradient_loss | -0.00207 | -| std | 0.442 | -| value_loss | 3.45e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3570 | -| time_elapsed | 32896 | -| total_timesteps | 456960 | -| train/ | | -| approx_kl | 0.0009905654 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | 0.00548 | -| learning_rate | 0.0003 | -| loss | 0.000493 | -| n_updates | 35690 | -| policy_gradient_loss | 0.000476 | -| std | 0.442 | -| value_loss | 4.97e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3571 | -| time_elapsed | 32900 | -| total_timesteps | 457088 | -| train/ | | -| approx_kl | 0.008616414 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.00738 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 35700 | -| policy_gradient_loss | -0.00508 | -| std | 0.441 | -| value_loss | 1.07e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3572 | -| time_elapsed | 32909 | -| total_timesteps | 457216 | -| train/ | | -| approx_kl | 0.029305246 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | 0.343 | -| learning_rate | 0.0003 | -| loss | -0.00692 | -| n_updates | 35710 | -| policy_gradient_loss | -0.00328 | -| std | 0.441 | -| value_loss | 0.000906 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3573 | -| time_elapsed | 32913 | -| total_timesteps | 457344 | -| train/ | | -| approx_kl | 0.019091202 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -5.41e+03 | -| learning_rate | 0.0003 | -| loss | -0.000296 | -| n_updates | 35720 | -| policy_gradient_loss | -0.000738 | -| std | 0.441 | -| value_loss | 4.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3574 | -| time_elapsed | 32915 | -| total_timesteps | 457472 | -| train/ | | -| approx_kl | 0.014997638 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -8.58e+03 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 35730 | -| policy_gradient_loss | -0.00712 | -| std | 0.44 | -| value_loss | 8.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3575 | -| time_elapsed | 32918 | -| total_timesteps | 457600 | -| train/ | | -| approx_kl | 0.032330304 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -116 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 35740 | -| policy_gradient_loss | -0.0122 | -| std | 0.441 | -| value_loss | 1.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3576 | -| time_elapsed | 32922 | -| total_timesteps | 457728 | -| train/ | | -| approx_kl | 0.010846835 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -8.32 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 35750 | -| policy_gradient_loss | -0.0107 | -| std | 0.44 | -| value_loss | 2.48e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3577 | -| time_elapsed | 32926 | -| total_timesteps | 457856 | -| train/ | | -| approx_kl | 0.043744903 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -4 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 35760 | -| policy_gradient_loss | -0.0151 | -| std | 0.44 | -| value_loss | 8.72e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 13 | -| iterations | 3578 | -| time_elapsed | 32931 | -| total_timesteps | 457984 | -| train/ | | -| approx_kl | 0.016985288 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.741 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 35770 | -| policy_gradient_loss | -0.00373 | -| std | 0.441 | -| value_loss | 4.58e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3579 | -| time_elapsed | 32935 | -| total_timesteps | 458112 | -| train/ | | -| approx_kl | 0.013174142 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 35780 | -| policy_gradient_loss | -0.00909 | -| std | 0.441 | -| value_loss | 2.13e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3580 | -| time_elapsed | 32943 | -| total_timesteps | 458240 | -| train/ | | -| approx_kl | 0.0068002883 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.773 | -| learning_rate | 0.0003 | -| loss | -0.00983 | -| n_updates | 35790 | -| policy_gradient_loss | -0.00388 | -| std | 0.441 | -| value_loss | 0.0031 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3581 | -| time_elapsed | 32946 | -| total_timesteps | 458368 | -| train/ | | -| approx_kl | 0.052510392 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -75.7 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 35800 | -| policy_gradient_loss | -0.00623 | -| std | 0.441 | -| value_loss | 3.89e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3582 | -| time_elapsed | 32949 | -| total_timesteps | 458496 | -| train/ | | -| approx_kl | 0.0033580628 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -96.5 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 35810 | -| policy_gradient_loss | -0.00299 | -| std | 0.44 | -| value_loss | 1.68e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3583 | -| time_elapsed | 32952 | -| total_timesteps | 458624 | -| train/ | | -| approx_kl | 0.013278985 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -5.15 | -| learning_rate | 0.0003 | -| loss | -0.000776 | -| n_updates | 35820 | -| policy_gradient_loss | -0.00138 | -| std | 0.439 | -| value_loss | 1.45e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3584 | -| time_elapsed | 32956 | -| total_timesteps | 458752 | -| train/ | | -| approx_kl | 9.5143914e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00031 | -| n_updates | 35830 | -| policy_gradient_loss | -0.000127 | -| std | 0.438 | -| value_loss | 1.38e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3585 | -| time_elapsed | 32959 | -| total_timesteps | 458880 | -| train/ | | -| approx_kl | 0.010154547 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | 0.00457 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 35840 | -| policy_gradient_loss | -0.00213 | -| std | 0.436 | -| value_loss | 2.92e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3586 | -| time_elapsed | 32962 | -| total_timesteps | 459008 | -| train/ | | -| approx_kl | 0.0056747543 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | 0.00104 | -| learning_rate | 0.0003 | -| loss | -0.00534 | -| n_updates | 35850 | -| policy_gradient_loss | -0.00166 | -| std | 0.435 | -| value_loss | 2.02e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3587 | -| time_elapsed | 32972 | -| total_timesteps | 459136 | -| train/ | | -| approx_kl | 0.0018355288 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -4.61 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 35860 | -| policy_gradient_loss | 0.00039 | -| std | 0.435 | -| value_loss | 0.00207 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3588 | -| time_elapsed | 32975 | -| total_timesteps | 459264 | -| train/ | | -| approx_kl | 0.009363285 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -2.62e+03 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 35870 | -| policy_gradient_loss | -0.00837 | -| std | 0.436 | -| value_loss | 1.45e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3589 | -| time_elapsed | 32978 | -| total_timesteps | 459392 | -| train/ | | -| approx_kl | 0.0073116394 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -5.74e+03 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 35880 | -| policy_gradient_loss | -0.0033 | -| std | 0.437 | -| value_loss | 3.64e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3590 | -| time_elapsed | 32981 | -| total_timesteps | 459520 | -| train/ | | -| approx_kl | 0.009727193 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -161 | -| learning_rate | 0.0003 | -| loss | 0.000335 | -| n_updates | 35890 | -| policy_gradient_loss | 2.41e-05 | -| std | 0.436 | -| value_loss | 1.19e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3591 | -| time_elapsed | 32984 | -| total_timesteps | 459648 | -| train/ | | -| approx_kl | 0.014986908 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -1.71 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 35900 | -| policy_gradient_loss | -0.00421 | -| std | 0.435 | -| value_loss | 6.82e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3592 | -| time_elapsed | 32986 | -| total_timesteps | 459776 | -| train/ | | -| approx_kl | 0.00064251386 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.674 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 35910 | -| policy_gradient_loss | 0.000689 | -| std | 0.435 | -| value_loss | 5.05e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3593 | -| time_elapsed | 32989 | -| total_timesteps | 459904 | -| train/ | | -| approx_kl | 0.026428007 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 35920 | -| policy_gradient_loss | -0.00334 | -| std | 0.436 | -| value_loss | 4.82e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3594 | -| time_elapsed | 32992 | -| total_timesteps | 460032 | -| train/ | | -| approx_kl | 0.011138698 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | -0.0084 | -| n_updates | 35930 | -| policy_gradient_loss | -0.00545 | -| std | 0.436 | -| value_loss | 3.09e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3595 | -| time_elapsed | 32999 | -| total_timesteps | 460160 | -| train/ | | -| approx_kl | 0.011059215 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | 0.689 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 35940 | -| policy_gradient_loss | -0.00196 | -| std | 0.436 | -| value_loss | 0.00465 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3596 | -| time_elapsed | 33002 | -| total_timesteps | 460288 | -| train/ | | -| approx_kl | 0.00032288837 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -1.16e+03 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 35950 | -| policy_gradient_loss | 0.000917 | -| std | 0.435 | -| value_loss | 2.19e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3597 | -| time_elapsed | 33004 | -| total_timesteps | 460416 | -| train/ | | -| approx_kl | 0.0011766795 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -2.12e+03 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 35960 | -| policy_gradient_loss | 0.000394 | -| std | 0.436 | -| value_loss | 8.23e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3598 | -| time_elapsed | 33008 | -| total_timesteps | 460544 | -| train/ | | -| approx_kl | 0.050659303 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -368 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 35970 | -| policy_gradient_loss | -0.00885 | -| std | 0.436 | -| value_loss | 3.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3599 | -| time_elapsed | 33010 | -| total_timesteps | 460672 | -| train/ | | -| approx_kl | 0.0078277085 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -7.15 | -| learning_rate | 0.0003 | -| loss | 0.000467 | -| n_updates | 35980 | -| policy_gradient_loss | 0.000231 | -| std | 0.436 | -| value_loss | 1.01e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3600 | -| time_elapsed | 33012 | -| total_timesteps | 460800 | -| train/ | | -| approx_kl | 0.0058200303 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00899 | -| n_updates | 35990 | -| policy_gradient_loss | -0.00259 | -| std | 0.436 | -| value_loss | 7.62e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 13 | -| iterations | 3601 | -| time_elapsed | 33014 | -| total_timesteps | 460928 | -| train/ | | -| approx_kl | 0.00016855286 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -0.399 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 36000 | -| policy_gradient_loss | 0.00225 | -| std | 0.436 | -| value_loss | 7.01e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3602 | -| time_elapsed | 33016 | -| total_timesteps | 461056 | -| train/ | | -| approx_kl | 0.0063496847 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.000175 | -| n_updates | 36010 | -| policy_gradient_loss | 4.15e-05 | -| std | 0.437 | -| value_loss | 7.01e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3603 | -| time_elapsed | 33021 | -| total_timesteps | 461184 | -| train/ | | -| approx_kl | 0.00679518 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 36020 | -| policy_gradient_loss | -0.00808 | -| std | 0.438 | -| value_loss | 0.00253 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3604 | -| time_elapsed | 33024 | -| total_timesteps | 461312 | -| train/ | | -| approx_kl | 0.0058599934 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -51.4 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 36030 | -| policy_gradient_loss | -0.00142 | -| std | 0.438 | -| value_loss | 2.92e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3605 | -| time_elapsed | 33027 | -| total_timesteps | 461440 | -| train/ | | -| approx_kl | 3.326754e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -187 | -| learning_rate | 0.0003 | -| loss | -7.53e-05 | -| n_updates | 36040 | -| policy_gradient_loss | 0.000598 | -| std | 0.44 | -| value_loss | 1.77e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3606 | -| time_elapsed | 33031 | -| total_timesteps | 461568 | -| train/ | | -| approx_kl | 0.0216058 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -7.06 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 36050 | -| policy_gradient_loss | -0.0025 | -| std | 0.442 | -| value_loss | 2.08e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3607 | -| time_elapsed | 33033 | -| total_timesteps | 461696 | -| train/ | | -| approx_kl | 0.00903281 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -4.2 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 36060 | -| policy_gradient_loss | -0.00132 | -| std | 0.442 | -| value_loss | 1.35e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3608 | -| time_elapsed | 33037 | -| total_timesteps | 461824 | -| train/ | | -| approx_kl | 0.004198432 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 36070 | -| policy_gradient_loss | -0.000703 | -| std | 0.44 | -| value_loss | 2.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3609 | -| time_elapsed | 33040 | -| total_timesteps | 461952 | -| train/ | | -| approx_kl | 0.01646832 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.0713 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 36080 | -| policy_gradient_loss | -0.00837 | -| std | 0.438 | -| value_loss | 1.56e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3610 | -| time_elapsed | 33043 | -| total_timesteps | 462080 | -| train/ | | -| approx_kl | 0.0036615224 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.00674 | -| n_updates | 36090 | -| policy_gradient_loss | -0.00139 | -| std | 0.438 | -| value_loss | 1.47e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3611 | -| time_elapsed | 33049 | -| total_timesteps | 462208 | -| train/ | | -| approx_kl | 0.0009275095 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 36100 | -| policy_gradient_loss | -0.000347 | -| std | 0.437 | -| value_loss | 0.000257 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3612 | -| time_elapsed | 33052 | -| total_timesteps | 462336 | -| train/ | | -| approx_kl | 0.017956365 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -903 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 36110 | -| policy_gradient_loss | -0.00145 | -| std | 0.436 | -| value_loss | 2.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3613 | -| time_elapsed | 33055 | -| total_timesteps | 462464 | -| train/ | | -| approx_kl | 0.008147979 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -304 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 36120 | -| policy_gradient_loss | -0.00149 | -| std | 0.437 | -| value_loss | 5.91e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3614 | -| time_elapsed | 33058 | -| total_timesteps | 462592 | -| train/ | | -| approx_kl | 5.955482e-05 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -0.718 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 36130 | -| policy_gradient_loss | 0.00401 | -| std | 0.437 | -| value_loss | 1.04e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3615 | -| time_elapsed | 33060 | -| total_timesteps | 462720 | -| train/ | | -| approx_kl | 0.0011844106 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.592 | -| explained_variance | -3.7 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 36140 | -| policy_gradient_loss | 0.000127 | -| std | 0.438 | -| value_loss | 2.89e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 13 | -| iterations | 3616 | -| time_elapsed | 33063 | -| total_timesteps | 462848 | -| train/ | | -| approx_kl | 0.0065113646 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | 0.00015 | -| n_updates | 36150 | -| policy_gradient_loss | -0.000111 | -| std | 0.438 | -| value_loss | 1.18e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 14 | -| iterations | 3617 | -| time_elapsed | 33065 | -| total_timesteps | 462976 | -| train/ | | -| approx_kl | 0.0070711463 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 36160 | -| policy_gradient_loss | -0.00561 | -| std | 0.439 | -| value_loss | 8.06e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 14 | -| iterations | 3618 | -| time_elapsed | 33067 | -| total_timesteps | 463104 | -| train/ | | -| approx_kl | 0.01108193 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.000884 | -| n_updates | 36170 | -| policy_gradient_loss | -0.000631 | -| std | 0.44 | -| value_loss | 1.84e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 14 | -| iterations | 3619 | -| time_elapsed | 33075 | -| total_timesteps | 463232 | -| train/ | | -| approx_kl | 0.018761214 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -1.63 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 36180 | -| policy_gradient_loss | -0.00947 | -| std | 0.441 | -| value_loss | 0.00183 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 14 | -| iterations | 3620 | -| time_elapsed | 33078 | -| total_timesteps | 463360 | -| train/ | | -| approx_kl | 0.029922225 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -208 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 36190 | -| policy_gradient_loss | -0.0117 | -| std | 0.442 | -| value_loss | 1.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 14 | -| iterations | 3621 | -| time_elapsed | 33081 | -| total_timesteps | 463488 | -| train/ | | -| approx_kl | 0.011678282 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -1.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 36200 | -| policy_gradient_loss | -0.00144 | -| std | 0.441 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 14 | -| iterations | 3622 | -| time_elapsed | 33084 | -| total_timesteps | 463616 | -| train/ | | -| approx_kl | 0.0013580322 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.00713 | -| n_updates | 36210 | -| policy_gradient_loss | 1.76e-05 | -| std | 0.441 | -| value_loss | 3.71e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 14 | -| iterations | 3623 | -| time_elapsed | 33087 | -| total_timesteps | 463744 | -| train/ | | -| approx_kl | 0.03653104 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -8.01 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 36220 | -| policy_gradient_loss | -0.00733 | -| std | 0.441 | -| value_loss | 1.55e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 14 | -| iterations | 3624 | -| time_elapsed | 33089 | -| total_timesteps | 463872 | -| train/ | | -| approx_kl | 0.009799547 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.567 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 36230 | -| policy_gradient_loss | -0.00867 | -| std | 0.441 | -| value_loss | 1.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3625 | -| time_elapsed | 33092 | -| total_timesteps | 464000 | -| train/ | | -| approx_kl | 0.004144798 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.000543 | -| n_updates | 36240 | -| policy_gradient_loss | 0.000517 | -| std | 0.442 | -| value_loss | 2.06e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3626 | -| time_elapsed | 33097 | -| total_timesteps | 464128 | -| train/ | | -| approx_kl | 0.0058820257 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.602 | -| explained_variance | -0.00391 | -| learning_rate | 0.0003 | -| loss | -0.00843 | -| n_updates | 36250 | -| policy_gradient_loss | -0.0025 | -| std | 0.442 | -| value_loss | 2.71e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3627 | -| time_elapsed | 33105 | -| total_timesteps | 464256 | -| train/ | | -| approx_kl | 0.00018345681 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.000666 | -| n_updates | 36260 | -| policy_gradient_loss | 0.000241 | -| std | 0.44 | -| value_loss | 9.16e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3628 | -| time_elapsed | 33109 | -| total_timesteps | 464384 | -| train/ | | -| approx_kl | 0.00080457586 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -820 | -| learning_rate | 0.0003 | -| loss | 0.000489 | -| n_updates | 36270 | -| policy_gradient_loss | 0.000385 | -| std | 0.44 | -| value_loss | 1.47e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3629 | -| time_elapsed | 33113 | -| total_timesteps | 464512 | -| train/ | | -| approx_kl | 0.011203112 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -149 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 36280 | -| policy_gradient_loss | -0.0016 | -| std | 0.441 | -| value_loss | 6.18e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3630 | -| time_elapsed | 33116 | -| total_timesteps | 464640 | -| train/ | | -| approx_kl | 0.0014536018 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -0.611 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 36290 | -| policy_gradient_loss | 8.88e-05 | -| std | 0.44 | -| value_loss | 2.66e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3631 | -| time_elapsed | 33119 | -| total_timesteps | 464768 | -| train/ | | -| approx_kl | 0.00065230276 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 36300 | -| policy_gradient_loss | 0.000398 | -| std | 0.441 | -| value_loss | 4.05e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3632 | -| time_elapsed | 33122 | -| total_timesteps | 464896 | -| train/ | | -| approx_kl | 0.0007801892 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -3.59 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 36310 | -| policy_gradient_loss | 0.00025 | -| std | 0.441 | -| value_loss | 1e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3633 | -| time_elapsed | 33126 | -| total_timesteps | 465024 | -| train/ | | -| approx_kl | 0.029810477 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | -0.00994 | -| n_updates | 36320 | -| policy_gradient_loss | -0.00992 | -| std | 0.441 | -| value_loss | 1.07e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3634 | -| time_elapsed | 33133 | -| total_timesteps | 465152 | -| train/ | | -| approx_kl | 0.019066293 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | 0.803 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 36330 | -| policy_gradient_loss | -0.00301 | -| std | 0.441 | -| value_loss | 0.00264 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3635 | -| time_elapsed | 33137 | -| total_timesteps | 465280 | -| train/ | | -| approx_kl | 0.028127197 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -685 | -| learning_rate | 0.0003 | -| loss | -0.00857 | -| n_updates | 36340 | -| policy_gradient_loss | -0.00781 | -| std | 0.44 | -| value_loss | 1.36e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3636 | -| time_elapsed | 33139 | -| total_timesteps | 465408 | -| train/ | | -| approx_kl | 0.013003685 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -2.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.00971 | -| n_updates | 36350 | -| policy_gradient_loss | -0.00414 | -| std | 0.44 | -| value_loss | 4.93e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3637 | -| time_elapsed | 33143 | -| total_timesteps | 465536 | -| train/ | | -| approx_kl | 6.4042397e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -640 | -| learning_rate | 0.0003 | -| loss | 0.000443 | -| n_updates | 36360 | -| policy_gradient_loss | 0.00393 | -| std | 0.44 | -| value_loss | 6.03e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3638 | -| time_elapsed | 33147 | -| total_timesteps | 465664 | -| train/ | | -| approx_kl | 0.02327394 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | -0.598 | -| explained_variance | -55.2 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 36370 | -| policy_gradient_loss | -0.0108 | -| std | 0.44 | -| value_loss | 7.8e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3639 | -| time_elapsed | 33150 | -| total_timesteps | 465792 | -| train/ | | -| approx_kl | 0.013801877 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.00701 | -| n_updates | 36380 | -| policy_gradient_loss | -0.00321 | -| std | 0.439 | -| value_loss | 2.71e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3640 | -| time_elapsed | 33153 | -| total_timesteps | 465920 | -| train/ | | -| approx_kl | 0.03335067 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 36390 | -| policy_gradient_loss | -0.0164 | -| std | 0.439 | -| value_loss | 3.66e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3641 | -| time_elapsed | 33156 | -| total_timesteps | 466048 | -| train/ | | -| approx_kl | 0.008706765 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.377 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 36400 | -| policy_gradient_loss | -0.00352 | -| std | 0.439 | -| value_loss | 2.08e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3642 | -| time_elapsed | 33163 | -| total_timesteps | 466176 | -| train/ | | -| approx_kl | 0.021571832 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | 0.838 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 36410 | -| policy_gradient_loss | -0.0113 | -| std | 0.438 | -| value_loss | 0.00278 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3643 | -| time_elapsed | 33166 | -| total_timesteps | 466304 | -| train/ | | -| approx_kl | 0.026822135 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -2.65e+03 | -| learning_rate | 0.0003 | -| loss | -0.0096 | -| n_updates | 36420 | -| policy_gradient_loss | -0.00654 | -| std | 0.438 | -| value_loss | 6.81e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3644 | -| time_elapsed | 33170 | -| total_timesteps | 466432 | -| train/ | | -| approx_kl | 0.02149917 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -4.28e+03 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 36430 | -| policy_gradient_loss | -0.0165 | -| std | 0.438 | -| value_loss | 3.65e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3645 | -| time_elapsed | 33174 | -| total_timesteps | 466560 | -| train/ | | -| approx_kl | 0.00067931577 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -1.59e+04 | -| learning_rate | 0.0003 | -| loss | -0.000377 | -| n_updates | 36440 | -| policy_gradient_loss | -0.000102 | -| std | 0.438 | -| value_loss | 3.4e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3646 | -| time_elapsed | 33177 | -| total_timesteps | 466688 | -| train/ | | -| approx_kl | 0.029611794 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -1.1e+03 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 36450 | -| policy_gradient_loss | -0.0063 | -| std | 0.439 | -| value_loss | 4.03e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3647 | -| time_elapsed | 33181 | -| total_timesteps | 466816 | -| train/ | | -| approx_kl | 0.08096729 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -1.8e+03 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 36460 | -| policy_gradient_loss | -0.00907 | -| std | 0.438 | -| value_loss | 1.64e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3648 | -| time_elapsed | 33184 | -| total_timesteps | 466944 | -| train/ | | -| approx_kl | 0.021212084 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -145 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 36470 | -| policy_gradient_loss | -0.00169 | -| std | 0.438 | -| value_loss | 2.79e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3649 | -| time_elapsed | 33188 | -| total_timesteps | 467072 | -| train/ | | -| approx_kl | 0.0009783702 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -7.44 | -| learning_rate | 0.0003 | -| loss | -0.00053 | -| n_updates | 36480 | -| policy_gradient_loss | -0.000181 | -| std | 0.44 | -| value_loss | 4.95e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3650 | -| time_elapsed | 33194 | -| total_timesteps | 467200 | -| train/ | | -| approx_kl | 0.017958976 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.6 | -| explained_variance | -0.425 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 36490 | -| policy_gradient_loss | -0.00739 | -| std | 0.442 | -| value_loss | 0.00236 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3651 | -| time_elapsed | 33198 | -| total_timesteps | 467328 | -| train/ | | -| approx_kl | 0.0018973555 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.601 | -| explained_variance | -683 | -| learning_rate | 0.0003 | -| loss | 8.31e-05 | -| n_updates | 36500 | -| policy_gradient_loss | 4.62e-05 | -| std | 0.441 | -| value_loss | 5.41e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3652 | -| time_elapsed | 33201 | -| total_timesteps | 467456 | -| train/ | | -| approx_kl | 0.0014784103 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.599 | -| explained_variance | -2.21e+03 | -| learning_rate | 0.0003 | -| loss | -0.000649 | -| n_updates | 36510 | -| policy_gradient_loss | -0.000312 | -| std | 0.44 | -| value_loss | 1.87e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3653 | -| time_elapsed | 33204 | -| total_timesteps | 467584 | -| train/ | | -| approx_kl | 0.029535264 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -21.1 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 36520 | -| policy_gradient_loss | -0.00485 | -| std | 0.439 | -| value_loss | 8.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3654 | -| time_elapsed | 33207 | -| total_timesteps | 467712 | -| train/ | | -| approx_kl | 0.03545864 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -3.57 | -| learning_rate | 0.0003 | -| loss | 6.35e-05 | -| n_updates | 36530 | -| policy_gradient_loss | -0.00314 | -| std | 0.439 | -| value_loss | 1.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3655 | -| time_elapsed | 33210 | -| total_timesteps | 467840 | -| train/ | | -| approx_kl | 0.0013601088 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -0.00724 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 36540 | -| policy_gradient_loss | -0.00017 | -| std | 0.439 | -| value_loss | 2.61e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3656 | -| time_elapsed | 33214 | -| total_timesteps | 467968 | -| train/ | | -| approx_kl | 0.015899863 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | 0.00793 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 36550 | -| policy_gradient_loss | -0.00851 | -| std | 0.439 | -| value_loss | 2.45e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3657 | -| time_elapsed | 33218 | -| total_timesteps | 468096 | -| train/ | | -| approx_kl | 0.0146033 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | 0.00498 | -| learning_rate | 0.0003 | -| loss | -0.00753 | -| n_updates | 36560 | -| policy_gradient_loss | -0.00568 | -| std | 0.439 | -| value_loss | 2.78e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3658 | -| time_elapsed | 33224 | -| total_timesteps | 468224 | -| train/ | | -| approx_kl | 0.029515924 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | 0.0518 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 36570 | -| policy_gradient_loss | -0.0078 | -| std | 0.439 | -| value_loss | 0.00157 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3659 | -| time_elapsed | 33228 | -| total_timesteps | 468352 | -| train/ | | -| approx_kl | 0.00065527647 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.596 | -| explained_variance | -1.37e+03 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 36580 | -| policy_gradient_loss | 0.00138 | -| std | 0.439 | -| value_loss | 5.1e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3660 | -| time_elapsed | 33232 | -| total_timesteps | 468480 | -| train/ | | -| approx_kl | 0.0011000978 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -259 | -| learning_rate | 0.0003 | -| loss | -0.00516 | -| n_updates | 36590 | -| policy_gradient_loss | 0.000668 | -| std | 0.44 | -| value_loss | 1.82e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3661 | -| time_elapsed | 33235 | -| total_timesteps | 468608 | -| train/ | | -| approx_kl | 0.0008221399 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -18.2 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 36600 | -| policy_gradient_loss | 0.000753 | -| std | 0.44 | -| value_loss | 1.09e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3662 | -| time_elapsed | 33239 | -| total_timesteps | 468736 | -| train/ | | -| approx_kl | 0.0010362593 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.597 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 36610 | -| policy_gradient_loss | 0.000377 | -| std | 0.439 | -| value_loss | 1.98e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3663 | -| time_elapsed | 33244 | -| total_timesteps | 468864 | -| train/ | | -| approx_kl | 0.024802778 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | -0.595 | -| explained_variance | -0.00811 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 36620 | -| policy_gradient_loss | -0.0124 | -| std | 0.439 | -| value_loss | 1.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3664 | -| time_elapsed | 33247 | -| total_timesteps | 468992 | -| train/ | | -| approx_kl | 0.011170708 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.594 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 36630 | -| policy_gradient_loss | -0.00788 | -| std | 0.438 | -| value_loss | 8.89e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3665 | -| time_elapsed | 33251 | -| total_timesteps | 469120 | -| train/ | | -| approx_kl | 0.0023550512 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.593 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | -0.00034 | -| n_updates | 36640 | -| policy_gradient_loss | -0.000177 | -| std | 0.438 | -| value_loss | 1.56e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3666 | -| time_elapsed | 33261 | -| total_timesteps | 469248 | -| train/ | | -| approx_kl | 0.013824305 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 36650 | -| policy_gradient_loss | -0.00163 | -| std | 0.437 | -| value_loss | 2.49e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3667 | -| time_elapsed | 33265 | -| total_timesteps | 469376 | -| train/ | | -| approx_kl | 0.004242935 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -129 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 36660 | -| policy_gradient_loss | -0.00113 | -| std | 0.436 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3668 | -| time_elapsed | 33269 | -| total_timesteps | 469504 | -| train/ | | -| approx_kl | 0.024753792 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 36670 | -| policy_gradient_loss | -0.0135 | -| std | 0.436 | -| value_loss | 4.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3669 | -| time_elapsed | 33274 | -| total_timesteps | 469632 | -| train/ | | -| approx_kl | 0.014014669 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 36680 | -| policy_gradient_loss | -0.00938 | -| std | 0.435 | -| value_loss | 2.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3670 | -| time_elapsed | 33277 | -| total_timesteps | 469760 | -| train/ | | -| approx_kl | 0.012578668 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 36690 | -| policy_gradient_loss | -0.00355 | -| std | 0.434 | -| value_loss | 1.74e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3671 | -| time_elapsed | 33281 | -| total_timesteps | 469888 | -| train/ | | -| approx_kl | 0.009607345 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.000308 | -| n_updates | 36700 | -| policy_gradient_loss | -0.00116 | -| std | 0.434 | -| value_loss | 2.87e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3672 | -| time_elapsed | 33284 | -| total_timesteps | 470016 | -| train/ | | -| approx_kl | 0.009878115 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 36710 | -| policy_gradient_loss | -0.00632 | -| std | 0.434 | -| value_loss | 1.6e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3673 | -| time_elapsed | 33293 | -| total_timesteps | 470144 | -| train/ | | -| approx_kl | 0.0022232234 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 36720 | -| policy_gradient_loss | -0.000395 | -| std | 0.434 | -| value_loss | 3.81e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3674 | -| time_elapsed | 33297 | -| total_timesteps | 470272 | -| train/ | | -| approx_kl | 0.0005608904 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -52.9 | -| learning_rate | 0.0003 | -| loss | -0.00439 | -| n_updates | 36730 | -| policy_gradient_loss | 0.00146 | -| std | 0.433 | -| value_loss | 3.22e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3675 | -| time_elapsed | 33301 | -| total_timesteps | 470400 | -| train/ | | -| approx_kl | 0.0009779327 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -99.3 | -| learning_rate | 0.0003 | -| loss | 0.00061 | -| n_updates | 36740 | -| policy_gradient_loss | 0.00056 | -| std | 0.434 | -| value_loss | 1.62e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3676 | -| time_elapsed | 33305 | -| total_timesteps | 470528 | -| train/ | | -| approx_kl | 0.009552244 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -3 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 36750 | -| policy_gradient_loss | -0.00261 | -| std | 0.435 | -| value_loss | 5.63e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3677 | -| time_elapsed | 33309 | -| total_timesteps | 470656 | -| train/ | | -| approx_kl | 0.0033245927 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 36760 | -| policy_gradient_loss | -0.00172 | -| std | 0.435 | -| value_loss | 2.48e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3678 | -| time_elapsed | 33313 | -| total_timesteps | 470784 | -| train/ | | -| approx_kl | 0.019768964 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 36770 | -| policy_gradient_loss | -0.00168 | -| std | 0.436 | -| value_loss | 1.93e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3679 | -| time_elapsed | 33316 | -| total_timesteps | 470912 | -| train/ | | -| approx_kl | 0.0126084555 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 36780 | -| policy_gradient_loss | -0.0103 | -| std | 0.436 | -| value_loss | 5.53e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3680 | -| time_elapsed | 33320 | -| total_timesteps | 471040 | -| train/ | | -| approx_kl | 0.004844296 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -0.00224 | -| learning_rate | 0.0003 | -| loss | 0.000302 | -| n_updates | 36790 | -| policy_gradient_loss | 0.000106 | -| std | 0.436 | -| value_loss | 1.04e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3681 | -| time_elapsed | 33327 | -| total_timesteps | 471168 | -| train/ | | -| approx_kl | 0.0037651774 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.000275 | -| n_updates | 36800 | -| policy_gradient_loss | -0.00047 | -| std | 0.435 | -| value_loss | 0.00164 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3682 | -| time_elapsed | 33331 | -| total_timesteps | 471296 | -| train/ | | -| approx_kl | 0.005911426 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -1.94e+03 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 36810 | -| policy_gradient_loss | -0.00218 | -| std | 0.434 | -| value_loss | 2.15e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3683 | -| time_elapsed | 33336 | -| total_timesteps | 471424 | -| train/ | | -| approx_kl | 0.04520325 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -1.35e+03 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 36820 | -| policy_gradient_loss | -0.00791 | -| std | 0.434 | -| value_loss | 5.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3684 | -| time_elapsed | 33339 | -| total_timesteps | 471552 | -| train/ | | -| approx_kl | 0.032818194 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 36830 | -| policy_gradient_loss | -0.0031 | -| std | 0.434 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3685 | -| time_elapsed | 33343 | -| total_timesteps | 471680 | -| train/ | | -| approx_kl | 0.0001452372 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -15.6 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 36840 | -| policy_gradient_loss | 0.0016 | -| std | 0.434 | -| value_loss | 2.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3686 | -| time_elapsed | 33348 | -| total_timesteps | 471808 | -| train/ | | -| approx_kl | 0.017248895 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -0.956 | -| learning_rate | 0.0003 | -| loss | 0.00174 | -| n_updates | 36850 | -| policy_gradient_loss | -0.00142 | -| std | 0.433 | -| value_loss | 7.34e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3687 | -| time_elapsed | 33351 | -| total_timesteps | 471936 | -| train/ | | -| approx_kl | 0.0108542 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 36860 | -| policy_gradient_loss | -0.00181 | -| std | 0.432 | -| value_loss | 5.97e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3688 | -| time_elapsed | 33355 | -| total_timesteps | 472064 | -| train/ | | -| approx_kl | 0.009470627 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 36870 | -| policy_gradient_loss | -0.00208 | -| std | 0.431 | -| value_loss | 2.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3689 | -| time_elapsed | 33360 | -| total_timesteps | 472192 | -| train/ | | -| approx_kl | 0.006836402 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.578 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 36880 | -| policy_gradient_loss | -0.00168 | -| std | 0.432 | -| value_loss | 0.000646 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3690 | -| time_elapsed | 33363 | -| total_timesteps | 472320 | -| train/ | | -| approx_kl | 0.04588843 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -949 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 36890 | -| policy_gradient_loss | -0.00547 | -| std | 0.431 | -| value_loss | 5.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3691 | -| time_elapsed | 33367 | -| total_timesteps | 472448 | -| train/ | | -| approx_kl | 0.03629879 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.578 | -| explained_variance | -766 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 36900 | -| policy_gradient_loss | -0.0153 | -| std | 0.431 | -| value_loss | 6.18e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3692 | -| time_elapsed | 33371 | -| total_timesteps | 472576 | -| train/ | | -| approx_kl | 0.027567595 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -45.6 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 36910 | -| policy_gradient_loss | -0.0056 | -| std | 0.431 | -| value_loss | 5.11e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3693 | -| time_elapsed | 33374 | -| total_timesteps | 472704 | -| train/ | | -| approx_kl | 0.0008314301 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -9.87 | -| learning_rate | 0.0003 | -| loss | -0.0063 | -| n_updates | 36920 | -| policy_gradient_loss | 0.00101 | -| std | 0.431 | -| value_loss | 2.2e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3694 | -| time_elapsed | 33378 | -| total_timesteps | 472832 | -| train/ | | -| approx_kl | 0.00081888307 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 36930 | -| policy_gradient_loss | 0.00071 | -| std | 0.431 | -| value_loss | 5.9e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.2 | -| time/ | | -| fps | 14 | -| iterations | 3695 | -| time_elapsed | 33381 | -| total_timesteps | 472960 | -| train/ | | -| approx_kl | 0.017182898 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 36940 | -| policy_gradient_loss | -0.0005 | -| std | 0.431 | -| value_loss | 5.74e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3696 | -| time_elapsed | 33385 | -| total_timesteps | 473088 | -| train/ | | -| approx_kl | 0.006845736 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | -0.000701 | -| n_updates | 36950 | -| policy_gradient_loss | -0.000751 | -| std | 0.431 | -| value_loss | 6.44e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3697 | -| time_elapsed | 33390 | -| total_timesteps | 473216 | -| train/ | | -| approx_kl | 5.640788e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.000381 | -| n_updates | 36960 | -| policy_gradient_loss | -0.000173 | -| std | 0.43 | -| value_loss | 8.77e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3698 | -| time_elapsed | 33394 | -| total_timesteps | 473344 | -| train/ | | -| approx_kl | 0.020100158 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.574 | -| explained_variance | -4.21e+03 | -| learning_rate | 0.0003 | -| loss | -0.00464 | -| n_updates | 36970 | -| policy_gradient_loss | -0.00213 | -| std | 0.429 | -| value_loss | 6.21e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3699 | -| time_elapsed | 33396 | -| total_timesteps | 473472 | -| train/ | | -| approx_kl | 0.00019772002 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.574 | -| explained_variance | -380 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 36980 | -| policy_gradient_loss | 0.00093 | -| std | 0.43 | -| value_loss | 9.25e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3700 | -| time_elapsed | 33399 | -| total_timesteps | 473600 | -| train/ | | -| approx_kl | 0.0013108414 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | -28.1 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 36990 | -| policy_gradient_loss | 0.000245 | -| std | 0.431 | -| value_loss | 1.46e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3701 | -| time_elapsed | 33402 | -| total_timesteps | 473728 | -| train/ | | -| approx_kl | 0.040150013 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 37000 | -| policy_gradient_loss | -0.00861 | -| std | 0.431 | -| value_loss | 2.12e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3702 | -| time_elapsed | 33405 | -| total_timesteps | 473856 | -| train/ | | -| approx_kl | 0.0019239332 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 8.55e-05 | -| n_updates | 37010 | -| policy_gradient_loss | 4.67e-05 | -| std | 0.431 | -| value_loss | 7.56e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3703 | -| time_elapsed | 33409 | -| total_timesteps | 473984 | -| train/ | | -| approx_kl | 0.016313884 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 37020 | -| policy_gradient_loss | -0.00312 | -| std | 0.431 | -| value_loss | 5.64e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3704 | -| time_elapsed | 33412 | -| total_timesteps | 474112 | -| train/ | | -| approx_kl | 0.0051369853 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -0.0731 | -| learning_rate | 0.0003 | -| loss | -0.000946 | -| n_updates | 37030 | -| policy_gradient_loss | -0.000576 | -| std | 0.433 | -| value_loss | 2.97e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3705 | -| time_elapsed | 33420 | -| total_timesteps | 474240 | -| train/ | | -| approx_kl | 0.0094011 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 37040 | -| policy_gradient_loss | -0.00995 | -| std | 0.434 | -| value_loss | 0.000773 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3706 | -| time_elapsed | 33423 | -| total_timesteps | 474368 | -| train/ | | -| approx_kl | 0.0017655105 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -5.9e+03 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 37050 | -| policy_gradient_loss | -0.000129 | -| std | 0.434 | -| value_loss | 2.47e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3707 | -| time_elapsed | 33427 | -| total_timesteps | 474496 | -| train/ | | -| approx_kl | 0.010910734 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -4.27e+03 | -| learning_rate | 0.0003 | -| loss | -0.00023 | -| n_updates | 37060 | -| policy_gradient_loss | -0.000291 | -| std | 0.436 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3708 | -| time_elapsed | 33430 | -| total_timesteps | 474624 | -| train/ | | -| approx_kl | 0.012056031 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -30 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 37070 | -| policy_gradient_loss | -0.00173 | -| std | 0.437 | -| value_loss | 3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3709 | -| time_elapsed | 33433 | -| total_timesteps | 474752 | -| train/ | | -| approx_kl | 0.019593054 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -315 | -| learning_rate | 0.0003 | -| loss | -0.000749 | -| n_updates | 37080 | -| policy_gradient_loss | -0.00111 | -| std | 0.436 | -| value_loss | 2.55e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3710 | -| time_elapsed | 33437 | -| total_timesteps | 474880 | -| train/ | | -| approx_kl | 0.00052841054 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.589 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | -0.000294 | -| n_updates | 37090 | -| policy_gradient_loss | -0.000116 | -| std | 0.435 | -| value_loss | 8.53e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3711 | -| time_elapsed | 33439 | -| total_timesteps | 475008 | -| train/ | | -| approx_kl | 0.007734785 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 37100 | -| policy_gradient_loss | -0.00188 | -| std | 0.435 | -| value_loss | 3.62e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3712 | -| time_elapsed | 33448 | -| total_timesteps | 475136 | -| train/ | | -| approx_kl | 0.00986062 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 37110 | -| policy_gradient_loss | -0.000934 | -| std | 0.435 | -| value_loss | 4.41e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3713 | -| time_elapsed | 33451 | -| total_timesteps | 475264 | -| train/ | | -| approx_kl | 0.00785278 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -483 | -| learning_rate | 0.0003 | -| loss | -0.00686 | -| n_updates | 37120 | -| policy_gradient_loss | -0.00233 | -| std | 0.436 | -| value_loss | 2.98e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3714 | -| time_elapsed | 33455 | -| total_timesteps | 475392 | -| train/ | | -| approx_kl | 2.743653e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -62.4 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 37130 | -| policy_gradient_loss | 0.000731 | -| std | 0.435 | -| value_loss | 1.9e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3715 | -| time_elapsed | 33458 | -| total_timesteps | 475520 | -| train/ | | -| approx_kl | 0.027773108 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | -0.00966 | -| n_updates | 37140 | -| policy_gradient_loss | -0.00718 | -| std | 0.434 | -| value_loss | 1.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3716 | -| time_elapsed | 33461 | -| total_timesteps | 475648 | -| train/ | | -| approx_kl | 0.015739786 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | -5.54 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 37150 | -| policy_gradient_loss | -0.0102 | -| std | 0.433 | -| value_loss | 4.22e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3717 | -| time_elapsed | 33466 | -| total_timesteps | 475776 | -| train/ | | -| approx_kl | 0.0013869894 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -0.00207 | -| learning_rate | 0.0003 | -| loss | -0.000142 | -| n_updates | 37160 | -| policy_gradient_loss | -7.79e-05 | -| std | 0.432 | -| value_loss | 4.22e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3718 | -| time_elapsed | 33469 | -| total_timesteps | 475904 | -| train/ | | -| approx_kl | 0.015452115 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 37170 | -| policy_gradient_loss | -0.00754 | -| std | 0.432 | -| value_loss | 1.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3719 | -| time_elapsed | 33473 | -| total_timesteps | 476032 | -| train/ | | -| approx_kl | 0.006463879 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -4.75 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 37180 | -| policy_gradient_loss | -0.000868 | -| std | 0.433 | -| value_loss | 1.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3720 | -| time_elapsed | 33479 | -| total_timesteps | 476160 | -| train/ | | -| approx_kl | 0.015548221 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 37190 | -| policy_gradient_loss | -0.00272 | -| std | 0.434 | -| value_loss | 1.46e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3721 | -| time_elapsed | 33482 | -| total_timesteps | 476288 | -| train/ | | -| approx_kl | 0.0015912154 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -767 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 37200 | -| policy_gradient_loss | -0.000219 | -| std | 0.434 | -| value_loss | 3.25e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3722 | -| time_elapsed | 33486 | -| total_timesteps | 476416 | -| train/ | | -| approx_kl | 0.004097494 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -86.4 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 37210 | -| policy_gradient_loss | -0.000641 | -| std | 0.433 | -| value_loss | 4.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3723 | -| time_elapsed | 33489 | -| total_timesteps | 476544 | -| train/ | | -| approx_kl | 0.034271836 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -108 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 37220 | -| policy_gradient_loss | -0.00983 | -| std | 0.432 | -| value_loss | 4.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3724 | -| time_elapsed | 33494 | -| total_timesteps | 476672 | -| train/ | | -| approx_kl | 0.041639943 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -65.2 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 37230 | -| policy_gradient_loss | -0.00647 | -| std | 0.432 | -| value_loss | 8.09e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3725 | -| time_elapsed | 33498 | -| total_timesteps | 476800 | -| train/ | | -| approx_kl | 7.0247566e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -0.808 | -| learning_rate | 0.0003 | -| loss | 0.000247 | -| n_updates | 37240 | -| policy_gradient_loss | 0.000696 | -| std | 0.431 | -| value_loss | 5.01e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3726 | -| time_elapsed | 33501 | -| total_timesteps | 476928 | -| train/ | | -| approx_kl | 0.015009873 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -2.85e-05 | -| n_updates | 37250 | -| policy_gradient_loss | -0.00131 | -| std | 0.433 | -| value_loss | 2.88e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3727 | -| time_elapsed | 33506 | -| total_timesteps | 477056 | -| train/ | | -| approx_kl | 0.011002414 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | 0.000742 | -| learning_rate | 0.0003 | -| loss | -0.000165 | -| n_updates | 37260 | -| policy_gradient_loss | -0.00155 | -| std | 0.433 | -| value_loss | 4.05e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3728 | -| time_elapsed | 33512 | -| total_timesteps | 477184 | -| train/ | | -| approx_kl | 0.009033842 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 37270 | -| policy_gradient_loss | -0.00202 | -| std | 0.433 | -| value_loss | 0.000425 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3729 | -| time_elapsed | 33515 | -| total_timesteps | 477312 | -| train/ | | -| approx_kl | 0.0031643203 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -3.5e+03 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 37280 | -| policy_gradient_loss | 0.00078 | -| std | 0.433 | -| value_loss | 3.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3730 | -| time_elapsed | 33518 | -| total_timesteps | 477440 | -| train/ | | -| approx_kl | 0.017130792 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | -1.37e+04 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 37290 | -| policy_gradient_loss | -0.0072 | -| std | 0.433 | -| value_loss | 3.96e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3731 | -| time_elapsed | 33521 | -| total_timesteps | 477568 | -| train/ | | -| approx_kl | 0.0002609077 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -53.3 | -| learning_rate | 0.0003 | -| loss | -0.000803 | -| n_updates | 37300 | -| policy_gradient_loss | 0.000122 | -| std | 0.432 | -| value_loss | 1.09e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3732 | -| time_elapsed | 33524 | -| total_timesteps | 477696 | -| train/ | | -| approx_kl | 0.0035929503 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -0.343 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 37310 | -| policy_gradient_loss | -0.00088 | -| std | 0.431 | -| value_loss | 1.13e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3733 | -| time_elapsed | 33527 | -| total_timesteps | 477824 | -| train/ | | -| approx_kl | 0.00043918286 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | -0.497 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 37320 | -| policy_gradient_loss | 0.00338 | -| std | 0.43 | -| value_loss | 6.64e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3734 | -| time_elapsed | 33530 | -| total_timesteps | 477952 | -| train/ | | -| approx_kl | 0.001243647 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.575 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 37330 | -| policy_gradient_loss | 0.000237 | -| std | 0.43 | -| value_loss | 1.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3735 | -| time_elapsed | 33531 | -| total_timesteps | 478080 | -| train/ | | -| approx_kl | 0.018478058 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | -0.00419 | -| learning_rate | 0.0003 | -| loss | -0.0063 | -| n_updates | 37340 | -| policy_gradient_loss | -0.00699 | -| std | 0.43 | -| value_loss | 6.36e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3736 | -| time_elapsed | 33538 | -| total_timesteps | 478208 | -| train/ | | -| approx_kl | 0.0018393965 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.000635 | -| n_updates | 37350 | -| policy_gradient_loss | -0.000253 | -| std | 0.431 | -| value_loss | 0.00012 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3737 | -| time_elapsed | 33541 | -| total_timesteps | 478336 | -| train/ | | -| approx_kl | 0.013366205 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -2.93e+03 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 37360 | -| policy_gradient_loss | -0.00756 | -| std | 0.432 | -| value_loss | 3.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3738 | -| time_elapsed | 33544 | -| total_timesteps | 478464 | -| train/ | | -| approx_kl | 0.014761171 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -605 | -| learning_rate | 0.0003 | -| loss | -0.00557 | -| n_updates | 37370 | -| policy_gradient_loss | -0.00258 | -| std | 0.432 | -| value_loss | 6.91e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3739 | -| time_elapsed | 33547 | -| total_timesteps | 478592 | -| train/ | | -| approx_kl | 0.04183886 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -8.33 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 37380 | -| policy_gradient_loss | -0.0112 | -| std | 0.432 | -| value_loss | 1.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3740 | -| time_elapsed | 33550 | -| total_timesteps | 478720 | -| train/ | | -| approx_kl | 0.009545492 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -30.6 | -| learning_rate | 0.0003 | -| loss | -0.00476 | -| n_updates | 37390 | -| policy_gradient_loss | -0.00179 | -| std | 0.432 | -| value_loss | 1.17e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3741 | -| time_elapsed | 33553 | -| total_timesteps | 478848 | -| train/ | | -| approx_kl | 0.00013255375 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 37400 | -| policy_gradient_loss | 0.000838 | -| std | 0.433 | -| value_loss | 4.58e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3742 | -| time_elapsed | 33555 | -| total_timesteps | 478976 | -| train/ | | -| approx_kl | 0.0016816761 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -489 | -| learning_rate | 0.0003 | -| loss | -0.00523 | -| n_updates | 37410 | -| policy_gradient_loss | 0.000261 | -| std | 0.434 | -| value_loss | 3.27e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3743 | -| time_elapsed | 33558 | -| total_timesteps | 479104 | -| train/ | | -| approx_kl | 4.9251365e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.584 | -| explained_variance | -2.25 | -| learning_rate | 0.0003 | -| loss | 0.000143 | -| n_updates | 37420 | -| policy_gradient_loss | 0.00055 | -| std | 0.433 | -| value_loss | 1.37e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3744 | -| time_elapsed | 33569 | -| total_timesteps | 479232 | -| train/ | | -| approx_kl | 0.015253778 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.582 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 37430 | -| policy_gradient_loss | -0.0103 | -| std | 0.433 | -| value_loss | 0.000121 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3745 | -| time_elapsed | 33573 | -| total_timesteps | 479360 | -| train/ | | -| approx_kl | 0.0012658734 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | -2.5e+03 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 37440 | -| policy_gradient_loss | -0.000223 | -| std | 0.434 | -| value_loss | 9.87e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3746 | -| time_elapsed | 33576 | -| total_timesteps | 479488 | -| train/ | | -| approx_kl | 0.0062000756 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -4.69e+03 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 37450 | -| policy_gradient_loss | -0.00116 | -| std | 0.435 | -| value_loss | 2.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3747 | -| time_elapsed | 33579 | -| total_timesteps | 479616 | -| train/ | | -| approx_kl | 0.020482197 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -98.6 | -| learning_rate | 0.0003 | -| loss | -0.00626 | -| n_updates | 37460 | -| policy_gradient_loss | -0.00581 | -| std | 0.435 | -| value_loss | 1.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3748 | -| time_elapsed | 33582 | -| total_timesteps | 479744 | -| train/ | | -| approx_kl | 0.009245412 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.587 | -| explained_variance | -2.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 37470 | -| policy_gradient_loss | -0.00376 | -| std | 0.435 | -| value_loss | 2.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3749 | -| time_elapsed | 33585 | -| total_timesteps | 479872 | -| train/ | | -| approx_kl | 0.034086205 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -337 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 37480 | -| policy_gradient_loss | -0.0101 | -| std | 0.435 | -| value_loss | 1.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3750 | -| time_elapsed | 33587 | -| total_timesteps | 480000 | -| train/ | | -| approx_kl | 0.009074771 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -2.28 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 37490 | -| policy_gradient_loss | -0.00785 | -| std | 0.434 | -| value_loss | 5.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3751 | -| time_elapsed | 33590 | -| total_timesteps | 480128 | -| train/ | | -| approx_kl | 0.012121147 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.585 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.00803 | -| n_updates | 37500 | -| policy_gradient_loss | -0.00415 | -| std | 0.434 | -| value_loss | 3.38e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3752 | -| time_elapsed | 33596 | -| total_timesteps | 480256 | -| train/ | | -| approx_kl | 0.0013145779 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.586 | -| explained_variance | -0.889 | -| learning_rate | 0.0003 | -| loss | -0.000457 | -| n_updates | 37510 | -| policy_gradient_loss | -0.000162 | -| std | 0.435 | -| value_loss | 0.00267 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3753 | -| time_elapsed | 33599 | -| total_timesteps | 480384 | -| train/ | | -| approx_kl | 0.026206369 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | -2.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 37520 | -| policy_gradient_loss | -0.0114 | -| std | 0.436 | -| value_loss | 6.68e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3754 | -| time_elapsed | 33601 | -| total_timesteps | 480512 | -| train/ | | -| approx_kl | 0.01467699 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.59 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 37530 | -| policy_gradient_loss | -0.0107 | -| std | 0.437 | -| value_loss | 5.15e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3755 | -| time_elapsed | 33604 | -| total_timesteps | 480640 | -| train/ | | -| approx_kl | 0.0012464088 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.357 | -| learning_rate | 0.0003 | -| loss | -0.00021 | -| n_updates | 37540 | -| policy_gradient_loss | -9.44e-05 | -| std | 0.437 | -| value_loss | 2.84e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3756 | -| time_elapsed | 33607 | -| total_timesteps | 480768 | -| train/ | | -| approx_kl | 0.018196125 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -2.21 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 37550 | -| policy_gradient_loss | -0.00264 | -| std | 0.437 | -| value_loss | 3.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 14 | -| iterations | 3757 | -| time_elapsed | 33610 | -| total_timesteps | 480896 | -| train/ | | -| approx_kl | 0.01606354 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | -0.591 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 37560 | -| policy_gradient_loss | -0.00338 | -| std | 0.437 | -| value_loss | 1.45e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3758 | -| time_elapsed | 33613 | -| total_timesteps | 481024 | -| train/ | | -| approx_kl | 0.00055764755 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.588 | -| explained_variance | 0.00188 | -| learning_rate | 0.0003 | -| loss | -0.000954 | -| n_updates | 37570 | -| policy_gradient_loss | -0.000418 | -| std | 0.434 | -| value_loss | 7.29e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3759 | -| time_elapsed | 33620 | -| total_timesteps | 481152 | -| train/ | | -| approx_kl | 0.014476868 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.583 | -| explained_variance | 0.793 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 37580 | -| policy_gradient_loss | -0.0101 | -| std | 0.433 | -| value_loss | 0.00308 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3760 | -| time_elapsed | 33623 | -| total_timesteps | 481280 | -| train/ | | -| approx_kl | 0.029302452 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -89.5 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 37590 | -| policy_gradient_loss | -0.0138 | -| std | 0.432 | -| value_loss | 7.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3761 | -| time_elapsed | 33626 | -| total_timesteps | 481408 | -| train/ | | -| approx_kl | 0.018593237 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.58 | -| explained_variance | -202 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 37600 | -| policy_gradient_loss | -0.00277 | -| std | 0.432 | -| value_loss | 3.78e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3762 | -| time_elapsed | 33629 | -| total_timesteps | 481536 | -| train/ | | -| approx_kl | 6.47523e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | 0.000724 | -| n_updates | 37610 | -| policy_gradient_loss | 0.00271 | -| std | 0.433 | -| value_loss | 7.73e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3763 | -| time_elapsed | 33633 | -| total_timesteps | 481664 | -| train/ | | -| approx_kl | 0.0065422114 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.581 | -| explained_variance | -2.98 | -| learning_rate | 0.0003 | -| loss | -0.000319 | -| n_updates | 37620 | -| policy_gradient_loss | -0.000405 | -| std | 0.432 | -| value_loss | 7.41e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3764 | -| time_elapsed | 33636 | -| total_timesteps | 481792 | -| train/ | | -| approx_kl | 0.016347783 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.579 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 37630 | -| policy_gradient_loss | -0.0118 | -| std | 0.431 | -| value_loss | 1.19e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.18 | -| time/ | | -| fps | 14 | -| iterations | 3765 | -| time_elapsed | 33640 | -| total_timesteps | 481920 | -| train/ | | -| approx_kl | 0.012799887 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.578 | -| explained_variance | -0.0711 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 37640 | -| policy_gradient_loss | -0.00387 | -| std | 0.431 | -| value_loss | 7.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3766 | -| time_elapsed | 33643 | -| total_timesteps | 482048 | -| train/ | | -| approx_kl | 0.010513039 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | 0.00223 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 37650 | -| policy_gradient_loss | -0.0077 | -| std | 0.431 | -| value_loss | 2.47e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3767 | -| time_elapsed | 33650 | -| total_timesteps | 482176 | -| train/ | | -| approx_kl | 7.380522e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | 2.76e-05 | -| n_updates | 37660 | -| policy_gradient_loss | 0.000899 | -| std | 0.43 | -| value_loss | 0.00246 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3768 | -| time_elapsed | 33654 | -| total_timesteps | 482304 | -| train/ | | -| approx_kl | 0.017226642 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.575 | -| explained_variance | -658 | -| learning_rate | 0.0003 | -| loss | -0.000805 | -| n_updates | 37670 | -| policy_gradient_loss | -0.000786 | -| std | 0.43 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3769 | -| time_elapsed | 33656 | -| total_timesteps | 482432 | -| train/ | | -| approx_kl | 0.021023363 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -529 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 37680 | -| policy_gradient_loss | -0.00368 | -| std | 0.431 | -| value_loss | 1.99e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3770 | -| time_elapsed | 33660 | -| total_timesteps | 482560 | -| train/ | | -| approx_kl | 0.017358446 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | -0.577 | -| explained_variance | -20.6 | -| learning_rate | 0.0003 | -| loss | -0.000356 | -| n_updates | 37690 | -| policy_gradient_loss | -0.00093 | -| std | 0.431 | -| value_loss | 2.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3771 | -| time_elapsed | 33663 | -| total_timesteps | 482688 | -| train/ | | -| approx_kl | 0.016622404 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.576 | -| explained_variance | -2.82 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 37700 | -| policy_gradient_loss | -0.00228 | -| std | 0.43 | -| value_loss | 4.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3772 | -| time_elapsed | 33665 | -| total_timesteps | 482816 | -| train/ | | -| approx_kl | 0.010424629 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.574 | -| explained_variance | -0.386 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 37710 | -| policy_gradient_loss | -0.00223 | -| std | 0.429 | -| value_loss | 3.92e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 14 | -| iterations | 3773 | -| time_elapsed | 33669 | -| total_timesteps | 482944 | -| train/ | | -| approx_kl | 8.324394e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.571 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 37720 | -| policy_gradient_loss | -0.00165 | -| std | 0.426 | -| value_loss | 5.26e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3774 | -| time_elapsed | 33673 | -| total_timesteps | 483072 | -| train/ | | -| approx_kl | 0.010170961 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.562 | -| explained_variance | 0.00629 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 37730 | -| policy_gradient_loss | -0.00822 | -| std | 0.423 | -| value_loss | 2.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3775 | -| time_elapsed | 33679 | -| total_timesteps | 483200 | -| train/ | | -| approx_kl | 0.021652453 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.558 | -| explained_variance | -8 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 37740 | -| policy_gradient_loss | -0.0118 | -| std | 0.422 | -| value_loss | 0.00451 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3776 | -| time_elapsed | 33683 | -| total_timesteps | 483328 | -| train/ | | -| approx_kl | 0.012932264 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | -1e+03 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 37750 | -| policy_gradient_loss | -0.00565 | -| std | 0.422 | -| value_loss | 2.54e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3777 | -| time_elapsed | 33686 | -| total_timesteps | 483456 | -| train/ | | -| approx_kl | 0.00150657 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | -3.07e+03 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 37760 | -| policy_gradient_loss | -3.4e-05 | -| std | 0.422 | -| value_loss | 1.04e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3778 | -| time_elapsed | 33690 | -| total_timesteps | 483584 | -| train/ | | -| approx_kl | 0.00052427035 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | -4.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.000704 | -| n_updates | 37770 | -| policy_gradient_loss | 0.000351 | -| std | 0.422 | -| value_loss | 3.24e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3779 | -| time_elapsed | 33693 | -| total_timesteps | 483712 | -| train/ | | -| approx_kl | 0.0018696114 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | -15.2 | -| learning_rate | 0.0003 | -| loss | -0.00766 | -| n_updates | 37780 | -| policy_gradient_loss | -0.000222 | -| std | 0.422 | -| value_loss | 3.55e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3780 | -| time_elapsed | 33697 | -| total_timesteps | 483840 | -| train/ | | -| approx_kl | 0.00067662913 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | -47.4 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 37790 | -| policy_gradient_loss | 0.000889 | -| std | 0.422 | -| value_loss | 3.63e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 14 | -| iterations | 3781 | -| time_elapsed | 33701 | -| total_timesteps | 483968 | -| train/ | | -| approx_kl | 0.038583428 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | -4.08 | -| learning_rate | 0.0003 | -| loss | -0.00797 | -| n_updates | 37800 | -| policy_gradient_loss | -0.0086 | -| std | 0.422 | -| value_loss | 3.85e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3782 | -| time_elapsed | 33704 | -| total_timesteps | 484096 | -| train/ | | -| approx_kl | 0.00871161 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | -0.00877 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 37810 | -| policy_gradient_loss | -0.00205 | -| std | 0.422 | -| value_loss | 1.51e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3783 | -| time_elapsed | 33712 | -| total_timesteps | 484224 | -| train/ | | -| approx_kl | 0.024410151 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | 0.75 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 37820 | -| policy_gradient_loss | -0.00265 | -| std | 0.421 | -| value_loss | 0.00432 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3784 | -| time_elapsed | 33715 | -| total_timesteps | 484352 | -| train/ | | -| approx_kl | 0.0025459218 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -1.75e+03 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 37830 | -| policy_gradient_loss | -0.00035 | -| std | 0.421 | -| value_loss | 5.59e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3785 | -| time_elapsed | 33719 | -| total_timesteps | 484480 | -| train/ | | -| approx_kl | 0.04727924 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -1.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 37840 | -| policy_gradient_loss | -0.00852 | -| std | 0.421 | -| value_loss | 1.63e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3786 | -| time_elapsed | 33722 | -| total_timesteps | 484608 | -| train/ | | -| approx_kl | 0.007512442 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.000406 | -| n_updates | 37850 | -| policy_gradient_loss | -0.000485 | -| std | 0.421 | -| value_loss | 2.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3787 | -| time_elapsed | 33725 | -| total_timesteps | 484736 | -| train/ | | -| approx_kl | 0.008206442 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -6.2 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 37860 | -| policy_gradient_loss | -0.00078 | -| std | 0.421 | -| value_loss | 2.18e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3788 | -| time_elapsed | 33729 | -| total_timesteps | 484864 | -| train/ | | -| approx_kl | 0.0029970545 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 37870 | -| policy_gradient_loss | -0.000454 | -| std | 0.42 | -| value_loss | 2.87e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.84 | -| time/ | | -| fps | 14 | -| iterations | 3789 | -| time_elapsed | 33733 | -| total_timesteps | 484992 | -| train/ | | -| approx_kl | 0.017941635 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 37880 | -| policy_gradient_loss | -0.00343 | -| std | 0.42 | -| value_loss | 8.71e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.74 | -| time/ | | -| fps | 14 | -| iterations | 3790 | -| time_elapsed | 33736 | -| total_timesteps | 485120 | -| train/ | | -| approx_kl | 0.0029253445 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -0.303 | -| learning_rate | 0.0003 | -| loss | -0.000215 | -| n_updates | 37890 | -| policy_gradient_loss | -0.000198 | -| std | 0.42 | -| value_loss | 4.06e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.74 | -| time/ | | -| fps | 14 | -| iterations | 3791 | -| time_elapsed | 33746 | -| total_timesteps | 485248 | -| train/ | | -| approx_kl | 0.01552547 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | 0.914 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 37900 | -| policy_gradient_loss | -0.00145 | -| std | 0.419 | -| value_loss | 0.0014 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.74 | -| time/ | | -| fps | 14 | -| iterations | 3792 | -| time_elapsed | 33750 | -| total_timesteps | 485376 | -| train/ | | -| approx_kl | 0.043942258 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -580 | -| learning_rate | 0.0003 | -| loss | -0.00959 | -| n_updates | 37910 | -| policy_gradient_loss | -0.00506 | -| std | 0.419 | -| value_loss | 1.88e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.74 | -| time/ | | -| fps | 14 | -| iterations | 3793 | -| time_elapsed | 33754 | -| total_timesteps | 485504 | -| train/ | | -| approx_kl | 0.00032042642 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -446 | -| learning_rate | 0.0003 | -| loss | 0.00214 | -| n_updates | 37920 | -| policy_gradient_loss | 0.00373 | -| std | 0.418 | -| value_loss | 2.36e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.74 | -| time/ | | -| fps | 14 | -| iterations | 3794 | -| time_elapsed | 33758 | -| total_timesteps | 485632 | -| train/ | | -| approx_kl | 0.030608246 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -77.3 | -| learning_rate | 0.0003 | -| loss | -0.000327 | -| n_updates | 37930 | -| policy_gradient_loss | -0.00248 | -| std | 0.418 | -| value_loss | 5.29e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.74 | -| time/ | | -| fps | 14 | -| iterations | 3795 | -| time_elapsed | 33762 | -| total_timesteps | 485760 | -| train/ | | -| approx_kl | 0.0074423365 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -0.698 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 37940 | -| policy_gradient_loss | -0.00171 | -| std | 0.419 | -| value_loss | 1.14e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.74 | -| time/ | | -| fps | 14 | -| iterations | 3796 | -| time_elapsed | 33765 | -| total_timesteps | 485888 | -| train/ | | -| approx_kl | 0.0013032169 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -0.34 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 37950 | -| policy_gradient_loss | -7.69e-05 | -| std | 0.42 | -| value_loss | 3.19e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3797 | -| time_elapsed | 33770 | -| total_timesteps | 486016 | -| train/ | | -| approx_kl | 0.025319297 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | -0.00996 | -| n_updates | 37960 | -| policy_gradient_loss | -0.00914 | -| std | 0.421 | -| value_loss | 3.21e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3798 | -| time_elapsed | 33780 | -| total_timesteps | 486144 | -| train/ | | -| approx_kl | 0.0134230945 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | 0.709 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 37970 | -| policy_gradient_loss | -0.00726 | -| std | 0.421 | -| value_loss | 0.0018 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3799 | -| time_elapsed | 33784 | -| total_timesteps | 486272 | -| train/ | | -| approx_kl | 1.6600825e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -1.26e-05 | -| n_updates | 37980 | -| policy_gradient_loss | 0.00156 | -| std | 0.421 | -| value_loss | 5.44e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3800 | -| time_elapsed | 33787 | -| total_timesteps | 486400 | -| train/ | | -| approx_kl | 0.03473534 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -16.3 | -| learning_rate | 0.0003 | -| loss | -0.00867 | -| n_updates | 37990 | -| policy_gradient_loss | -0.00608 | -| std | 0.421 | -| value_loss | 2.6e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3801 | -| time_elapsed | 33790 | -| total_timesteps | 486528 | -| train/ | | -| approx_kl | 0.02262292 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 38000 | -| policy_gradient_loss | -0.015 | -| std | 0.42 | -| value_loss | 3.47e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3802 | -| time_elapsed | 33793 | -| total_timesteps | 486656 | -| train/ | | -| approx_kl | 0.016887568 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 38010 | -| policy_gradient_loss | -0.00313 | -| std | 0.421 | -| value_loss | 1.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3803 | -| time_elapsed | 33797 | -| total_timesteps | 486784 | -| train/ | | -| approx_kl | 0.009107342 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | -0.00692 | -| n_updates | 38020 | -| policy_gradient_loss | -0.00475 | -| std | 0.422 | -| value_loss | 7.11e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.55 | -| time/ | | -| fps | 14 | -| iterations | 3804 | -| time_elapsed | 33801 | -| total_timesteps | 486912 | -| train/ | | -| approx_kl | 0.0055405614 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.557 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.000831 | -| n_updates | 38030 | -| policy_gradient_loss | -0.000608 | -| std | 0.422 | -| value_loss | 4.08e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3805 | -| time_elapsed | 33804 | -| total_timesteps | 487040 | -| train/ | | -| approx_kl | 0.019492552 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.556 | -| explained_variance | 0.00636 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 38040 | -| policy_gradient_loss | -0.00855 | -| std | 0.422 | -| value_loss | 6.5e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3806 | -| time_elapsed | 33811 | -| total_timesteps | 487168 | -| train/ | | -| approx_kl | 0.0036148326 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.557 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 38050 | -| policy_gradient_loss | -0.00237 | -| std | 0.422 | -| value_loss | 0.00129 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3807 | -| time_elapsed | 33815 | -| total_timesteps | 487296 | -| train/ | | -| approx_kl | 0.03430599 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | -0.557 | -| explained_variance | -47.9 | -| learning_rate | 0.0003 | -| loss | -0.00266 | -| n_updates | 38060 | -| policy_gradient_loss | -0.00219 | -| std | 0.422 | -| value_loss | 1.79e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3808 | -| time_elapsed | 33817 | -| total_timesteps | 487424 | -| train/ | | -| approx_kl | 0.019172404 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | -16.1 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 38070 | -| policy_gradient_loss | -0.00413 | -| std | 0.421 | -| value_loss | 6.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3809 | -| time_elapsed | 33819 | -| total_timesteps | 487552 | -| train/ | | -| approx_kl | 0.016840128 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -1.94 | -| learning_rate | 0.0003 | -| loss | -0.00817 | -| n_updates | 38080 | -| policy_gradient_loss | -0.00459 | -| std | 0.421 | -| value_loss | 6.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3810 | -| time_elapsed | 33822 | -| total_timesteps | 487680 | -| train/ | | -| approx_kl | 0.013742844 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -0.317 | -| learning_rate | 0.0003 | -| loss | 0.000889 | -| n_updates | 38090 | -| policy_gradient_loss | -0.000941 | -| std | 0.421 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3811 | -| time_elapsed | 33825 | -| total_timesteps | 487808 | -| train/ | | -| approx_kl | 0.010740253 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 38100 | -| policy_gradient_loss | -0.00248 | -| std | 0.421 | -| value_loss | 1.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3812 | -| time_elapsed | 33828 | -| total_timesteps | 487936 | -| train/ | | -| approx_kl | 0.020325037 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 38110 | -| policy_gradient_loss | -0.00415 | -| std | 0.421 | -| value_loss | 1.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3813 | -| time_elapsed | 33832 | -| total_timesteps | 488064 | -| train/ | | -| approx_kl | 0.016758071 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | 0.00515 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 38120 | -| policy_gradient_loss | -0.00833 | -| std | 0.421 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3814 | -| time_elapsed | 33837 | -| total_timesteps | 488192 | -| train/ | | -| approx_kl | 0.015574476 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -15.7 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 38130 | -| policy_gradient_loss | -0.00726 | -| std | 0.421 | -| value_loss | 0.0073 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3815 | -| time_elapsed | 33840 | -| total_timesteps | 488320 | -| train/ | | -| approx_kl | 0.021406882 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -238 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 38140 | -| policy_gradient_loss | -0.00181 | -| std | 0.421 | -| value_loss | 1.18e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3816 | -| time_elapsed | 33843 | -| total_timesteps | 488448 | -| train/ | | -| approx_kl | 0.017923664 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -234 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 38150 | -| policy_gradient_loss | -0.00989 | -| std | 0.42 | -| value_loss | 3.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3817 | -| time_elapsed | 33846 | -| total_timesteps | 488576 | -| train/ | | -| approx_kl | 0.0027235385 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -0.469 | -| learning_rate | 0.0003 | -| loss | 0.000442 | -| n_updates | 38160 | -| policy_gradient_loss | 0.000325 | -| std | 0.42 | -| value_loss | 1.26e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3818 | -| time_elapsed | 33850 | -| total_timesteps | 488704 | -| train/ | | -| approx_kl | 0.01251701 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -0.883 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 38170 | -| policy_gradient_loss | -0.00194 | -| std | 0.42 | -| value_loss | 7.83e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3819 | -| time_elapsed | 33854 | -| total_timesteps | 488832 | -| train/ | | -| approx_kl | 0.010265726 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 38180 | -| policy_gradient_loss | -0.00674 | -| std | 0.42 | -| value_loss | 3.56e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3820 | -| time_elapsed | 33857 | -| total_timesteps | 488960 | -| train/ | | -| approx_kl | 3.256905e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.000939 | -| n_updates | 38190 | -| policy_gradient_loss | 0.00344 | -| std | 0.421 | -| value_loss | 5.41e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3821 | -| time_elapsed | 33861 | -| total_timesteps | 489088 | -| train/ | | -| approx_kl | 0.022260875 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -0.0824 | -| learning_rate | 0.0003 | -| loss | -0.00407 | -| n_updates | 38200 | -| policy_gradient_loss | -0.00432 | -| std | 0.421 | -| value_loss | 3.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3822 | -| time_elapsed | 33868 | -| total_timesteps | 489216 | -| train/ | | -| approx_kl | 0.016475854 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.00566 | -| n_updates | 38210 | -| policy_gradient_loss | -0.00258 | -| std | 0.42 | -| value_loss | 0.000226 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3823 | -| time_elapsed | 33872 | -| total_timesteps | 489344 | -| train/ | | -| approx_kl | 0.03684784 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -687 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 38220 | -| policy_gradient_loss | -0.0128 | -| std | 0.42 | -| value_loss | 2.37e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3824 | -| time_elapsed | 33875 | -| total_timesteps | 489472 | -| train/ | | -| approx_kl | 0.01467257 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -459 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 38230 | -| policy_gradient_loss | -0.00285 | -| std | 0.42 | -| value_loss | 6.63e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3825 | -| time_elapsed | 33877 | -| total_timesteps | 489600 | -| train/ | | -| approx_kl | 2.2649765e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | 0.000216 | -| n_updates | 38240 | -| policy_gradient_loss | 0.00498 | -| std | 0.42 | -| value_loss | 2.12e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3826 | -| time_elapsed | 33881 | -| total_timesteps | 489728 | -| train/ | | -| approx_kl | 0.001608084 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -584 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 38250 | -| policy_gradient_loss | -1.91e-05 | -| std | 0.42 | -| value_loss | 3.06e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3827 | -| time_elapsed | 33885 | -| total_timesteps | 489856 | -| train/ | | -| approx_kl | 0.00069603254 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -58.5 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 38260 | -| policy_gradient_loss | 0.00062 | -| std | 0.42 | -| value_loss | 1.31e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3828 | -| time_elapsed | 33888 | -| total_timesteps | 489984 | -| train/ | | -| approx_kl | 0.00076283375 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -3.17 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 38270 | -| policy_gradient_loss | 0.00019 | -| std | 0.42 | -| value_loss | 4.98e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3829 | -| time_elapsed | 33891 | -| total_timesteps | 490112 | -| train/ | | -| approx_kl | 0.024657167 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -6.78 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 38280 | -| policy_gradient_loss | -0.0131 | -| std | 0.421 | -| value_loss | 5.06e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3830 | -| time_elapsed | 33897 | -| total_timesteps | 490240 | -| train/ | | -| approx_kl | 0.014357975 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | -0.00711 | -| n_updates | 38290 | -| policy_gradient_loss | -0.00324 | -| std | 0.421 | -| value_loss | 0.00101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3831 | -| time_elapsed | 33900 | -| total_timesteps | 490368 | -| train/ | | -| approx_kl | 0.043751936 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -6.18e+03 | -| learning_rate | 0.0003 | -| loss | -0.00828 | -| n_updates | 38300 | -| policy_gradient_loss | -0.006 | -| std | 0.421 | -| value_loss | 8.01e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3832 | -| time_elapsed | 33902 | -| total_timesteps | 490496 | -| train/ | | -| approx_kl | 0.00040220772 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -1.79e+03 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 38310 | -| policy_gradient_loss | 0.00104 | -| std | 0.421 | -| value_loss | 1.22e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3833 | -| time_elapsed | 33905 | -| total_timesteps | 490624 | -| train/ | | -| approx_kl | 0.03303023 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -359 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 38320 | -| policy_gradient_loss | -0.00624 | -| std | 0.421 | -| value_loss | 1.59e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3834 | -| time_elapsed | 33909 | -| total_timesteps | 490752 | -| train/ | | -| approx_kl | 0.008024331 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -51.5 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 38330 | -| policy_gradient_loss | -0.000821 | -| std | 0.419 | -| value_loss | 4.69e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.54 | -| time/ | | -| fps | 14 | -| iterations | 3835 | -| time_elapsed | 33912 | -| total_timesteps | 490880 | -| train/ | | -| approx_kl | 0.005721679 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -24.4 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 38340 | -| policy_gradient_loss | -0.00141 | -| std | 0.419 | -| value_loss | 4e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3836 | -| time_elapsed | 33915 | -| total_timesteps | 491008 | -| train/ | | -| approx_kl | 0.00022251019 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -0.741 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 38350 | -| policy_gradient_loss | 0.000981 | -| std | 0.419 | -| value_loss | 2.7e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3837 | -| time_elapsed | 33924 | -| total_timesteps | 491136 | -| train/ | | -| approx_kl | 0.044421505 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 38360 | -| policy_gradient_loss | -0.00823 | -| std | 0.419 | -| value_loss | 0.000846 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3838 | -| time_elapsed | 33927 | -| total_timesteps | 491264 | -| train/ | | -| approx_kl | 0.0052774283 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -958 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 38370 | -| policy_gradient_loss | -0.00404 | -| std | 0.419 | -| value_loss | 9.38e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3839 | -| time_elapsed | 33931 | -| total_timesteps | 491392 | -| train/ | | -| approx_kl | 0.055131257 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -390 | -| learning_rate | 0.0003 | -| loss | -0.00971 | -| n_updates | 38380 | -| policy_gradient_loss | -0.00629 | -| std | 0.419 | -| value_loss | 2.04e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3840 | -| time_elapsed | 33934 | -| total_timesteps | 491520 | -| train/ | | -| approx_kl | 0.00073500234 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -3.37 | -| learning_rate | 0.0003 | -| loss | 0.000651 | -| n_updates | 38390 | -| policy_gradient_loss | 0.000819 | -| std | 0.418 | -| value_loss | 3.2e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3841 | -| time_elapsed | 33937 | -| total_timesteps | 491648 | -| train/ | | -| approx_kl | 0.0055625457 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.546 | -| explained_variance | -8.98 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 38400 | -| policy_gradient_loss | -0.00384 | -| std | 0.417 | -| value_loss | 6.72e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3842 | -| time_elapsed | 33940 | -| total_timesteps | 491776 | -| train/ | | -| approx_kl | 0.0038599544 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | -3.71e-05 | -| n_updates | 38410 | -| policy_gradient_loss | 1.55e-05 | -| std | 0.417 | -| value_loss | 7.74e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.53 | -| time/ | | -| fps | 14 | -| iterations | 3843 | -| time_elapsed | 33943 | -| total_timesteps | 491904 | -| train/ | | -| approx_kl | 0.026023231 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.546 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 38420 | -| policy_gradient_loss | -0.00896 | -| std | 0.418 | -| value_loss | 7.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3844 | -| time_elapsed | 33947 | -| total_timesteps | 492032 | -| train/ | | -| approx_kl | 0.005224454 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.547 | -| explained_variance | -0.701 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 38430 | -| policy_gradient_loss | -0.003 | -| std | 0.419 | -| value_loss | 9.63e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3845 | -| time_elapsed | 33955 | -| total_timesteps | 492160 | -| train/ | | -| approx_kl | 0.0020397955 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | 0.000362 | -| n_updates | 38440 | -| policy_gradient_loss | 0.00024 | -| std | 0.419 | -| value_loss | 4.05e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3846 | -| time_elapsed | 33959 | -| total_timesteps | 492288 | -| train/ | | -| approx_kl | 0.010718925 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -3.26e+03 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 38450 | -| policy_gradient_loss | -0.00103 | -| std | 0.418 | -| value_loss | 7.62e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3847 | -| time_elapsed | 33963 | -| total_timesteps | 492416 | -| train/ | | -| approx_kl | 0.0038600957 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.546 | -| explained_variance | -1.6e+03 | -| learning_rate | 0.0003 | -| loss | -0.000177 | -| n_updates | 38460 | -| policy_gradient_loss | -0.000134 | -| std | 0.417 | -| value_loss | 6.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3848 | -| time_elapsed | 33966 | -| total_timesteps | 492544 | -| train/ | | -| approx_kl | 0.012917285 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.543 | -| explained_variance | -1.31e+03 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 38470 | -| policy_gradient_loss | -0.00636 | -| std | 0.416 | -| value_loss | 5.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3849 | -| time_elapsed | 33970 | -| total_timesteps | 492672 | -| train/ | | -| approx_kl | 0.031911764 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -70.7 | -| learning_rate | 0.0003 | -| loss | -0.00569 | -| n_updates | 38480 | -| policy_gradient_loss | -0.00365 | -| std | 0.416 | -| value_loss | 5.62e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3850 | -| time_elapsed | 33973 | -| total_timesteps | 492800 | -| train/ | | -| approx_kl | 0.017865803 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -0.398 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 38490 | -| policy_gradient_loss | -0.00477 | -| std | 0.416 | -| value_loss | 5.58e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 14 | -| iterations | 3851 | -| time_elapsed | 33977 | -| total_timesteps | 492928 | -| train/ | | -| approx_kl | 0.013274625 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -0.293 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 38500 | -| policy_gradient_loss | -0.00765 | -| std | 0.416 | -| value_loss | 7.15e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3852 | -| time_elapsed | 33981 | -| total_timesteps | 493056 | -| train/ | | -| approx_kl | 0.018339813 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 38510 | -| policy_gradient_loss | -0.00538 | -| std | 0.416 | -| value_loss | 9.06e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3853 | -| time_elapsed | 33988 | -| total_timesteps | 493184 | -| train/ | | -| approx_kl | 0.01823076 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 38520 | -| policy_gradient_loss | -0.0046 | -| std | 0.415 | -| value_loss | 0.000508 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3854 | -| time_elapsed | 33992 | -| total_timesteps | 493312 | -| train/ | | -| approx_kl | 0.030375285 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.54 | -| explained_variance | -1.63e+03 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 38530 | -| policy_gradient_loss | -0.00139 | -| std | 0.415 | -| value_loss | 2.69e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3855 | -| time_elapsed | 33997 | -| total_timesteps | 493440 | -| train/ | | -| approx_kl | 0.0058099665 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.54 | -| explained_variance | -8.17e+03 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 38540 | -| policy_gradient_loss | -0.00528 | -| std | 0.415 | -| value_loss | 3.36e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3856 | -| time_elapsed | 34001 | -| total_timesteps | 493568 | -| train/ | | -| approx_kl | 0.047092393 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | -0.539 | -| explained_variance | -288 | -| learning_rate | 0.0003 | -| loss | -0.00765 | -| n_updates | 38550 | -| policy_gradient_loss | -0.00705 | -| std | 0.415 | -| value_loss | 7e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3857 | -| time_elapsed | 34004 | -| total_timesteps | 493696 | -| train/ | | -| approx_kl | 0.0064270645 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.538 | -| explained_variance | -655 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 38560 | -| policy_gradient_loss | -0.00189 | -| std | 0.414 | -| value_loss | 1.23e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3858 | -| time_elapsed | 34007 | -| total_timesteps | 493824 | -| train/ | | -| approx_kl | 0.0001783329 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.537 | -| explained_variance | -3.28 | -| learning_rate | 0.0003 | -| loss | -0.00487 | -| n_updates | 38570 | -| policy_gradient_loss | 0.00531 | -| std | 0.414 | -| value_loss | 1.73e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 14 | -| iterations | 3859 | -| time_elapsed | 34011 | -| total_timesteps | 493952 | -| train/ | | -| approx_kl | 0.00150015 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.536 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 38580 | -| policy_gradient_loss | 0.000367 | -| std | 0.414 | -| value_loss | 2.87e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3860 | -| time_elapsed | 34015 | -| total_timesteps | 494080 | -| train/ | | -| approx_kl | 0.00313965 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.534 | -| explained_variance | -0.626 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 38590 | -| policy_gradient_loss | 0.000388 | -| std | 0.412 | -| value_loss | 2.58e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3861 | -| time_elapsed | 34021 | -| total_timesteps | 494208 | -| train/ | | -| approx_kl | 0.038784146 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | -0.531 | -| explained_variance | 0.0272 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 38600 | -| policy_gradient_loss | -0.00808 | -| std | 0.411 | -| value_loss | 0.00255 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3862 | -| time_elapsed | 34024 | -| total_timesteps | 494336 | -| train/ | | -| approx_kl | 0.015935838 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.529 | -| explained_variance | -1.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.000865 | -| n_updates | 38610 | -| policy_gradient_loss | -0.00114 | -| std | 0.41 | -| value_loss | 1.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3863 | -| time_elapsed | 34028 | -| total_timesteps | 494464 | -| train/ | | -| approx_kl | 0.008719009 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.528 | -| explained_variance | -795 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 38620 | -| policy_gradient_loss | -0.00923 | -| std | 0.41 | -| value_loss | 2.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3864 | -| time_elapsed | 34030 | -| total_timesteps | 494592 | -| train/ | | -| approx_kl | 0.020477436 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.528 | -| explained_variance | -9.02 | -| learning_rate | 0.0003 | -| loss | -0.0072 | -| n_updates | 38630 | -| policy_gradient_loss | -0.00407 | -| std | 0.411 | -| value_loss | 6.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3865 | -| time_elapsed | 34034 | -| total_timesteps | 494720 | -| train/ | | -| approx_kl | 0.000805249 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.53 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 38640 | -| policy_gradient_loss | -8.27e-05 | -| std | 0.412 | -| value_loss | 5.99e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3866 | -| time_elapsed | 34038 | -| total_timesteps | 494848 | -| train/ | | -| approx_kl | 0.0015561823 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.534 | -| explained_variance | -0.648 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 38650 | -| policy_gradient_loss | -8.69e-05 | -| std | 0.414 | -| value_loss | 4.61e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 14 | -| iterations | 3867 | -| time_elapsed | 34041 | -| total_timesteps | 494976 | -| train/ | | -| approx_kl | 0.0007260903 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.537 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 38660 | -| policy_gradient_loss | 0.000742 | -| std | 0.414 | -| value_loss | 7.32e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 14 | -| iterations | 3868 | -| time_elapsed | 34045 | -| total_timesteps | 495104 | -| train/ | | -| approx_kl | 0.01712453 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.538 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | 0.00071 | -| n_updates | 38670 | -| policy_gradient_loss | -0.00197 | -| std | 0.414 | -| value_loss | 1.76e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 14 | -| iterations | 3869 | -| time_elapsed | 34055 | -| total_timesteps | 495232 | -| train/ | | -| approx_kl | 0.0282958 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.538 | -| explained_variance | -0.204 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 38680 | -| policy_gradient_loss | -0.00246 | -| std | 0.415 | -| value_loss | 0.00178 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 14 | -| iterations | 3870 | -| time_elapsed | 34059 | -| total_timesteps | 495360 | -| train/ | | -| approx_kl | 0.049955204 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | -0.539 | -| explained_variance | -3.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 38690 | -| policy_gradient_loss | -0.011 | -| std | 0.415 | -| value_loss | 1.86e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 14 | -| iterations | 3871 | -| time_elapsed | 34062 | -| total_timesteps | 495488 | -| train/ | | -| approx_kl | 0.010439312 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.54 | -| explained_variance | -2.64e+03 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 38700 | -| policy_gradient_loss | -0.00574 | -| std | 0.415 | -| value_loss | 4.3e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 14 | -| iterations | 3872 | -| time_elapsed | 34066 | -| total_timesteps | 495616 | -| train/ | | -| approx_kl | 0.0013603489 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | -55.7 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 38710 | -| policy_gradient_loss | 0.000394 | -| std | 0.416 | -| value_loss | 9.18e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 14 | -| iterations | 3873 | -| time_elapsed | 34069 | -| total_timesteps | 495744 | -| train/ | | -| approx_kl | 0.00080251996 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | -0.763 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 38720 | -| policy_gradient_loss | 0.000452 | -| std | 0.415 | -| value_loss | 1.68e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 14 | -| iterations | 3874 | -| time_elapsed | 34073 | -| total_timesteps | 495872 | -| train/ | | -| approx_kl | 0.00095372135 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.54 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00442 | -| n_updates | 38730 | -| policy_gradient_loss | 0.00063 | -| std | 0.415 | -| value_loss | 1.69e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3875 | -| time_elapsed | 34077 | -| total_timesteps | 496000 | -| train/ | | -| approx_kl | 0.021518067 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.54 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 38740 | -| policy_gradient_loss | -0.00533 | -| std | 0.415 | -| value_loss | 6.73e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3876 | -| time_elapsed | 34080 | -| total_timesteps | 496128 | -| train/ | | -| approx_kl | 5.14742e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.54 | -| explained_variance | 0.00389 | -| learning_rate | 0.0003 | -| loss | -0.000102 | -| n_updates | 38750 | -| policy_gradient_loss | -3.66e-05 | -| std | 0.415 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3877 | -| time_elapsed | 34088 | -| total_timesteps | 496256 | -| train/ | | -| approx_kl | 0.014733456 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.538 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 38760 | -| policy_gradient_loss | -0.00937 | -| std | 0.414 | -| value_loss | 0.000962 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3878 | -| time_elapsed | 34092 | -| total_timesteps | 496384 | -| train/ | | -| approx_kl | 0.028641118 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.538 | -| explained_variance | -98.1 | -| learning_rate | 0.0003 | -| loss | -0.00513 | -| n_updates | 38770 | -| policy_gradient_loss | -0.00271 | -| std | 0.415 | -| value_loss | 2.14e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3879 | -| time_elapsed | 34095 | -| total_timesteps | 496512 | -| train/ | | -| approx_kl | 0.00025525037 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | -196 | -| learning_rate | 0.0003 | -| loss | -0.000978 | -| n_updates | 38780 | -| policy_gradient_loss | 0.00038 | -| std | 0.416 | -| value_loss | 9.91e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3880 | -| time_elapsed | 34098 | -| total_timesteps | 496640 | -| train/ | | -| approx_kl | 0.025768923 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.544 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 38790 | -| policy_gradient_loss | -0.004 | -| std | 0.417 | -| value_loss | 9.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3881 | -| time_elapsed | 34102 | -| total_timesteps | 496768 | -| train/ | | -| approx_kl | 0.016233038 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.544 | -| explained_variance | -4.15 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 38800 | -| policy_gradient_loss | -0.00486 | -| std | 0.417 | -| value_loss | 2.5e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3882 | -| time_elapsed | 34105 | -| total_timesteps | 496896 | -| train/ | | -| approx_kl | 0.0011129312 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.543 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 38810 | -| policy_gradient_loss | 0.000163 | -| std | 0.417 | -| value_loss | 2.51e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3883 | -| time_elapsed | 34108 | -| total_timesteps | 497024 | -| train/ | | -| approx_kl | 0.0010039429 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.000884 | -| n_updates | 38820 | -| policy_gradient_loss | 3.49e-05 | -| std | 0.419 | -| value_loss | 2.27e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3884 | -| time_elapsed | 34117 | -| total_timesteps | 497152 | -| train/ | | -| approx_kl | 0.013382258 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 38830 | -| policy_gradient_loss | -0.00831 | -| std | 0.421 | -| value_loss | 5.39e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3885 | -| time_elapsed | 34121 | -| total_timesteps | 497280 | -| train/ | | -| approx_kl | 4.2256434e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | -14.7 | -| learning_rate | 0.0003 | -| loss | -1.88e-05 | -| n_updates | 38840 | -| policy_gradient_loss | 0.00134 | -| std | 0.422 | -| value_loss | 1.78e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3886 | -| time_elapsed | 34124 | -| total_timesteps | 497408 | -| train/ | | -| approx_kl | 0.04078366 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | -28 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 38850 | -| policy_gradient_loss | -0.00573 | -| std | 0.421 | -| value_loss | 9.8e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3887 | -| time_elapsed | 34127 | -| total_timesteps | 497536 | -| train/ | | -| approx_kl | 0.002626477 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -2.04 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 38860 | -| policy_gradient_loss | -0.000816 | -| std | 0.421 | -| value_loss | 2.99e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3888 | -| time_elapsed | 34130 | -| total_timesteps | 497664 | -| train/ | | -| approx_kl | 0.000508829 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -0.439 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 38870 | -| policy_gradient_loss | 0.000424 | -| std | 0.421 | -| value_loss | 1.74e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3889 | -| time_elapsed | 34134 | -| total_timesteps | 497792 | -| train/ | | -| approx_kl | 0.0011288864 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.553 | -| explained_variance | -0.0885 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 38880 | -| policy_gradient_loss | 0.000287 | -| std | 0.421 | -| value_loss | 8.53e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 14 | -| iterations | 3890 | -| time_elapsed | 34138 | -| total_timesteps | 497920 | -| train/ | | -| approx_kl | 0.017770708 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -0.00288 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 38890 | -| policy_gradient_loss | -0.00513 | -| std | 0.42 | -| value_loss | 1.36e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3891 | -| time_elapsed | 34141 | -| total_timesteps | 498048 | -| train/ | | -| approx_kl | 0.009827136 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 38900 | -| policy_gradient_loss | -0.0052 | -| std | 0.42 | -| value_loss | 3.08e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3892 | -| time_elapsed | 34147 | -| total_timesteps | 498176 | -| train/ | | -| approx_kl | 0.0005639894 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | 0.826 | -| learning_rate | 0.0003 | -| loss | 0.000915 | -| n_updates | 38910 | -| policy_gradient_loss | 0.000121 | -| std | 0.419 | -| value_loss | 0.00223 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3893 | -| time_elapsed | 34151 | -| total_timesteps | 498304 | -| train/ | | -| approx_kl | 0.009724213 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | -1.77e+03 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 38920 | -| policy_gradient_loss | -0.00124 | -| std | 0.419 | -| value_loss | 3.35e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3894 | -| time_elapsed | 34154 | -| total_timesteps | 498432 | -| train/ | | -| approx_kl | 6.8759546e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | -4e+03 | -| learning_rate | 0.0003 | -| loss | 6.99e-05 | -| n_updates | 38930 | -| policy_gradient_loss | 0.00057 | -| std | 0.42 | -| value_loss | 7.83e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3895 | -| time_elapsed | 34158 | -| total_timesteps | 498560 | -| train/ | | -| approx_kl | 0.003729649 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -62.1 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 38940 | -| policy_gradient_loss | -0.000775 | -| std | 0.42 | -| value_loss | 5.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3896 | -| time_elapsed | 34161 | -| total_timesteps | 498688 | -| train/ | | -| approx_kl | 0.02049166 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -4.04 | -| learning_rate | 0.0003 | -| loss | -0.000591 | -| n_updates | 38950 | -| policy_gradient_loss | -0.00168 | -| std | 0.419 | -| value_loss | 9.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3897 | -| time_elapsed | 34165 | -| total_timesteps | 498816 | -| train/ | | -| approx_kl | 0.013251786 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -0.784 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 38960 | -| policy_gradient_loss | -0.0022 | -| std | 0.419 | -| value_loss | 1.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3898 | -| time_elapsed | 34168 | -| total_timesteps | 498944 | -| train/ | | -| approx_kl | 0.007927927 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 38970 | -| policy_gradient_loss | -0.00147 | -| std | 0.419 | -| value_loss | 8.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3899 | -| time_elapsed | 34171 | -| total_timesteps | 499072 | -| train/ | | -| approx_kl | 0.008184403 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 38980 | -| policy_gradient_loss | -0.00246 | -| std | 0.418 | -| value_loss | 6.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3900 | -| time_elapsed | 34176 | -| total_timesteps | 499200 | -| train/ | | -| approx_kl | 0.018778643 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.547 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | -0.000684 | -| n_updates | 38990 | -| policy_gradient_loss | -0.0011 | -| std | 0.418 | -| value_loss | 0.00267 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3901 | -| time_elapsed | 34179 | -| total_timesteps | 499328 | -| train/ | | -| approx_kl | 0.021615269 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.547 | -| explained_variance | -4.01e+03 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 39000 | -| policy_gradient_loss | -0.00207 | -| std | 0.418 | -| value_loss | 3.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3902 | -| time_elapsed | 34182 | -| total_timesteps | 499456 | -| train/ | | -| approx_kl | 0.008796257 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -8.7e+03 | -| learning_rate | 0.0003 | -| loss | -0.000846 | -| n_updates | 39010 | -| policy_gradient_loss | -0.000666 | -| std | 0.417 | -| value_loss | 3.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3903 | -| time_elapsed | 34186 | -| total_timesteps | 499584 | -| train/ | | -| approx_kl | 0.030884782 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.543 | -| explained_variance | -719 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 39020 | -| policy_gradient_loss | -0.0097 | -| std | 0.416 | -| value_loss | 2.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3904 | -| time_elapsed | 34189 | -| total_timesteps | 499712 | -| train/ | | -| approx_kl | 0.039181843 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -574 | -| learning_rate | 0.0003 | -| loss | -0.00683 | -| n_updates | 39030 | -| policy_gradient_loss | -0.00577 | -| std | 0.416 | -| value_loss | 4.91e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3905 | -| time_elapsed | 34191 | -| total_timesteps | 499840 | -| train/ | | -| approx_kl | 0.0049887225 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -7.67 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 39040 | -| policy_gradient_loss | -0.00107 | -| std | 0.416 | -| value_loss | 4.87e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 14 | -| iterations | 3906 | -| time_elapsed | 34194 | -| total_timesteps | 499968 | -| train/ | | -| approx_kl | 0.00024581165 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | -5.5 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 39050 | -| policy_gradient_loss | 0.00136 | -| std | 0.416 | -| value_loss | 7.2e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3907 | -| time_elapsed | 34197 | -| total_timesteps | 500096 | -| train/ | | -| approx_kl | 0.0013058286 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | -0.746 | -| learning_rate | 0.0003 | -| loss | -0.0075 | -| n_updates | 39060 | -| policy_gradient_loss | 0.000537 | -| std | 0.416 | -| value_loss | 3.81e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3908 | -| time_elapsed | 34205 | -| total_timesteps | 500224 | -| train/ | | -| approx_kl | 0.021708708 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 39070 | -| policy_gradient_loss | -0.0017 | -| std | 0.416 | -| value_loss | 1.58e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3909 | -| time_elapsed | 34209 | -| total_timesteps | 500352 | -| train/ | | -| approx_kl | 0.046769053 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | -0.541 | -| explained_variance | -312 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 39080 | -| policy_gradient_loss | -0.00547 | -| std | 0.416 | -| value_loss | 2.57e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3910 | -| time_elapsed | 34212 | -| total_timesteps | 500480 | -| train/ | | -| approx_kl | 0.007825814 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -207 | -| learning_rate | 0.0003 | -| loss | 0.00162 | -| n_updates | 39090 | -| policy_gradient_loss | 0.00132 | -| std | 0.416 | -| value_loss | 8.87e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3911 | -| time_elapsed | 34216 | -| total_timesteps | 500608 | -| train/ | | -| approx_kl | 0.0067159114 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.544 | -| explained_variance | -11.6 | -| learning_rate | 0.0003 | -| loss | -0.00797 | -| n_updates | 39100 | -| policy_gradient_loss | -0.00263 | -| std | 0.417 | -| value_loss | 4.25e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3912 | -| time_elapsed | 34219 | -| total_timesteps | 500736 | -| train/ | | -| approx_kl | 0.006995789 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -0.702 | -| learning_rate | 0.0003 | -| loss | 0.000555 | -| n_updates | 39110 | -| policy_gradient_loss | 0.000368 | -| std | 0.418 | -| value_loss | 1.74e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3913 | -| time_elapsed | 34223 | -| total_timesteps | 500864 | -| train/ | | -| approx_kl | 0.0135126375 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.546 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 39120 | -| policy_gradient_loss | -0.00256 | -| std | 0.417 | -| value_loss | 1.86e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 14 | -| iterations | 3914 | -| time_elapsed | 34228 | -| total_timesteps | 500992 | -| train/ | | -| approx_kl | 0.012140928 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | 0.00553 | -| learning_rate | 0.0003 | -| loss | -0.00459 | -| n_updates | 39130 | -| policy_gradient_loss | -0.00332 | -| std | 0.417 | -| value_loss | 9.65e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3915 | -| time_elapsed | 34232 | -| total_timesteps | 501120 | -| train/ | | -| approx_kl | 0.01002751 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -0.00569 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 39140 | -| policy_gradient_loss | -0.00508 | -| std | 0.418 | -| value_loss | 1.09e-10 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3916 | -| time_elapsed | 34241 | -| total_timesteps | 501248 | -| train/ | | -| approx_kl | 0.00051975716 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.546 | -| explained_variance | -7.07 | -| learning_rate | 0.0003 | -| loss | 0.00116 | -| n_updates | 39150 | -| policy_gradient_loss | 0.000584 | -| std | 0.418 | -| value_loss | 0.00197 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3917 | -| time_elapsed | 34245 | -| total_timesteps | 501376 | -| train/ | | -| approx_kl | 0.025611375 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -3.31e+03 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 39160 | -| policy_gradient_loss | -0.0054 | -| std | 0.419 | -| value_loss | 1.22e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3918 | -| time_elapsed | 34249 | -| total_timesteps | 501504 | -| train/ | | -| approx_kl | 0.0005013107 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -1.22e+03 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 39170 | -| policy_gradient_loss | 0.00408 | -| std | 0.419 | -| value_loss | 3.52e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3919 | -| time_elapsed | 34253 | -| total_timesteps | 501632 | -| train/ | | -| approx_kl | 0.030796908 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -16.3 | -| learning_rate | 0.0003 | -| loss | -0.00586 | -| n_updates | 39180 | -| policy_gradient_loss | -0.00632 | -| std | 0.419 | -| value_loss | 1.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3920 | -| time_elapsed | 34256 | -| total_timesteps | 501760 | -| train/ | | -| approx_kl | 0.009679547 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | -0.522 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 39190 | -| policy_gradient_loss | -0.00309 | -| std | 0.42 | -| value_loss | 2.02e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3921 | -| time_elapsed | 34259 | -| total_timesteps | 501888 | -| train/ | | -| approx_kl | 0.01923704 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 39200 | -| policy_gradient_loss | -0.00452 | -| std | 0.42 | -| value_loss | 2.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3922 | -| time_elapsed | 34263 | -| total_timesteps | 502016 | -| train/ | | -| approx_kl | 0.011387383 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.551 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 39210 | -| policy_gradient_loss | -0.00298 | -| std | 0.42 | -| value_loss | 2.27e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3923 | -| time_elapsed | 34272 | -| total_timesteps | 502144 | -| train/ | | -| approx_kl | 0.0001813306 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | 0.000558 | -| n_updates | 39220 | -| policy_gradient_loss | 1.24e-06 | -| std | 0.419 | -| value_loss | 0.00138 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3924 | -| time_elapsed | 34276 | -| total_timesteps | 502272 | -| train/ | | -| approx_kl | 0.01313713 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -943 | -| learning_rate | 0.0003 | -| loss | -0.00956 | -| n_updates | 39230 | -| policy_gradient_loss | -0.00395 | -| std | 0.419 | -| value_loss | 1.22e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3925 | -| time_elapsed | 34280 | -| total_timesteps | 502400 | -| train/ | | -| approx_kl | 0.038665377 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -391 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 39240 | -| policy_gradient_loss | -0.0115 | -| std | 0.419 | -| value_loss | 4.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3926 | -| time_elapsed | 34283 | -| total_timesteps | 502528 | -| train/ | | -| approx_kl | 0.012193823 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -43.3 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 39250 | -| policy_gradient_loss | -0.00452 | -| std | 0.419 | -| value_loss | 4.06e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3927 | -| time_elapsed | 34286 | -| total_timesteps | 502656 | -| train/ | | -| approx_kl | 3.7252903e-08 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -0.787 | -| learning_rate | 0.0003 | -| loss | -2.14e-05 | -| n_updates | 39260 | -| policy_gradient_loss | 0.00274 | -| std | 0.419 | -| value_loss | 1.48e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3928 | -| time_elapsed | 34288 | -| total_timesteps | 502784 | -| train/ | | -| approx_kl | 0.0017864967 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | -0.0079 | -| learning_rate | 0.0003 | -| loss | -0.00781 | -| n_updates | 39270 | -| policy_gradient_loss | -0.000153 | -| std | 0.419 | -| value_loss | 7.69e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 14 | -| iterations | 3929 | -| time_elapsed | 34292 | -| total_timesteps | 502912 | -| train/ | | -| approx_kl | 0.01605793 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.0025 | -| n_updates | 39280 | -| policy_gradient_loss | -0.00084 | -| std | 0.419 | -| value_loss | 4.81e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3930 | -| time_elapsed | 34296 | -| total_timesteps | 503040 | -| train/ | | -| approx_kl | 0.0105085755 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 39290 | -| policy_gradient_loss | -0.00833 | -| std | 0.419 | -| value_loss | 1.36e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3931 | -| time_elapsed | 34304 | -| total_timesteps | 503168 | -| train/ | | -| approx_kl | 0.039073452 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | -0.548 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 39300 | -| policy_gradient_loss | -0.0115 | -| std | 0.419 | -| value_loss | 0.000474 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3932 | -| time_elapsed | 34307 | -| total_timesteps | 503296 | -| train/ | | -| approx_kl | 0.019941345 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -402 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 39310 | -| policy_gradient_loss | -0.00374 | -| std | 0.419 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3933 | -| time_elapsed | 34311 | -| total_timesteps | 503424 | -| train/ | | -| approx_kl | 3.769202e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | -1.48e+03 | -| learning_rate | 0.0003 | -| loss | 0.000289 | -| n_updates | 39320 | -| policy_gradient_loss | 0.00127 | -| std | 0.419 | -| value_loss | 6.02e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3934 | -| time_elapsed | 34314 | -| total_timesteps | 503552 | -| train/ | | -| approx_kl | 0.0008650073 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | -106 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 39330 | -| policy_gradient_loss | 7.97e-05 | -| std | 0.42 | -| value_loss | 2.87e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3935 | -| time_elapsed | 34315 | -| total_timesteps | 503680 | -| train/ | | -| approx_kl | 0.0012005984 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.552 | -| explained_variance | -43.1 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 39340 | -| policy_gradient_loss | 0.000328 | -| std | 0.421 | -| value_loss | 3.05e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3936 | -| time_elapsed | 34317 | -| total_timesteps | 503808 | -| train/ | | -| approx_kl | 0.000660412 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -3.72 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 39350 | -| policy_gradient_loss | 0.000375 | -| std | 0.421 | -| value_loss | 3.74e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 14 | -| iterations | 3937 | -| time_elapsed | 34319 | -| total_timesteps | 503936 | -| train/ | | -| approx_kl | 0.01848545 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | -0.0762 | -| learning_rate | 0.0003 | -| loss | -0.0087 | -| n_updates | 39360 | -| policy_gradient_loss | -0.00805 | -| std | 0.422 | -| value_loss | 3.86e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3938 | -| time_elapsed | 34322 | -| total_timesteps | 504064 | -| train/ | | -| approx_kl | 0.009922208 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.557 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 39370 | -| policy_gradient_loss | -0.00242 | -| std | 0.423 | -| value_loss | 1.51e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3939 | -| time_elapsed | 34327 | -| total_timesteps | 504192 | -| train/ | | -| approx_kl | 0.016377416 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -0.558 | -| explained_variance | 0.657 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 39380 | -| policy_gradient_loss | -0.00771 | -| std | 0.423 | -| value_loss | 0.000549 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3940 | -| time_elapsed | 34329 | -| total_timesteps | 504320 | -| train/ | | -| approx_kl | 0.015478343 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.557 | -| explained_variance | -258 | -| learning_rate | 0.0003 | -| loss | -0.000394 | -| n_updates | 39390 | -| policy_gradient_loss | -0.000627 | -| std | 0.422 | -| value_loss | 6.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3941 | -| time_elapsed | 34331 | -| total_timesteps | 504448 | -| train/ | | -| approx_kl | 0.01140147 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | -482 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 39400 | -| policy_gradient_loss | -0.00786 | -| std | 0.421 | -| value_loss | 2.53e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3942 | -| time_elapsed | 34334 | -| total_timesteps | 504576 | -| train/ | | -| approx_kl | 0.02556135 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -3.95 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 39410 | -| policy_gradient_loss | -0.0115 | -| std | 0.421 | -| value_loss | 9.9e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3943 | -| time_elapsed | 34338 | -| total_timesteps | 504704 | -| train/ | | -| approx_kl | 0.011481421 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.555 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 39420 | -| policy_gradient_loss | -0.00575 | -| std | 0.421 | -| value_loss | 2.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3944 | -| time_elapsed | 34341 | -| total_timesteps | 504832 | -| train/ | | -| approx_kl | 0.011974037 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | 0.00068 | -| n_updates | 39430 | -| policy_gradient_loss | -0.00069 | -| std | 0.421 | -| value_loss | 1.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 14 | -| iterations | 3945 | -| time_elapsed | 34345 | -| total_timesteps | 504960 | -| train/ | | -| approx_kl | 0.008973875 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00803 | -| n_updates | 39440 | -| policy_gradient_loss | -0.00302 | -| std | 0.422 | -| value_loss | 2.73e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3946 | -| time_elapsed | 34349 | -| total_timesteps | 505088 | -| train/ | | -| approx_kl | 0.0017021641 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.557 | -| explained_variance | 0.00606 | -| learning_rate | 0.0003 | -| loss | -0.000281 | -| n_updates | 39450 | -| policy_gradient_loss | 5.09e-05 | -| std | 0.423 | -| value_loss | 7.67e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3947 | -| time_elapsed | 34356 | -| total_timesteps | 505216 | -| train/ | | -| approx_kl | 0.006738539 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.56 | -| explained_variance | 0.773 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 39460 | -| policy_gradient_loss | -0.0045 | -| std | 0.424 | -| value_loss | 0.0031 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3948 | -| time_elapsed | 34360 | -| total_timesteps | 505344 | -| train/ | | -| approx_kl | 0.04255244 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | -0.562 | -| explained_variance | -178 | -| learning_rate | 0.0003 | -| loss | -0.00842 | -| n_updates | 39470 | -| policy_gradient_loss | -0.00515 | -| std | 0.425 | -| value_loss | 1.26e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3949 | -| time_elapsed | 34363 | -| total_timesteps | 505472 | -| train/ | | -| approx_kl | 2.993294e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.564 | -| explained_variance | -377 | -| learning_rate | 0.0003 | -| loss | 0.000752 | -| n_updates | 39480 | -| policy_gradient_loss | 0.00336 | -| std | 0.425 | -| value_loss | 2.93e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3950 | -| time_elapsed | 34367 | -| total_timesteps | 505600 | -| train/ | | -| approx_kl | 0.0073720114 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.564 | -| explained_variance | -4.26 | -| learning_rate | 0.0003 | -| loss | -5.84e-05 | -| n_updates | 39490 | -| policy_gradient_loss | -0.00017 | -| std | 0.426 | -| value_loss | 3.57e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3951 | -| time_elapsed | 34371 | -| total_timesteps | 505728 | -| train/ | | -| approx_kl | 0.013849138 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.565 | -| explained_variance | -0.385 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 39500 | -| policy_gradient_loss | -0.00545 | -| std | 0.425 | -| value_loss | 5.45e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3952 | -| time_elapsed | 34374 | -| total_timesteps | 505856 | -| train/ | | -| approx_kl | 0.00089919264 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.563 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | -0.000676 | -| n_updates | 39510 | -| policy_gradient_loss | -0.000226 | -| std | 0.424 | -| value_loss | 7.31e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3953 | -| time_elapsed | 34376 | -| total_timesteps | 505984 | -| train/ | | -| approx_kl | 0.0059205787 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.56 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 39520 | -| policy_gradient_loss | -0.000928 | -| std | 0.422 | -| value_loss | 1.5e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 14 | -| iterations | 3954 | -| time_elapsed | 34380 | -| total_timesteps | 506112 | -| train/ | | -| approx_kl | 0.012988072 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.554 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 39530 | -| policy_gradient_loss | -0.00262 | -| std | 0.42 | -| value_loss | 9.4e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 14 | -| iterations | 3955 | -| time_elapsed | 34389 | -| total_timesteps | 506240 | -| train/ | | -| approx_kl | 0.012112497 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.55 | -| explained_variance | 0.826 | -| learning_rate | 0.0003 | -| loss | -0.00763 | -| n_updates | 39540 | -| policy_gradient_loss | -0.00315 | -| std | 0.419 | -| value_loss | 0.00214 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 14 | -| iterations | 3956 | -| time_elapsed | 34393 | -| total_timesteps | 506368 | -| train/ | | -| approx_kl | 0.04933612 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -3.2e+03 | -| learning_rate | 0.0003 | -| loss | -0.00582 | -| n_updates | 39550 | -| policy_gradient_loss | -0.00384 | -| std | 0.419 | -| value_loss | 4.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 14 | -| iterations | 3957 | -| time_elapsed | 34396 | -| total_timesteps | 506496 | -| train/ | | -| approx_kl | 0.030935107 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -1.39e+03 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 39560 | -| policy_gradient_loss | -0.0131 | -| std | 0.419 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 14 | -| iterations | 3958 | -| time_elapsed | 34399 | -| total_timesteps | 506624 | -| train/ | | -| approx_kl | 0.0069475644 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.549 | -| explained_variance | -92.7 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 39570 | -| policy_gradient_loss | -0.000716 | -| std | 0.418 | -| value_loss | 3.77e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 14 | -| iterations | 3959 | -| time_elapsed | 34403 | -| total_timesteps | 506752 | -| train/ | | -| approx_kl | 0.0063690282 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.547 | -| explained_variance | -37.1 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 39580 | -| policy_gradient_loss | -0.00507 | -| std | 0.418 | -| value_loss | 3.29e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 14 | -| iterations | 3960 | -| time_elapsed | 34407 | -| total_timesteps | 506880 | -| train/ | | -| approx_kl | 0.0074349367 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | 0.00176 | -| n_updates | 39590 | -| policy_gradient_loss | 0.00152 | -| std | 0.417 | -| value_loss | 5.47e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3961 | -| time_elapsed | 34411 | -| total_timesteps | 507008 | -| train/ | | -| approx_kl | 0.005098611 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.543 | -| explained_variance | 0.00561 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 39600 | -| policy_gradient_loss | -0.00205 | -| std | 0.417 | -| value_loss | 1.92e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3962 | -| time_elapsed | 34421 | -| total_timesteps | 507136 | -| train/ | | -| approx_kl | 0.00023631006 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.543 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 39610 | -| policy_gradient_loss | 0.00103 | -| std | 0.417 | -| value_loss | 0.000433 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3963 | -| time_elapsed | 34424 | -| total_timesteps | 507264 | -| train/ | | -| approx_kl | 0.0014177999 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -689 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 39620 | -| policy_gradient_loss | 9.37e-05 | -| std | 0.418 | -| value_loss | 2.64e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3964 | -| time_elapsed | 34427 | -| total_timesteps | 507392 | -| train/ | | -| approx_kl | 7.7809906e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.545 | -| explained_variance | -499 | -| learning_rate | 0.0003 | -| loss | -0.000363 | -| n_updates | 39630 | -| policy_gradient_loss | 0.000415 | -| std | 0.417 | -| value_loss | 3.56e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3965 | -| time_elapsed | 34429 | -| total_timesteps | 507520 | -| train/ | | -| approx_kl | 0.0006631792 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.543 | -| explained_variance | -17.1 | -| learning_rate | 0.0003 | -| loss | -0.000677 | -| n_updates | 39640 | -| policy_gradient_loss | 0.000111 | -| std | 0.416 | -| value_loss | 9.22e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3966 | -| time_elapsed | 34433 | -| total_timesteps | 507648 | -| train/ | | -| approx_kl | 0.034993947 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -27.3 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 39650 | -| policy_gradient_loss | -0.00778 | -| std | 0.416 | -| value_loss | 3.67e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3967 | -| time_elapsed | 34437 | -| total_timesteps | 507776 | -| train/ | | -| approx_kl | 0.017838638 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | 0.00181 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 39660 | -| policy_gradient_loss | -0.00877 | -| std | 0.416 | -| value_loss | 6.98e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 14 | -| iterations | 3968 | -| time_elapsed | 34441 | -| total_timesteps | 507904 | -| train/ | | -| approx_kl | 0.012534435 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 39670 | -| policy_gradient_loss | -0.00249 | -| std | 0.416 | -| value_loss | 8.54e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3969 | -| time_elapsed | 34444 | -| total_timesteps | 508032 | -| train/ | | -| approx_kl | 0.00020433543 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.543 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | -0.000329 | -| n_updates | 39680 | -| policy_gradient_loss | 0.000121 | -| std | 0.416 | -| value_loss | 5.78e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3970 | -| time_elapsed | 34453 | -| total_timesteps | 508160 | -| train/ | | -| approx_kl | 0.0046450216 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 39690 | -| policy_gradient_loss | -0.00219 | -| std | 0.416 | -| value_loss | 2.8e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3971 | -| time_elapsed | 34455 | -| total_timesteps | 508288 | -| train/ | | -| approx_kl | 0.028231848 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.542 | -| explained_variance | -19.6 | -| learning_rate | 0.0003 | -| loss | -0.000108 | -| n_updates | 39700 | -| policy_gradient_loss | -0.00163 | -| std | 0.416 | -| value_loss | 1.94e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3972 | -| time_elapsed | 34458 | -| total_timesteps | 508416 | -| train/ | | -| approx_kl | 0.0021018027 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.539 | -| explained_variance | -5.67 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 39710 | -| policy_gradient_loss | -0.000479 | -| std | 0.414 | -| value_loss | 4.13e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3973 | -| time_elapsed | 34462 | -| total_timesteps | 508544 | -| train/ | | -| approx_kl | 0.01013696 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.534 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 39720 | -| policy_gradient_loss | -0.00242 | -| std | 0.412 | -| value_loss | 9.92e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3974 | -| time_elapsed | 34466 | -| total_timesteps | 508672 | -| train/ | | -| approx_kl | 0.010260003 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.53 | -| explained_variance | -0.0742 | -| learning_rate | 0.0003 | -| loss | -0.00595 | -| n_updates | 39730 | -| policy_gradient_loss | -0.00558 | -| std | 0.41 | -| value_loss | 6.77e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3975 | -| time_elapsed | 34468 | -| total_timesteps | 508800 | -| train/ | | -| approx_kl | 0.010535099 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | -0.000306 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 39740 | -| policy_gradient_loss | -0.00356 | -| std | 0.41 | -| value_loss | 5.25e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 14 | -| iterations | 3976 | -| time_elapsed | 34471 | -| total_timesteps | 508928 | -| train/ | | -| approx_kl | 0.007430669 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | 0.00472 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 39750 | -| policy_gradient_loss | -0.000856 | -| std | 0.409 | -| value_loss | 5.67e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3977 | -| time_elapsed | 34474 | -| total_timesteps | 509056 | -| train/ | | -| approx_kl | 0.0014040077 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.524 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.000978 | -| n_updates | 39760 | -| policy_gradient_loss | -0.000216 | -| std | 0.408 | -| value_loss | 1.22e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3978 | -| time_elapsed | 34480 | -| total_timesteps | 509184 | -| train/ | | -| approx_kl | 0.034659885 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.522 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 39770 | -| policy_gradient_loss | -0.00827 | -| std | 0.407 | -| value_loss | 0.000453 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3979 | -| time_elapsed | 34483 | -| total_timesteps | 509312 | -| train/ | | -| approx_kl | 0.007914502 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -1.35e+03 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 39780 | -| policy_gradient_loss | -0.000603 | -| std | 0.408 | -| value_loss | 1.33e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3980 | -| time_elapsed | 34486 | -| total_timesteps | 509440 | -| train/ | | -| approx_kl | 0.02688836 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.523 | -| explained_variance | -7.38e+03 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 39790 | -| policy_gradient_loss | -0.0027 | -| std | 0.409 | -| value_loss | 3.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3981 | -| time_elapsed | 34489 | -| total_timesteps | 509568 | -| train/ | | -| approx_kl | 0.021057546 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.524 | -| explained_variance | -89.9 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 39800 | -| policy_gradient_loss | -0.00154 | -| std | 0.408 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3982 | -| time_elapsed | 34493 | -| total_timesteps | 509696 | -| train/ | | -| approx_kl | 0.003518042 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.522 | -| explained_variance | -1.33e+03 | -| learning_rate | 0.0003 | -| loss | -0.000997 | -| n_updates | 39810 | -| policy_gradient_loss | -0.000434 | -| std | 0.407 | -| value_loss | 9.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3983 | -| time_elapsed | 34496 | -| total_timesteps | 509824 | -| train/ | | -| approx_kl | 0.008641097 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.00068 | -| n_updates | 39820 | -| policy_gradient_loss | -0.000765 | -| std | 0.406 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 14 | -| iterations | 3984 | -| time_elapsed | 34500 | -| total_timesteps | 509952 | -| train/ | | -| approx_kl | 0.014016649 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -33 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 39830 | -| policy_gradient_loss | -0.00272 | -| std | 0.406 | -| value_loss | 2.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3985 | -| time_elapsed | 34504 | -| total_timesteps | 510080 | -| train/ | | -| approx_kl | 0.026865691 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -0.373 | -| learning_rate | 0.0003 | -| loss | -0.00723 | -| n_updates | 39840 | -| policy_gradient_loss | -0.00835 | -| std | 0.406 | -| value_loss | 1.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3986 | -| time_elapsed | 34510 | -| total_timesteps | 510208 | -| train/ | | -| approx_kl | 0.016914392 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | -0.00706 | -| n_updates | 39850 | -| policy_gradient_loss | -0.0033 | -| std | 0.405 | -| value_loss | 0.000338 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3987 | -| time_elapsed | 34514 | -| total_timesteps | 510336 | -| train/ | | -| approx_kl | 1.9159634e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -4.87e+03 | -| learning_rate | 0.0003 | -| loss | -0.000116 | -| n_updates | 39860 | -| policy_gradient_loss | 0.00228 | -| std | 0.405 | -| value_loss | 2.58e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3988 | -| time_elapsed | 34518 | -| total_timesteps | 510464 | -| train/ | | -| approx_kl | 0.0016513534 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -1.22e+04 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 39870 | -| policy_gradient_loss | 2.66e-05 | -| std | 0.405 | -| value_loss | 9.41e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3989 | -| time_elapsed | 34521 | -| total_timesteps | 510592 | -| train/ | | -| approx_kl | 0.0007181242 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.514 | -| explained_variance | -186 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 39880 | -| policy_gradient_loss | 0.000901 | -| std | 0.405 | -| value_loss | 3.52e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3990 | -| time_elapsed | 34524 | -| total_timesteps | 510720 | -| train/ | | -| approx_kl | 0.01837731 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | -0.514 | -| explained_variance | -2.37 | -| learning_rate | 0.0003 | -| loss | 0.00214 | -| n_updates | 39890 | -| policy_gradient_loss | -0.000172 | -| std | 0.405 | -| value_loss | 8.69e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3991 | -| time_elapsed | 34526 | -| total_timesteps | 510848 | -| train/ | | -| approx_kl | 0.009781935 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 39900 | -| policy_gradient_loss | -0.00263 | -| std | 0.405 | -| value_loss | 1.82e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 14 | -| iterations | 3992 | -| time_elapsed | 34529 | -| total_timesteps | 510976 | -| train/ | | -| approx_kl | 0.012182988 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -0.0557 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 39910 | -| policy_gradient_loss | -0.00225 | -| std | 0.405 | -| value_loss | 2.04e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 14 | -| iterations | 3993 | -| time_elapsed | 34531 | -| total_timesteps | 511104 | -| train/ | | -| approx_kl | 0.006795761 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -0.0755 | -| learning_rate | 0.0003 | -| loss | -0.00868 | -| n_updates | 39920 | -| policy_gradient_loss | -0.00314 | -| std | 0.406 | -| value_loss | 4.07e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 14 | -| iterations | 3994 | -| time_elapsed | 34539 | -| total_timesteps | 511232 | -| train/ | | -| approx_kl | 0.018773204 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 39930 | -| policy_gradient_loss | -0.00201 | -| std | 0.406 | -| value_loss | 0.000192 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 14 | -| iterations | 3995 | -| time_elapsed | 34543 | -| total_timesteps | 511360 | -| train/ | | -| approx_kl | 0.037115853 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -297 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 39940 | -| policy_gradient_loss | -0.00495 | -| std | 0.406 | -| value_loss | 7.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 14 | -| iterations | 3996 | -| time_elapsed | 34547 | -| total_timesteps | 511488 | -| train/ | | -| approx_kl | 0.004677642 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -4.47 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 39950 | -| policy_gradient_loss | 0.00103 | -| std | 0.406 | -| value_loss | 0.000132 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 14 | -| iterations | 3997 | -| time_elapsed | 34550 | -| total_timesteps | 511616 | -| train/ | | -| approx_kl | 0.009007716 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | -0.00838 | -| n_updates | 39960 | -| policy_gradient_loss | -0.00309 | -| std | 0.406 | -| value_loss | 4.54e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 14 | -| iterations | 3998 | -| time_elapsed | 34553 | -| total_timesteps | 511744 | -| train/ | | -| approx_kl | 0.0014939173 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | -0.00634 | -| n_updates | 39970 | -| policy_gradient_loss | 3.72e-06 | -| std | 0.406 | -| value_loss | 9.98e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 14 | -| iterations | 3999 | -| time_elapsed | 34556 | -| total_timesteps | 511872 | -| train/ | | -| approx_kl | 0.033994418 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.00924 | -| n_updates | 39980 | -| policy_gradient_loss | -0.0114 | -| std | 0.406 | -| value_loss | 4.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4000 | -| time_elapsed | 34560 | -| total_timesteps | 512000 | -| train/ | | -| approx_kl | 0.014372835 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 39990 | -| policy_gradient_loss | -0.00473 | -| std | 0.406 | -| value_loss | 5.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4001 | -| time_elapsed | 34563 | -| total_timesteps | 512128 | -| train/ | | -| approx_kl | 0.0054987213 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | 0.00244 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 40000 | -| policy_gradient_loss | -0.000762 | -| std | 0.406 | -| value_loss | 1.88e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4002 | -| time_elapsed | 34572 | -| total_timesteps | 512256 | -| train/ | | -| approx_kl | 0.049196016 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 40010 | -| policy_gradient_loss | -0.0114 | -| std | 0.407 | -| value_loss | 2.22e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4003 | -| time_elapsed | 34575 | -| total_timesteps | 512384 | -| train/ | | -| approx_kl | 0.0024470603 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.0094 | -| n_updates | 40020 | -| policy_gradient_loss | -0.000418 | -| std | 0.407 | -| value_loss | 5.76e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4004 | -| time_elapsed | 34578 | -| total_timesteps | 512512 | -| train/ | | -| approx_kl | 0.0039324313 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.000393 | -| n_updates | 40030 | -| policy_gradient_loss | 0.000358 | -| std | 0.406 | -| value_loss | 1.81e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4005 | -| time_elapsed | 34581 | -| total_timesteps | 512640 | -| train/ | | -| approx_kl | 0.007975596 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | 0.00171 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 40040 | -| policy_gradient_loss | -0.00186 | -| std | 0.406 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4006 | -| time_elapsed | 34584 | -| total_timesteps | 512768 | -| train/ | | -| approx_kl | 0.017877035 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 40050 | -| policy_gradient_loss | -0.00498 | -| std | 0.406 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 14 | -| iterations | 4007 | -| time_elapsed | 34585 | -| total_timesteps | 512896 | -| train/ | | -| approx_kl | 0.011339475 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 40060 | -| policy_gradient_loss | -0.00698 | -| std | 0.405 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4008 | -| time_elapsed | 34587 | -| total_timesteps | 513024 | -| train/ | | -| approx_kl | 0.018407283 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 40070 | -| policy_gradient_loss | -0.00367 | -| std | 0.405 | -| value_loss | 3.06e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4009 | -| time_elapsed | 34594 | -| total_timesteps | 513152 | -| train/ | | -| approx_kl | 0.00073846057 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | 0.000343 | -| n_updates | 40080 | -| policy_gradient_loss | -0.000174 | -| std | 0.406 | -| value_loss | 0.00214 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4010 | -| time_elapsed | 34598 | -| total_timesteps | 513280 | -| train/ | | -| approx_kl | 0.014484613 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -422 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 40090 | -| policy_gradient_loss | -0.01 | -| std | 0.407 | -| value_loss | 3.02e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4011 | -| time_elapsed | 34601 | -| total_timesteps | 513408 | -| train/ | | -| approx_kl | 0.014077158 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -331 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 40100 | -| policy_gradient_loss | -0.00186 | -| std | 0.406 | -| value_loss | 5.37e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4012 | -| time_elapsed | 34603 | -| total_timesteps | 513536 | -| train/ | | -| approx_kl | 0.00012004771 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 40110 | -| policy_gradient_loss | 0.000895 | -| std | 0.407 | -| value_loss | 5.19e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4013 | -| time_elapsed | 34606 | -| total_timesteps | 513664 | -| train/ | | -| approx_kl | 0.0017099224 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.522 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 40120 | -| policy_gradient_loss | 7.9e-05 | -| std | 0.408 | -| value_loss | 1.06e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4014 | -| time_elapsed | 34611 | -| total_timesteps | 513792 | -| train/ | | -| approx_kl | 0.019658504 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | -0.522 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 40130 | -| policy_gradient_loss | -0.00752 | -| std | 0.408 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 14 | -| iterations | 4015 | -| time_elapsed | 34614 | -| total_timesteps | 513920 | -| train/ | | -| approx_kl | 0.016251216 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | 0.00125 | -| learning_rate | 0.0003 | -| loss | -0.0086 | -| n_updates | 40140 | -| policy_gradient_loss | -0.00646 | -| std | 0.407 | -| value_loss | 9.31e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4016 | -| time_elapsed | 34618 | -| total_timesteps | 514048 | -| train/ | | -| approx_kl | 0.0146241365 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 40150 | -| policy_gradient_loss | -0.011 | -| std | 0.407 | -| value_loss | 1.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4017 | -| time_elapsed | 34624 | -| total_timesteps | 514176 | -| train/ | | -| approx_kl | 0.041434526 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.00545 | -| n_updates | 40160 | -| policy_gradient_loss | -0.00392 | -| std | 0.406 | -| value_loss | 0.000577 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4018 | -| time_elapsed | 34628 | -| total_timesteps | 514304 | -| train/ | | -| approx_kl | 0.008259801 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -358 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 40170 | -| policy_gradient_loss | -4.55e-05 | -| std | 0.406 | -| value_loss | 4.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4019 | -| time_elapsed | 34632 | -| total_timesteps | 514432 | -| train/ | | -| approx_kl | 0.008400921 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -598 | -| learning_rate | 0.0003 | -| loss | -0.00701 | -| n_updates | 40180 | -| policy_gradient_loss | -0.00256 | -| std | 0.407 | -| value_loss | 1.07e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4020 | -| time_elapsed | 34636 | -| total_timesteps | 514560 | -| train/ | | -| approx_kl | 6.5926695e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.000438 | -| n_updates | 40190 | -| policy_gradient_loss | 0.00109 | -| std | 0.407 | -| value_loss | 1.91e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4021 | -| time_elapsed | 34639 | -| total_timesteps | 514688 | -| train/ | | -| approx_kl | 0.038903616 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | -0.0233 | -| n_updates | 40200 | -| policy_gradient_loss | -0.0187 | -| std | 0.407 | -| value_loss | 2.99e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4022 | -| time_elapsed | 34642 | -| total_timesteps | 514816 | -| train/ | | -| approx_kl | 0.00829047 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | -0.00387 | -| n_updates | 40210 | -| policy_gradient_loss | -0.00212 | -| std | 0.407 | -| value_loss | 1.04e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 14 | -| iterations | 4023 | -| time_elapsed | 34646 | -| total_timesteps | 514944 | -| train/ | | -| approx_kl | 0.0060743727 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | 0.00607 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 40220 | -| policy_gradient_loss | -0.00285 | -| std | 0.407 | -| value_loss | 9.27e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4024 | -| time_elapsed | 34649 | -| total_timesteps | 515072 | -| train/ | | -| approx_kl | 0.0014721579 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 40230 | -| policy_gradient_loss | -0.000753 | -| std | 0.406 | -| value_loss | 3.31e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4025 | -| time_elapsed | 34656 | -| total_timesteps | 515200 | -| train/ | | -| approx_kl | 0.0032221796 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | 0.337 | -| learning_rate | 0.0003 | -| loss | -0.00348 | -| n_updates | 40240 | -| policy_gradient_loss | -0.000684 | -| std | 0.406 | -| value_loss | 0.00112 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4026 | -| time_elapsed | 34660 | -| total_timesteps | 515328 | -| train/ | | -| approx_kl | 0.042424437 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -2.18e+03 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 40250 | -| policy_gradient_loss | -0.0127 | -| std | 0.407 | -| value_loss | 4.06e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4027 | -| time_elapsed | 34664 | -| total_timesteps | 515456 | -| train/ | | -| approx_kl | 0.0116869435 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -5.06e+03 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 40260 | -| policy_gradient_loss | -0.00183 | -| std | 0.406 | -| value_loss | 1.15e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4028 | -| time_elapsed | 34667 | -| total_timesteps | 515584 | -| train/ | | -| approx_kl | 0.04002515 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 40270 | -| policy_gradient_loss | -0.00332 | -| std | 0.405 | -| value_loss | 1.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4029 | -| time_elapsed | 34670 | -| total_timesteps | 515712 | -| train/ | | -| approx_kl | 0.004304759 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.514 | -| explained_variance | -11.3 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 40280 | -| policy_gradient_loss | -0.00121 | -| std | 0.405 | -| value_loss | 5.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4030 | -| time_elapsed | 34673 | -| total_timesteps | 515840 | -| train/ | | -| approx_kl | 0.019433752 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -1.75 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 40290 | -| policy_gradient_loss | -0.0105 | -| std | 0.405 | -| value_loss | 2.73e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 14 | -| iterations | 4031 | -| time_elapsed | 34676 | -| total_timesteps | 515968 | -| train/ | | -| approx_kl | 0.008414825 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -0.455 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 40300 | -| policy_gradient_loss | -0.0013 | -| std | 0.405 | -| value_loss | 8.56e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4032 | -| time_elapsed | 34679 | -| total_timesteps | 516096 | -| train/ | | -| approx_kl | 0.0039659585 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 40310 | -| policy_gradient_loss | -0.000447 | -| std | 0.405 | -| value_loss | 2.77e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4033 | -| time_elapsed | 34686 | -| total_timesteps | 516224 | -| train/ | | -| approx_kl | 0.02774319 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 40320 | -| policy_gradient_loss | -0.00914 | -| std | 0.405 | -| value_loss | 0.00249 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4034 | -| time_elapsed | 34689 | -| total_timesteps | 516352 | -| train/ | | -| approx_kl | 0.0015495927 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -340 | -| learning_rate | 0.0003 | -| loss | -0.000522 | -| n_updates | 40330 | -| policy_gradient_loss | -0.000195 | -| std | 0.406 | -| value_loss | 5.21e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4035 | -| time_elapsed | 34693 | -| total_timesteps | 516480 | -| train/ | | -| approx_kl | 0.009414849 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -449 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 40340 | -| policy_gradient_loss | -0.00914 | -| std | 0.406 | -| value_loss | 2.43e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4036 | -| time_elapsed | 34697 | -| total_timesteps | 516608 | -| train/ | | -| approx_kl | 0.0106096985 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -4.34 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 40350 | -| policy_gradient_loss | -0.00153 | -| std | 0.407 | -| value_loss | 1.24e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4037 | -| time_elapsed | 34701 | -| total_timesteps | 516736 | -| train/ | | -| approx_kl | 0.0013878276 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -0.535 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 40360 | -| policy_gradient_loss | 0.000187 | -| std | 0.407 | -| value_loss | 5.87e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4038 | -| time_elapsed | 34705 | -| total_timesteps | 516864 | -| train/ | | -| approx_kl | 0.0007292121 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 40370 | -| policy_gradient_loss | 0.000668 | -| std | 0.407 | -| value_loss | 2.71e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 14 | -| iterations | 4039 | -| time_elapsed | 34707 | -| total_timesteps | 516992 | -| train/ | | -| approx_kl | 0.0027300382 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | 0.00501 | -| learning_rate | 0.0003 | -| loss | 0.000146 | -| n_updates | 40380 | -| policy_gradient_loss | 0.00028 | -| std | 0.407 | -| value_loss | 1.07e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 14 | -| iterations | 4040 | -| time_elapsed | 34712 | -| total_timesteps | 517120 | -| train/ | | -| approx_kl | 0.0067114946 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.00228 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 40390 | -| policy_gradient_loss | -0.00469 | -| std | 0.406 | -| value_loss | 1.31e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 14 | -| iterations | 4041 | -| time_elapsed | 34721 | -| total_timesteps | 517248 | -| train/ | | -| approx_kl | 0.07533565 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -6.25 | -| learning_rate | 0.0003 | -| loss | -0.00867 | -| n_updates | 40400 | -| policy_gradient_loss | -0.00542 | -| std | 0.406 | -| value_loss | 0.00298 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 14 | -| iterations | 4042 | -| time_elapsed | 34725 | -| total_timesteps | 517376 | -| train/ | | -| approx_kl | 0.027862128 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -1.28e+03 | -| learning_rate | 0.0003 | -| loss | -0.000757 | -| n_updates | 40410 | -| policy_gradient_loss | -0.00125 | -| std | 0.406 | -| value_loss | 1.63e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 14 | -| iterations | 4043 | -| time_elapsed | 34728 | -| total_timesteps | 517504 | -| train/ | | -| approx_kl | 0.001809129 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -2.73e+03 | -| learning_rate | 0.0003 | -| loss | -0.000546 | -| n_updates | 40420 | -| policy_gradient_loss | -0.000266 | -| std | 0.404 | -| value_loss | 3.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 14 | -| iterations | 4044 | -| time_elapsed | 34732 | -| total_timesteps | 517632 | -| train/ | | -| approx_kl | 0.001485196 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.513 | -| explained_variance | -34 | -| learning_rate | 0.0003 | -| loss | -7.47e-05 | -| n_updates | 40430 | -| policy_gradient_loss | 6.95e-06 | -| std | 0.404 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 14 | -| iterations | 4045 | -| time_elapsed | 34735 | -| total_timesteps | 517760 | -| train/ | | -| approx_kl | 0.009836571 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.514 | -| explained_variance | -89.1 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 40440 | -| policy_gradient_loss | -0.00185 | -| std | 0.405 | -| value_loss | 1.69e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 14 | -| iterations | 4046 | -| time_elapsed | 34738 | -| total_timesteps | 517888 | -| train/ | | -| approx_kl | 0.01463614 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -4 | -| learning_rate | 0.0003 | -| loss | 0.00353 | -| n_updates | 40450 | -| policy_gradient_loss | 0.0012 | -| std | 0.406 | -| value_loss | 1.04e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4047 | -| time_elapsed | 34742 | -| total_timesteps | 518016 | -| train/ | | -| approx_kl | 0.012693098 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 40460 | -| policy_gradient_loss | -0.00182 | -| std | 0.405 | -| value_loss | 1.64e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4048 | -| time_elapsed | 34750 | -| total_timesteps | 518144 | -| train/ | | -| approx_kl | 0.014158657 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | 0.37 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 40470 | -| policy_gradient_loss | -0.00546 | -| std | 0.405 | -| value_loss | 0.000646 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4049 | -| time_elapsed | 34754 | -| total_timesteps | 518272 | -| train/ | | -| approx_kl | 3.8906e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -101 | -| learning_rate | 0.0003 | -| loss | 0.000199 | -| n_updates | 40480 | -| policy_gradient_loss | 0.00255 | -| std | 0.405 | -| value_loss | 4.35e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4050 | -| time_elapsed | 34757 | -| total_timesteps | 518400 | -| train/ | | -| approx_kl | 0.0018749454 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.514 | -| explained_variance | -127 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 40490 | -| policy_gradient_loss | -1.72e-05 | -| std | 0.404 | -| value_loss | 1.91e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4051 | -| time_elapsed | 34760 | -| total_timesteps | 518528 | -| train/ | | -| approx_kl | 0.0009185036 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.513 | -| explained_variance | -6.26 | -| learning_rate | 0.0003 | -| loss | -0.00641 | -| n_updates | 40500 | -| policy_gradient_loss | 0.00173 | -| std | 0.404 | -| value_loss | 1.67e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4052 | -| time_elapsed | 34765 | -| total_timesteps | 518656 | -| train/ | | -| approx_kl | 0.011292398 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -0.513 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 40510 | -| policy_gradient_loss | -0.00203 | -| std | 0.405 | -| value_loss | 9.47e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4053 | -| time_elapsed | 34768 | -| total_timesteps | 518784 | -| train/ | | -| approx_kl | 0.012080808 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -0.0924 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 40520 | -| policy_gradient_loss | -0.00297 | -| std | 0.405 | -| value_loss | 2.67e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 14 | -| iterations | 4054 | -| time_elapsed | 34772 | -| total_timesteps | 518912 | -| train/ | | -| approx_kl | 0.00043104123 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | -7.77e-05 | -| n_updates | 40530 | -| policy_gradient_loss | -3.15e-05 | -| std | 0.405 | -| value_loss | 2.85e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4055 | -| time_elapsed | 34775 | -| total_timesteps | 519040 | -| train/ | | -| approx_kl | 0.012737529 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 40540 | -| policy_gradient_loss | -0.00771 | -| std | 0.406 | -| value_loss | 9.48e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4056 | -| time_elapsed | 34785 | -| total_timesteps | 519168 | -| train/ | | -| approx_kl | 0.06580737 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | 0.697 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 40550 | -| policy_gradient_loss | -0.0104 | -| std | 0.406 | -| value_loss | 0.00456 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4057 | -| time_elapsed | 34789 | -| total_timesteps | 519296 | -| train/ | | -| approx_kl | 0.0007532027 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -2.16e+03 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 40560 | -| policy_gradient_loss | 0.000888 | -| std | 0.406 | -| value_loss | 1.42e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4058 | -| time_elapsed | 34793 | -| total_timesteps | 519424 | -| train/ | | -| approx_kl | 0.0433499 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -1.84e+03 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 40570 | -| policy_gradient_loss | -0.00416 | -| std | 0.407 | -| value_loss | 6.62e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4059 | -| time_elapsed | 34796 | -| total_timesteps | 519552 | -| train/ | | -| approx_kl | 0.016149681 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -97.8 | -| learning_rate | 0.0003 | -| loss | -0.000319 | -| n_updates | 40580 | -| policy_gradient_loss | -0.000951 | -| std | 0.407 | -| value_loss | 2.66e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4060 | -| time_elapsed | 34799 | -| total_timesteps | 519680 | -| train/ | | -| approx_kl | 0.02511734 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -8.52 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 40590 | -| policy_gradient_loss | -0.00808 | -| std | 0.407 | -| value_loss | 5.33e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4061 | -| time_elapsed | 34803 | -| total_timesteps | 519808 | -| train/ | | -| approx_kl | 0.0015228507 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 40600 | -| policy_gradient_loss | 0.000151 | -| std | 0.407 | -| value_loss | 5.03e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 14 | -| iterations | 4062 | -| time_elapsed | 34806 | -| total_timesteps | 519936 | -| train/ | | -| approx_kl | 0.0017532972 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.000126 | -| n_updates | 40610 | -| policy_gradient_loss | 0.000357 | -| std | 0.408 | -| value_loss | 4.4e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4063 | -| time_elapsed | 34809 | -| total_timesteps | 520064 | -| train/ | | -| approx_kl | 0.011565964 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.524 | -| explained_variance | 0.00384 | -| learning_rate | 0.0003 | -| loss | -0.000231 | -| n_updates | 40620 | -| policy_gradient_loss | -0.00121 | -| std | 0.41 | -| value_loss | 2.05e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4064 | -| time_elapsed | 34816 | -| total_timesteps | 520192 | -| train/ | | -| approx_kl | 0.02288363 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00932 | -| n_updates | 40630 | -| policy_gradient_loss | -0.00444 | -| std | 0.41 | -| value_loss | 0.00121 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4065 | -| time_elapsed | 34819 | -| total_timesteps | 520320 | -| train/ | | -| approx_kl | 0.0015224083 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.528 | -| explained_variance | -722 | -| learning_rate | 0.0003 | -| loss | 0.000772 | -| n_updates | 40640 | -| policy_gradient_loss | 0.00104 | -| std | 0.41 | -| value_loss | 3.36e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4066 | -| time_elapsed | 34823 | -| total_timesteps | 520448 | -| train/ | | -| approx_kl | 0.0044790464 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | -768 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 40650 | -| policy_gradient_loss | -0.00343 | -| std | 0.409 | -| value_loss | 9.86e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4067 | -| time_elapsed | 34826 | -| total_timesteps | 520576 | -| train/ | | -| approx_kl | 0.00034193275 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | -31.4 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 40660 | -| policy_gradient_loss | 0.000834 | -| std | 0.409 | -| value_loss | 2.41e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4068 | -| time_elapsed | 34829 | -| total_timesteps | 520704 | -| train/ | | -| approx_kl | 0.0047333813 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | -2.11 | -| learning_rate | 0.0003 | -| loss | 0.000158 | -| n_updates | 40670 | -| policy_gradient_loss | 6.13e-05 | -| std | 0.409 | -| value_loss | 1.75e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4069 | -| time_elapsed | 34833 | -| total_timesteps | 520832 | -| train/ | | -| approx_kl | 0.004717797 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 40680 | -| policy_gradient_loss | -0.000428 | -| std | 0.41 | -| value_loss | 1.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 14 | -| iterations | 4070 | -| time_elapsed | 34835 | -| total_timesteps | 520960 | -| train/ | | -| approx_kl | 0.008658936 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.529 | -| explained_variance | 0.00347 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 40690 | -| policy_gradient_loss | -0.00806 | -| std | 0.411 | -| value_loss | 2.65e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4071 | -| time_elapsed | 34839 | -| total_timesteps | 521088 | -| train/ | | -| approx_kl | 0.0001258431 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.531 | -| explained_variance | 0.00184 | -| learning_rate | 0.0003 | -| loss | -0.000852 | -| n_updates | 40700 | -| policy_gradient_loss | 0.00107 | -| std | 0.412 | -| value_loss | 7.71e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4072 | -| time_elapsed | 34846 | -| total_timesteps | 521216 | -| train/ | | -| approx_kl | 0.020184513 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | -0.532 | -| explained_variance | 0.876 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 40710 | -| policy_gradient_loss | -0.0104 | -| std | 0.412 | -| value_loss | 0.000247 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4073 | -| time_elapsed | 34850 | -| total_timesteps | 521344 | -| train/ | | -| approx_kl | 0.023366924 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.532 | -| explained_variance | -499 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 40720 | -| policy_gradient_loss | -0.00487 | -| std | 0.412 | -| value_loss | 4.8e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4074 | -| time_elapsed | 34854 | -| total_timesteps | 521472 | -| train/ | | -| approx_kl | 0.03750363 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | -0.531 | -| explained_variance | -448 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 40730 | -| policy_gradient_loss | -0.0158 | -| std | 0.411 | -| value_loss | 4.52e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4075 | -| time_elapsed | 34858 | -| total_timesteps | 521600 | -| train/ | | -| approx_kl | 0.014216777 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.531 | -| explained_variance | -4.21 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 40740 | -| policy_gradient_loss | -0.00215 | -| std | 0.411 | -| value_loss | 1.8e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4076 | -| time_elapsed | 34860 | -| total_timesteps | 521728 | -| train/ | | -| approx_kl | 0.0073129106 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.529 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 40750 | -| policy_gradient_loss | -0.00399 | -| std | 0.41 | -| value_loss | 9.7e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4077 | -| time_elapsed | 34863 | -| total_timesteps | 521856 | -| train/ | | -| approx_kl | 0.020465432 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | 0.00693 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 40760 | -| policy_gradient_loss | -0.00511 | -| std | 0.409 | -| value_loss | 3.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 14 | -| iterations | 4078 | -| time_elapsed | 34865 | -| total_timesteps | 521984 | -| train/ | | -| approx_kl | 0.006160355 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | -0.0618 | -| learning_rate | 0.0003 | -| loss | -0.00266 | -| n_updates | 40770 | -| policy_gradient_loss | -0.00199 | -| std | 0.409 | -| value_loss | 1.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 14 | -| iterations | 4079 | -| time_elapsed | 34870 | -| total_timesteps | 522112 | -| train/ | | -| approx_kl | 0.015715502 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | 0.00502 | -| learning_rate | 0.0003 | -| loss | -0.00893 | -| n_updates | 40780 | -| policy_gradient_loss | -0.00618 | -| std | 0.409 | -| value_loss | 1.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 14 | -| iterations | 4080 | -| time_elapsed | 34878 | -| total_timesteps | 522240 | -| train/ | | -| approx_kl | 0.021247154 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | 0.942 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 40790 | -| policy_gradient_loss | -0.00998 | -| std | 0.41 | -| value_loss | 0.000332 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 14 | -| iterations | 4081 | -| time_elapsed | 34881 | -| total_timesteps | 522368 | -| train/ | | -| approx_kl | 0.0028125972 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | -1.68e+03 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 40800 | -| policy_gradient_loss | -0.00045 | -| std | 0.411 | -| value_loss | 6.42e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 14 | -| iterations | 4082 | -| time_elapsed | 34885 | -| total_timesteps | 522496 | -| train/ | | -| approx_kl | 0.042405136 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | -0.53 | -| explained_variance | -1.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 40810 | -| policy_gradient_loss | -0.0111 | -| std | 0.411 | -| value_loss | 3.86e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 14 | -| iterations | 4083 | -| time_elapsed | 34888 | -| total_timesteps | 522624 | -| train/ | | -| approx_kl | 0.0043687164 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.531 | -| explained_variance | -177 | -| learning_rate | 0.0003 | -| loss | -0.0074 | -| n_updates | 40820 | -| policy_gradient_loss | -0.00181 | -| std | 0.412 | -| value_loss | 3.2e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 14 | -| iterations | 4084 | -| time_elapsed | 34893 | -| total_timesteps | 522752 | -| train/ | | -| approx_kl | 0.00078485673 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.532 | -| explained_variance | -6.16 | -| learning_rate | 0.0003 | -| loss | 0.000709 | -| n_updates | 40830 | -| policy_gradient_loss | 0.000733 | -| std | 0.412 | -| value_loss | 8.38e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 14 | -| iterations | 4085 | -| time_elapsed | 34897 | -| total_timesteps | 522880 | -| train/ | | -| approx_kl | 0.014991367 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.531 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 40840 | -| policy_gradient_loss | -0.00308 | -| std | 0.411 | -| value_loss | 5.75e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4086 | -| time_elapsed | 34900 | -| total_timesteps | 523008 | -| train/ | | -| approx_kl | 0.0007996601 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.528 | -| explained_variance | -0.402 | -| learning_rate | 0.0003 | -| loss | -0.00032 | -| n_updates | 40850 | -| policy_gradient_loss | -0.000149 | -| std | 0.41 | -| value_loss | 1.14e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4087 | -| time_elapsed | 34909 | -| total_timesteps | 523136 | -| train/ | | -| approx_kl | 0.009882748 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | 0.764 | -| learning_rate | 0.0003 | -| loss | -0.00855 | -| n_updates | 40860 | -| policy_gradient_loss | -0.00358 | -| std | 0.409 | -| value_loss | 0.0033 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4088 | -| time_elapsed | 34913 | -| total_timesteps | 523264 | -| train/ | | -| approx_kl | 0.0162338 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | -134 | -| learning_rate | 0.0003 | -| loss | -0.000286 | -| n_updates | 40870 | -| policy_gradient_loss | -0.000543 | -| std | 0.41 | -| value_loss | 3.39e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4089 | -| time_elapsed | 34917 | -| total_timesteps | 523392 | -| train/ | | -| approx_kl | 0.01263631 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | -163 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 40880 | -| policy_gradient_loss | -0.00193 | -| std | 0.41 | -| value_loss | 1.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4090 | -| time_elapsed | 34921 | -| total_timesteps | 523520 | -| train/ | | -| approx_kl | 5.28472e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 40890 | -| policy_gradient_loss | 0.00305 | -| std | 0.41 | -| value_loss | 5.9e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4091 | -| time_elapsed | 34924 | -| total_timesteps | 523648 | -| train/ | | -| approx_kl | 0.0016659738 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.526 | -| explained_variance | -2.76 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 40900 | -| policy_gradient_loss | 6.48e-05 | -| std | 0.409 | -| value_loss | 3.75e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4092 | -| time_elapsed | 34928 | -| total_timesteps | 523776 | -| train/ | | -| approx_kl | 0.00062561594 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.525 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 40910 | -| policy_gradient_loss | 0.000759 | -| std | 0.409 | -| value_loss | 1.17e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 14 | -| iterations | 4093 | -| time_elapsed | 34930 | -| total_timesteps | 523904 | -| train/ | | -| approx_kl | 0.001188966 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.000605 | -| n_updates | 40920 | -| policy_gradient_loss | 0.000538 | -| std | 0.41 | -| value_loss | 1.46e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4094 | -| time_elapsed | 34934 | -| total_timesteps | 524032 | -| train/ | | -| approx_kl | 0.0024581393 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.527 | -| explained_variance | 0.00291 | -| learning_rate | 0.0003 | -| loss | -0.000311 | -| n_updates | 40930 | -| policy_gradient_loss | -0.000164 | -| std | 0.409 | -| value_loss | 1.49e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4095 | -| time_elapsed | 34942 | -| total_timesteps | 524160 | -| train/ | | -| approx_kl | 0.002036792 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.524 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.000461 | -| n_updates | 40940 | -| policy_gradient_loss | -0.000318 | -| std | 0.408 | -| value_loss | 0.000412 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4096 | -| time_elapsed | 34944 | -| total_timesteps | 524288 | -| train/ | | -| approx_kl | 0.021258276 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -2.85e+03 | -| learning_rate | 0.0003 | -| loss | -0.00419 | -| n_updates | 40950 | -| policy_gradient_loss | -0.00227 | -| std | 0.407 | -| value_loss | 4.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4097 | -| time_elapsed | 34947 | -| total_timesteps | 524416 | -| train/ | | -| approx_kl | 0.054020233 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -4.59e+03 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 40960 | -| policy_gradient_loss | -0.0073 | -| std | 0.408 | -| value_loss | 6.41e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4098 | -| time_elapsed | 34951 | -| total_timesteps | 524544 | -| train/ | | -| approx_kl | 0.0014396524 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.522 | -| explained_variance | -180 | -| learning_rate | 0.0003 | -| loss | 0.00244 | -| n_updates | 40970 | -| policy_gradient_loss | 0.00293 | -| std | 0.408 | -| value_loss | 2.22e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4099 | -| time_elapsed | 34956 | -| total_timesteps | 524672 | -| train/ | | -| approx_kl | 0.002865148 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.522 | -| explained_variance | -272 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 40980 | -| policy_gradient_loss | -0.000567 | -| std | 0.407 | -| value_loss | 7.17e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4100 | -| time_elapsed | 34960 | -| total_timesteps | 524800 | -| train/ | | -| approx_kl | 0.0005565109 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -3.28 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 40990 | -| policy_gradient_loss | 0.00116 | -| std | 0.407 | -| value_loss | 7.79e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4101 | -| time_elapsed | 34964 | -| total_timesteps | 524928 | -| train/ | | -| approx_kl | 0.0013597889 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.522 | -| explained_variance | -0.885 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 41000 | -| policy_gradient_loss | 0.000327 | -| std | 0.408 | -| value_loss | 2.78e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4102 | -| time_elapsed | 34968 | -| total_timesteps | 525056 | -| train/ | | -| approx_kl | 0.01929454 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | -0.523 | -| explained_variance | -0.562 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 41010 | -| policy_gradient_loss | -0.0116 | -| std | 0.408 | -| value_loss | 1.53e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4103 | -| time_elapsed | 34974 | -| total_timesteps | 525184 | -| train/ | | -| approx_kl | 0.0007955241 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | 0.000201 | -| n_updates | 41020 | -| policy_gradient_loss | -0.000148 | -| std | 0.407 | -| value_loss | 0.00139 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4104 | -| time_elapsed | 34977 | -| total_timesteps | 525312 | -| train/ | | -| approx_kl | 0.016239256 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -6.62e+03 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 41030 | -| policy_gradient_loss | -0.00667 | -| std | 0.406 | -| value_loss | 2.32e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4105 | -| time_elapsed | 34980 | -| total_timesteps | 525440 | -| train/ | | -| approx_kl | 0.0016303102 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -1.24e+04 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 41040 | -| policy_gradient_loss | 2.87e-05 | -| std | 0.406 | -| value_loss | 5.78e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4106 | -| time_elapsed | 34982 | -| total_timesteps | 525568 | -| train/ | | -| approx_kl | 0.0035067638 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -176 | -| learning_rate | 0.0003 | -| loss | 0.000726 | -| n_updates | 41050 | -| policy_gradient_loss | 0.000518 | -| std | 0.406 | -| value_loss | 1.6e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4107 | -| time_elapsed | 34986 | -| total_timesteps | 525696 | -| train/ | | -| approx_kl | 0.018400079 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -32.6 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 41060 | -| policy_gradient_loss | -0.00654 | -| std | 0.406 | -| value_loss | 7.39e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4108 | -| time_elapsed | 34989 | -| total_timesteps | 525824 | -| train/ | | -| approx_kl | 0.0022272833 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.442 | -| learning_rate | 0.0003 | -| loss | -0.00387 | -| n_updates | 41070 | -| policy_gradient_loss | -0.000504 | -| std | 0.407 | -| value_loss | 3.62e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4109 | -| time_elapsed | 34992 | -| total_timesteps | 525952 | -| train/ | | -| approx_kl | 0.016061693 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | -0.000323 | -| n_updates | 41080 | -| policy_gradient_loss | -0.00187 | -| std | 0.406 | -| value_loss | 3.13e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4110 | -| time_elapsed | 34996 | -| total_timesteps | 526080 | -| train/ | | -| approx_kl | 0.009860875 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -588 | -| learning_rate | 0.0003 | -| loss | -0.00345 | -| n_updates | 41090 | -| policy_gradient_loss | -0.00129 | -| std | 0.406 | -| value_loss | 5.85e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4111 | -| time_elapsed | 35002 | -| total_timesteps | 526208 | -| train/ | | -| approx_kl | 0.00043779542 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.00407 | -| n_updates | 41100 | -| policy_gradient_loss | 0.00115 | -| std | 0.407 | -| value_loss | 4.96e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4112 | -| time_elapsed | 35006 | -| total_timesteps | 526336 | -| train/ | | -| approx_kl | 0.026739202 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -52.7 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 41110 | -| policy_gradient_loss | -0.0115 | -| std | 0.407 | -| value_loss | 2.17e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4113 | -| time_elapsed | 35008 | -| total_timesteps | 526464 | -| train/ | | -| approx_kl | 0.0139586 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -3.87 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 41120 | -| policy_gradient_loss | -0.00337 | -| std | 0.407 | -| value_loss | 4.34e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4114 | -| time_elapsed | 35011 | -| total_timesteps | 526592 | -| train/ | | -| approx_kl | 0.008229469 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 41130 | -| policy_gradient_loss | -0.00141 | -| std | 0.407 | -| value_loss | 3.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4115 | -| time_elapsed | 35014 | -| total_timesteps | 526720 | -| train/ | | -| approx_kl | 0.006299516 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | -0.000886 | -| n_updates | 41140 | -| policy_gradient_loss | -0.000702 | -| std | 0.405 | -| value_loss | 1.18e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4116 | -| time_elapsed | 35017 | -| total_timesteps | 526848 | -| train/ | | -| approx_kl | 0.00822284 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 41150 | -| policy_gradient_loss | -0.00106 | -| std | 0.405 | -| value_loss | 4.34e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4117 | -| time_elapsed | 35020 | -| total_timesteps | 526976 | -| train/ | | -| approx_kl | 0.0071752043 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.515 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.00913 | -| n_updates | 41160 | -| policy_gradient_loss | -0.00368 | -| std | 0.405 | -| value_loss | 4.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4118 | -| time_elapsed | 35023 | -| total_timesteps | 527104 | -| train/ | | -| approx_kl | 0.008650331 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | 0.00367 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 41170 | -| policy_gradient_loss | -0.00154 | -| std | 0.405 | -| value_loss | 1.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4119 | -| time_elapsed | 35030 | -| total_timesteps | 527232 | -| train/ | | -| approx_kl | 0.031716835 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | 0.893 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 41180 | -| policy_gradient_loss | -0.00561 | -| std | 0.405 | -| value_loss | 0.000633 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4120 | -| time_elapsed | 35034 | -| total_timesteps | 527360 | -| train/ | | -| approx_kl | 0.0024953482 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.516 | -| explained_variance | -885 | -| learning_rate | 0.0003 | -| loss | 0.000939 | -| n_updates | 41190 | -| policy_gradient_loss | 0.00107 | -| std | 0.405 | -| value_loss | 5.53e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4121 | -| time_elapsed | 35036 | -| total_timesteps | 527488 | -| train/ | | -| approx_kl | 0.0050844206 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.513 | -| explained_variance | -1.33e+03 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 41200 | -| policy_gradient_loss | -0.000852 | -| std | 0.403 | -| value_loss | 9.54e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4122 | -| time_elapsed | 35040 | -| total_timesteps | 527616 | -| train/ | | -| approx_kl | 0.00046010152 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -50.8 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 41210 | -| policy_gradient_loss | 0.00145 | -| std | 0.403 | -| value_loss | 2.08e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4123 | -| time_elapsed | 35044 | -| total_timesteps | 527744 | -| train/ | | -| approx_kl | 0.01376643 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -24.4 | -| learning_rate | 0.0003 | -| loss | -0.000273 | -| n_updates | 41220 | -| policy_gradient_loss | -0.000732 | -| std | 0.403 | -| value_loss | 1.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4124 | -| time_elapsed | 35048 | -| total_timesteps | 527872 | -| train/ | | -| approx_kl | 0.012946233 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | 0.000277 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 41230 | -| policy_gradient_loss | -0.00551 | -| std | 0.403 | -| value_loss | 8.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4125 | -| time_elapsed | 35051 | -| total_timesteps | 528000 | -| train/ | | -| approx_kl | 0.001121318 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -0.000428 | -| n_updates | 41240 | -| policy_gradient_loss | -0.000152 | -| std | 0.404 | -| value_loss | 8.91e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4126 | -| time_elapsed | 35055 | -| total_timesteps | 528128 | -| train/ | | -| approx_kl | 0.01839514 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | 0.00303 | -| learning_rate | 0.0003 | -| loss | 0.000578 | -| n_updates | 41250 | -| policy_gradient_loss | -0.00183 | -| std | 0.403 | -| value_loss | 7.25e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4127 | -| time_elapsed | 35064 | -| total_timesteps | 528256 | -| train/ | | -| approx_kl | 0.020785525 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | 0.922 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 41260 | -| policy_gradient_loss | -0.00408 | -| std | 0.403 | -| value_loss | 0.00127 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4128 | -| time_elapsed | 35067 | -| total_timesteps | 528384 | -| train/ | | -| approx_kl | 5.045673e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -3.52e+03 | -| learning_rate | 0.0003 | -| loss | -0.000528 | -| n_updates | 41270 | -| policy_gradient_loss | 0.00448 | -| std | 0.402 | -| value_loss | 9.67e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4129 | -| time_elapsed | 35070 | -| total_timesteps | 528512 | -| train/ | | -| approx_kl | 0.05215906 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -3.77e+03 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 41280 | -| policy_gradient_loss | -0.00758 | -| std | 0.402 | -| value_loss | 4.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4130 | -| time_elapsed | 35073 | -| total_timesteps | 528640 | -| train/ | | -| approx_kl | 0.028898649 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -169 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 41290 | -| policy_gradient_loss | -0.0131 | -| std | 0.402 | -| value_loss | 1.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4131 | -| time_elapsed | 35076 | -| total_timesteps | 528768 | -| train/ | | -| approx_kl | 0.012965418 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -54 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 41300 | -| policy_gradient_loss | -0.00645 | -| std | 0.402 | -| value_loss | 3.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4132 | -| time_elapsed | 35078 | -| total_timesteps | 528896 | -| train/ | | -| approx_kl | 0.026743189 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | -0.507 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 41310 | -| policy_gradient_loss | -0.0114 | -| std | 0.402 | -| value_loss | 5.21e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4133 | -| time_elapsed | 35081 | -| total_timesteps | 529024 | -| train/ | | -| approx_kl | 0.01218125 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -2.32 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 41320 | -| policy_gradient_loss | -0.00611 | -| std | 0.401 | -| value_loss | 1.03e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4134 | -| time_elapsed | 35090 | -| total_timesteps | 529152 | -| train/ | | -| approx_kl | 0.027247079 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.00838 | -| n_updates | 41330 | -| policy_gradient_loss | -0.00801 | -| std | 0.401 | -| value_loss | 0.000133 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4135 | -| time_elapsed | 35094 | -| total_timesteps | 529280 | -| train/ | | -| approx_kl | 0.012593932 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -1.24e+03 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 41340 | -| policy_gradient_loss | -0.00768 | -| std | 0.401 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4136 | -| time_elapsed | 35098 | -| total_timesteps | 529408 | -| train/ | | -| approx_kl | 0.012979452 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -826 | -| learning_rate | 0.0003 | -| loss | -0.00269 | -| n_updates | 41350 | -| policy_gradient_loss | -0.00154 | -| std | 0.4 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4137 | -| time_elapsed | 35101 | -| total_timesteps | 529536 | -| train/ | | -| approx_kl | 0.0052804495 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -21.6 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 41360 | -| policy_gradient_loss | -0.000892 | -| std | 0.399 | -| value_loss | 2.17e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4138 | -| time_elapsed | 35105 | -| total_timesteps | 529664 | -| train/ | | -| approx_kl | 0.0058347774 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -23.7 | -| learning_rate | 0.0003 | -| loss | 0.000316 | -| n_updates | 41370 | -| policy_gradient_loss | 0.000215 | -| std | 0.4 | -| value_loss | 1.38e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4139 | -| time_elapsed | 35110 | -| total_timesteps | 529792 | -| train/ | | -| approx_kl | 0.018267583 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -0.757 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 41380 | -| policy_gradient_loss | -0.0104 | -| std | 0.401 | -| value_loss | 3.41e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 15 | -| iterations | 4140 | -| time_elapsed | 35113 | -| total_timesteps | 529920 | -| train/ | | -| approx_kl | 0.008399351 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 41390 | -| policy_gradient_loss | -0.00253 | -| std | 0.401 | -| value_loss | 1.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4141 | -| time_elapsed | 35116 | -| total_timesteps | 530048 | -| train/ | | -| approx_kl | 0.011290323 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -0.074 | -| learning_rate | 0.0003 | -| loss | 0.0013 | -| n_updates | 41400 | -| policy_gradient_loss | 0.000326 | -| std | 0.402 | -| value_loss | 1.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4142 | -| time_elapsed | 35122 | -| total_timesteps | 530176 | -| train/ | | -| approx_kl | 0.008712303 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.507 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 41410 | -| policy_gradient_loss | -0.00497 | -| std | 0.402 | -| value_loss | 0.000184 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4143 | -| time_elapsed | 35126 | -| total_timesteps | 530304 | -| train/ | | -| approx_kl | 0.043858446 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -1.11e+04 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 41420 | -| policy_gradient_loss | -0.00635 | -| std | 0.402 | -| value_loss | 2.74e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4144 | -| time_elapsed | 35129 | -| total_timesteps | 530432 | -| train/ | | -| approx_kl | 5.4749195e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -2.01e+03 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 41430 | -| policy_gradient_loss | 0.00241 | -| std | 0.403 | -| value_loss | 7.91e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4145 | -| time_elapsed | 35132 | -| total_timesteps | 530560 | -| train/ | | -| approx_kl | 0.019083597 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -43.7 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 41440 | -| policy_gradient_loss | -0.00418 | -| std | 0.403 | -| value_loss | 2.83e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4146 | -| time_elapsed | 35137 | -| total_timesteps | 530688 | -| train/ | | -| approx_kl | 0.012820725 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -6.57 | -| learning_rate | 0.0003 | -| loss | -0.00476 | -| n_updates | 41450 | -| policy_gradient_loss | -0.0024 | -| std | 0.403 | -| value_loss | 8.68e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4147 | -| time_elapsed | 35141 | -| total_timesteps | 530816 | -| train/ | | -| approx_kl | 0.0021488077 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -0.307 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 41460 | -| policy_gradient_loss | 5.98e-05 | -| std | 0.403 | -| value_loss | 2.89e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4148 | -| time_elapsed | 35144 | -| total_timesteps | 530944 | -| train/ | | -| approx_kl | 0.034065392 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 41470 | -| policy_gradient_loss | -0.0187 | -| std | 0.403 | -| value_loss | 5.08e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4149 | -| time_elapsed | 35147 | -| total_timesteps | 531072 | -| train/ | | -| approx_kl | 0.021432498 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 41480 | -| policy_gradient_loss | -0.0084 | -| std | 0.404 | -| value_loss | 5.51e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4150 | -| time_elapsed | 35152 | -| total_timesteps | 531200 | -| train/ | | -| approx_kl | 0.029114226 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.512 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 41490 | -| policy_gradient_loss | -0.0139 | -| std | 0.404 | -| value_loss | 0.000453 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4151 | -| time_elapsed | 35155 | -| total_timesteps | 531328 | -| train/ | | -| approx_kl | 0.007186888 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.512 | -| explained_variance | -1.54e+03 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 41500 | -| policy_gradient_loss | -0.0035 | -| std | 0.404 | -| value_loss | 8.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4152 | -| time_elapsed | 35158 | -| total_timesteps | 531456 | -| train/ | | -| approx_kl | 0.022032222 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | -0.513 | -| explained_variance | -1.17e+03 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 41510 | -| policy_gradient_loss | -0.00146 | -| std | 0.404 | -| value_loss | 6.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4153 | -| time_elapsed | 35160 | -| total_timesteps | 531584 | -| train/ | | -| approx_kl | 0.010245315 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | -3.38 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 41520 | -| policy_gradient_loss | -0.00137 | -| std | 0.403 | -| value_loss | 9.39e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4154 | -| time_elapsed | 35164 | -| total_timesteps | 531712 | -| train/ | | -| approx_kl | 0.0050232895 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 41530 | -| policy_gradient_loss | -0.00269 | -| std | 0.403 | -| value_loss | 5.97e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4155 | -| time_elapsed | 35168 | -| total_timesteps | 531840 | -| train/ | | -| approx_kl | 0.00035450072 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 41540 | -| policy_gradient_loss | 0.00212 | -| std | 0.403 | -| value_loss | 2.59e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 15 | -| iterations | 4156 | -| time_elapsed | 35172 | -| total_timesteps | 531968 | -| train/ | | -| approx_kl | 0.019770253 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -2.34e-05 | -| n_updates | 41550 | -| policy_gradient_loss | -0.00274 | -| std | 0.403 | -| value_loss | 6.58e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4157 | -| time_elapsed | 35177 | -| total_timesteps | 532096 | -| train/ | | -| approx_kl | 0.0096149985 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -0.00301 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 41560 | -| policy_gradient_loss | -0.00191 | -| std | 0.403 | -| value_loss | 7.46e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4158 | -| time_elapsed | 35186 | -| total_timesteps | 532224 | -| train/ | | -| approx_kl | 0.0072534345 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 41570 | -| policy_gradient_loss | -0.00531 | -| std | 0.402 | -| value_loss | 0.00338 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4159 | -| time_elapsed | 35189 | -| total_timesteps | 532352 | -| train/ | | -| approx_kl | 0.0017898032 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -136 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 41580 | -| policy_gradient_loss | -0.000262 | -| std | 0.401 | -| value_loss | 5.3e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4160 | -| time_elapsed | 35193 | -| total_timesteps | 532480 | -| train/ | | -| approx_kl | 0.0258666 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -156 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 41590 | -| policy_gradient_loss | -0.0144 | -| std | 0.4 | -| value_loss | 3.15e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4161 | -| time_elapsed | 35197 | -| total_timesteps | 532608 | -| train/ | | -| approx_kl | 0.0119090155 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 41600 | -| policy_gradient_loss | -0.00144 | -| std | 0.401 | -| value_loss | 1.31e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4162 | -| time_elapsed | 35201 | -| total_timesteps | 532736 | -| train/ | | -| approx_kl | 0.010164453 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -2.84 | -| learning_rate | 0.0003 | -| loss | -0.00055 | -| n_updates | 41610 | -| policy_gradient_loss | -0.000715 | -| std | 0.402 | -| value_loss | 3.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4163 | -| time_elapsed | 35204 | -| total_timesteps | 532864 | -| train/ | | -| approx_kl | 0.008229118 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.507 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | -0.000403 | -| n_updates | 41620 | -| policy_gradient_loss | -0.000833 | -| std | 0.402 | -| value_loss | 2.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 15 | -| iterations | 4164 | -| time_elapsed | 35208 | -| total_timesteps | 532992 | -| train/ | | -| approx_kl | 0.015177533 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.507 | -| explained_variance | -0.0095 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 41630 | -| policy_gradient_loss | -0.00336 | -| std | 0.402 | -| value_loss | 1.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4165 | -| time_elapsed | 35212 | -| total_timesteps | 533120 | -| train/ | | -| approx_kl | 0.014122495 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.507 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 41640 | -| policy_gradient_loss | -0.00329 | -| std | 0.402 | -| value_loss | 6.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4166 | -| time_elapsed | 35221 | -| total_timesteps | 533248 | -| train/ | | -| approx_kl | 0.018552732 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | 0.661 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 41650 | -| policy_gradient_loss | -0.0057 | -| std | 0.403 | -| value_loss | 0.000995 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4167 | -| time_elapsed | 35224 | -| total_timesteps | 533376 | -| train/ | | -| approx_kl | 4.2156084e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -315 | -| learning_rate | 0.0003 | -| loss | 0.000445 | -| n_updates | 41660 | -| policy_gradient_loss | 0.0019 | -| std | 0.402 | -| value_loss | 2.87e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4168 | -| time_elapsed | 35227 | -| total_timesteps | 533504 | -| train/ | | -| approx_kl | 0.0051431637 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -392 | -| learning_rate | 0.0003 | -| loss | 0.000118 | -| n_updates | 41670 | -| policy_gradient_loss | 4.76e-05 | -| std | 0.401 | -| value_loss | 9.63e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4169 | -| time_elapsed | 35231 | -| total_timesteps | 533632 | -| train/ | | -| approx_kl | 0.019374628 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -7.2 | -| learning_rate | 0.0003 | -| loss | -0.00569 | -| n_updates | 41680 | -| policy_gradient_loss | -0.0041 | -| std | 0.401 | -| value_loss | 2.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4170 | -| time_elapsed | 35234 | -| total_timesteps | 533760 | -| train/ | | -| approx_kl | 0.004136738 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -355 | -| learning_rate | 0.0003 | -| loss | -0.00896 | -| n_updates | 41690 | -| policy_gradient_loss | -0.00205 | -| std | 0.4 | -| value_loss | 9.66e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4171 | -| time_elapsed | 35237 | -| total_timesteps | 533888 | -| train/ | | -| approx_kl | 0.00035668816 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.503 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 41700 | -| policy_gradient_loss | 0.00313 | -| std | 0.4 | -| value_loss | 4.77e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4172 | -| time_elapsed | 35240 | -| total_timesteps | 534016 | -| train/ | | -| approx_kl | 0.001261594 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -50 | -| learning_rate | 0.0003 | -| loss | -0.00427 | -| n_updates | 41710 | -| policy_gradient_loss | 0.000353 | -| std | 0.4 | -| value_loss | 1.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4173 | -| time_elapsed | 35248 | -| total_timesteps | 534144 | -| train/ | | -| approx_kl | 0.0008795073 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.501 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.00419 | -| n_updates | 41720 | -| policy_gradient_loss | 0.000876 | -| std | 0.399 | -| value_loss | 0.000177 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4174 | -| time_elapsed | 35252 | -| total_timesteps | 534272 | -| train/ | | -| approx_kl | 0.04307659 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | -0.501 | -| explained_variance | -80.7 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 41730 | -| policy_gradient_loss | -0.0145 | -| std | 0.399 | -| value_loss | 2.93e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4175 | -| time_elapsed | 35255 | -| total_timesteps | 534400 | -| train/ | | -| approx_kl | 0.0060685147 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.501 | -| explained_variance | -61.8 | -| learning_rate | 0.0003 | -| loss | -0.00358 | -| n_updates | 41740 | -| policy_gradient_loss | -0.00093 | -| std | 0.4 | -| value_loss | 7.83e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4176 | -| time_elapsed | 35260 | -| total_timesteps | 534528 | -| train/ | | -| approx_kl | 0.019768663 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -0.408 | -| learning_rate | 0.0003 | -| loss | 0.00529 | -| n_updates | 41750 | -| policy_gradient_loss | 0.00103 | -| std | 0.401 | -| value_loss | 6.4e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4177 | -| time_elapsed | 35264 | -| total_timesteps | 534656 | -| train/ | | -| approx_kl | 0.00914433 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.507 | -| explained_variance | -0.722 | -| learning_rate | 0.0003 | -| loss | -0.00494 | -| n_updates | 41760 | -| policy_gradient_loss | -0.00195 | -| std | 0.402 | -| value_loss | 6.92e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4178 | -| time_elapsed | 35266 | -| total_timesteps | 534784 | -| train/ | | -| approx_kl | 0.0012990865 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | 0.0045 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 41770 | -| policy_gradient_loss | 8.85e-06 | -| std | 0.403 | -| value_loss | 3.7e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4179 | -| time_elapsed | 35270 | -| total_timesteps | 534912 | -| train/ | | -| approx_kl | 0.023049071 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 41780 | -| policy_gradient_loss | -0.00903 | -| std | 0.403 | -| value_loss | 3.14e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4180 | -| time_elapsed | 35274 | -| total_timesteps | 535040 | -| train/ | | -| approx_kl | 0.011603051 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -0.00125 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 41790 | -| policy_gradient_loss | -0.00237 | -| std | 0.402 | -| value_loss | 1.99e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4181 | -| time_elapsed | 35281 | -| total_timesteps | 535168 | -| train/ | | -| approx_kl | 0.01425217 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | 0.953 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 41800 | -| policy_gradient_loss | -0.00788 | -| std | 0.402 | -| value_loss | 0.000509 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4182 | -| time_elapsed | 35284 | -| total_timesteps | 535296 | -| train/ | | -| approx_kl | 0.004097793 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -1.7e+03 | -| learning_rate | 0.0003 | -| loss | -0.00738 | -| n_updates | 41810 | -| policy_gradient_loss | -0.00139 | -| std | 0.402 | -| value_loss | 2.64e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4183 | -| time_elapsed | 35287 | -| total_timesteps | 535424 | -| train/ | | -| approx_kl | 0.03384985 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -589 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 41820 | -| policy_gradient_loss | -0.0113 | -| std | 0.402 | -| value_loss | 1.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4184 | -| time_elapsed | 35290 | -| total_timesteps | 535552 | -| train/ | | -| approx_kl | 0.010165368 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 41830 | -| policy_gradient_loss | -0.00107 | -| std | 0.402 | -| value_loss | 5.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4185 | -| time_elapsed | 35293 | -| total_timesteps | 535680 | -| train/ | | -| approx_kl | 0.019314162 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -7.31 | -| learning_rate | 0.0003 | -| loss | -0.000548 | -| n_updates | 41840 | -| policy_gradient_loss | -0.00163 | -| std | 0.401 | -| value_loss | 6.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4186 | -| time_elapsed | 35296 | -| total_timesteps | 535808 | -| train/ | | -| approx_kl | 0.017872432 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | -0.00667 | -| n_updates | 41850 | -| policy_gradient_loss | -0.00585 | -| std | 0.401 | -| value_loss | 3.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4187 | -| time_elapsed | 35298 | -| total_timesteps | 535936 | -| train/ | | -| approx_kl | 0.008796207 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | -0.000243 | -| n_updates | 41860 | -| policy_gradient_loss | -0.00065 | -| std | 0.401 | -| value_loss | 1.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4188 | -| time_elapsed | 35300 | -| total_timesteps | 536064 | -| train/ | | -| approx_kl | 0.016293516 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -2.31 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 41870 | -| policy_gradient_loss | -0.0106 | -| std | 0.401 | -| value_loss | 3.98e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4189 | -| time_elapsed | 35306 | -| total_timesteps | 536192 | -| train/ | | -| approx_kl | 0.0037693898 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.00594 | -| n_updates | 41880 | -| policy_gradient_loss | -0.00136 | -| std | 0.401 | -| value_loss | 0.000344 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4190 | -| time_elapsed | 35310 | -| total_timesteps | 536320 | -| train/ | | -| approx_kl | 0.0003559189 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -2e+03 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 41890 | -| policy_gradient_loss | 0.00343 | -| std | 0.4 | -| value_loss | 1.49e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4191 | -| time_elapsed | 35314 | -| total_timesteps | 536448 | -| train/ | | -| approx_kl | 0.04401113 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | -0.503 | -| explained_variance | -841 | -| learning_rate | 0.0003 | -| loss | -0.00944 | -| n_updates | 41900 | -| policy_gradient_loss | -0.00701 | -| std | 0.4 | -| value_loss | 5.33e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4192 | -| time_elapsed | 35318 | -| total_timesteps | 536576 | -| train/ | | -| approx_kl | 0.0043443358 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -25.1 | -| learning_rate | 0.0003 | -| loss | -0.00923 | -| n_updates | 41910 | -| policy_gradient_loss | -0.00243 | -| std | 0.4 | -| value_loss | 1.14e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4193 | -| time_elapsed | 35321 | -| total_timesteps | 536704 | -| train/ | | -| approx_kl | 0.00029730168 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -5.84 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 41920 | -| policy_gradient_loss | 0.0015 | -| std | 0.4 | -| value_loss | 5.7e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4194 | -| time_elapsed | 35324 | -| total_timesteps | 536832 | -| train/ | | -| approx_kl | 0.0011684203 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -0.67 | -| learning_rate | 0.0003 | -| loss | -0.00895 | -| n_updates | 41930 | -| policy_gradient_loss | 0.000588 | -| std | 0.4 | -| value_loss | 3.32e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4195 | -| time_elapsed | 35327 | -| total_timesteps | 536960 | -| train/ | | -| approx_kl | 0.00913491 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -0.00227 | -| learning_rate | 0.0003 | -| loss | 0.000439 | -| n_updates | 41940 | -| policy_gradient_loss | 2e-05 | -| std | 0.4 | -| value_loss | 1.25e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4196 | -| time_elapsed | 35330 | -| total_timesteps | 537088 | -| train/ | | -| approx_kl | 0.0015819347 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | 0.00486 | -| learning_rate | 0.0003 | -| loss | 1.17e-05 | -| n_updates | 41950 | -| policy_gradient_loss | 7.06e-06 | -| std | 0.399 | -| value_loss | 1.89e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4197 | -| time_elapsed | 35337 | -| total_timesteps | 537216 | -| train/ | | -| approx_kl | 0.0008313975 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.5 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.000225 | -| n_updates | 41960 | -| policy_gradient_loss | -0.000192 | -| std | 0.398 | -| value_loss | 0.00067 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4198 | -| time_elapsed | 35340 | -| total_timesteps | 537344 | -| train/ | | -| approx_kl | 0.009749956 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.497 | -| explained_variance | -5.9e+03 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 41970 | -| policy_gradient_loss | -0.00712 | -| std | 0.397 | -| value_loss | 2.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4199 | -| time_elapsed | 35344 | -| total_timesteps | 537472 | -| train/ | | -| approx_kl | 0.008099065 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.495 | -| explained_variance | -112 | -| learning_rate | 0.0003 | -| loss | 0.000271 | -| n_updates | 41980 | -| policy_gradient_loss | 2.87e-05 | -| std | 0.397 | -| value_loss | 0.000162 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4200 | -| time_elapsed | 35347 | -| total_timesteps | 537600 | -| train/ | | -| approx_kl | 0.017189313 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.496 | -| explained_variance | -4.32 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 41990 | -| policy_gradient_loss | -0.00603 | -| std | 0.397 | -| value_loss | 0.000185 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4201 | -| time_elapsed | 35350 | -| total_timesteps | 537728 | -| train/ | | -| approx_kl | 0.021234188 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | -0.497 | -| explained_variance | -0.554 | -| learning_rate | 0.0003 | -| loss | -0.00671 | -| n_updates | 42000 | -| policy_gradient_loss | -0.00691 | -| std | 0.398 | -| value_loss | 0.000135 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4202 | -| time_elapsed | 35352 | -| total_timesteps | 537856 | -| train/ | | -| approx_kl | 0.015426034 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.497 | -| explained_variance | -6.32 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 42010 | -| policy_gradient_loss | -0.00163 | -| std | 0.398 | -| value_loss | 7.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 15 | -| iterations | 4203 | -| time_elapsed | 35354 | -| total_timesteps | 537984 | -| train/ | | -| approx_kl | 0.023251787 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.496 | -| explained_variance | -0.0728 | -| learning_rate | 0.0003 | -| loss | -0.00637 | -| n_updates | 42020 | -| policy_gradient_loss | -0.00681 | -| std | 0.397 | -| value_loss | 7.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 15 | -| iterations | 4204 | -| time_elapsed | 35357 | -| total_timesteps | 538112 | -| train/ | | -| approx_kl | 0.009086647 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.495 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | -0.000481 | -| n_updates | 42030 | -| policy_gradient_loss | -0.00112 | -| std | 0.396 | -| value_loss | 3.44e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 15 | -| iterations | 4205 | -| time_elapsed | 35365 | -| total_timesteps | 538240 | -| train/ | | -| approx_kl | 6.905524e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.493 | -| explained_variance | -5.58 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 42040 | -| policy_gradient_loss | 2.83e-05 | -| std | 0.396 | -| value_loss | 0.00566 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 15 | -| iterations | 4206 | -| time_elapsed | 35369 | -| total_timesteps | 538368 | -| train/ | | -| approx_kl | 0.015285246 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.494 | -| explained_variance | -2.11e+03 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 42050 | -| policy_gradient_loss | -0.00854 | -| std | 0.397 | -| value_loss | 6.88e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 15 | -| iterations | 4207 | -| time_elapsed | 35373 | -| total_timesteps | 538496 | -| train/ | | -| approx_kl | 0.0013243405 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.494 | -| explained_variance | -165 | -| learning_rate | 0.0003 | -| loss | 0.000251 | -| n_updates | 42060 | -| policy_gradient_loss | 0.000199 | -| std | 0.396 | -| value_loss | 1.27e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 15 | -| iterations | 4208 | -| time_elapsed | 35376 | -| total_timesteps | 538624 | -| train/ | | -| approx_kl | 0.014602516 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.493 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 42070 | -| policy_gradient_loss | -0.0109 | -| std | 0.396 | -| value_loss | 5.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 15 | -| iterations | 4209 | -| time_elapsed | 35381 | -| total_timesteps | 538752 | -| train/ | | -| approx_kl | 0.003915476 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.493 | -| explained_variance | -0.576 | -| learning_rate | 0.0003 | -| loss | -8.05e-05 | -| n_updates | 42080 | -| policy_gradient_loss | -9.81e-05 | -| std | 0.397 | -| value_loss | 7.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 15 | -| iterations | 4210 | -| time_elapsed | 35385 | -| total_timesteps | 538880 | -| train/ | | -| approx_kl | 0.017181655 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.494 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 42090 | -| policy_gradient_loss | -0.00454 | -| std | 0.396 | -| value_loss | 4.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4211 | -| time_elapsed | 35388 | -| total_timesteps | 539008 | -| train/ | | -| approx_kl | 0.0056338105 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.492 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | -0.000491 | -| n_updates | 42100 | -| policy_gradient_loss | -0.000494 | -| std | 0.395 | -| value_loss | 3.32e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4212 | -| time_elapsed | 35397 | -| total_timesteps | 539136 | -| train/ | | -| approx_kl | 0.018249277 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.491 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 42110 | -| policy_gradient_loss | -0.0072 | -| std | 0.395 | -| value_loss | 0.00209 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4213 | -| time_elapsed | 35399 | -| total_timesteps | 539264 | -| train/ | | -| approx_kl | 0.00078760786 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.49 | -| explained_variance | -4.97 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 42120 | -| policy_gradient_loss | 0.00113 | -| std | 0.395 | -| value_loss | 1.16e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4214 | -| time_elapsed | 35402 | -| total_timesteps | 539392 | -| train/ | | -| approx_kl | 0.04480766 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | -0.49 | -| explained_variance | -43.2 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 42130 | -| policy_gradient_loss | -0.00633 | -| std | 0.395 | -| value_loss | 1.18e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4215 | -| time_elapsed | 35404 | -| total_timesteps | 539520 | -| train/ | | -| approx_kl | 0.0062599033 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.492 | -| explained_variance | -4.91 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 42140 | -| policy_gradient_loss | -0.000631 | -| std | 0.397 | -| value_loss | 1.43e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4216 | -| time_elapsed | 35407 | -| total_timesteps | 539648 | -| train/ | | -| approx_kl | 0.012103572 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.498 | -| explained_variance | -0.00608 | -| learning_rate | 0.0003 | -| loss | -0.0062 | -| n_updates | 42150 | -| policy_gradient_loss | -0.00275 | -| std | 0.399 | -| value_loss | 1.23e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4217 | -| time_elapsed | 35409 | -| total_timesteps | 539776 | -| train/ | | -| approx_kl | 0.0151745 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | -0.5 | -| explained_variance | -0.00915 | -| learning_rate | 0.0003 | -| loss | -0.000507 | -| n_updates | 42160 | -| policy_gradient_loss | -0.00195 | -| std | 0.399 | -| value_loss | 5.12e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4218 | -| time_elapsed | 35412 | -| total_timesteps | 539904 | -| train/ | | -| approx_kl | 0.0111595765 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.498 | -| explained_variance | 0.0055 | -| learning_rate | 0.0003 | -| loss | -0.00894 | -| n_updates | 42170 | -| policy_gradient_loss | -0.0041 | -| std | 0.398 | -| value_loss | 3.98e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4219 | -| time_elapsed | 35416 | -| total_timesteps | 540032 | -| train/ | | -| approx_kl | 0.0013751921 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.497 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | 0.00036 | -| n_updates | 42180 | -| policy_gradient_loss | 0.00027 | -| std | 0.398 | -| value_loss | 3.55e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4220 | -| time_elapsed | 35425 | -| total_timesteps | 540160 | -| train/ | | -| approx_kl | 2.3145927e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.497 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | 3.15e-05 | -| n_updates | 42190 | -| policy_gradient_loss | 4.66e-06 | -| std | 0.398 | -| value_loss | 0.000102 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4221 | -| time_elapsed | 35428 | -| total_timesteps | 540288 | -| train/ | | -| approx_kl | 0.018028941 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.498 | -| explained_variance | -1.81e+03 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 42200 | -| policy_gradient_loss | -0.00688 | -| std | 0.398 | -| value_loss | 4.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4222 | -| time_elapsed | 35431 | -| total_timesteps | 540416 | -| train/ | | -| approx_kl | 0.028854104 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | -0.498 | -| explained_variance | -7.64e+03 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 42210 | -| policy_gradient_loss | -0.0136 | -| std | 0.398 | -| value_loss | 1.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4223 | -| time_elapsed | 35434 | -| total_timesteps | 540544 | -| train/ | | -| approx_kl | 0.01171995 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.499 | -| explained_variance | -25.4 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 42220 | -| policy_gradient_loss | -0.00846 | -| std | 0.399 | -| value_loss | 5.45e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4224 | -| time_elapsed | 35436 | -| total_timesteps | 540672 | -| train/ | | -| approx_kl | 0.0003067907 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.5 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 42230 | -| policy_gradient_loss | 0.00127 | -| std | 0.399 | -| value_loss | 7.15e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4225 | -| time_elapsed | 35439 | -| total_timesteps | 540800 | -| train/ | | -| approx_kl | 0.0011367672 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.5 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.0059 | -| n_updates | 42240 | -| policy_gradient_loss | 0.000536 | -| std | 0.399 | -| value_loss | 8.47e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4226 | -| time_elapsed | 35442 | -| total_timesteps | 540928 | -| train/ | | -| approx_kl | 0.029555064 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -0.5 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 42250 | -| policy_gradient_loss | -0.00891 | -| std | 0.399 | -| value_loss | 7.44e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4227 | -| time_elapsed | 35444 | -| total_timesteps | 541056 | -| train/ | | -| approx_kl | 0.00960302 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.501 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | -0.000111 | -| n_updates | 42260 | -| policy_gradient_loss | -0.000982 | -| std | 0.4 | -| value_loss | 8.96e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4228 | -| time_elapsed | 35450 | -| total_timesteps | 541184 | -| train/ | | -| approx_kl | 0.013477052 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 42270 | -| policy_gradient_loss | -0.00429 | -| std | 0.401 | -| value_loss | 0.000131 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4229 | -| time_elapsed | 35454 | -| total_timesteps | 541312 | -| train/ | | -| approx_kl | 0.044173293 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -284 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 42280 | -| policy_gradient_loss | -0.00197 | -| std | 0.401 | -| value_loss | 6.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4230 | -| time_elapsed | 35458 | -| total_timesteps | 541440 | -| train/ | | -| approx_kl | 0.021706041 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -599 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 42290 | -| policy_gradient_loss | -0.00232 | -| std | 0.4 | -| value_loss | 1.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4231 | -| time_elapsed | 35461 | -| total_timesteps | 541568 | -| train/ | | -| approx_kl | 0.003736639 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.503 | -| explained_variance | -9.34 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 42300 | -| policy_gradient_loss | -0.000512 | -| std | 0.4 | -| value_loss | 9.93e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4232 | -| time_elapsed | 35464 | -| total_timesteps | 541696 | -| train/ | | -| approx_kl | 0.043211438 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 42310 | -| policy_gradient_loss | -0.00273 | -| std | 0.4 | -| value_loss | 8.12e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4233 | -| time_elapsed | 35468 | -| total_timesteps | 541824 | -| train/ | | -| approx_kl | 0.00022755447 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.503 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 42320 | -| policy_gradient_loss | 0.00202 | -| std | 0.4 | -| value_loss | 9.63e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 15 | -| iterations | 4234 | -| time_elapsed | 35471 | -| total_timesteps | 541952 | -| train/ | | -| approx_kl | 0.0011912277 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 42330 | -| policy_gradient_loss | 0.000176 | -| std | 0.401 | -| value_loss | 2.04e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4235 | -| time_elapsed | 35475 | -| total_timesteps | 542080 | -| train/ | | -| approx_kl | 0.0008177955 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -5.85 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 42340 | -| policy_gradient_loss | 0.000508 | -| std | 0.401 | -| value_loss | 4.23e-12 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4236 | -| time_elapsed | 35481 | -| total_timesteps | 542208 | -| train/ | | -| approx_kl | 0.033041142 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 42350 | -| policy_gradient_loss | -0.0126 | -| std | 0.401 | -| value_loss | 0.00197 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4237 | -| time_elapsed | 35483 | -| total_timesteps | 542336 | -| train/ | | -| approx_kl | 0.011636327 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -1.03e+03 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 42360 | -| policy_gradient_loss | -0.00127 | -| std | 0.402 | -| value_loss | 5.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4238 | -| time_elapsed | 35486 | -| total_timesteps | 542464 | -| train/ | | -| approx_kl | 0.029520817 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -3.83e+03 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 42370 | -| policy_gradient_loss | -0.00926 | -| std | 0.402 | -| value_loss | 2.35e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4239 | -| time_elapsed | 35489 | -| total_timesteps | 542592 | -| train/ | | -| approx_kl | 0.01767269 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -99.8 | -| learning_rate | 0.0003 | -| loss | -0.00834 | -| n_updates | 42380 | -| policy_gradient_loss | -0.0038 | -| std | 0.403 | -| value_loss | 7.35e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4240 | -| time_elapsed | 35492 | -| total_timesteps | 542720 | -| train/ | | -| approx_kl | 2.7441885e-05 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -16.5 | -| learning_rate | 0.0003 | -| loss | 0.000686 | -| n_updates | 42390 | -| policy_gradient_loss | 0.00438 | -| std | 0.403 | -| value_loss | 2.25e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4241 | -| time_elapsed | 35495 | -| total_timesteps | 542848 | -| train/ | | -| approx_kl | 0.0016911859 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.00661 | -| n_updates | 42400 | -| policy_gradient_loss | -0.000317 | -| std | 0.404 | -| value_loss | 5.47e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 15 | -| iterations | 4242 | -| time_elapsed | 35499 | -| total_timesteps | 542976 | -| train/ | | -| approx_kl | 0.0005773646 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.512 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 42410 | -| policy_gradient_loss | 0.000478 | -| std | 0.403 | -| value_loss | 1.29e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4243 | -| time_elapsed | 35503 | -| total_timesteps | 543104 | -| train/ | | -| approx_kl | 0.014311745 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | -0.000305 | -| n_updates | 42420 | -| policy_gradient_loss | -0.00111 | -| std | 0.403 | -| value_loss | 1.24e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4244 | -| time_elapsed | 35510 | -| total_timesteps | 543232 | -| train/ | | -| approx_kl | 0.010931276 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | 0.73 | -| learning_rate | 0.0003 | -| loss | -0.00981 | -| n_updates | 42430 | -| policy_gradient_loss | -0.00362 | -| std | 0.403 | -| value_loss | 0.000773 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4245 | -| time_elapsed | 35514 | -| total_timesteps | 543360 | -| train/ | | -| approx_kl | 2.8196257e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -144 | -| learning_rate | 0.0003 | -| loss | -0.000857 | -| n_updates | 42440 | -| policy_gradient_loss | 0.00339 | -| std | 0.403 | -| value_loss | 1.03e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4246 | -| time_elapsed | 35518 | -| total_timesteps | 543488 | -| train/ | | -| approx_kl | 0.04265758 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -151 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 42450 | -| policy_gradient_loss | -0.00358 | -| std | 0.403 | -| value_loss | 4.2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4247 | -| time_elapsed | 35523 | -| total_timesteps | 543616 | -| train/ | | -| approx_kl | 0.033708498 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | -0.51 | -| explained_variance | -6.51 | -| learning_rate | 0.0003 | -| loss | -0.00817 | -| n_updates | 42460 | -| policy_gradient_loss | -0.00742 | -| std | 0.403 | -| value_loss | 4.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4248 | -| time_elapsed | 35526 | -| total_timesteps | 543744 | -| train/ | | -| approx_kl | 0.007617304 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | -0.072 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 42470 | -| policy_gradient_loss | -0.000791 | -| std | 0.403 | -| value_loss | 7.97e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4249 | -| time_elapsed | 35529 | -| total_timesteps | 543872 | -| train/ | | -| approx_kl | 0.004117211 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.511 | -| explained_variance | 0.00528 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 42480 | -| policy_gradient_loss | -0.00184 | -| std | 0.404 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4250 | -| time_elapsed | 35532 | -| total_timesteps | 544000 | -| train/ | | -| approx_kl | 0.015968623 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.514 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | 0.00165 | -| n_updates | 42490 | -| policy_gradient_loss | -1.77e-05 | -| std | 0.405 | -| value_loss | 6.99e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4251 | -| time_elapsed | 35535 | -| total_timesteps | 544128 | -| train/ | | -| approx_kl | 0.008329719 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -0.00247 | -| learning_rate | 0.0003 | -| loss | -7.71e-05 | -| n_updates | 42500 | -| policy_gradient_loss | -0.000952 | -| std | 0.406 | -| value_loss | 2.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4252 | -| time_elapsed | 35541 | -| total_timesteps | 544256 | -| train/ | | -| approx_kl | 0.030132996 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 42510 | -| policy_gradient_loss | -0.00644 | -| std | 0.407 | -| value_loss | 6.9e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4253 | -| time_elapsed | 35545 | -| total_timesteps | 544384 | -| train/ | | -| approx_kl | 0.077699535 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -70.4 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 42520 | -| policy_gradient_loss | -0.00657 | -| std | 0.407 | -| value_loss | 1.57e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4254 | -| time_elapsed | 35549 | -| total_timesteps | 544512 | -| train/ | | -| approx_kl | 0.03924209 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -121 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 42530 | -| policy_gradient_loss | -0.00938 | -| std | 0.407 | -| value_loss | 1.03e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4255 | -| time_elapsed | 35552 | -| total_timesteps | 544640 | -| train/ | | -| approx_kl | 0.01324019 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00566 | -| n_updates | 42540 | -| policy_gradient_loss | -0.00474 | -| std | 0.407 | -| value_loss | 8.59e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4256 | -| time_elapsed | 35555 | -| total_timesteps | 544768 | -| train/ | | -| approx_kl | 0.012062692 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.519 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 42550 | -| policy_gradient_loss | -0.00137 | -| std | 0.406 | -| value_loss | 4.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4257 | -| time_elapsed | 35558 | -| total_timesteps | 544896 | -| train/ | | -| approx_kl | 0.010842023 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -0.646 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 42560 | -| policy_gradient_loss | -0.00662 | -| std | 0.406 | -| value_loss | 1.98e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4258 | -| time_elapsed | 35562 | -| total_timesteps | 545024 | -| train/ | | -| approx_kl | 0.0019240933 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.518 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 42570 | -| policy_gradient_loss | -0.000236 | -| std | 0.407 | -| value_loss | 1.87e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4259 | -| time_elapsed | 35570 | -| total_timesteps | 545152 | -| train/ | | -| approx_kl | 0.03965001 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | 0.247 | -| learning_rate | 0.0003 | -| loss | -0.00937 | -| n_updates | 42580 | -| policy_gradient_loss | -0.00822 | -| std | 0.407 | -| value_loss | 0.00127 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4260 | -| time_elapsed | 35574 | -| total_timesteps | 545280 | -| train/ | | -| approx_kl | 0.010748952 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.521 | -| explained_variance | -988 | -| learning_rate | 0.0003 | -| loss | -0.00905 | -| n_updates | 42590 | -| policy_gradient_loss | -0.00317 | -| std | 0.407 | -| value_loss | 2.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4261 | -| time_elapsed | 35577 | -| total_timesteps | 545408 | -| train/ | | -| approx_kl | 0.053413495 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | -0.52 | -| explained_variance | -3.96e+03 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 42600 | -| policy_gradient_loss | -0.00582 | -| std | 0.407 | -| value_loss | 1.03e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4262 | -| time_elapsed | 35581 | -| total_timesteps | 545536 | -| train/ | | -| approx_kl | 0.00043851277 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.517 | -| explained_variance | -190 | -| learning_rate | 0.0003 | -| loss | -0.000349 | -| n_updates | 42610 | -| policy_gradient_loss | 7.87e-05 | -| std | 0.405 | -| value_loss | 2.43e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4263 | -| time_elapsed | 35584 | -| total_timesteps | 545664 | -| train/ | | -| approx_kl | 0.009459209 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.512 | -| explained_variance | -22.4 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 42620 | -| policy_gradient_loss | -0.00211 | -| std | 0.402 | -| value_loss | 8.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4264 | -| time_elapsed | 35587 | -| total_timesteps | 545792 | -| train/ | | -| approx_kl | 0.030416792 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -3.53 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 42630 | -| policy_gradient_loss | -0.00853 | -| std | 0.402 | -| value_loss | 2.86e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4265 | -| time_elapsed | 35590 | -| total_timesteps | 545920 | -| train/ | | -| approx_kl | 0.00015598489 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | 0.000117 | -| n_updates | 42640 | -| policy_gradient_loss | 0.00027 | -| std | 0.401 | -| value_loss | 3.69e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4266 | -| time_elapsed | 35595 | -| total_timesteps | 546048 | -| train/ | | -| approx_kl | 0.004919437 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 42650 | -| policy_gradient_loss | -0.00116 | -| std | 0.399 | -| value_loss | 3.3e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4267 | -| time_elapsed | 35602 | -| total_timesteps | 546176 | -| train/ | | -| approx_kl | 0.0067320364 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.499 | -| explained_variance | 0.57 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 42660 | -| policy_gradient_loss | -0.000935 | -| std | 0.399 | -| value_loss | 0.000703 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4268 | -| time_elapsed | 35606 | -| total_timesteps | 546304 | -| train/ | | -| approx_kl | 0.064205356 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | -0.5 | -| explained_variance | -997 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 42670 | -| policy_gradient_loss | -0.0104 | -| std | 0.399 | -| value_loss | 3.5e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4269 | -| time_elapsed | 35609 | -| total_timesteps | 546432 | -| train/ | | -| approx_kl | 0.0010322621 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.499 | -| explained_variance | -4.01e+03 | -| learning_rate | 0.0003 | -| loss | 0.000464 | -| n_updates | 42680 | -| policy_gradient_loss | 0.000628 | -| std | 0.398 | -| value_loss | 8.79e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4270 | -| time_elapsed | 35612 | -| total_timesteps | 546560 | -| train/ | | -| approx_kl | 0.022848023 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.497 | -| explained_variance | -1.73e+03 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 42690 | -| policy_gradient_loss | -0.0106 | -| std | 0.397 | -| value_loss | 1.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4271 | -| time_elapsed | 35615 | -| total_timesteps | 546688 | -| train/ | | -| approx_kl | 0.019390529 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.496 | -| explained_variance | -562 | -| learning_rate | 0.0003 | -| loss | -0.00443 | -| n_updates | 42700 | -| policy_gradient_loss | -0.00275 | -| std | 0.397 | -| value_loss | 2.07e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4272 | -| time_elapsed | 35618 | -| total_timesteps | 546816 | -| train/ | | -| approx_kl | 0.013415659 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.496 | -| explained_variance | -248 | -| learning_rate | 0.0003 | -| loss | -0.000656 | -| n_updates | 42710 | -| policy_gradient_loss | -0.000811 | -| std | 0.397 | -| value_loss | 1.11e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 15 | -| iterations | 4273 | -| time_elapsed | 35621 | -| total_timesteps | 546944 | -| train/ | | -| approx_kl | 0.012159409 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.495 | -| explained_variance | -0.833 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 42720 | -| policy_gradient_loss | -0.00269 | -| std | 0.396 | -| value_loss | 3.07e-12 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4274 | -| time_elapsed | 35624 | -| total_timesteps | 547072 | -| train/ | | -| approx_kl | 0.013332138 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.493 | -| explained_variance | -3.52 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 42730 | -| policy_gradient_loss | -0.00945 | -| std | 0.396 | -| value_loss | 1.58e-12 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4275 | -| time_elapsed | 35630 | -| total_timesteps | 547200 | -| train/ | | -| approx_kl | 0.0070960233 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.493 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 42740 | -| policy_gradient_loss | -0.0049 | -| std | 0.396 | -| value_loss | 0.000106 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4276 | -| time_elapsed | 35633 | -| total_timesteps | 547328 | -| train/ | | -| approx_kl | 0.00024152291 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.493 | -| explained_variance | -218 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 42750 | -| policy_gradient_loss | 0.00148 | -| std | 0.396 | -| value_loss | 5.93e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4277 | -| time_elapsed | 35637 | -| total_timesteps | 547456 | -| train/ | | -| approx_kl | 0.0014407928 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.494 | -| explained_variance | -277 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 42760 | -| policy_gradient_loss | 5.13e-05 | -| std | 0.397 | -| value_loss | 2.38e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4278 | -| time_elapsed | 35641 | -| total_timesteps | 547584 | -| train/ | | -| approx_kl | 0.012465237 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.497 | -| explained_variance | -16.4 | -| learning_rate | 0.0003 | -| loss | -0.000788 | -| n_updates | 42770 | -| policy_gradient_loss | -0.000502 | -| std | 0.399 | -| value_loss | 1.83e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4279 | -| time_elapsed | 35645 | -| total_timesteps | 547712 | -| train/ | | -| approx_kl | 0.0091696065 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | 0.00407 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 42780 | -| policy_gradient_loss | -0.00227 | -| std | 0.4 | -| value_loss | 2.86e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4280 | -| time_elapsed | 35648 | -| total_timesteps | 547840 | -| train/ | | -| approx_kl | 0.008419952 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.505 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 42790 | -| policy_gradient_loss | -0.00301 | -| std | 0.402 | -| value_loss | 4e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4281 | -| time_elapsed | 35651 | -| total_timesteps | 547968 | -| train/ | | -| approx_kl | 0.011645046 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | -0.00769 | -| n_updates | 42800 | -| policy_gradient_loss | -0.00595 | -| std | 0.403 | -| value_loss | 6.46e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4282 | -| time_elapsed | 35655 | -| total_timesteps | 548096 | -| train/ | | -| approx_kl | 0.01029397 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.509 | -| explained_variance | 0.00308 | -| learning_rate | 0.0003 | -| loss | -0.000317 | -| n_updates | 42810 | -| policy_gradient_loss | -0.00117 | -| std | 0.402 | -| value_loss | 3.77e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4283 | -| time_elapsed | 35661 | -| total_timesteps | 548224 | -| train/ | | -| approx_kl | 0.001381705 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -5.7 | -| learning_rate | 0.0003 | -| loss | -4.42e-05 | -| n_updates | 42820 | -| policy_gradient_loss | -0.000238 | -| std | 0.402 | -| value_loss | 0.00178 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4284 | -| time_elapsed | 35665 | -| total_timesteps | 548352 | -| train/ | | -| approx_kl | 0.028638456 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | -0.508 | -| explained_variance | -800 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 42830 | -| policy_gradient_loss | -0.00271 | -| std | 0.402 | -| value_loss | 7.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4285 | -| time_elapsed | 35668 | -| total_timesteps | 548480 | -| train/ | | -| approx_kl | 0.004816278 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.507 | -| explained_variance | -511 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 42840 | -| policy_gradient_loss | -0.00301 | -| std | 0.402 | -| value_loss | 1.99e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4286 | -| time_elapsed | 35669 | -| total_timesteps | 548608 | -| train/ | | -| approx_kl | 0.02642363 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.506 | -| explained_variance | -24.9 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 42850 | -| policy_gradient_loss | -0.00167 | -| std | 0.401 | -| value_loss | 8.56e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4287 | -| time_elapsed | 35672 | -| total_timesteps | 548736 | -| train/ | | -| approx_kl | 0.006281387 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.504 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 42860 | -| policy_gradient_loss | -0.000546 | -| std | 0.4 | -| value_loss | 2.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4288 | -| time_elapsed | 35675 | -| total_timesteps | 548864 | -| train/ | | -| approx_kl | 0.002827374 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.502 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 42870 | -| policy_gradient_loss | -0.000589 | -| std | 0.398 | -| value_loss | 3e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4289 | -| time_elapsed | 35678 | -| total_timesteps | 548992 | -| train/ | | -| approx_kl | 0.0005781769 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.496 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | -0.000165 | -| n_updates | 42880 | -| policy_gradient_loss | 2.16e-06 | -| std | 0.396 | -| value_loss | 2.27e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 15 | -| iterations | 4290 | -| time_elapsed | 35681 | -| total_timesteps | 549120 | -| train/ | | -| approx_kl | 0.008731788 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.491 | -| explained_variance | -0.0621 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 42890 | -| policy_gradient_loss | -0.00365 | -| std | 0.395 | -| value_loss | 1.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 15 | -| iterations | 4291 | -| time_elapsed | 35692 | -| total_timesteps | 549248 | -| train/ | | -| approx_kl | 0.019602237 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.489 | -| explained_variance | 0.624 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 42900 | -| policy_gradient_loss | -0.00405 | -| std | 0.394 | -| value_loss | 0.00569 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 15 | -| iterations | 4292 | -| time_elapsed | 35696 | -| total_timesteps | 549376 | -| train/ | | -| approx_kl | 0.019094216 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.488 | -| explained_variance | -924 | -| learning_rate | 0.0003 | -| loss | 0.000548 | -| n_updates | 42910 | -| policy_gradient_loss | 6.98e-05 | -| std | 0.394 | -| value_loss | 1.39e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 15 | -| iterations | 4293 | -| time_elapsed | 35699 | -| total_timesteps | 549504 | -| train/ | | -| approx_kl | 0.019151447 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -0.488 | -| explained_variance | -1.48e+03 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 42920 | -| policy_gradient_loss | -0.00285 | -| std | 0.395 | -| value_loss | 3.94e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 15 | -| iterations | 4294 | -| time_elapsed | 35703 | -| total_timesteps | 549632 | -| train/ | | -| approx_kl | 0.04063767 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | -0.489 | -| explained_variance | -45.5 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 42930 | -| policy_gradient_loss | -0.0149 | -| std | 0.395 | -| value_loss | 4.54e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 15 | -| iterations | 4295 | -| time_elapsed | 35707 | -| total_timesteps | 549760 | -| train/ | | -| approx_kl | 0.010305315 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.489 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 42940 | -| policy_gradient_loss | -0.000925 | -| std | 0.394 | -| value_loss | 1.05e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 15 | -| iterations | 4296 | -| time_elapsed | 35710 | -| total_timesteps | 549888 | -| train/ | | -| approx_kl | 0.0043127974 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.488 | -| explained_variance | -0.905 | -| learning_rate | 0.0003 | -| loss | -0.00962 | -| n_updates | 42950 | -| policy_gradient_loss | -0.00203 | -| std | 0.395 | -| value_loss | 1.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4297 | -| time_elapsed | 35714 | -| total_timesteps | 550016 | -| train/ | | -| approx_kl | 0.018382378 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.49 | -| explained_variance | -0.0853 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 42960 | -| policy_gradient_loss | -0.00675 | -| std | 0.395 | -| value_loss | 1.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4298 | -| time_elapsed | 35723 | -| total_timesteps | 550144 | -| train/ | | -| approx_kl | 0.021005701 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -0.49 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | -0.00407 | -| n_updates | 42970 | -| policy_gradient_loss | -0.00223 | -| std | 0.395 | -| value_loss | 0.00023 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4299 | -| time_elapsed | 35727 | -| total_timesteps | 550272 | -| train/ | | -| approx_kl | 0.015678043 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.489 | -| explained_variance | -1.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 42980 | -| policy_gradient_loss | -0.00953 | -| std | 0.394 | -| value_loss | 1.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4300 | -| time_elapsed | 35730 | -| total_timesteps | 550400 | -| train/ | | -| approx_kl | 0.023802115 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.489 | -| explained_variance | -2.82e+03 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 42990 | -| policy_gradient_loss | -0.0028 | -| std | 0.395 | -| value_loss | 6.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4301 | -| time_elapsed | 35733 | -| total_timesteps | 550528 | -| train/ | | -| approx_kl | 0.03505151 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.49 | -| explained_variance | -30.3 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 43000 | -| policy_gradient_loss | -0.00282 | -| std | 0.396 | -| value_loss | 7.06e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4302 | -| time_elapsed | 35738 | -| total_timesteps | 550656 | -| train/ | | -| approx_kl | 0.0073029203 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.493 | -| explained_variance | -5.72 | -| learning_rate | 0.0003 | -| loss | -0.00959 | -| n_updates | 43010 | -| policy_gradient_loss | -0.0039 | -| std | 0.397 | -| value_loss | 3.94e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4303 | -| time_elapsed | 35741 | -| total_timesteps | 550784 | -| train/ | | -| approx_kl | 0.0012270557 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.494 | -| explained_variance | -2.32 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 43020 | -| policy_gradient_loss | 1.8e-05 | -| std | 0.396 | -| value_loss | 7.63e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4304 | -| time_elapsed | 35744 | -| total_timesteps | 550912 | -| train/ | | -| approx_kl | 0.0020427015 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.49 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 43030 | -| policy_gradient_loss | 0.000179 | -| std | 0.394 | -| value_loss | 9.48e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4305 | -| time_elapsed | 35747 | -| total_timesteps | 551040 | -| train/ | | -| approx_kl | 0.024903094 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | -0.488 | -| explained_variance | -0.00812 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 43040 | -| policy_gradient_loss | -0.00551 | -| std | 0.394 | -| value_loss | 2.87e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4306 | -| time_elapsed | 35754 | -| total_timesteps | 551168 | -| train/ | | -| approx_kl | 0.02195041 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.486 | -| explained_variance | 0.75 | -| learning_rate | 0.0003 | -| loss | -0.00602 | -| n_updates | 43050 | -| policy_gradient_loss | -0.0037 | -| std | 0.393 | -| value_loss | 0.00433 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4307 | -| time_elapsed | 35758 | -| total_timesteps | 551296 | -| train/ | | -| approx_kl | 0.00016209972 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.485 | -| explained_variance | -3.36e+03 | -| learning_rate | 0.0003 | -| loss | 0.000403 | -| n_updates | 43060 | -| policy_gradient_loss | 0.000948 | -| std | 0.393 | -| value_loss | 1.21e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4308 | -| time_elapsed | 35761 | -| total_timesteps | 551424 | -| train/ | | -| approx_kl | 0.043433025 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | -0.487 | -| explained_variance | -4.07e+03 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 43070 | -| policy_gradient_loss | -0.00287 | -| std | 0.394 | -| value_loss | 3.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4309 | -| time_elapsed | 35765 | -| total_timesteps | 551552 | -| train/ | | -| approx_kl | 0.010994192 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | -0.489 | -| explained_variance | -173 | -| learning_rate | 0.0003 | -| loss | -0.000116 | -| n_updates | 43080 | -| policy_gradient_loss | -0.000274 | -| std | 0.394 | -| value_loss | 5.62e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4310 | -| time_elapsed | 35768 | -| total_timesteps | 551680 | -| train/ | | -| approx_kl | 0.019365996 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.487 | -| explained_variance | -870 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 43090 | -| policy_gradient_loss | -0.00717 | -| std | 0.393 | -| value_loss | 3.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4311 | -| time_elapsed | 35771 | -| total_timesteps | 551808 | -| train/ | | -| approx_kl | 0.032961678 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -0.486 | -| explained_variance | -76.1 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 43100 | -| policy_gradient_loss | -0.0123 | -| std | 0.393 | -| value_loss | 3.01e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4312 | -| time_elapsed | 35775 | -| total_timesteps | 551936 | -| train/ | | -| approx_kl | 0.01905495 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.486 | -| explained_variance | -3.79 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 43110 | -| policy_gradient_loss | -0.0102 | -| std | 0.393 | -| value_loss | 2.41e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4313 | -| time_elapsed | 35778 | -| total_timesteps | 552064 | -| train/ | | -| approx_kl | 0.026761664 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.485 | -| explained_variance | -0.769 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 43120 | -| policy_gradient_loss | -0.0144 | -| std | 0.393 | -| value_loss | 8.32e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4314 | -| time_elapsed | 35782 | -| total_timesteps | 552192 | -| train/ | | -| approx_kl | 0.034805834 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | -0.486 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 43130 | -| policy_gradient_loss | -0.0122 | -| std | 0.393 | -| value_loss | 3.44e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4315 | -| time_elapsed | 35784 | -| total_timesteps | 552320 | -| train/ | | -| approx_kl | 0.029350916 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.486 | -| explained_variance | -222 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 43140 | -| policy_gradient_loss | -0.00249 | -| std | 0.393 | -| value_loss | 3.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4316 | -| time_elapsed | 35788 | -| total_timesteps | 552448 | -| train/ | | -| approx_kl | 0.034783304 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | -0.485 | -| explained_variance | -237 | -| learning_rate | 0.0003 | -| loss | -0.00853 | -| n_updates | 43150 | -| policy_gradient_loss | -0.00729 | -| std | 0.393 | -| value_loss | 3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4317 | -| time_elapsed | 35791 | -| total_timesteps | 552576 | -| train/ | | -| approx_kl | 0.020459395 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.483 | -| explained_variance | -37.8 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 43160 | -| policy_gradient_loss | -0.00639 | -| std | 0.392 | -| value_loss | 3.49e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4318 | -| time_elapsed | 35795 | -| total_timesteps | 552704 | -| train/ | | -| approx_kl | 0.0053643314 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 43170 | -| policy_gradient_loss | -0.00196 | -| std | 0.391 | -| value_loss | 6.44e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4319 | -| time_elapsed | 35798 | -| total_timesteps | 552832 | -| train/ | | -| approx_kl | 0.027315738 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.48 | -| explained_variance | -0.607 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 43180 | -| policy_gradient_loss | -0.0131 | -| std | 0.391 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 15 | -| iterations | 4320 | -| time_elapsed | 35802 | -| total_timesteps | 552960 | -| train/ | | -| approx_kl | 0.013187222 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 43190 | -| policy_gradient_loss | -0.00409 | -| std | 0.392 | -| value_loss | 5.07e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4321 | -| time_elapsed | 35805 | -| total_timesteps | 553088 | -| train/ | | -| approx_kl | 0.02366699 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 43200 | -| policy_gradient_loss | -0.00848 | -| std | 0.392 | -| value_loss | 1.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4322 | -| time_elapsed | 35812 | -| total_timesteps | 553216 | -| train/ | | -| approx_kl | 0.007870537 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | 0.878 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 43210 | -| policy_gradient_loss | -0.00676 | -| std | 0.392 | -| value_loss | 0.00211 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4323 | -| time_elapsed | 35816 | -| total_timesteps | 553344 | -| train/ | | -| approx_kl | 0.0028360854 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.483 | -| explained_variance | -790 | -| learning_rate | 0.0003 | -| loss | -0.00858 | -| n_updates | 43220 | -| policy_gradient_loss | -0.00083 | -| std | 0.392 | -| value_loss | 2.62e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4324 | -| time_elapsed | 35819 | -| total_timesteps | 553472 | -| train/ | | -| approx_kl | 0.0004924191 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.484 | -| explained_variance | -6.32e+03 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 43230 | -| policy_gradient_loss | 0.000573 | -| std | 0.393 | -| value_loss | 1.76e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4325 | -| time_elapsed | 35822 | -| total_timesteps | 553600 | -| train/ | | -| approx_kl | 0.0060360543 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.485 | -| explained_variance | -231 | -| learning_rate | 0.0003 | -| loss | 0.000205 | -| n_updates | 43240 | -| policy_gradient_loss | 0.000131 | -| std | 0.394 | -| value_loss | 3.06e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4326 | -| time_elapsed | 35825 | -| total_timesteps | 553728 | -| train/ | | -| approx_kl | 0.020525776 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.488 | -| explained_variance | -45.2 | -| learning_rate | 0.0003 | -| loss | -0.00627 | -| n_updates | 43250 | -| policy_gradient_loss | -0.00363 | -| std | 0.394 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4327 | -| time_elapsed | 35828 | -| total_timesteps | 553856 | -| train/ | | -| approx_kl | 0.023227533 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | -0.488 | -| explained_variance | -13.5 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 43260 | -| policy_gradient_loss | -0.0109 | -| std | 0.394 | -| value_loss | 4.36e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4328 | -| time_elapsed | 35832 | -| total_timesteps | 553984 | -| train/ | | -| approx_kl | 0.01130155 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.488 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 43270 | -| policy_gradient_loss | -0.00223 | -| std | 0.393 | -| value_loss | 5.58e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4329 | -| time_elapsed | 35836 | -| total_timesteps | 554112 | -| train/ | | -| approx_kl | 0.009676365 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.485 | -| explained_variance | -1.81 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 43280 | -| policy_gradient_loss | -0.00112 | -| std | 0.393 | -| value_loss | 6.27e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4330 | -| time_elapsed | 35845 | -| total_timesteps | 554240 | -| train/ | | -| approx_kl | 0.04047967 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.484 | -| explained_variance | 0.456 | -| learning_rate | 0.0003 | -| loss | -0.00905 | -| n_updates | 43290 | -| policy_gradient_loss | -0.00653 | -| std | 0.392 | -| value_loss | 0.0015 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4331 | -| time_elapsed | 35848 | -| total_timesteps | 554368 | -| train/ | | -| approx_kl | 0.033759005 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.484 | -| explained_variance | -1.27e+03 | -| learning_rate | 0.0003 | -| loss | -0.000415 | -| n_updates | 43300 | -| policy_gradient_loss | -0.00198 | -| std | 0.393 | -| value_loss | 6.58e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4332 | -| time_elapsed | 35851 | -| total_timesteps | 554496 | -| train/ | | -| approx_kl | 0.0073750457 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.485 | -| explained_variance | -3.28e+03 | -| learning_rate | 0.0003 | -| loss | -0.00428 | -| n_updates | 43310 | -| policy_gradient_loss | -0.00146 | -| std | 0.393 | -| value_loss | 1.44e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4333 | -| time_elapsed | 35854 | -| total_timesteps | 554624 | -| train/ | | -| approx_kl | 0.061334655 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | -0.484 | -| explained_variance | -224 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 43320 | -| policy_gradient_loss | -0.0099 | -| std | 0.392 | -| value_loss | 5.82e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4334 | -| time_elapsed | 35858 | -| total_timesteps | 554752 | -| train/ | | -| approx_kl | 0.0012772155 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.483 | -| explained_variance | -81.8 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 43330 | -| policy_gradient_loss | 0.000486 | -| std | 0.392 | -| value_loss | 3.54e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 15 | -| iterations | 4335 | -| time_elapsed | 35862 | -| total_timesteps | 554880 | -| train/ | | -| approx_kl | 0.0008596529 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | -5.3 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 43340 | -| policy_gradient_loss | 0.000408 | -| std | 0.391 | -| value_loss | 8.08e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4336 | -| time_elapsed | 35865 | -| total_timesteps | 555008 | -| train/ | | -| approx_kl | 0.043990403 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | -0.48 | -| explained_variance | -2.02 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 43350 | -| policy_gradient_loss | -0.0109 | -| std | 0.391 | -| value_loss | 1.02e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4337 | -| time_elapsed | 35874 | -| total_timesteps | 555136 | -| train/ | | -| approx_kl | 0.0062924307 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.479 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 43360 | -| policy_gradient_loss | -0.00611 | -| std | 0.39 | -| value_loss | 8.61e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4338 | -| time_elapsed | 35878 | -| total_timesteps | 555264 | -| train/ | | -| approx_kl | 0.00016601966 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.478 | -| explained_variance | -423 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 43370 | -| policy_gradient_loss | 0.00313 | -| std | 0.39 | -| value_loss | 3.49e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4339 | -| time_elapsed | 35882 | -| total_timesteps | 555392 | -| train/ | | -| approx_kl | 0.0015737046 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.477 | -| explained_variance | -7.24 | -| learning_rate | 0.0003 | -| loss | -0.00689 | -| n_updates | 43380 | -| policy_gradient_loss | 0.000386 | -| std | 0.39 | -| value_loss | 1.71e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4340 | -| time_elapsed | 35885 | -| total_timesteps | 555520 | -| train/ | | -| approx_kl | 0.00084375264 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.477 | -| explained_variance | -0.333 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 43390 | -| policy_gradient_loss | 0.00178 | -| std | 0.39 | -| value_loss | 5.43e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4341 | -| time_elapsed | 35888 | -| total_timesteps | 555648 | -| train/ | | -| approx_kl | 0.008112986 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.476 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.00015 | -| n_updates | 43400 | -| policy_gradient_loss | 2.68e-05 | -| std | 0.39 | -| value_loss | 1.35e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4342 | -| time_elapsed | 35890 | -| total_timesteps | 555776 | -| train/ | | -| approx_kl | 0.0075801215 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.476 | -| explained_variance | -0.0805 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 43410 | -| policy_gradient_loss | -0.00517 | -| std | 0.39 | -| value_loss | 2.86e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 15 | -| iterations | 4343 | -| time_elapsed | 35893 | -| total_timesteps | 555904 | -| train/ | | -| approx_kl | 0.00014841883 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.477 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 43420 | -| policy_gradient_loss | 0.00296 | -| std | 0.39 | -| value_loss | 3.51e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4344 | -| time_elapsed | 35896 | -| total_timesteps | 556032 | -| train/ | | -| approx_kl | 0.018590761 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | -0.478 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 43430 | -| policy_gradient_loss | -0.00369 | -| std | 0.39 | -| value_loss | 1.55e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4345 | -| time_elapsed | 35903 | -| total_timesteps | 556160 | -| train/ | | -| approx_kl | 0.025983447 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -0.479 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 43440 | -| policy_gradient_loss | -0.00523 | -| std | 0.39 | -| value_loss | 0.00017 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4346 | -| time_elapsed | 35906 | -| total_timesteps | 556288 | -| train/ | | -| approx_kl | 0.00015537068 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.478 | -| explained_variance | -9.57e+03 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 43450 | -| policy_gradient_loss | 0.00499 | -| std | 0.39 | -| value_loss | 5.66e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4347 | -| time_elapsed | 35910 | -| total_timesteps | 556416 | -| train/ | | -| approx_kl | 0.006285009 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.478 | -| explained_variance | -8.76e+03 | -| learning_rate | 0.0003 | -| loss | 0.000148 | -| n_updates | 43460 | -| policy_gradient_loss | 8.12e-05 | -| std | 0.391 | -| value_loss | 2.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4348 | -| time_elapsed | 35913 | -| total_timesteps | 556544 | -| train/ | | -| approx_kl | 0.015605858 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.48 | -| explained_variance | -931 | -| learning_rate | 0.0003 | -| loss | -0.00519 | -| n_updates | 43470 | -| policy_gradient_loss | -0.00208 | -| std | 0.391 | -| value_loss | 4.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4349 | -| time_elapsed | 35916 | -| total_timesteps | 556672 | -| train/ | | -| approx_kl | 0.045371424 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | -943 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 43480 | -| policy_gradient_loss | -0.0107 | -| std | 0.392 | -| value_loss | 5.48e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4350 | -| time_elapsed | 35920 | -| total_timesteps | 556800 | -| train/ | | -| approx_kl | 0.0153165 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | -43.6 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 43490 | -| policy_gradient_loss | -0.00811 | -| std | 0.392 | -| value_loss | 3.76e-10 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 15 | -| iterations | 4351 | -| time_elapsed | 35923 | -| total_timesteps | 556928 | -| train/ | | -| approx_kl | 0.0059311376 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.483 | -| explained_variance | -0.701 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 43500 | -| policy_gradient_loss | -0.00276 | -| std | 0.392 | -| value_loss | 1.81e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4352 | -| time_elapsed | 35926 | -| total_timesteps | 557056 | -| train/ | | -| approx_kl | 0.00019966299 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.483 | -| explained_variance | -0.878 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 43510 | -| policy_gradient_loss | 0.00115 | -| std | 0.392 | -| value_loss | 2.99e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4353 | -| time_elapsed | 35933 | -| total_timesteps | 557184 | -| train/ | | -| approx_kl | 0.019074226 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 43520 | -| policy_gradient_loss | -0.0127 | -| std | 0.392 | -| value_loss | 0.000531 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4354 | -| time_elapsed | 35937 | -| total_timesteps | 557312 | -| train/ | | -| approx_kl | 0.020653129 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | -374 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 43530 | -| policy_gradient_loss | -0.00254 | -| std | 0.391 | -| value_loss | 2.84e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4355 | -| time_elapsed | 35941 | -| total_timesteps | 557440 | -| train/ | | -| approx_kl | 0.00032291026 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.48 | -| explained_variance | -612 | -| learning_rate | 0.0003 | -| loss | -0.00626 | -| n_updates | 43540 | -| policy_gradient_loss | 0.00446 | -| std | 0.391 | -| value_loss | 1.06e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4356 | -| time_elapsed | 35945 | -| total_timesteps | 557568 | -| train/ | | -| approx_kl | 0.031015657 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 43550 | -| policy_gradient_loss | -0.0157 | -| std | 0.392 | -| value_loss | 4.98e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4357 | -| time_elapsed | 35948 | -| total_timesteps | 557696 | -| train/ | | -| approx_kl | 0.00999385 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.0011 | -| n_updates | 43560 | -| policy_gradient_loss | -0.000134 | -| std | 0.392 | -| value_loss | 6.91e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4358 | -| time_elapsed | 35951 | -| total_timesteps | 557824 | -| train/ | | -| approx_kl | 0.023805933 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | -0.00995 | -| learning_rate | 0.0003 | -| loss | -0.0298 | -| n_updates | 43570 | -| policy_gradient_loss | -0.0185 | -| std | 0.391 | -| value_loss | 9.04e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 15 | -| iterations | 4359 | -| time_elapsed | 35955 | -| total_timesteps | 557952 | -| train/ | | -| approx_kl | 0.02712446 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.48 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 43580 | -| policy_gradient_loss | -0.014 | -| std | 0.391 | -| value_loss | 6.02e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4360 | -| time_elapsed | 35959 | -| total_timesteps | 558080 | -| train/ | | -| approx_kl | 0.010540278 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.000195 | -| n_updates | 43590 | -| policy_gradient_loss | -0.000807 | -| std | 0.391 | -| value_loss | 5.94e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4361 | -| time_elapsed | 35965 | -| total_timesteps | 558208 | -| train/ | | -| approx_kl | 0.014975622 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 43600 | -| policy_gradient_loss | -0.00687 | -| std | 0.391 | -| value_loss | 0.00104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4362 | -| time_elapsed | 35968 | -| total_timesteps | 558336 | -| train/ | | -| approx_kl | 0.006054456 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.482 | -| explained_variance | -568 | -| learning_rate | 0.0003 | -| loss | 0.000337 | -| n_updates | 43610 | -| policy_gradient_loss | 0.000224 | -| std | 0.392 | -| value_loss | 1.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4363 | -| time_elapsed | 35971 | -| total_timesteps | 558464 | -| train/ | | -| approx_kl | 0.015300483 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.484 | -| explained_variance | -5.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 43620 | -| policy_gradient_loss | -0.00448 | -| std | 0.393 | -| value_loss | 4.61e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4364 | -| time_elapsed | 35975 | -| total_timesteps | 558592 | -| train/ | | -| approx_kl | 3.2604206e-05 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.486 | -| explained_variance | -134 | -| learning_rate | 0.0003 | -| loss | 0.000888 | -| n_updates | 43630 | -| policy_gradient_loss | 0.00454 | -| std | 0.394 | -| value_loss | 5.14e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4365 | -| time_elapsed | 35978 | -| total_timesteps | 558720 | -| train/ | | -| approx_kl | 0.03924526 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | -0.486 | -| explained_variance | -37.8 | -| learning_rate | 0.0003 | -| loss | -0.00706 | -| n_updates | 43640 | -| policy_gradient_loss | -0.00516 | -| std | 0.393 | -| value_loss | 2.07e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4366 | -| time_elapsed | 35982 | -| total_timesteps | 558848 | -| train/ | | -| approx_kl | 0.0011087712 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.484 | -| explained_variance | -1.53 | -| learning_rate | 0.0003 | -| loss | 6.91e-05 | -| n_updates | 43650 | -| policy_gradient_loss | 0.000165 | -| std | 0.392 | -| value_loss | 2.56e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4367 | -| time_elapsed | 35986 | -| total_timesteps | 558976 | -| train/ | | -| approx_kl | 0.008724745 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.481 | -| explained_variance | -0.492 | -| learning_rate | 0.0003 | -| loss | -0.000648 | -| n_updates | 43660 | -| policy_gradient_loss | -0.00082 | -| std | 0.391 | -| value_loss | 1.07e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4368 | -| time_elapsed | 35989 | -| total_timesteps | 559104 | -| train/ | | -| approx_kl | 0.014968174 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.48 | -| explained_variance | 0.00385 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 43670 | -| policy_gradient_loss | -0.0078 | -| std | 0.391 | -| value_loss | 1.04e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4369 | -| time_elapsed | 35998 | -| total_timesteps | 559232 | -| train/ | | -| approx_kl | 0.0061868075 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.477 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 43680 | -| policy_gradient_loss | -0.000885 | -| std | 0.389 | -| value_loss | 6.59e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4370 | -| time_elapsed | 36001 | -| total_timesteps | 559360 | -| train/ | | -| approx_kl | 0.029240306 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.473 | -| explained_variance | -294 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 43690 | -| policy_gradient_loss | -0.0104 | -| std | 0.388 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4371 | -| time_elapsed | 36005 | -| total_timesteps | 559488 | -| train/ | | -| approx_kl | 0.005077144 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.471 | -| explained_variance | -216 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 43700 | -| policy_gradient_loss | -0.00117 | -| std | 0.387 | -| value_loss | 3.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4372 | -| time_elapsed | 36007 | -| total_timesteps | 559616 | -| train/ | | -| approx_kl | 0.002235535 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.469 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.000508 | -| n_updates | 43710 | -| policy_gradient_loss | 0.000561 | -| std | 0.387 | -| value_loss | 1.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4373 | -| time_elapsed | 36011 | -| total_timesteps | 559744 | -| train/ | | -| approx_kl | 0.006621009 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.469 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 43720 | -| policy_gradient_loss | -0.00132 | -| std | 0.387 | -| value_loss | 1.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4374 | -| time_elapsed | 36013 | -| total_timesteps | 559872 | -| train/ | | -| approx_kl | 0.014385463 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.472 | -| explained_variance | 0.00136 | -| learning_rate | 0.0003 | -| loss | -0.000589 | -| n_updates | 43730 | -| policy_gradient_loss | -0.00243 | -| std | 0.388 | -| value_loss | 8.76e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4375 | -| time_elapsed | 36017 | -| total_timesteps | 560000 | -| train/ | | -| approx_kl | 0.012890024 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.473 | -| explained_variance | -0.00121 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 43740 | -| policy_gradient_loss | -0.00302 | -| std | 0.389 | -| value_loss | 1.22e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4376 | -| time_elapsed | 36021 | -| total_timesteps | 560128 | -| train/ | | -| approx_kl | 0.0035558 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.473 | -| explained_variance | 0.00128 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 43750 | -| policy_gradient_loss | -0.00049 | -| std | 0.388 | -| value_loss | 1.06e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4377 | -| time_elapsed | 36027 | -| total_timesteps | 560256 | -| train/ | | -| approx_kl | 0.025390178 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -0.469 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 43760 | -| policy_gradient_loss | -0.00411 | -| std | 0.386 | -| value_loss | 0.00068 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4378 | -| time_elapsed | 36031 | -| total_timesteps | 560384 | -| train/ | | -| approx_kl | 2.1344516e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.467 | -| explained_variance | -2.57e+03 | -| learning_rate | 0.0003 | -| loss | -0.000311 | -| n_updates | 43770 | -| policy_gradient_loss | 0.00158 | -| std | 0.386 | -| value_loss | 7.24e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4379 | -| time_elapsed | 36034 | -| total_timesteps | 560512 | -| train/ | | -| approx_kl | 0.0016858999 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | -570 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 43780 | -| policy_gradient_loss | 6.04e-05 | -| std | 0.386 | -| value_loss | 2.36e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4380 | -| time_elapsed | 36036 | -| total_timesteps | 560640 | -| train/ | | -| approx_kl | 0.00072919484 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | -10 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 43790 | -| policy_gradient_loss | 0.00119 | -| std | 0.386 | -| value_loss | 2.65e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4381 | -| time_elapsed | 36039 | -| total_timesteps | 560768 | -| train/ | | -| approx_kl | 0.0011294242 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | -2.03 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 43800 | -| policy_gradient_loss | 0.000478 | -| std | 0.386 | -| value_loss | 1.12e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 15 | -| iterations | 4382 | -| time_elapsed | 36041 | -| total_timesteps | 560896 | -| train/ | | -| approx_kl | 0.0009597095 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 43810 | -| policy_gradient_loss | 0.000327 | -| std | 0.386 | -| value_loss | 1.18e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4383 | -| time_elapsed | 36045 | -| total_timesteps | 561024 | -| train/ | | -| approx_kl | 0.022366486 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | -0.467 | -| explained_variance | 0.00338 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 43820 | -| policy_gradient_loss | -0.00329 | -| std | 0.386 | -| value_loss | 7.64e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4384 | -| time_elapsed | 36054 | -| total_timesteps | 561152 | -| train/ | | -| approx_kl | 0.0114562195 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 43830 | -| policy_gradient_loss | -0.00541 | -| std | 0.385 | -| value_loss | 0.000214 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4385 | -| time_elapsed | 36058 | -| total_timesteps | 561280 | -| train/ | | -| approx_kl | 0.002210287 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.465 | -| explained_variance | -119 | -| learning_rate | 0.0003 | -| loss | -0.00748 | -| n_updates | 43840 | -| policy_gradient_loss | -0.000503 | -| std | 0.385 | -| value_loss | 5.78e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4386 | -| time_elapsed | 36061 | -| total_timesteps | 561408 | -| train/ | | -| approx_kl | 0.0011293578 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.464 | -| explained_variance | -265 | -| learning_rate | 0.0003 | -| loss | 0.00055 | -| n_updates | 43850 | -| policy_gradient_loss | 0.000589 | -| std | 0.385 | -| value_loss | 2.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4387 | -| time_elapsed | 36065 | -| total_timesteps | 561536 | -| train/ | | -| approx_kl | 0.008967986 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.463 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 43860 | -| policy_gradient_loss | -0.00599 | -| std | 0.384 | -| value_loss | 7.47e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4388 | -| time_elapsed | 36068 | -| total_timesteps | 561664 | -| train/ | | -| approx_kl | 0.019228877 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | -0.464 | -| explained_variance | -15.1 | -| learning_rate | 0.0003 | -| loss | -0.000432 | -| n_updates | 43870 | -| policy_gradient_loss | -0.000991 | -| std | 0.385 | -| value_loss | 1.95e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4389 | -| time_elapsed | 36073 | -| total_timesteps | 561792 | -| train/ | | -| approx_kl | 0.009185291 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 43880 | -| policy_gradient_loss | -0.00134 | -| std | 0.387 | -| value_loss | 1.22e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4390 | -| time_elapsed | 36075 | -| total_timesteps | 561920 | -| train/ | | -| approx_kl | 0.012299059 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.47 | -| explained_variance | -0.409 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 43890 | -| policy_gradient_loss | -0.000558 | -| std | 0.387 | -| value_loss | 7.65e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4391 | -| time_elapsed | 36079 | -| total_timesteps | 562048 | -| train/ | | -| approx_kl | 0.0129829645 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.471 | -| explained_variance | -0.00795 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 43900 | -| policy_gradient_loss | -0.00863 | -| std | 0.387 | -| value_loss | 5.34e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4392 | -| time_elapsed | 36086 | -| total_timesteps | 562176 | -| train/ | | -| approx_kl | 0.031169027 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | -0.47 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 43910 | -| policy_gradient_loss | -0.00242 | -| std | 0.387 | -| value_loss | 0.000932 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4393 | -| time_elapsed | 36089 | -| total_timesteps | 562304 | -| train/ | | -| approx_kl | 0.04012255 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.469 | -| explained_variance | -2.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.0078 | -| n_updates | 43920 | -| policy_gradient_loss | -0.00492 | -| std | 0.387 | -| value_loss | 8.66e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4394 | -| time_elapsed | 36092 | -| total_timesteps | 562432 | -| train/ | | -| approx_kl | 0.020416422 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | -0.468 | -| explained_variance | -14 | -| learning_rate | 0.0003 | -| loss | -0.00867 | -| n_updates | 43930 | -| policy_gradient_loss | -0.00843 | -| std | 0.386 | -| value_loss | 0.000411 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4395 | -| time_elapsed | 36096 | -| total_timesteps | 562560 | -| train/ | | -| approx_kl | 0.019486252 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.468 | -| explained_variance | -36.3 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 43940 | -| policy_gradient_loss | -0.0125 | -| std | 0.386 | -| value_loss | 0.000224 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4396 | -| time_elapsed | 36101 | -| total_timesteps | 562688 | -| train/ | | -| approx_kl | 0.028713334 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | -0.468 | -| explained_variance | -0.467 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 43950 | -| policy_gradient_loss | -0.0141 | -| std | 0.387 | -| value_loss | 0.00093 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4397 | -| time_elapsed | 36104 | -| total_timesteps | 562816 | -| train/ | | -| approx_kl | 0.016045166 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.469 | -| explained_variance | -0.000519 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 43960 | -| policy_gradient_loss | -0.00303 | -| std | 0.387 | -| value_loss | 0.000203 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 15 | -| iterations | 4398 | -| time_elapsed | 36107 | -| total_timesteps | 562944 | -| train/ | | -| approx_kl | 0.012646597 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.468 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.000148 | -| n_updates | 43970 | -| policy_gradient_loss | -0.00202 | -| std | 0.386 | -| value_loss | 2.2e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4399 | -| time_elapsed | 36109 | -| total_timesteps | 563072 | -| train/ | | -| approx_kl | 0.011140272 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.468 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 43980 | -| policy_gradient_loss | -0.00519 | -| std | 0.386 | -| value_loss | 1.72e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4400 | -| time_elapsed | 36115 | -| total_timesteps | 563200 | -| train/ | | -| approx_kl | 0.006922179 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.468 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -5.88e-05 | -| n_updates | 43990 | -| policy_gradient_loss | -0.000145 | -| std | 0.386 | -| value_loss | 0.000139 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4401 | -| time_elapsed | 36119 | -| total_timesteps | 563328 | -| train/ | | -| approx_kl | 0.00879029 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | -3.35 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 44000 | -| policy_gradient_loss | -0.00444 | -| std | 0.386 | -| value_loss | 2.06e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4402 | -| time_elapsed | 36121 | -| total_timesteps | 563456 | -| train/ | | -| approx_kl | 0.044972073 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | -0.466 | -| explained_variance | -3.73 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 44010 | -| policy_gradient_loss | -0.00821 | -| std | 0.386 | -| value_loss | 8.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4403 | -| time_elapsed | 36123 | -| total_timesteps | 563584 | -| train/ | | -| approx_kl | 0.0040628053 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.465 | -| explained_variance | -0.0743 | -| learning_rate | 0.0003 | -| loss | -0.000689 | -| n_updates | 44020 | -| policy_gradient_loss | -0.000376 | -| std | 0.385 | -| value_loss | 8.39e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4404 | -| time_elapsed | 36127 | -| total_timesteps | 563712 | -| train/ | | -| approx_kl | 0.013197657 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.464 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | -0.000224 | -| n_updates | 44030 | -| policy_gradient_loss | -0.00139 | -| std | 0.384 | -| value_loss | 6.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4405 | -| time_elapsed | 36129 | -| total_timesteps | 563840 | -| train/ | | -| approx_kl | 0.017550219 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -0.461 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 44040 | -| policy_gradient_loss | -0.00492 | -| std | 0.384 | -| value_loss | 1.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4406 | -| time_elapsed | 36133 | -| total_timesteps | 563968 | -| train/ | | -| approx_kl | 0.012116399 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.46 | -| explained_variance | -0.000933 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 44050 | -| policy_gradient_loss | -0.00434 | -| std | 0.383 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4407 | -| time_elapsed | 36135 | -| total_timesteps | 564096 | -| train/ | | -| approx_kl | 0.015548993 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.46 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 44060 | -| policy_gradient_loss | -0.00655 | -| std | 0.383 | -| value_loss | 1.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4408 | -| time_elapsed | 36143 | -| total_timesteps | 564224 | -| train/ | | -| approx_kl | 0.01440334 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.459 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | -0.00699 | -| n_updates | 44070 | -| policy_gradient_loss | -0.00282 | -| std | 0.383 | -| value_loss | 0.000487 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4409 | -| time_elapsed | 36147 | -| total_timesteps | 564352 | -| train/ | | -| approx_kl | 0.024572536 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.459 | -| explained_variance | -308 | -| learning_rate | 0.0003 | -| loss | -0.000313 | -| n_updates | 44080 | -| policy_gradient_loss | -0.000819 | -| std | 0.383 | -| value_loss | 2.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4410 | -| time_elapsed | 36150 | -| total_timesteps | 564480 | -| train/ | | -| approx_kl | 0.002437781 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.458 | -| explained_variance | -162 | -| learning_rate | 0.0003 | -| loss | -0.000661 | -| n_updates | 44090 | -| policy_gradient_loss | -0.000323 | -| std | 0.382 | -| value_loss | 5.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4411 | -| time_elapsed | 36154 | -| total_timesteps | 564608 | -| train/ | | -| approx_kl | 0.011331243 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.455 | -| explained_variance | -5.51 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 44100 | -| policy_gradient_loss | -0.00636 | -| std | 0.381 | -| value_loss | 1.84e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4412 | -| time_elapsed | 36157 | -| total_timesteps | 564736 | -| train/ | | -| approx_kl | 0.0016192778 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.451 | -| explained_variance | -2.75 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 44110 | -| policy_gradient_loss | -0.000335 | -| std | 0.379 | -| value_loss | 5.34e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4413 | -| time_elapsed | 36159 | -| total_timesteps | 564864 | -| train/ | | -| approx_kl | 0.0015086152 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.446 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 44120 | -| policy_gradient_loss | -0.000124 | -| std | 0.377 | -| value_loss | 1.88e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 15 | -| iterations | 4414 | -| time_elapsed | 36163 | -| total_timesteps | 564992 | -| train/ | | -| approx_kl | 0.00090142246 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | 0.000913 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 44130 | -| policy_gradient_loss | 0.000339 | -| std | 0.376 | -| value_loss | 1.59e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 15 | -| iterations | 4415 | -| time_elapsed | 36166 | -| total_timesteps | 565120 | -| train/ | | -| approx_kl | 0.0047034402 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.441 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | 0.000154 | -| n_updates | 44140 | -| policy_gradient_loss | 0.000426 | -| std | 0.376 | -| value_loss | 6.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 15 | -| iterations | 4416 | -| time_elapsed | 36176 | -| total_timesteps | 565248 | -| train/ | | -| approx_kl | 0.024019945 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | -8.01 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 44150 | -| policy_gradient_loss | -0.00208 | -| std | 0.377 | -| value_loss | 0.00572 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 15 | -| iterations | 4417 | -| time_elapsed | 36179 | -| total_timesteps | 565376 | -| train/ | | -| approx_kl | 0.02527624 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.443 | -| explained_variance | -4.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.000578 | -| n_updates | 44160 | -| policy_gradient_loss | -0.00142 | -| std | 0.377 | -| value_loss | 3.87e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 15 | -| iterations | 4418 | -| time_elapsed | 36183 | -| total_timesteps | 565504 | -| train/ | | -| approx_kl | 0.023048757 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | -4.87e+03 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 44170 | -| policy_gradient_loss | -0.00524 | -| std | 0.376 | -| value_loss | 6.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 15 | -| iterations | 4419 | -| time_elapsed | 36186 | -| total_timesteps | 565632 | -| train/ | | -| approx_kl | 0.017516911 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.441 | -| explained_variance | -456 | -| learning_rate | 0.0003 | -| loss | 0.000311 | -| n_updates | 44180 | -| policy_gradient_loss | -0.000113 | -| std | 0.376 | -| value_loss | 9.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 15 | -| iterations | 4420 | -| time_elapsed | 36189 | -| total_timesteps | 565760 | -| train/ | | -| approx_kl | 0.019101407 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.439 | -| explained_variance | -13.2 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 44190 | -| policy_gradient_loss | -0.00366 | -| std | 0.375 | -| value_loss | 1.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 15 | -| iterations | 4421 | -| time_elapsed | 36193 | -| total_timesteps | 565888 | -| train/ | | -| approx_kl | 0.019321056 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.44 | -| explained_variance | -3.33 | -| learning_rate | 0.0003 | -| loss | 0.000622 | -| n_updates | 44200 | -| policy_gradient_loss | -0.00134 | -| std | 0.376 | -| value_loss | 7.36e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4422 | -| time_elapsed | 36195 | -| total_timesteps | 566016 | -| train/ | | -| approx_kl | 0.0053822664 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.44 | -| explained_variance | -0.0558 | -| learning_rate | 0.0003 | -| loss | -0.00065 | -| n_updates | 44210 | -| policy_gradient_loss | -0.00048 | -| std | 0.376 | -| value_loss | 2.86e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4423 | -| time_elapsed | 36203 | -| total_timesteps | 566144 | -| train/ | | -| approx_kl | 0.020036697 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.439 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 44220 | -| policy_gradient_loss | -0.00892 | -| std | 0.375 | -| value_loss | 0.00129 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4424 | -| time_elapsed | 36206 | -| total_timesteps | 566272 | -| train/ | | -| approx_kl | 0.0009993496 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.437 | -| explained_variance | -198 | -| learning_rate | 0.0003 | -| loss | 0.000351 | -| n_updates | 44230 | -| policy_gradient_loss | 0.000306 | -| std | 0.374 | -| value_loss | 5.6e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4425 | -| time_elapsed | 36209 | -| total_timesteps | 566400 | -| train/ | | -| approx_kl | 0.006527184 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.436 | -| explained_variance | -507 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 44240 | -| policy_gradient_loss | -0.000577 | -| std | 0.374 | -| value_loss | 2.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4426 | -| time_elapsed | 36211 | -| total_timesteps | 566528 | -| train/ | | -| approx_kl | 0.010215802 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.433 | -| explained_variance | -11.6 | -| learning_rate | 0.0003 | -| loss | -0.0083 | -| n_updates | 44250 | -| policy_gradient_loss | -0.00274 | -| std | 0.373 | -| value_loss | 6.68e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4427 | -| time_elapsed | 36214 | -| total_timesteps | 566656 | -| train/ | | -| approx_kl | 0.020405818 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | -0.431 | -| explained_variance | -0.502 | -| learning_rate | 0.0003 | -| loss | 0.00588 | -| n_updates | 44260 | -| policy_gradient_loss | 0.00241 | -| std | 0.372 | -| value_loss | 6.27e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4428 | -| time_elapsed | 36217 | -| total_timesteps | 566784 | -| train/ | | -| approx_kl | 0.008080272 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.43 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 44270 | -| policy_gradient_loss | -0.000644 | -| std | 0.371 | -| value_loss | 3.55e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 15 | -| iterations | 4429 | -| time_elapsed | 36220 | -| total_timesteps | 566912 | -| train/ | | -| approx_kl | 0.012734508 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.428 | -| explained_variance | 0.00711 | -| learning_rate | 0.0003 | -| loss | -0.00977 | -| n_updates | 44280 | -| policy_gradient_loss | -0.00436 | -| std | 0.371 | -| value_loss | 1.55e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4430 | -| time_elapsed | 36223 | -| total_timesteps | 567040 | -| train/ | | -| approx_kl | 0.0024924441 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 44290 | -| policy_gradient_loss | -0.00107 | -| std | 0.37 | -| value_loss | 2.06e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4431 | -| time_elapsed | 36228 | -| total_timesteps | 567168 | -| train/ | | -| approx_kl | 0.039963126 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | -0.424 | -| explained_variance | 0.685 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 44300 | -| policy_gradient_loss | -0.00971 | -| std | 0.37 | -| value_loss | 0.000579 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4432 | -| time_elapsed | 36230 | -| total_timesteps | 567296 | -| train/ | | -| approx_kl | 0.01741328 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -0.423 | -| explained_variance | -139 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 44310 | -| policy_gradient_loss | -0.00132 | -| std | 0.369 | -| value_loss | 2.86e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4433 | -| time_elapsed | 36232 | -| total_timesteps | 567424 | -| train/ | | -| approx_kl | 0.010756434 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.42 | -| explained_variance | -234 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 44320 | -| policy_gradient_loss | -0.00376 | -| std | 0.368 | -| value_loss | 1.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4434 | -| time_elapsed | 36236 | -| total_timesteps | 567552 | -| train/ | | -| approx_kl | 0.038386334 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | -0.419 | -| explained_variance | -11.9 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 44330 | -| policy_gradient_loss | -0.014 | -| std | 0.368 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4435 | -| time_elapsed | 36239 | -| total_timesteps | 567680 | -| train/ | | -| approx_kl | 0.009059491 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.419 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.00945 | -| n_updates | 44340 | -| policy_gradient_loss | -0.00349 | -| std | 0.368 | -| value_loss | 3.33e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4436 | -| time_elapsed | 36243 | -| total_timesteps | 567808 | -| train/ | | -| approx_kl | 0.0005711098 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.42 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | -0.000967 | -| n_updates | 44350 | -| policy_gradient_loss | 0.000519 | -| std | 0.368 | -| value_loss | 2.71e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4437 | -| time_elapsed | 36246 | -| total_timesteps | 567936 | -| train/ | | -| approx_kl | 0.0217005 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -0.42 | -| explained_variance | 0.00696 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 44360 | -| policy_gradient_loss | -0.00625 | -| std | 0.368 | -| value_loss | 5.11e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4438 | -| time_elapsed | 36248 | -| total_timesteps | 568064 | -| train/ | | -| approx_kl | 0.012066926 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.42 | -| explained_variance | -0.0689 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 44370 | -| policy_gradient_loss | -0.0021 | -| std | 0.369 | -| value_loss | 4.9e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4439 | -| time_elapsed | 36253 | -| total_timesteps | 568192 | -| train/ | | -| approx_kl | 0.0009585568 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.422 | -| explained_variance | 0.858 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 44380 | -| policy_gradient_loss | 0.000408 | -| std | 0.369 | -| value_loss | 0.00141 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4440 | -| time_elapsed | 36257 | -| total_timesteps | 568320 | -| train/ | | -| approx_kl | 0.033802766 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.422 | -| explained_variance | -2.66e+03 | -| learning_rate | 0.0003 | -| loss | -0.00901 | -| n_updates | 44390 | -| policy_gradient_loss | -0.00506 | -| std | 0.369 | -| value_loss | 8.07e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4441 | -| time_elapsed | 36261 | -| total_timesteps | 568448 | -| train/ | | -| approx_kl | 0.0009865924 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.422 | -| explained_variance | -1.78e+03 | -| learning_rate | 0.0003 | -| loss | 0.000442 | -| n_updates | 44400 | -| policy_gradient_loss | 0.000582 | -| std | 0.369 | -| value_loss | 2.57e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4442 | -| time_elapsed | 36264 | -| total_timesteps | 568576 | -| train/ | | -| approx_kl | 0.0046873656 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.424 | -| explained_variance | -22.9 | -| learning_rate | 0.0003 | -| loss | -0.000143 | -| n_updates | 44410 | -| policy_gradient_loss | -0.000144 | -| std | 0.37 | -| value_loss | 4.29e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4443 | -| time_elapsed | 36268 | -| total_timesteps | 568704 | -| train/ | | -| approx_kl | 0.021898957 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | -3.8 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 44420 | -| policy_gradient_loss | -0.01 | -| std | 0.371 | -| value_loss | 1.88e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4444 | -| time_elapsed | 36271 | -| total_timesteps | 568832 | -| train/ | | -| approx_kl | 0.03724169 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | -0.427 | -| explained_variance | -0.804 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 44430 | -| policy_gradient_loss | -0.00632 | -| std | 0.371 | -| value_loss | 1.03e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 15 | -| iterations | 4445 | -| time_elapsed | 36273 | -| total_timesteps | 568960 | -| train/ | | -| approx_kl | 0.01229758 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.427 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 44440 | -| policy_gradient_loss | -0.00735 | -| std | 0.371 | -| value_loss | 6.91e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4446 | -| time_elapsed | 36276 | -| total_timesteps | 569088 | -| train/ | | -| approx_kl | 0.013565984 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | -0.427 | -| explained_variance | -0.00763 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 44450 | -| policy_gradient_loss | -0.000105 | -| std | 0.37 | -| value_loss | 1.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4447 | -| time_elapsed | 36282 | -| total_timesteps | 569216 | -| train/ | | -| approx_kl | 0.038310338 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | 0.706 | -| learning_rate | 0.0003 | -| loss | -0.00873 | -| n_updates | 44460 | -| policy_gradient_loss | -0.00438 | -| std | 0.37 | -| value_loss | 0.000687 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4448 | -| time_elapsed | 36284 | -| total_timesteps | 569344 | -| train/ | | -| approx_kl | 0.029500991 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.425 | -| explained_variance | -910 | -| learning_rate | 0.0003 | -| loss | -0.000362 | -| n_updates | 44470 | -| policy_gradient_loss | -0.00108 | -| std | 0.37 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4449 | -| time_elapsed | 36286 | -| total_timesteps | 569472 | -| train/ | | -| approx_kl | 0.011037024 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.423 | -| explained_variance | -6.16e+03 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 44480 | -| policy_gradient_loss | -0.00112 | -| std | 0.369 | -| value_loss | 5.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4450 | -| time_elapsed | 36289 | -| total_timesteps | 569600 | -| train/ | | -| approx_kl | 0.0034657032 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.419 | -| explained_variance | -41.7 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 44490 | -| policy_gradient_loss | -0.000458 | -| std | 0.367 | -| value_loss | 3.13e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4451 | -| time_elapsed | 36292 | -| total_timesteps | 569728 | -| train/ | | -| approx_kl | 0.0018636626 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.416 | -| explained_variance | -3.51 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 44500 | -| policy_gradient_loss | 0.000151 | -| std | 0.367 | -| value_loss | 1.61e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4452 | -| time_elapsed | 36295 | -| total_timesteps | 569856 | -| train/ | | -| approx_kl | 0.00092068687 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.416 | -| explained_variance | -0.701 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 44510 | -| policy_gradient_loss | 0.000432 | -| std | 0.367 | -| value_loss | 6.37e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 15 | -| iterations | 4453 | -| time_elapsed | 36299 | -| total_timesteps | 569984 | -| train/ | | -| approx_kl | 0.021130703 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.416 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | -1.86e-05 | -| n_updates | 44520 | -| policy_gradient_loss | -0.00304 | -| std | 0.367 | -| value_loss | 7.83e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4454 | -| time_elapsed | 36303 | -| total_timesteps | 570112 | -| train/ | | -| approx_kl | 0.009891322 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.416 | -| explained_variance | -0.00583 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 44530 | -| policy_gradient_loss | -0.00219 | -| std | 0.367 | -| value_loss | 1.93e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4455 | -| time_elapsed | 36310 | -| total_timesteps | 570240 | -| train/ | | -| approx_kl | 0.014617331 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.417 | -| explained_variance | 0.94 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 44540 | -| policy_gradient_loss | -0.0107 | -| std | 0.368 | -| value_loss | 0.000516 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4456 | -| time_elapsed | 36314 | -| total_timesteps | 570368 | -| train/ | | -| approx_kl | 0.0066199577 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.419 | -| explained_variance | -36.4 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 44550 | -| policy_gradient_loss | -0.000887 | -| std | 0.368 | -| value_loss | 6.49e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4457 | -| time_elapsed | 36318 | -| total_timesteps | 570496 | -| train/ | | -| approx_kl | 0.0072447076 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.422 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | 4.96e-05 | -| n_updates | 44560 | -| policy_gradient_loss | 0.000103 | -| std | 0.37 | -| value_loss | 3.76e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4458 | -| time_elapsed | 36321 | -| total_timesteps | 570624 | -| train/ | | -| approx_kl | 0.007828755 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.425 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 44570 | -| policy_gradient_loss | -0.000821 | -| std | 0.37 | -| value_loss | 6.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4459 | -| time_elapsed | 36324 | -| total_timesteps | 570752 | -| train/ | | -| approx_kl | 0.019860364 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | -0.345 | -| learning_rate | 0.0003 | -| loss | -0.00797 | -| n_updates | 44580 | -| policy_gradient_loss | -0.0072 | -| std | 0.37 | -| value_loss | 2.81e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 15 | -| iterations | 4460 | -| time_elapsed | 36327 | -| total_timesteps | 570880 | -| train/ | | -| approx_kl | 0.0017065597 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | -0.00642 | -| learning_rate | 0.0003 | -| loss | -0.000671 | -| n_updates | 44590 | -| policy_gradient_loss | -0.000212 | -| std | 0.371 | -| value_loss | 1.68e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4461 | -| time_elapsed | 36331 | -| total_timesteps | 571008 | -| train/ | | -| approx_kl | 0.006010721 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.427 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 44600 | -| policy_gradient_loss | -0.001 | -| std | 0.371 | -| value_loss | 1.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4462 | -| time_elapsed | 36340 | -| total_timesteps | 571136 | -| train/ | | -| approx_kl | 0.003653714 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | 0.864 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 44610 | -| policy_gradient_loss | -0.000439 | -| std | 0.371 | -| value_loss | 0.000387 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4463 | -| time_elapsed | 36345 | -| total_timesteps | 571264 | -| train/ | | -| approx_kl | 0.015812991 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | -3.44e+03 | -| learning_rate | 0.0003 | -| loss | -0.00483 | -| n_updates | 44620 | -| policy_gradient_loss | -0.00442 | -| std | 0.37 | -| value_loss | 7.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4464 | -| time_elapsed | 36348 | -| total_timesteps | 571392 | -| train/ | | -| approx_kl | 0.023159586 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | -0.425 | -| explained_variance | -355 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 44630 | -| policy_gradient_loss | -0.0127 | -| std | 0.37 | -| value_loss | 6.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4465 | -| time_elapsed | 36352 | -| total_timesteps | 571520 | -| train/ | | -| approx_kl | 0.005769573 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | -3.09 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 44640 | -| policy_gradient_loss | -0.00061 | -| std | 0.371 | -| value_loss | 1.99e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4466 | -| time_elapsed | 36355 | -| total_timesteps | 571648 | -| train/ | | -| approx_kl | 0.029272806 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | -0.427 | -| explained_variance | -0.775 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 44650 | -| policy_gradient_loss | -0.00585 | -| std | 0.371 | -| value_loss | 2.79e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4467 | -| time_elapsed | 36358 | -| total_timesteps | 571776 | -| train/ | | -| approx_kl | 0.010639774 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.429 | -| explained_variance | -0.493 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 44660 | -| policy_gradient_loss | -0.00288 | -| std | 0.372 | -| value_loss | 3.91e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 15 | -| iterations | 4468 | -| time_elapsed | 36361 | -| total_timesteps | 571904 | -| train/ | | -| approx_kl | 0.014119639 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.431 | -| explained_variance | -0.0846 | -| learning_rate | 0.0003 | -| loss | -0.00974 | -| n_updates | 44670 | -| policy_gradient_loss | -0.00594 | -| std | 0.373 | -| value_loss | 2.64e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4469 | -| time_elapsed | 36365 | -| total_timesteps | 572032 | -| train/ | | -| approx_kl | 0.029774252 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.432 | -| explained_variance | -0.00244 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 44680 | -| policy_gradient_loss | -0.00913 | -| std | 0.373 | -| value_loss | 3.07e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4470 | -| time_elapsed | 36373 | -| total_timesteps | 572160 | -| train/ | | -| approx_kl | 0.0228879 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.431 | -| explained_variance | 0.921 | -| learning_rate | 0.0003 | -| loss | -0.00637 | -| n_updates | 44690 | -| policy_gradient_loss | -0.00315 | -| std | 0.372 | -| value_loss | 0.000755 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4471 | -| time_elapsed | 36376 | -| total_timesteps | 572288 | -| train/ | | -| approx_kl | 0.00011457456 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.43 | -| explained_variance | -3.03e+03 | -| learning_rate | 0.0003 | -| loss | -0.000624 | -| n_updates | 44700 | -| policy_gradient_loss | 0.000971 | -| std | 0.372 | -| value_loss | 2.35e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4472 | -| time_elapsed | 36379 | -| total_timesteps | 572416 | -| train/ | | -| approx_kl | 0.048918635 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | -0.432 | -| explained_variance | -2.09e+03 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 44710 | -| policy_gradient_loss | -0.00331 | -| std | 0.373 | -| value_loss | 7.92e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4473 | -| time_elapsed | 36382 | -| total_timesteps | 572544 | -| train/ | | -| approx_kl | 0.022308135 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.435 | -| explained_variance | -508 | -| learning_rate | 0.0003 | -| loss | -0.000943 | -| n_updates | 44720 | -| policy_gradient_loss | -0.00092 | -| std | 0.374 | -| value_loss | 1.26e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4474 | -| time_elapsed | 36385 | -| total_timesteps | 572672 | -| train/ | | -| approx_kl | 0.02563235 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.437 | -| explained_variance | -323 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 44730 | -| policy_gradient_loss | -0.00418 | -| std | 0.375 | -| value_loss | 3.11e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4475 | -| time_elapsed | 36387 | -| total_timesteps | 572800 | -| train/ | | -| approx_kl | 0.017171059 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | -0.438 | -| explained_variance | -82.9 | -| learning_rate | 0.0003 | -| loss | 0.000882 | -| n_updates | 44740 | -| policy_gradient_loss | -0.000698 | -| std | 0.375 | -| value_loss | 2.86e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 15 | -| iterations | 4476 | -| time_elapsed | 36390 | -| total_timesteps | 572928 | -| train/ | | -| approx_kl | 0.006624133 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.438 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 44750 | -| policy_gradient_loss | -0.0027 | -| std | 0.375 | -| value_loss | 3.47e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4477 | -| time_elapsed | 36393 | -| total_timesteps | 573056 | -| train/ | | -| approx_kl | 0.015984945 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.437 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 44760 | -| policy_gradient_loss | -0.00383 | -| std | 0.375 | -| value_loss | 1.12e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4478 | -| time_elapsed | 36398 | -| total_timesteps | 573184 | -| train/ | | -| approx_kl | 0.0075754705 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.439 | -| explained_variance | 0.169 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 44770 | -| policy_gradient_loss | -0.000773 | -| std | 0.376 | -| value_loss | 0.00126 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4479 | -| time_elapsed | 36401 | -| total_timesteps | 573312 | -| train/ | | -| approx_kl | 0.0038076863 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | -966 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 44780 | -| policy_gradient_loss | -0.00174 | -| std | 0.377 | -| value_loss | 7.63e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4480 | -| time_elapsed | 36404 | -| total_timesteps | 573440 | -| train/ | | -| approx_kl | 0.03403157 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | -1.82e+03 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 44790 | -| policy_gradient_loss | -0.0137 | -| std | 0.377 | -| value_loss | 2.71e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4481 | -| time_elapsed | 36406 | -| total_timesteps | 573568 | -| train/ | | -| approx_kl | 0.0193857 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.445 | -| explained_variance | -5.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 44800 | -| policy_gradient_loss | -0.00358 | -| std | 0.377 | -| value_loss | 1.57e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4482 | -| time_elapsed | 36409 | -| total_timesteps | 573696 | -| train/ | | -| approx_kl | 0.0059365397 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | -2.75 | -| learning_rate | 0.0003 | -| loss | -0.00374 | -| n_updates | 44810 | -| policy_gradient_loss | -0.00106 | -| std | 0.377 | -| value_loss | 6.43e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4483 | -| time_elapsed | 36412 | -| total_timesteps | 573824 | -| train/ | | -| approx_kl | 0.023094852 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | -4.48 | -| learning_rate | 0.0003 | -| loss | -0.00379 | -| n_updates | 44820 | -| policy_gradient_loss | -0.00436 | -| std | 0.377 | -| value_loss | 9.48e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 15 | -| iterations | 4484 | -| time_elapsed | 36414 | -| total_timesteps | 573952 | -| train/ | | -| approx_kl | 0.01437032 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 44830 | -| policy_gradient_loss | -0.00337 | -| std | 0.377 | -| value_loss | 4.95e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4485 | -| time_elapsed | 36418 | -| total_timesteps | 574080 | -| train/ | | -| approx_kl | 0.012904592 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.443 | -| explained_variance | 0.00185 | -| learning_rate | 0.0003 | -| loss | -0.000112 | -| n_updates | 44840 | -| policy_gradient_loss | -0.000854 | -| std | 0.377 | -| value_loss | 1.83e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4486 | -| time_elapsed | 36424 | -| total_timesteps | 574208 | -| train/ | | -| approx_kl | 0.013854014 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | 0.834 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 44850 | -| policy_gradient_loss | -0.00536 | -| std | 0.376 | -| value_loss | 0.000341 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4487 | -| time_elapsed | 36427 | -| total_timesteps | 574336 | -| train/ | | -| approx_kl | 0.021507649 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | -180 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 44860 | -| policy_gradient_loss | -0.0135 | -| std | 0.377 | -| value_loss | 1.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4488 | -| time_elapsed | 36431 | -| total_timesteps | 574464 | -| train/ | | -| approx_kl | 0.03005929 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.443 | -| explained_variance | -175 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 44870 | -| policy_gradient_loss | -0.00723 | -| std | 0.377 | -| value_loss | 1.03e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4489 | -| time_elapsed | 36435 | -| total_timesteps | 574592 | -| train/ | | -| approx_kl | 0.00029796571 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | -4.79 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 44880 | -| policy_gradient_loss | 0.00421 | -| std | 0.376 | -| value_loss | 1.43e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4490 | -| time_elapsed | 36438 | -| total_timesteps | 574720 | -| train/ | | -| approx_kl | 0.021707565 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | -0.358 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 44890 | -| policy_gradient_loss | -0.00361 | -| std | 0.376 | -| value_loss | 1.15e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4491 | -| time_elapsed | 36442 | -| total_timesteps | 574848 | -| train/ | | -| approx_kl | 0.01159971 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.443 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 44900 | -| policy_gradient_loss | -0.00206 | -| std | 0.377 | -| value_loss | 3.77e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 15 | -| iterations | 4492 | -| time_elapsed | 36445 | -| total_timesteps | 574976 | -| train/ | | -| approx_kl | 0.0045860223 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | 0.00128 | -| learning_rate | 0.0003 | -| loss | -0.00473 | -| n_updates | 44910 | -| policy_gradient_loss | -0.000851 | -| std | 0.377 | -| value_loss | 1.06e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4493 | -| time_elapsed | 36449 | -| total_timesteps | 575104 | -| train/ | | -| approx_kl | 0.00060846144 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.445 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 44920 | -| policy_gradient_loss | 0.00166 | -| std | 0.377 | -| value_loss | 1.75e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4494 | -| time_elapsed | 36456 | -| total_timesteps | 575232 | -| train/ | | -| approx_kl | 0.04105644 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 44930 | -| policy_gradient_loss | -0.0133 | -| std | 0.377 | -| value_loss | 1.18e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4495 | -| time_elapsed | 36459 | -| total_timesteps | 575360 | -| train/ | | -| approx_kl | 0.008707538 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | -1.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 44940 | -| policy_gradient_loss | -0.000358 | -| std | 0.378 | -| value_loss | 6.99e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4496 | -| time_elapsed | 36463 | -| total_timesteps | 575488 | -| train/ | | -| approx_kl | 0.02360752 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.446 | -| explained_variance | -324 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 44950 | -| policy_gradient_loss | -0.00719 | -| std | 0.378 | -| value_loss | 2.79e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4497 | -| time_elapsed | 36467 | -| total_timesteps | 575616 | -| train/ | | -| approx_kl | 0.0010645643 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.446 | -| explained_variance | -12.1 | -| learning_rate | 0.0003 | -| loss | -0.005 | -| n_updates | 44960 | -| policy_gradient_loss | 0.000933 | -| std | 0.378 | -| value_loss | 1.06e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4498 | -| time_elapsed | 36470 | -| total_timesteps | 575744 | -| train/ | | -| approx_kl | 0.018421791 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | -0.447 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.00215 | -| n_updates | 44970 | -| policy_gradient_loss | -0.000936 | -| std | 0.378 | -| value_loss | 4.65e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 15 | -| iterations | 4499 | -| time_elapsed | 36474 | -| total_timesteps | 575872 | -| train/ | | -| approx_kl | 0.017584022 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.447 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 44980 | -| policy_gradient_loss | -0.00561 | -| std | 0.379 | -| value_loss | 2.13e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4500 | -| time_elapsed | 36478 | -| total_timesteps | 576000 | -| train/ | | -| approx_kl | 0.006996535 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.448 | -| explained_variance | -0.00254 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 44990 | -| policy_gradient_loss | -0.00102 | -| std | 0.379 | -| value_loss | 2.67e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4501 | -| time_elapsed | 36481 | -| total_timesteps | 576128 | -| train/ | | -| approx_kl | 0.010615198 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.449 | -| explained_variance | 0.00096 | -| learning_rate | 0.0003 | -| loss | -0.000236 | -| n_updates | 45000 | -| policy_gradient_loss | -0.001 | -| std | 0.379 | -| value_loss | 9.89e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4502 | -| time_elapsed | 36489 | -| total_timesteps | 576256 | -| train/ | | -| approx_kl | 0.012656939 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.449 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 45010 | -| policy_gradient_loss | -0.0108 | -| std | 0.379 | -| value_loss | 0.00124 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4503 | -| time_elapsed | 36494 | -| total_timesteps | 576384 | -| train/ | | -| approx_kl | 0.0077697663 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.45 | -| explained_variance | -45.9 | -| learning_rate | 0.0003 | -| loss | -0.000462 | -| n_updates | 45020 | -| policy_gradient_loss | -0.000525 | -| std | 0.38 | -| value_loss | 1.59e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4504 | -| time_elapsed | 36498 | -| total_timesteps | 576512 | -| train/ | | -| approx_kl | 0.015848212 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -0.452 | -| explained_variance | -193 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 45030 | -| policy_gradient_loss | -0.00134 | -| std | 0.381 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4505 | -| time_elapsed | 36501 | -| total_timesteps | 576640 | -| train/ | | -| approx_kl | 0.0045457357 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.455 | -| explained_variance | -6.83 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 45040 | -| policy_gradient_loss | -0.00128 | -| std | 0.381 | -| value_loss | 2.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4506 | -| time_elapsed | 36504 | -| total_timesteps | 576768 | -| train/ | | -| approx_kl | 0.023856102 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.455 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 45050 | -| policy_gradient_loss | -0.00839 | -| std | 0.381 | -| value_loss | 2.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4507 | -| time_elapsed | 36507 | -| total_timesteps | 576896 | -| train/ | | -| approx_kl | 0.013391651 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.455 | -| explained_variance | -0.0679 | -| learning_rate | 0.0003 | -| loss | -0.000187 | -| n_updates | 45060 | -| policy_gradient_loss | -0.00146 | -| std | 0.381 | -| value_loss | 5.18e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4508 | -| time_elapsed | 36511 | -| total_timesteps | 577024 | -| train/ | | -| approx_kl | 0.015126086 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.454 | -| explained_variance | 0.00727 | -| learning_rate | 0.0003 | -| loss | -0.00736 | -| n_updates | 45070 | -| policy_gradient_loss | -0.00505 | -| std | 0.381 | -| value_loss | 4.66e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4509 | -| time_elapsed | 36519 | -| total_timesteps | 577152 | -| train/ | | -| approx_kl | 0.008147354 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.454 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.00779 | -| n_updates | 45080 | -| policy_gradient_loss | -0.00265 | -| std | 0.381 | -| value_loss | 8.49e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4510 | -| time_elapsed | 36523 | -| total_timesteps | 577280 | -| train/ | | -| approx_kl | 9.050639e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.454 | -| explained_variance | -4.31e+03 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 45090 | -| policy_gradient_loss | 0.00278 | -| std | 0.381 | -| value_loss | 9.93e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4511 | -| time_elapsed | 36527 | -| total_timesteps | 577408 | -| train/ | | -| approx_kl | 0.051037192 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | -0.454 | -| explained_variance | -2.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 45100 | -| policy_gradient_loss | -0.00632 | -| std | 0.381 | -| value_loss | 4.23e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4512 | -| time_elapsed | 36531 | -| total_timesteps | 577536 | -| train/ | | -| approx_kl | 0.0073676514 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.454 | -| explained_variance | -305 | -| learning_rate | 0.0003 | -| loss | -0.00473 | -| n_updates | 45110 | -| policy_gradient_loss | -0.00132 | -| std | 0.381 | -| value_loss | 2.9e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4513 | -| time_elapsed | 36534 | -| total_timesteps | 577664 | -| train/ | | -| approx_kl | 0.03936582 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | -0.452 | -| explained_variance | -2.14 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 45120 | -| policy_gradient_loss | -0.00638 | -| std | 0.38 | -| value_loss | 3.41e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4514 | -| time_elapsed | 36537 | -| total_timesteps | 577792 | -| train/ | | -| approx_kl | 0.006037929 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.45 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 45130 | -| policy_gradient_loss | -0.000776 | -| std | 0.379 | -| value_loss | 1.01e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 15 | -| iterations | 4515 | -| time_elapsed | 36540 | -| total_timesteps | 577920 | -| train/ | | -| approx_kl | 0.011776347 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.448 | -| explained_variance | -0.069 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 45140 | -| policy_gradient_loss | -0.00782 | -| std | 0.378 | -| value_loss | 6.23e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4516 | -| time_elapsed | 36544 | -| total_timesteps | 578048 | -| train/ | | -| approx_kl | 0.017820098 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.447 | -| explained_variance | 0.00375 | -| learning_rate | 0.0003 | -| loss | -0.00878 | -| n_updates | 45150 | -| policy_gradient_loss | -0.00712 | -| std | 0.378 | -| value_loss | 4.03e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4517 | -| time_elapsed | 36549 | -| total_timesteps | 578176 | -| train/ | | -| approx_kl | 0.014288117 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.446 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 45160 | -| policy_gradient_loss | -0.00958 | -| std | 0.378 | -| value_loss | 5.72e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4518 | -| time_elapsed | 36551 | -| total_timesteps | 578304 | -| train/ | | -| approx_kl | 0.00065336353 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.447 | -| explained_variance | -32.4 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 45170 | -| policy_gradient_loss | 0.000662 | -| std | 0.379 | -| value_loss | 6.44e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4519 | -| time_elapsed | 36554 | -| total_timesteps | 578432 | -| train/ | | -| approx_kl | 0.0012053847 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.449 | -| explained_variance | -237 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 45180 | -| policy_gradient_loss | 0.000322 | -| std | 0.379 | -| value_loss | 4.54e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4520 | -| time_elapsed | 36557 | -| total_timesteps | 578560 | -| train/ | | -| approx_kl | 0.053727698 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | -0.45 | -| explained_variance | -21.3 | -| learning_rate | 0.0003 | -| loss | -0.00796 | -| n_updates | 45190 | -| policy_gradient_loss | -0.00466 | -| std | 0.38 | -| value_loss | 2.71e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4521 | -| time_elapsed | 36559 | -| total_timesteps | 578688 | -| train/ | | -| approx_kl | 1.0299729e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.452 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.000202 | -| n_updates | 45200 | -| policy_gradient_loss | 0.00144 | -| std | 0.38 | -| value_loss | 9.54e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4522 | -| time_elapsed | 36563 | -| total_timesteps | 578816 | -| train/ | | -| approx_kl | 0.0018087788 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.451 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 45210 | -| policy_gradient_loss | -5.78e-05 | -| std | 0.379 | -| value_loss | 4.97e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 15 | -| iterations | 4523 | -| time_elapsed | 36567 | -| total_timesteps | 578944 | -| train/ | | -| approx_kl | 0.0014760529 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.448 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 45220 | -| policy_gradient_loss | 0.000174 | -| std | 0.378 | -| value_loss | 4.31e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4524 | -| time_elapsed | 36570 | -| total_timesteps | 579072 | -| train/ | | -| approx_kl | 0.0010320325 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.446 | -| explained_variance | 0.0104 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 45230 | -| policy_gradient_loss | 0.000638 | -| std | 0.378 | -| value_loss | 3.04e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4525 | -| time_elapsed | 36574 | -| total_timesteps | 579200 | -| train/ | | -| approx_kl | 0.048736982 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | -0.445 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 45240 | -| policy_gradient_loss | -0.00387 | -| std | 0.377 | -| value_loss | 0.000759 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4526 | -| time_elapsed | 36576 | -| total_timesteps | 579328 | -| train/ | | -| approx_kl | 0.0015208111 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.444 | -| explained_variance | -729 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 45250 | -| policy_gradient_loss | -8.8e-05 | -| std | 0.377 | -| value_loss | 4.01e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4527 | -| time_elapsed | 36579 | -| total_timesteps | 579456 | -| train/ | | -| approx_kl | 0.0020383678 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.445 | -| explained_variance | -2.71e+03 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 45260 | -| policy_gradient_loss | 6.93e-06 | -| std | 0.378 | -| value_loss | 1.27e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4528 | -| time_elapsed | 36583 | -| total_timesteps | 579584 | -| train/ | | -| approx_kl | 0.00076452596 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.446 | -| explained_variance | -32.7 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 45270 | -| policy_gradient_loss | 0.000665 | -| std | 0.378 | -| value_loss | 2.48e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4529 | -| time_elapsed | 36587 | -| total_timesteps | 579712 | -| train/ | | -| approx_kl | 0.02502068 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.447 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 45280 | -| policy_gradient_loss | -0.0046 | -| std | 0.379 | -| value_loss | 4.62e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4530 | -| time_elapsed | 36590 | -| total_timesteps | 579840 | -| train/ | | -| approx_kl | 0.010185828 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.448 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | 0.0013 | -| n_updates | 45290 | -| policy_gradient_loss | -0.000577 | -| std | 0.379 | -| value_loss | 2.91e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4531 | -| time_elapsed | 36594 | -| total_timesteps | 579968 | -| train/ | | -| approx_kl | 0.016067674 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.448 | -| explained_variance | 0.00802 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 45300 | -| policy_gradient_loss | -0.00816 | -| std | 0.379 | -| value_loss | 2.42e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4532 | -| time_elapsed | 36596 | -| total_timesteps | 580096 | -| train/ | | -| approx_kl | 0.009977455 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.448 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 45310 | -| policy_gradient_loss | -0.0014 | -| std | 0.379 | -| value_loss | 2.79e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4533 | -| time_elapsed | 36602 | -| total_timesteps | 580224 | -| train/ | | -| approx_kl | 0.013003653 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.449 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 45320 | -| policy_gradient_loss | -0.00723 | -| std | 0.379 | -| value_loss | 0.00147 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4534 | -| time_elapsed | 36605 | -| total_timesteps | 580352 | -| train/ | | -| approx_kl | 0.0011975779 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.449 | -| explained_variance | -66.7 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 45330 | -| policy_gradient_loss | 0.000962 | -| std | 0.379 | -| value_loss | 2.26e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4535 | -| time_elapsed | 36608 | -| total_timesteps | 580480 | -| train/ | | -| approx_kl | 0.0011890689 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.449 | -| explained_variance | -87 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 45340 | -| policy_gradient_loss | 0.000468 | -| std | 0.379 | -| value_loss | 8.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4536 | -| time_elapsed | 36612 | -| total_timesteps | 580608 | -| train/ | | -| approx_kl | 0.035215016 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.449 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 45350 | -| policy_gradient_loss | -0.00381 | -| std | 0.379 | -| value_loss | 6.08e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4537 | -| time_elapsed | 36615 | -| total_timesteps | 580736 | -| train/ | | -| approx_kl | 0.007849533 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.451 | -| explained_variance | -0.0031 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 45360 | -| policy_gradient_loss | -0.00208 | -| std | 0.38 | -| value_loss | 1.59e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4538 | -| time_elapsed | 36619 | -| total_timesteps | 580864 | -| train/ | | -| approx_kl | 0.0026843979 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.454 | -| explained_variance | 0.00733 | -| learning_rate | 0.0003 | -| loss | -0.000509 | -| n_updates | 45370 | -| policy_gradient_loss | -0.000226 | -| std | 0.382 | -| value_loss | 2.48e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 15 | -| iterations | 4539 | -| time_elapsed | 36622 | -| total_timesteps | 580992 | -| train/ | | -| approx_kl | 0.016923942 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.457 | -| explained_variance | 0.00658 | -| learning_rate | 0.0003 | -| loss | -0.00738 | -| n_updates | 45380 | -| policy_gradient_loss | -0.00653 | -| std | 0.383 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4540 | -| time_elapsed | 36624 | -| total_timesteps | 581120 | -| train/ | | -| approx_kl | 0.013212789 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.458 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 45390 | -| policy_gradient_loss | -0.00181 | -| std | 0.382 | -| value_loss | 1.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4541 | -| time_elapsed | 36633 | -| total_timesteps | 581248 | -| train/ | | -| approx_kl | 0.008331487 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.455 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 45400 | -| policy_gradient_loss | -0.000791 | -| std | 0.381 | -| value_loss | 9.11e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4542 | -| time_elapsed | 36638 | -| total_timesteps | 581376 | -| train/ | | -| approx_kl | 0.0015925614 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.452 | -| explained_variance | -1.2e+03 | -| learning_rate | 0.0003 | -| loss | 0.000152 | -| n_updates | 45410 | -| policy_gradient_loss | 0.000126 | -| std | 0.38 | -| value_loss | 4.74e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4543 | -| time_elapsed | 36643 | -| total_timesteps | 581504 | -| train/ | | -| approx_kl | 0.018217199 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.453 | -| explained_variance | -545 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 45420 | -| policy_gradient_loss | -0.00486 | -| std | 0.381 | -| value_loss | 8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4544 | -| time_elapsed | 36646 | -| total_timesteps | 581632 | -| train/ | | -| approx_kl | 0.023918573 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.454 | -| explained_variance | -14.6 | -| learning_rate | 0.0003 | -| loss | 0.000101 | -| n_updates | 45430 | -| policy_gradient_loss | -0.00083 | -| std | 0.381 | -| value_loss | 2.6e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4545 | -| time_elapsed | 36649 | -| total_timesteps | 581760 | -| train/ | | -| approx_kl | 0.016274322 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.452 | -| explained_variance | -1.92 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 45440 | -| policy_gradient_loss | -0.0068 | -| std | 0.38 | -| value_loss | 9.12e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 15 | -| iterations | 4546 | -| time_elapsed | 36653 | -| total_timesteps | 581888 | -| train/ | | -| approx_kl | 0.007140637 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.45 | -| explained_variance | -0.00436 | -| learning_rate | 0.0003 | -| loss | -0.00387 | -| n_updates | 45450 | -| policy_gradient_loss | -0.0017 | -| std | 0.379 | -| value_loss | 4.07e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4547 | -| time_elapsed | 36656 | -| total_timesteps | 582016 | -| train/ | | -| approx_kl | 0.0024145704 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.445 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.000801 | -| n_updates | 45460 | -| policy_gradient_loss | -0.00038 | -| std | 0.376 | -| value_loss | 1.57e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4548 | -| time_elapsed | 36665 | -| total_timesteps | 582144 | -| train/ | | -| approx_kl | 0.011373986 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -0.439 | -| explained_variance | 0.0708 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 45470 | -| policy_gradient_loss | -0.00634 | -| std | 0.375 | -| value_loss | 0.00186 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4549 | -| time_elapsed | 36669 | -| total_timesteps | 582272 | -| train/ | | -| approx_kl | 0.0025604798 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.436 | -| explained_variance | -62.2 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 45480 | -| policy_gradient_loss | -0.000278 | -| std | 0.373 | -| value_loss | 2.01e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4550 | -| time_elapsed | 36673 | -| total_timesteps | 582400 | -| train/ | | -| approx_kl | 0.0008316906 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.432 | -| explained_variance | -281 | -| learning_rate | 0.0003 | -| loss | -0.0078 | -| n_updates | 45490 | -| policy_gradient_loss | 0.00195 | -| std | 0.373 | -| value_loss | 6.75e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4551 | -| time_elapsed | 36676 | -| total_timesteps | 582528 | -| train/ | | -| approx_kl | 0.001202351 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.432 | -| explained_variance | -1.8 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 45500 | -| policy_gradient_loss | 0.000721 | -| std | 0.373 | -| value_loss | 3.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4552 | -| time_elapsed | 36680 | -| total_timesteps | 582656 | -| train/ | | -| approx_kl | 0.018569564 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | -0.432 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | -0.00076 | -| n_updates | 45510 | -| policy_gradient_loss | -0.00302 | -| std | 0.372 | -| value_loss | 9.64e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4553 | -| time_elapsed | 36682 | -| total_timesteps | 582784 | -| train/ | | -| approx_kl | 0.011777971 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.431 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 45520 | -| policy_gradient_loss | -0.00217 | -| std | 0.373 | -| value_loss | 5.37e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 15 | -| iterations | 4554 | -| time_elapsed | 36684 | -| total_timesteps | 582912 | -| train/ | | -| approx_kl | 0.008715461 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.433 | -| explained_variance | 0.00555 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 45530 | -| policy_gradient_loss | -0.00307 | -| std | 0.374 | -| value_loss | 5.03e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4555 | -| time_elapsed | 36688 | -| total_timesteps | 583040 | -| train/ | | -| approx_kl | 0.004371162 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.435 | -| explained_variance | 0.00551 | -| learning_rate | 0.0003 | -| loss | 0.000182 | -| n_updates | 45540 | -| policy_gradient_loss | 0.000162 | -| std | 0.373 | -| value_loss | 3.1e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4556 | -| time_elapsed | 36696 | -| total_timesteps | 583168 | -| train/ | | -| approx_kl | 0.01143196 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.433 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 45550 | -| policy_gradient_loss | -0.0109 | -| std | 0.373 | -| value_loss | 0.000289 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4557 | -| time_elapsed | 36700 | -| total_timesteps | 583296 | -| train/ | | -| approx_kl | 0.019267099 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -0.433 | -| explained_variance | -1.04e+03 | -| learning_rate | 0.0003 | -| loss | -0.00454 | -| n_updates | 45560 | -| policy_gradient_loss | -0.00223 | -| std | 0.374 | -| value_loss | 8.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4558 | -| time_elapsed | 36703 | -| total_timesteps | 583424 | -| train/ | | -| approx_kl | 0.030968994 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.435 | -| explained_variance | -1.06e+03 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 45570 | -| policy_gradient_loss | -0.012 | -| std | 0.374 | -| value_loss | 3.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4559 | -| time_elapsed | 36706 | -| total_timesteps | 583552 | -| train/ | | -| approx_kl | 0.02259422 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -0.435 | -| explained_variance | -6.19 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 45580 | -| policy_gradient_loss | -0.00658 | -| std | 0.374 | -| value_loss | 3.13e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4560 | -| time_elapsed | 36708 | -| total_timesteps | 583680 | -| train/ | | -| approx_kl | 0.025327073 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.435 | -| explained_variance | -6.3 | -| learning_rate | 0.0003 | -| loss | 0.000456 | -| n_updates | 45590 | -| policy_gradient_loss | -0.00231 | -| std | 0.374 | -| value_loss | 3.43e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4561 | -| time_elapsed | 36713 | -| total_timesteps | 583808 | -| train/ | | -| approx_kl | 0.019429645 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.434 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 45600 | -| policy_gradient_loss | -0.00304 | -| std | 0.373 | -| value_loss | 1.12e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 15 | -| iterations | 4562 | -| time_elapsed | 36716 | -| total_timesteps | 583936 | -| train/ | | -| approx_kl | 0.01698404 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.433 | -| explained_variance | -0.00103 | -| learning_rate | 0.0003 | -| loss | -0.00854 | -| n_updates | 45610 | -| policy_gradient_loss | -0.00778 | -| std | 0.373 | -| value_loss | 1.49e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4563 | -| time_elapsed | 36720 | -| total_timesteps | 584064 | -| train/ | | -| approx_kl | 0.013091499 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.433 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 45620 | -| policy_gradient_loss | -0.00287 | -| std | 0.373 | -| value_loss | 2.66e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4564 | -| time_elapsed | 36725 | -| total_timesteps | 584192 | -| train/ | | -| approx_kl | 0.0014854283 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.433 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | 1.33e-05 | -| n_updates | 45630 | -| policy_gradient_loss | -2.74e-05 | -| std | 0.373 | -| value_loss | 0.000196 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4565 | -| time_elapsed | 36728 | -| total_timesteps | 584320 | -| train/ | | -| approx_kl | 0.0043255966 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.432 | -| explained_variance | -1.17e+04 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 45640 | -| policy_gradient_loss | -0.00036 | -| std | 0.373 | -| value_loss | 2.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4566 | -| time_elapsed | 36731 | -| total_timesteps | 584448 | -| train/ | | -| approx_kl | 0.0053448556 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.434 | -| explained_variance | -2.91e+04 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 45650 | -| policy_gradient_loss | -0.000732 | -| std | 0.374 | -| value_loss | 2.29e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4567 | -| time_elapsed | 36734 | -| total_timesteps | 584576 | -| train/ | | -| approx_kl | 0.00691948 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.436 | -| explained_variance | -711 | -| learning_rate | 0.0003 | -| loss | 0.000671 | -| n_updates | 45660 | -| policy_gradient_loss | 0.000442 | -| std | 0.375 | -| value_loss | 5.35e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4568 | -| time_elapsed | 36737 | -| total_timesteps | 584704 | -| train/ | | -| approx_kl | 0.01993623 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.438 | -| explained_variance | -574 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 45670 | -| policy_gradient_loss | -0.00482 | -| std | 0.375 | -| value_loss | 2.03e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4569 | -| time_elapsed | 36740 | -| total_timesteps | 584832 | -| train/ | | -| approx_kl | 0.05220719 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | -0.438 | -| explained_variance | -97.7 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 45680 | -| policy_gradient_loss | -0.0111 | -| std | 0.375 | -| value_loss | 8.44e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 15 | -| iterations | 4570 | -| time_elapsed | 36743 | -| total_timesteps | 584960 | -| train/ | | -| approx_kl | 0.01170869 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.438 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | -0.000597 | -| n_updates | 45690 | -| policy_gradient_loss | -0.000733 | -| std | 0.375 | -| value_loss | 4.85e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4571 | -| time_elapsed | 36746 | -| total_timesteps | 585088 | -| train/ | | -| approx_kl | 0.008784577 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.439 | -| explained_variance | -1.21 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 45700 | -| policy_gradient_loss | -0.000986 | -| std | 0.375 | -| value_loss | 2.24e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4572 | -| time_elapsed | 36753 | -| total_timesteps | 585216 | -| train/ | | -| approx_kl | 0.01152897 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.44 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 45710 | -| policy_gradient_loss | -0.00414 | -| std | 0.376 | -| value_loss | 9.95e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4573 | -| time_elapsed | 36757 | -| total_timesteps | 585344 | -| train/ | | -| approx_kl | 0.086615846 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | -0.44 | -| explained_variance | -8.82e+04 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 45720 | -| policy_gradient_loss | -0.00603 | -| std | 0.376 | -| value_loss | 7.97e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4574 | -| time_elapsed | 36761 | -| total_timesteps | 585472 | -| train/ | | -| approx_kl | 0.00010162918 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.442 | -| explained_variance | -9.28e+03 | -| learning_rate | 0.0003 | -| loss | 0.000106 | -| n_updates | 45730 | -| policy_gradient_loss | 0.00082 | -| std | 0.377 | -| value_loss | 1.36e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4575 | -| time_elapsed | 36765 | -| total_timesteps | 585600 | -| train/ | | -| approx_kl | 0.0025209968 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.445 | -| explained_variance | -645 | -| learning_rate | 0.0003 | -| loss | -0.00343 | -| n_updates | 45740 | -| policy_gradient_loss | -0.000402 | -| std | 0.378 | -| value_loss | 1.41e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4576 | -| time_elapsed | 36769 | -| total_timesteps | 585728 | -| train/ | | -| approx_kl | 9.2678005e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.445 | -| explained_variance | -1.66e+03 | -| learning_rate | 0.0003 | -| loss | 0.000104 | -| n_updates | 45750 | -| policy_gradient_loss | 0.000567 | -| std | 0.377 | -| value_loss | 1.84e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4577 | -| time_elapsed | 36772 | -| total_timesteps | 585856 | -| train/ | | -| approx_kl | 0.0060173105 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.443 | -| explained_variance | -194 | -| learning_rate | 0.0003 | -| loss | -0.005 | -| n_updates | 45760 | -| policy_gradient_loss | -0.00148 | -| std | 0.376 | -| value_loss | 2.5e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4578 | -| time_elapsed | 36776 | -| total_timesteps | 585984 | -| train/ | | -| approx_kl | 0.0042414796 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.44 | -| explained_variance | -92.4 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 45770 | -| policy_gradient_loss | -0.00163 | -| std | 0.375 | -| value_loss | 5.54e-12 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 15 | -| iterations | 4579 | -| time_elapsed | 36779 | -| total_timesteps | 586112 | -| train/ | | -| approx_kl | 0.0005220878 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.438 | -| explained_variance | -5.8 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 45780 | -| policy_gradient_loss | 0.00108 | -| std | 0.375 | -| value_loss | 5.03e-13 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 15 | -| iterations | 4580 | -| time_elapsed | 36789 | -| total_timesteps | 586240 | -| train/ | | -| approx_kl | 0.045186903 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | -0.438 | -| explained_variance | -4 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 45790 | -| policy_gradient_loss | -0.00897 | -| std | 0.375 | -| value_loss | 0.00432 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 15 | -| iterations | 4581 | -| time_elapsed | 36792 | -| total_timesteps | 586368 | -| train/ | | -| approx_kl | 0.005943993 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.437 | -| explained_variance | -1.53e+03 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 45800 | -| policy_gradient_loss | -0.0067 | -| std | 0.375 | -| value_loss | 2e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 15 | -| iterations | 4582 | -| time_elapsed | 36795 | -| total_timesteps | 586496 | -| train/ | | -| approx_kl | 0.0004868002 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.437 | -| explained_variance | -940 | -| learning_rate | 0.0003 | -| loss | -0.000709 | -| n_updates | 45810 | -| policy_gradient_loss | 0.000336 | -| std | 0.374 | -| value_loss | 6.56e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 15 | -| iterations | 4583 | -| time_elapsed | 36798 | -| total_timesteps | 586624 | -| train/ | | -| approx_kl | 0.0035213844 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.435 | -| explained_variance | -2.97 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 45820 | -| policy_gradient_loss | -0.000216 | -| std | 0.373 | -| value_loss | 8.01e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 15 | -| iterations | 4584 | -| time_elapsed | 36802 | -| total_timesteps | 586752 | -| train/ | | -| approx_kl | 0.00073313084 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.432 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 45830 | -| policy_gradient_loss | 0.00104 | -| std | 0.372 | -| value_loss | 8.93e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 15 | -| iterations | 4585 | -| time_elapsed | 36806 | -| total_timesteps | 586880 | -| train/ | | -| approx_kl | 0.023753747 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | -0.428 | -| explained_variance | -0.673 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 45840 | -| policy_gradient_loss | -0.00231 | -| std | 0.371 | -| value_loss | 5.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4586 | -| time_elapsed | 36808 | -| total_timesteps | 587008 | -| train/ | | -| approx_kl | 0.015093978 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.427 | -| explained_variance | -0.0055 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 45850 | -| policy_gradient_loss | -0.00533 | -| std | 0.371 | -| value_loss | 3.68e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4587 | -| time_elapsed | 36817 | -| total_timesteps | 587136 | -| train/ | | -| approx_kl | 0.008905765 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.426 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 45860 | -| policy_gradient_loss | -0.00145 | -| std | 0.37 | -| value_loss | 3.83e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4588 | -| time_elapsed | 36820 | -| total_timesteps | 587264 | -| train/ | | -| approx_kl | 0.031184684 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.425 | -| explained_variance | -50.1 | -| learning_rate | 0.0003 | -| loss | -0.0057 | -| n_updates | 45870 | -| policy_gradient_loss | -0.00412 | -| std | 0.37 | -| value_loss | 9.8e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4589 | -| time_elapsed | 36824 | -| total_timesteps | 587392 | -| train/ | | -| approx_kl | 0.0057678167 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.423 | -| explained_variance | -32.2 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 45880 | -| policy_gradient_loss | -0.00257 | -| std | 0.369 | -| value_loss | 5.18e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4590 | -| time_elapsed | 36827 | -| total_timesteps | 587520 | -| train/ | | -| approx_kl | 0.00032271305 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.423 | -| explained_variance | -3.04 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 45890 | -| policy_gradient_loss | 0.000921 | -| std | 0.37 | -| value_loss | 1.36e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4591 | -| time_elapsed | 36830 | -| total_timesteps | 587648 | -| train/ | | -| approx_kl | 0.0012907265 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.424 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | -0.00978 | -| n_updates | 45900 | -| policy_gradient_loss | 0.00082 | -| std | 0.37 | -| value_loss | 1.78e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4592 | -| time_elapsed | 36834 | -| total_timesteps | 587776 | -| train/ | | -| approx_kl | 0.023312598 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | -0.424 | -| explained_variance | -0.0077 | -| learning_rate | 0.0003 | -| loss | -0.00616 | -| n_updates | 45910 | -| policy_gradient_loss | -0.00721 | -| std | 0.37 | -| value_loss | 1.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4593 | -| time_elapsed | 36837 | -| total_timesteps | 587904 | -| train/ | | -| approx_kl | 0.016115265 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.424 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 45920 | -| policy_gradient_loss | -0.00849 | -| std | 0.37 | -| value_loss | 6.03e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4594 | -| time_elapsed | 36839 | -| total_timesteps | 588032 | -| train/ | | -| approx_kl | 0.009877965 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.422 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.000585 | -| n_updates | 45930 | -| policy_gradient_loss | -0.00114 | -| std | 0.368 | -| value_loss | 7.61e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4595 | -| time_elapsed | 36846 | -| total_timesteps | 588160 | -| train/ | | -| approx_kl | 0.02158734 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -0.418 | -| explained_variance | 0.943 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 45940 | -| policy_gradient_loss | -0.0132 | -| std | 0.367 | -| value_loss | 0.000577 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4596 | -| time_elapsed | 36849 | -| total_timesteps | 588288 | -| train/ | | -| approx_kl | 0.010083441 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.417 | -| explained_variance | -1.39e+03 | -| learning_rate | 0.0003 | -| loss | -0.000754 | -| n_updates | 45950 | -| policy_gradient_loss | -0.000447 | -| std | 0.368 | -| value_loss | 2.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4597 | -| time_elapsed | 36853 | -| total_timesteps | 588416 | -| train/ | | -| approx_kl | 0.026685873 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.419 | -| explained_variance | -1.6e+03 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 45960 | -| policy_gradient_loss | -0.0059 | -| std | 0.368 | -| value_loss | 8.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4598 | -| time_elapsed | 36857 | -| total_timesteps | 588544 | -| train/ | | -| approx_kl | 0.016800603 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | -0.42 | -| explained_variance | -25 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 45970 | -| policy_gradient_loss | -8.05e-05 | -| std | 0.368 | -| value_loss | 8.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4599 | -| time_elapsed | 36860 | -| total_timesteps | 588672 | -| train/ | | -| approx_kl | 0.012838248 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.42 | -| explained_variance | -22.4 | -| learning_rate | 0.0003 | -| loss | -0.00389 | -| n_updates | 45980 | -| policy_gradient_loss | -0.00167 | -| std | 0.368 | -| value_loss | 1.76e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4600 | -| time_elapsed | 36863 | -| total_timesteps | 588800 | -| train/ | | -| approx_kl | 0.0075842575 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.419 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 45990 | -| policy_gradient_loss | 0.000793 | -| std | 0.368 | -| value_loss | 3.12e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 15 | -| iterations | 4601 | -| time_elapsed | 36867 | -| total_timesteps | 588928 | -| train/ | | -| approx_kl | 0.017596763 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.418 | -| explained_variance | -0.345 | -| learning_rate | 0.0003 | -| loss | -0.000923 | -| n_updates | 46000 | -| policy_gradient_loss | -0.00231 | -| std | 0.367 | -| value_loss | 2.59e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4602 | -| time_elapsed | 36870 | -| total_timesteps | 589056 | -| train/ | | -| approx_kl | 0.010388717 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.416 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 46010 | -| policy_gradient_loss | -0.00377 | -| std | 0.366 | -| value_loss | 2.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4603 | -| time_elapsed | 36875 | -| total_timesteps | 589184 | -| train/ | | -| approx_kl | 0.013513004 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.414 | -| explained_variance | -8.86 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 46020 | -| policy_gradient_loss | -0.0106 | -| std | 0.366 | -| value_loss | 0.004 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4604 | -| time_elapsed | 36879 | -| total_timesteps | 589312 | -| train/ | | -| approx_kl | 0.015352836 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.412 | -| explained_variance | -4.31e+03 | -| learning_rate | 0.0003 | -| loss | -0.00613 | -| n_updates | 46030 | -| policy_gradient_loss | -0.0026 | -| std | 0.365 | -| value_loss | 1.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4605 | -| time_elapsed | 36883 | -| total_timesteps | 589440 | -| train/ | | -| approx_kl | 0.021475332 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -1.71e+03 | -| learning_rate | 0.0003 | -| loss | -0.000426 | -| n_updates | 46040 | -| policy_gradient_loss | -0.000709 | -| std | 0.363 | -| value_loss | 4.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4606 | -| time_elapsed | 36887 | -| total_timesteps | 589568 | -| train/ | | -| approx_kl | 0.018476745 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.405 | -| explained_variance | -2.43 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 46050 | -| policy_gradient_loss | -0.00918 | -| std | 0.362 | -| value_loss | 4.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4607 | -| time_elapsed | 36891 | -| total_timesteps | 589696 | -| train/ | | -| approx_kl | 0.025411284 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | -0.402 | -| explained_variance | -29.3 | -| learning_rate | 0.0003 | -| loss | -0.00563 | -| n_updates | 46060 | -| policy_gradient_loss | -0.00441 | -| std | 0.361 | -| value_loss | 7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4608 | -| time_elapsed | 36893 | -| total_timesteps | 589824 | -| train/ | | -| approx_kl | 0.007084173 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.401 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 46070 | -| policy_gradient_loss | -0.0018 | -| std | 0.361 | -| value_loss | 1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 15 | -| iterations | 4609 | -| time_elapsed | 36896 | -| total_timesteps | 589952 | -| train/ | | -| approx_kl | 0.010682063 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.401 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 46080 | -| policy_gradient_loss | -0.00277 | -| std | 0.361 | -| value_loss | 8.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 15 | -| iterations | 4610 | -| time_elapsed | 36900 | -| total_timesteps | 590080 | -| train/ | | -| approx_kl | 0.029570414 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | -0.401 | -| explained_variance | -0.00633 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 46090 | -| policy_gradient_loss | -0.0122 | -| std | 0.361 | -| value_loss | 1.4e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 15 | -| iterations | 4611 | -| time_elapsed | 36906 | -| total_timesteps | 590208 | -| train/ | | -| approx_kl | 0.017790753 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | -0.427 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 46100 | -| policy_gradient_loss | -0.00345 | -| std | 0.361 | -| value_loss | 0.00123 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 15 | -| iterations | 4612 | -| time_elapsed | 36908 | -| total_timesteps | 590336 | -| train/ | | -| approx_kl | 1.0937452e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | -1.73e+03 | -| learning_rate | 0.0003 | -| loss | 0.000315 | -| n_updates | 46110 | -| policy_gradient_loss | 0.00242 | -| std | 0.361 | -| value_loss | 3.86e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 15 | -| iterations | 4613 | -| time_elapsed | 36912 | -| total_timesteps | 590464 | -| train/ | | -| approx_kl | 0.0026166826 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | -3.52e+03 | -| learning_rate | 0.0003 | -| loss | -0.00405 | -| n_updates | 46120 | -| policy_gradient_loss | -9.08e-05 | -| std | 0.361 | -| value_loss | 1.57e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 15 | -| iterations | 4614 | -| time_elapsed | 36914 | -| total_timesteps | 590592 | -| train/ | | -| approx_kl | 0.0009731543 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | -2.1e+03 | -| learning_rate | 0.0003 | -| loss | -0.00692 | -| n_updates | 46130 | -| policy_gradient_loss | 0.00201 | -| std | 0.361 | -| value_loss | 2.85e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 16 | -| iterations | 4615 | -| time_elapsed | 36917 | -| total_timesteps | 590720 | -| train/ | | -| approx_kl | 0.0014356053 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | -17.4 | -| learning_rate | 0.0003 | -| loss | -0.00893 | -| n_updates | 46140 | -| policy_gradient_loss | 0.00117 | -| std | 0.361 | -| value_loss | 6.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 16 | -| iterations | 4616 | -| time_elapsed | 36920 | -| total_timesteps | 590848 | -| train/ | | -| approx_kl | 0.020690627 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | -0.401 | -| explained_variance | -0.724 | -| learning_rate | 0.0003 | -| loss | -0.000373 | -| n_updates | 46150 | -| policy_gradient_loss | -0.00342 | -| std | 0.362 | -| value_loss | 1.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 16 | -| iterations | 4617 | -| time_elapsed | 36922 | -| total_timesteps | 590976 | -| train/ | | -| approx_kl | 0.010342221 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.403 | -| explained_variance | -0.0819 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 46160 | -| policy_gradient_loss | -0.00163 | -| std | 0.363 | -| value_loss | 4.34e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 16 | -| iterations | 4618 | -| time_elapsed | 36926 | -| total_timesteps | 591104 | -| train/ | | -| approx_kl | 0.008991742 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 46170 | -| policy_gradient_loss | -0.00225 | -| std | 0.363 | -| value_loss | 1.17e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 16 | -| iterations | 4619 | -| time_elapsed | 36934 | -| total_timesteps | 591232 | -| train/ | | -| approx_kl | 0.025650581 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | 0.665 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 46180 | -| policy_gradient_loss | -0.00952 | -| std | 0.363 | -| value_loss | 0.00621 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 16 | -| iterations | 4620 | -| time_elapsed | 36937 | -| total_timesteps | 591360 | -| train/ | | -| approx_kl | 0.0046217316 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -2.91e+03 | -| learning_rate | 0.0003 | -| loss | -0.00615 | -| n_updates | 46190 | -| policy_gradient_loss | -0.00124 | -| std | 0.364 | -| value_loss | 1.92e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 16 | -| iterations | 4621 | -| time_elapsed | 36941 | -| total_timesteps | 591488 | -| train/ | | -| approx_kl | 0.00047767814 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -1.06e+03 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 46200 | -| policy_gradient_loss | 0.00312 | -| std | 0.363 | -| value_loss | 1.23e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 16 | -| iterations | 4622 | -| time_elapsed | 36944 | -| total_timesteps | 591616 | -| train/ | | -| approx_kl | 0.0011816788 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -123 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 46210 | -| policy_gradient_loss | 0.000295 | -| std | 0.363 | -| value_loss | 1.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 16 | -| iterations | 4623 | -| time_elapsed | 36948 | -| total_timesteps | 591744 | -| train/ | | -| approx_kl | 0.0009927093 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -42.4 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 46220 | -| policy_gradient_loss | 0.000601 | -| std | 0.363 | -| value_loss | 3.11e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 16 | -| iterations | 4624 | -| time_elapsed | 36952 | -| total_timesteps | 591872 | -| train/ | | -| approx_kl | 0.00024462584 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.000138 | -| n_updates | 46230 | -| policy_gradient_loss | 0.000451 | -| std | 0.364 | -| value_loss | 4.02e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4625 | -| time_elapsed | 36955 | -| total_timesteps | 592000 | -| train/ | | -| approx_kl | 0.02008611 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | -0.41 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 46240 | -| policy_gradient_loss | -0.0127 | -| std | 0.365 | -| value_loss | 1.36e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4626 | -| time_elapsed | 36957 | -| total_timesteps | 592128 | -| train/ | | -| approx_kl | 0.013565439 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.412 | -| explained_variance | -0.00391 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 46250 | -| policy_gradient_loss | -0.00403 | -| std | 0.365 | -| value_loss | 9.57e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4627 | -| time_elapsed | 36966 | -| total_timesteps | 592256 | -| train/ | | -| approx_kl | 0.013219289 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.412 | -| explained_variance | -3.35 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 46260 | -| policy_gradient_loss | -0.0014 | -| std | 0.366 | -| value_loss | 0.00218 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4628 | -| time_elapsed | 36970 | -| total_timesteps | 592384 | -| train/ | | -| approx_kl | 0.050273098 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | -0.413 | -| explained_variance | -3.64e+03 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 46270 | -| policy_gradient_loss | -0.0108 | -| std | 0.366 | -| value_loss | 1.68e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4629 | -| time_elapsed | 36974 | -| total_timesteps | 592512 | -| train/ | | -| approx_kl | 0.019800192 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | -0.415 | -| explained_variance | -2.7e+03 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 46280 | -| policy_gradient_loss | -0.0044 | -| std | 0.367 | -| value_loss | 4.17e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4630 | -| time_elapsed | 36978 | -| total_timesteps | 592640 | -| train/ | | -| approx_kl | 0.02028551 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.416 | -| explained_variance | -64 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 46290 | -| policy_gradient_loss | -0.0118 | -| std | 0.367 | -| value_loss | 7.57e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4631 | -| time_elapsed | 36983 | -| total_timesteps | 592768 | -| train/ | | -| approx_kl | 0.010885173 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.418 | -| explained_variance | -0.879 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 46300 | -| policy_gradient_loss | -0.00791 | -| std | 0.368 | -| value_loss | 1.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 16 | -| iterations | 4632 | -| time_elapsed | 36987 | -| total_timesteps | 592896 | -| train/ | | -| approx_kl | 0.012916331 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | -0.418 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.00184 | -| n_updates | 46310 | -| policy_gradient_loss | 0.000754 | -| std | 0.367 | -| value_loss | 4.71e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4633 | -| time_elapsed | 36991 | -| total_timesteps | 593024 | -| train/ | | -| approx_kl | 0.0066284128 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.416 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 46320 | -| policy_gradient_loss | -0.000671 | -| std | 0.366 | -| value_loss | 4.6e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4634 | -| time_elapsed | 36999 | -| total_timesteps | 593152 | -| train/ | | -| approx_kl | 0.03416565 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.412 | -| explained_variance | 0.966 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 46330 | -| policy_gradient_loss | -0.00713 | -| std | 0.365 | -| value_loss | 6.88e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4635 | -| time_elapsed | 37003 | -| total_timesteps | 593280 | -| train/ | | -| approx_kl | 0.0325366 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.41 | -| explained_variance | -28.4 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 46340 | -| policy_gradient_loss | -0.00155 | -| std | 0.364 | -| value_loss | 2.35e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4636 | -| time_elapsed | 37006 | -| total_timesteps | 593408 | -| train/ | | -| approx_kl | 0.019828497 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.408 | -| explained_variance | -29.7 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 46350 | -| policy_gradient_loss | -0.00485 | -| std | 0.364 | -| value_loss | 1.05e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4637 | -| time_elapsed | 37009 | -| total_timesteps | 593536 | -| train/ | | -| approx_kl | 1.3693236e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 46360 | -| policy_gradient_loss | 0.00849 | -| std | 0.364 | -| value_loss | 1.48e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4638 | -| time_elapsed | 37012 | -| total_timesteps | 593664 | -| train/ | | -| approx_kl | 0.002289319 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.408 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 46370 | -| policy_gradient_loss | -0.000186 | -| std | 0.364 | -| value_loss | 9.68e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4639 | -| time_elapsed | 37016 | -| total_timesteps | 593792 | -| train/ | | -| approx_kl | 0.0012581288 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.000607 | -| n_updates | 46380 | -| policy_gradient_loss | 0.000598 | -| std | 0.364 | -| value_loss | 8.87e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 16 | -| iterations | 4640 | -| time_elapsed | 37020 | -| total_timesteps | 593920 | -| train/ | | -| approx_kl | 0.010557072 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.41 | -| explained_variance | 0.000297 | -| learning_rate | 0.0003 | -| loss | -0.0269 | -| n_updates | 46390 | -| policy_gradient_loss | -0.00955 | -| std | 0.365 | -| value_loss | 2.36e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4641 | -| time_elapsed | 37023 | -| total_timesteps | 594048 | -| train/ | | -| approx_kl | 8.132635e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -0.00825 | -| learning_rate | 0.0003 | -| loss | -0.000703 | -| n_updates | 46400 | -| policy_gradient_loss | 0.00109 | -| std | 0.364 | -| value_loss | 3.95e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4642 | -| time_elapsed | 37029 | -| total_timesteps | 594176 | -| train/ | | -| approx_kl | 0.0021372023 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | 0.758 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 46410 | -| policy_gradient_loss | -6.98e-05 | -| std | 0.363 | -| value_loss | 0.00259 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4643 | -| time_elapsed | 37032 | -| total_timesteps | 594304 | -| train/ | | -| approx_kl | 0.047318034 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -96.5 | -| learning_rate | 0.0003 | -| loss | -0.00899 | -| n_updates | 46420 | -| policy_gradient_loss | -0.00684 | -| std | 0.363 | -| value_loss | 9.72e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4644 | -| time_elapsed | 37036 | -| total_timesteps | 594432 | -| train/ | | -| approx_kl | 0.0063989335 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -85.1 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 46430 | -| policy_gradient_loss | -0.00368 | -| std | 0.363 | -| value_loss | 5.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4645 | -| time_elapsed | 37038 | -| total_timesteps | 594560 | -| train/ | | -| approx_kl | 0.017516563 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -3.41 | -| learning_rate | 0.0003 | -| loss | 0.000282 | -| n_updates | 46440 | -| policy_gradient_loss | -0.000519 | -| std | 0.364 | -| value_loss | 3.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4646 | -| time_elapsed | 37042 | -| total_timesteps | 594688 | -| train/ | | -| approx_kl | 0.016603973 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.408 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.00834 | -| n_updates | 46450 | -| policy_gradient_loss | -0.0076 | -| std | 0.364 | -| value_loss | 3.02e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4647 | -| time_elapsed | 37046 | -| total_timesteps | 594816 | -| train/ | | -| approx_kl | 0.0060211346 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.000731 | -| n_updates | 46460 | -| policy_gradient_loss | -0.000745 | -| std | 0.363 | -| value_loss | 4.13e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 16 | -| iterations | 4648 | -| time_elapsed | 37049 | -| total_timesteps | 594944 | -| train/ | | -| approx_kl | 0.0137105435 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.403 | -| explained_variance | 0.00581 | -| learning_rate | 0.0003 | -| loss | -0.00964 | -| n_updates | 46470 | -| policy_gradient_loss | -0.00561 | -| std | 0.361 | -| value_loss | 1.42e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4649 | -| time_elapsed | 37054 | -| total_timesteps | 595072 | -| train/ | | -| approx_kl | 0.008938918 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.401 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 46480 | -| policy_gradient_loss | -0.00405 | -| std | 0.361 | -| value_loss | 6.82e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4650 | -| time_elapsed | 37060 | -| total_timesteps | 595200 | -| train/ | | -| approx_kl | 0.00299318 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 46490 | -| policy_gradient_loss | -0.00184 | -| std | 0.361 | -| value_loss | 5e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4651 | -| time_elapsed | 37064 | -| total_timesteps | 595328 | -| train/ | | -| approx_kl | 0.00076935906 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.399 | -| explained_variance | -6.14 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 46500 | -| policy_gradient_loss | 0.00174 | -| std | 0.361 | -| value_loss | 3.67e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4652 | -| time_elapsed | 37068 | -| total_timesteps | 595456 | -| train/ | | -| approx_kl | 0.001398134 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | -5.36 | -| learning_rate | 0.0003 | -| loss | -0.0049 | -| n_updates | 46510 | -| policy_gradient_loss | 0.000616 | -| std | 0.361 | -| value_loss | 1.93e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4653 | -| time_elapsed | 37071 | -| total_timesteps | 595584 | -| train/ | | -| approx_kl | 0.014185499 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.399 | -| explained_variance | -0.474 | -| learning_rate | 0.0003 | -| loss | 0.00064 | -| n_updates | 46520 | -| policy_gradient_loss | -0.000171 | -| std | 0.36 | -| value_loss | 1.91e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4654 | -| time_elapsed | 37074 | -| total_timesteps | 595712 | -| train/ | | -| approx_kl | 0.010723081 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.396 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 46530 | -| policy_gradient_loss | -0.00576 | -| std | 0.359 | -| value_loss | 1.51e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4655 | -| time_elapsed | 37077 | -| total_timesteps | 595840 | -| train/ | | -| approx_kl | 0.020590339 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.395 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 46540 | -| policy_gradient_loss | -0.00634 | -| std | 0.359 | -| value_loss | 1.2e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4656 | -| time_elapsed | 37080 | -| total_timesteps | 595968 | -| train/ | | -| approx_kl | 0.01237238 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | -0.00953 | -| n_updates | 46550 | -| policy_gradient_loss | -0.00481 | -| std | 0.358 | -| value_loss | 1.91e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4657 | -| time_elapsed | 37084 | -| total_timesteps | 596096 | -| train/ | | -| approx_kl | 0.01644174 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | -0.00053 | -| n_updates | 46560 | -| policy_gradient_loss | -0.00176 | -| std | 0.357 | -| value_loss | 2.16e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4658 | -| time_elapsed | 37090 | -| total_timesteps | 596224 | -| train/ | | -| approx_kl | 0.020671796 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | -0.389 | -| explained_variance | -2.4 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 46570 | -| policy_gradient_loss | -0.00165 | -| std | 0.357 | -| value_loss | 0.00118 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4659 | -| time_elapsed | 37093 | -| total_timesteps | 596352 | -| train/ | | -| approx_kl | 0.017480688 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | -0.39 | -| explained_variance | -4.17e+03 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 46580 | -| policy_gradient_loss | -0.0102 | -| std | 0.358 | -| value_loss | 6.37e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4660 | -| time_elapsed | 37097 | -| total_timesteps | 596480 | -| train/ | | -| approx_kl | 0.0007405183 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -2.79e+03 | -| learning_rate | 0.0003 | -| loss | -3.95e-05 | -| n_updates | 46590 | -| policy_gradient_loss | -1.48e-05 | -| std | 0.357 | -| value_loss | 1.76e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4661 | -| time_elapsed | 37100 | -| total_timesteps | 596608 | -| train/ | | -| approx_kl | 0.02169274 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.389 | -| explained_variance | -65.4 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 46600 | -| policy_gradient_loss | -0.0141 | -| std | 0.357 | -| value_loss | 2.49e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4662 | -| time_elapsed | 37103 | -| total_timesteps | 596736 | -| train/ | | -| approx_kl | 0.0048519527 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.389 | -| explained_variance | -4.34 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 46610 | -| policy_gradient_loss | -0.00344 | -| std | 0.357 | -| value_loss | 4.34e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4663 | -| time_elapsed | 37106 | -| total_timesteps | 596864 | -| train/ | | -| approx_kl | 0.026858432 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.39 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.00495 | -| n_updates | 46620 | -| policy_gradient_loss | -0.00629 | -| std | 0.358 | -| value_loss | 1.99e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 16 | -| iterations | 4664 | -| time_elapsed | 37108 | -| total_timesteps | 596992 | -| train/ | | -| approx_kl | 0.012251634 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 46630 | -| policy_gradient_loss | -0.00464 | -| std | 0.358 | -| value_loss | 9.6e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4665 | -| time_elapsed | 37110 | -| total_timesteps | 597120 | -| train/ | | -| approx_kl | 0.01151807 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 46640 | -| policy_gradient_loss | -0.00679 | -| std | 0.358 | -| value_loss | 7.68e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4666 | -| time_elapsed | 37119 | -| total_timesteps | 597248 | -| train/ | | -| approx_kl | 0.027365513 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | 0.679 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 46650 | -| policy_gradient_loss | -0.00567 | -| std | 0.358 | -| value_loss | 0.00324 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4667 | -| time_elapsed | 37123 | -| total_timesteps | 597376 | -| train/ | | -| approx_kl | 0.00016107596 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.392 | -| explained_variance | -1.26e+03 | -| learning_rate | 0.0003 | -| loss | 0.00184 | -| n_updates | 46660 | -| policy_gradient_loss | 0.0048 | -| std | 0.358 | -| value_loss | 8.47e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4668 | -| time_elapsed | 37127 | -| total_timesteps | 597504 | -| train/ | | -| approx_kl | 0.050008494 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | -0.392 | -| explained_variance | -550 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 46670 | -| policy_gradient_loss | -0.00907 | -| std | 0.358 | -| value_loss | 3.68e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4669 | -| time_elapsed | 37130 | -| total_timesteps | 597632 | -| train/ | | -| approx_kl | 3.7424266e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.392 | -| explained_variance | -25.8 | -| learning_rate | 0.0003 | -| loss | 0.000541 | -| n_updates | 46680 | -| policy_gradient_loss | 0.00284 | -| std | 0.358 | -| value_loss | 1.66e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4670 | -| time_elapsed | 37133 | -| total_timesteps | 597760 | -| train/ | | -| approx_kl | 0.0049211876 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.394 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.000874 | -| n_updates | 46690 | -| policy_gradient_loss | 0.00113 | -| std | 0.359 | -| value_loss | 5.77e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4671 | -| time_elapsed | 37137 | -| total_timesteps | 597888 | -| train/ | | -| approx_kl | 0.017173363 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.394 | -| explained_variance | -0.0828 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 46700 | -| policy_gradient_loss | -0.00412 | -| std | 0.359 | -| value_loss | 5.51e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4672 | -| time_elapsed | 37140 | -| total_timesteps | 598016 | -| train/ | | -| approx_kl | 0.016298052 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.392 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 46710 | -| policy_gradient_loss | -0.00289 | -| std | 0.358 | -| value_loss | 4.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4673 | -| time_elapsed | 37148 | -| total_timesteps | 598144 | -| train/ | | -| approx_kl | 0.018546429 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.39 | -| explained_variance | 0.689 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 46720 | -| policy_gradient_loss | -0.0108 | -| std | 0.357 | -| value_loss | 0.000359 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4674 | -| time_elapsed | 37152 | -| total_timesteps | 598272 | -| train/ | | -| approx_kl | 0.0074454756 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.389 | -| explained_variance | -21.7 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 46730 | -| policy_gradient_loss | -0.0068 | -| std | 0.357 | -| value_loss | 3.74e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4675 | -| time_elapsed | 37156 | -| total_timesteps | 598400 | -| train/ | | -| approx_kl | 0.0206451 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | -0.39 | -| explained_variance | -71.1 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 46740 | -| policy_gradient_loss | -0.0124 | -| std | 0.358 | -| value_loss | 2.67e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4676 | -| time_elapsed | 37158 | -| total_timesteps | 598528 | -| train/ | | -| approx_kl | 0.02977561 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.39 | -| explained_variance | -5.69 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 46750 | -| policy_gradient_loss | -0.0121 | -| std | 0.358 | -| value_loss | 3.28e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4677 | -| time_elapsed | 37162 | -| total_timesteps | 598656 | -| train/ | | -| approx_kl | 0.0011744653 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.00921 | -| n_updates | 46760 | -| policy_gradient_loss | 0.00146 | -| std | 0.358 | -| value_loss | 7.74e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4678 | -| time_elapsed | 37164 | -| total_timesteps | 598784 | -| train/ | | -| approx_kl | 0.0011792909 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -0.00198 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 46770 | -| policy_gradient_loss | 0.00177 | -| std | 0.358 | -| value_loss | 4.52e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4679 | -| time_elapsed | 37167 | -| total_timesteps | 598912 | -| train/ | | -| approx_kl | 0.0010718782 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | 0.00629 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 46780 | -| policy_gradient_loss | 0.000312 | -| std | 0.358 | -| value_loss | 4.65e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4680 | -| time_elapsed | 37170 | -| total_timesteps | 599040 | -| train/ | | -| approx_kl | 0.01854795 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | 0.00134 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 46790 | -| policy_gradient_loss | -0.00169 | -| std | 0.359 | -| value_loss | 4.72e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4681 | -| time_elapsed | 37176 | -| total_timesteps | 599168 | -| train/ | | -| approx_kl | 0.010633422 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 46800 | -| policy_gradient_loss | -0.000816 | -| std | 0.358 | -| value_loss | 0.000133 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4682 | -| time_elapsed | 37180 | -| total_timesteps | 599296 | -| train/ | | -| approx_kl | 0.015616916 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -1.98e+03 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 46810 | -| policy_gradient_loss | -0.00102 | -| std | 0.359 | -| value_loss | 1.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4683 | -| time_elapsed | 37184 | -| total_timesteps | 599424 | -| train/ | | -| approx_kl | 0.026743047 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.394 | -| explained_variance | -1.92e+03 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 46820 | -| policy_gradient_loss | -0.00806 | -| std | 0.359 | -| value_loss | 4.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4684 | -| time_elapsed | 37186 | -| total_timesteps | 599552 | -| train/ | | -| approx_kl | 0.002113692 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.395 | -| explained_variance | -20.3 | -| learning_rate | 0.0003 | -| loss | -0.000253 | -| n_updates | 46830 | -| policy_gradient_loss | -0.00011 | -| std | 0.359 | -| value_loss | 1.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4685 | -| time_elapsed | 37189 | -| total_timesteps | 599680 | -| train/ | | -| approx_kl | 0.013170222 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.396 | -| explained_variance | -14.7 | -| learning_rate | 0.0003 | -| loss | -0.00976 | -| n_updates | 46840 | -| policy_gradient_loss | -0.00362 | -| std | 0.359 | -| value_loss | 1.63e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4686 | -| time_elapsed | 37192 | -| total_timesteps | 599808 | -| train/ | | -| approx_kl | 7.010577e-05 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.395 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 46850 | -| policy_gradient_loss | 0.00452 | -| std | 0.359 | -| value_loss | 1.11e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4687 | -| time_elapsed | 37196 | -| total_timesteps | 599936 | -| train/ | | -| approx_kl | 0.0015976299 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.395 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 46860 | -| policy_gradient_loss | 5.18e-05 | -| std | 0.359 | -| value_loss | 1.45e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4688 | -| time_elapsed | 37198 | -| total_timesteps | 600064 | -| train/ | | -| approx_kl | 0.00091410195 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.396 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 46870 | -| policy_gradient_loss | 0.000299 | -| std | 0.36 | -| value_loss | 4.38e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4689 | -| time_elapsed | 37204 | -| total_timesteps | 600192 | -| train/ | | -| approx_kl | 0.001073671 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.398 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.00897 | -| n_updates | 46880 | -| policy_gradient_loss | 0.000909 | -| std | 0.36 | -| value_loss | 9.95e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4690 | -| time_elapsed | 37208 | -| total_timesteps | 600320 | -| train/ | | -| approx_kl | 0.0002722321 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.4 | -| explained_variance | -2.28e+03 | -| learning_rate | 0.0003 | -| loss | -0.0009 | -| n_updates | 46890 | -| policy_gradient_loss | 0.000215 | -| std | 0.362 | -| value_loss | 1.69e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4691 | -| time_elapsed | 37211 | -| total_timesteps | 600448 | -| train/ | | -| approx_kl | 0.002321518 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.403 | -| explained_variance | -1.81e+03 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 46900 | -| policy_gradient_loss | -4.59e-05 | -| std | 0.363 | -| value_loss | 3.96e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4692 | -| time_elapsed | 37215 | -| total_timesteps | 600576 | -| train/ | | -| approx_kl | 0.00021137623 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.405 | -| explained_variance | -12.9 | -| learning_rate | 0.0003 | -| loss | -0.000457 | -| n_updates | 46910 | -| policy_gradient_loss | 0.000412 | -| std | 0.363 | -| value_loss | 1.86e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4693 | -| time_elapsed | 37219 | -| total_timesteps | 600704 | -| train/ | | -| approx_kl | 0.0025636759 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -20 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 46920 | -| policy_gradient_loss | -0.000511 | -| std | 0.363 | -| value_loss | 4.09e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4694 | -| time_elapsed | 37223 | -| total_timesteps | 600832 | -| train/ | | -| approx_kl | 0.0008813618 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -3.89 | -| learning_rate | 0.0003 | -| loss | -0.00627 | -| n_updates | 46930 | -| policy_gradient_loss | 0.00206 | -| std | 0.363 | -| value_loss | 1.63e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4695 | -| time_elapsed | 37226 | -| total_timesteps | 600960 | -| train/ | | -| approx_kl | 0.00109229 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -0.701 | -| learning_rate | 0.0003 | -| loss | -0.00289 | -| n_updates | 46940 | -| policy_gradient_loss | 0.000394 | -| std | 0.364 | -| value_loss | 4.61e-12 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4696 | -| time_elapsed | 37229 | -| total_timesteps | 601088 | -| train/ | | -| approx_kl | 0.022742853 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | -0.408 | -| explained_variance | 0.0025 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 46950 | -| policy_gradient_loss | -0.00561 | -| std | 0.364 | -| value_loss | 9.15e-13 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4697 | -| time_elapsed | 37235 | -| total_timesteps | 601216 | -| train/ | | -| approx_kl | 0.022597278 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.41 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 46960 | -| policy_gradient_loss | -0.002 | -| std | 0.364 | -| value_loss | 0.00124 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4698 | -| time_elapsed | 37238 | -| total_timesteps | 601344 | -| train/ | | -| approx_kl | 0.028958771 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -1.38e+03 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 46970 | -| policy_gradient_loss | -0.00416 | -| std | 0.364 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4699 | -| time_elapsed | 37241 | -| total_timesteps | 601472 | -| train/ | | -| approx_kl | 0.007955023 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -3.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.00723 | -| n_updates | 46980 | -| policy_gradient_loss | -0.00214 | -| std | 0.364 | -| value_loss | 2.43e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4700 | -| time_elapsed | 37246 | -| total_timesteps | 601600 | -| train/ | | -| approx_kl | 0.00016802689 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -171 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 46990 | -| policy_gradient_loss | 0.00402 | -| std | 0.364 | -| value_loss | 7.06e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4701 | -| time_elapsed | 37250 | -| total_timesteps | 601728 | -| train/ | | -| approx_kl | 0.0015297905 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.408 | -| explained_variance | -29.5 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 47000 | -| policy_gradient_loss | 0.000216 | -| std | 0.364 | -| value_loss | 1.4e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4702 | -| time_elapsed | 37254 | -| total_timesteps | 601856 | -| train/ | | -| approx_kl | 0.00025361124 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -4.23 | -| learning_rate | 0.0003 | -| loss | -0.000435 | -| n_updates | 47010 | -| policy_gradient_loss | 0.00038 | -| std | 0.363 | -| value_loss | 3.46e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4703 | -| time_elapsed | 37257 | -| total_timesteps | 601984 | -| train/ | | -| approx_kl | 0.00223774 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | 0.00333 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 47020 | -| policy_gradient_loss | -0.000535 | -| std | 0.363 | -| value_loss | 1.28e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 16 | -| iterations | 4704 | -| time_elapsed | 37260 | -| total_timesteps | 602112 | -| train/ | | -| approx_kl | 0.00063308934 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -0.354 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 47030 | -| policy_gradient_loss | 0.00244 | -| std | 0.363 | -| value_loss | 5.09e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 16 | -| iterations | 4705 | -| time_elapsed | 37270 | -| total_timesteps | 602240 | -| train/ | | -| approx_kl | 0.0013408968 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.405 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 47040 | -| policy_gradient_loss | 0.000647 | -| std | 0.362 | -| value_loss | 1.41e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 16 | -| iterations | 4706 | -| time_elapsed | 37274 | -| total_timesteps | 602368 | -| train/ | | -| approx_kl | 0.0011032484 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.404 | -| explained_variance | -6.03 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 47050 | -| policy_gradient_loss | 0.000547 | -| std | 0.362 | -| value_loss | 7.88e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 16 | -| iterations | 4707 | -| time_elapsed | 37277 | -| total_timesteps | 602496 | -| train/ | | -| approx_kl | 0.001033348 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.404 | -| explained_variance | -7.75 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 47060 | -| policy_gradient_loss | 0.000695 | -| std | 0.363 | -| value_loss | 3.63e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 16 | -| iterations | 4708 | -| time_elapsed | 37281 | -| total_timesteps | 602624 | -| train/ | | -| approx_kl | 0.03359243 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | -0.405 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 47070 | -| policy_gradient_loss | -0.0104 | -| std | 0.363 | -| value_loss | 1.93e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 16 | -| iterations | 4709 | -| time_elapsed | 37284 | -| total_timesteps | 602752 | -| train/ | | -| approx_kl | 0.012368124 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.406 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 47080 | -| policy_gradient_loss | -0.00256 | -| std | 0.364 | -| value_loss | 9.63e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 16 | -| iterations | 4710 | -| time_elapsed | 37287 | -| total_timesteps | 602880 | -| train/ | | -| approx_kl | 0.010696147 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 47090 | -| policy_gradient_loss | -0.00166 | -| std | 0.365 | -| value_loss | 4.6e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4711 | -| time_elapsed | 37290 | -| total_timesteps | 603008 | -| train/ | | -| approx_kl | 0.00981167 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.41 | -| explained_variance | -0.0018 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 47100 | -| policy_gradient_loss | -0.00424 | -| std | 0.365 | -| value_loss | 3.14e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4712 | -| time_elapsed | 37299 | -| total_timesteps | 603136 | -| train/ | | -| approx_kl | 0.0033434806 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.411 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 47110 | -| policy_gradient_loss | -0.000561 | -| std | 0.365 | -| value_loss | 0.00115 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4713 | -| time_elapsed | 37303 | -| total_timesteps | 603264 | -| train/ | | -| approx_kl | 0.025982434 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | -0.41 | -| explained_variance | -2.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 47120 | -| policy_gradient_loss | -0.015 | -| std | 0.364 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4714 | -| time_elapsed | 37306 | -| total_timesteps | 603392 | -| train/ | | -| approx_kl | 0.0055904286 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.409 | -| explained_variance | -4.93e+03 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 47130 | -| policy_gradient_loss | -0.000847 | -| std | 0.365 | -| value_loss | 1.88e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4715 | -| time_elapsed | 37309 | -| total_timesteps | 603520 | -| train/ | | -| approx_kl | 0.0025493046 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.41 | -| explained_variance | -220 | -| learning_rate | 0.0003 | -| loss | 0.000295 | -| n_updates | 47140 | -| policy_gradient_loss | 0.000422 | -| std | 0.364 | -| value_loss | 3.25e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4716 | -| time_elapsed | 37313 | -| total_timesteps | 603648 | -| train/ | | -| approx_kl | 0.020389853 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | -0.407 | -| explained_variance | -39.9 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 47150 | -| policy_gradient_loss | -0.00253 | -| std | 0.363 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4717 | -| time_elapsed | 37315 | -| total_timesteps | 603776 | -| train/ | | -| approx_kl | 0.0065426314 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.405 | -| explained_variance | -0.639 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 47160 | -| policy_gradient_loss | -0.00105 | -| std | 0.363 | -| value_loss | 1.2e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 16 | -| iterations | 4718 | -| time_elapsed | 37317 | -| total_timesteps | 603904 | -| train/ | | -| approx_kl | 0.009571151 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.404 | -| explained_variance | -3.26 | -| learning_rate | 0.0003 | -| loss | -0.000362 | -| n_updates | 47170 | -| policy_gradient_loss | -0.000678 | -| std | 0.362 | -| value_loss | 2.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4719 | -| time_elapsed | 37320 | -| total_timesteps | 604032 | -| train/ | | -| approx_kl | 0.006865631 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.403 | -| explained_variance | -0.627 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 47180 | -| policy_gradient_loss | -0.00278 | -| std | 0.362 | -| value_loss | 8.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4720 | -| time_elapsed | 37328 | -| total_timesteps | 604160 | -| train/ | | -| approx_kl | 0.00338285 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.403 | -| explained_variance | -0.364 | -| learning_rate | 0.0003 | -| loss | -4.71e-05 | -| n_updates | 47190 | -| policy_gradient_loss | -0.000232 | -| std | 0.362 | -| value_loss | 0.00149 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4721 | -| time_elapsed | 37333 | -| total_timesteps | 604288 | -| train/ | | -| approx_kl | 0.025065113 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | -0.404 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 47200 | -| policy_gradient_loss | -0.00243 | -| std | 0.362 | -| value_loss | 3.17e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4722 | -| time_elapsed | 37335 | -| total_timesteps | 604416 | -| train/ | | -| approx_kl | 0.011962643 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.402 | -| explained_variance | -421 | -| learning_rate | 0.0003 | -| loss | -0.00083 | -| n_updates | 47210 | -| policy_gradient_loss | -0.000729 | -| std | 0.361 | -| value_loss | 3.79e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4723 | -| time_elapsed | 37338 | -| total_timesteps | 604544 | -| train/ | | -| approx_kl | 0.018478386 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.398 | -| explained_variance | -3.36 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 47220 | -| policy_gradient_loss | -0.0125 | -| std | 0.36 | -| value_loss | 4.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4724 | -| time_elapsed | 37341 | -| total_timesteps | 604672 | -| train/ | | -| approx_kl | 0.034292378 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | -0.396 | -| explained_variance | -19.2 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 47230 | -| policy_gradient_loss | -0.0112 | -| std | 0.359 | -| value_loss | 3.84e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4725 | -| time_elapsed | 37344 | -| total_timesteps | 604800 | -| train/ | | -| approx_kl | 0.0130778365 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.395 | -| explained_variance | -44.1 | -| learning_rate | 0.0003 | -| loss | -0.00473 | -| n_updates | 47240 | -| policy_gradient_loss | -0.00228 | -| std | 0.359 | -| value_loss | 9.18e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4726 | -| time_elapsed | 37346 | -| total_timesteps | 604928 | -| train/ | | -| approx_kl | 0.0024563386 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.394 | -| explained_variance | -4.43 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 47250 | -| policy_gradient_loss | -0.000239 | -| std | 0.359 | -| value_loss | 2.05e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4727 | -| time_elapsed | 37348 | -| total_timesteps | 605056 | -| train/ | | -| approx_kl | 0.0008679549 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.394 | -| explained_variance | -0.00913 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 47260 | -| policy_gradient_loss | 0.00167 | -| std | 0.359 | -| value_loss | 4.67e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4728 | -| time_elapsed | 37354 | -| total_timesteps | 605184 | -| train/ | | -| approx_kl | 0.0011306843 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.394 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | 0.000896 | -| n_updates | 47270 | -| policy_gradient_loss | 0.000472 | -| std | 0.359 | -| value_loss | 0.00116 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4729 | -| time_elapsed | 37358 | -| total_timesteps | 605312 | -| train/ | | -| approx_kl | 0.021482117 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.396 | -| explained_variance | -3e+03 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 47280 | -| policy_gradient_loss | -0.00176 | -| std | 0.359 | -| value_loss | 7.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4730 | -| time_elapsed | 37360 | -| total_timesteps | 605440 | -| train/ | | -| approx_kl | 0.0068204654 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.394 | -| explained_variance | -5.2e+03 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 47290 | -| policy_gradient_loss | -0.00155 | -| std | 0.359 | -| value_loss | 2.29e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4731 | -| time_elapsed | 37362 | -| total_timesteps | 605568 | -| train/ | | -| approx_kl | 0.0002937098 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -42.9 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 47300 | -| policy_gradient_loss | 0.00294 | -| std | 0.358 | -| value_loss | 1.1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4732 | -| time_elapsed | 37364 | -| total_timesteps | 605696 | -| train/ | | -| approx_kl | 0.027203176 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -0.977 | -| learning_rate | 0.0003 | -| loss | 0.00247 | -| n_updates | 47310 | -| policy_gradient_loss | -0.00269 | -| std | 0.359 | -| value_loss | 1.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4733 | -| time_elapsed | 37367 | -| total_timesteps | 605824 | -| train/ | | -| approx_kl | 0.011154151 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -0.0895 | -| learning_rate | 0.0003 | -| loss | -0.000458 | -| n_updates | 47320 | -| policy_gradient_loss | -0.000987 | -| std | 0.358 | -| value_loss | 8.52e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 16 | -| iterations | 4734 | -| time_elapsed | 37371 | -| total_timesteps | 605952 | -| train/ | | -| approx_kl | 0.0035194848 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -0.00545 | -| learning_rate | 0.0003 | -| loss | -0.000163 | -| n_updates | 47330 | -| policy_gradient_loss | -0.000206 | -| std | 0.358 | -| value_loss | 1.29e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4735 | -| time_elapsed | 37373 | -| total_timesteps | 606080 | -| train/ | | -| approx_kl | 0.011545111 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 47340 | -| policy_gradient_loss | -0.00205 | -| std | 0.358 | -| value_loss | 5.05e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4736 | -| time_elapsed | 37380 | -| total_timesteps | 606208 | -| train/ | | -| approx_kl | 0.03152805 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | 0.858 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 47350 | -| policy_gradient_loss | -0.00631 | -| std | 0.358 | -| value_loss | 0.000724 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4737 | -| time_elapsed | 37383 | -| total_timesteps | 606336 | -| train/ | | -| approx_kl | 0.00024150545 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -59.9 | -| learning_rate | 0.0003 | -| loss | 0.00058 | -| n_updates | 47360 | -| policy_gradient_loss | 0.00146 | -| std | 0.358 | -| value_loss | 1.07e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4738 | -| time_elapsed | 37386 | -| total_timesteps | 606464 | -| train/ | | -| approx_kl | 0.0021468466 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -258 | -| learning_rate | 0.0003 | -| loss | -0.00998 | -| n_updates | 47370 | -| policy_gradient_loss | -0.000546 | -| std | 0.358 | -| value_loss | 7.1e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4739 | -| time_elapsed | 37389 | -| total_timesteps | 606592 | -| train/ | | -| approx_kl | 0.02047088 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.393 | -| explained_variance | -13.8 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 47380 | -| policy_gradient_loss | -0.00481 | -| std | 0.358 | -| value_loss | 8.88e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4740 | -| time_elapsed | 37393 | -| total_timesteps | 606720 | -| train/ | | -| approx_kl | 0.015344857 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.392 | -| explained_variance | -4.13 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 47390 | -| policy_gradient_loss | -0.00264 | -| std | 0.358 | -| value_loss | 4.75e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4741 | -| time_elapsed | 37397 | -| total_timesteps | 606848 | -| train/ | | -| approx_kl | 0.0105233295 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.391 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 47400 | -| policy_gradient_loss | -0.00229 | -| std | 0.357 | -| value_loss | 3.48e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4742 | -| time_elapsed | 37400 | -| total_timesteps | 606976 | -| train/ | | -| approx_kl | 0.0076499656 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.388 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.00875 | -| n_updates | 47410 | -| policy_gradient_loss | -0.0032 | -| std | 0.356 | -| value_loss | 1.97e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4743 | -| time_elapsed | 37402 | -| total_timesteps | 607104 | -| train/ | | -| approx_kl | 0.0015815818 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.382 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | -0.000613 | -| n_updates | 47420 | -| policy_gradient_loss | -0.000134 | -| std | 0.353 | -| value_loss | 8.01e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4744 | -| time_elapsed | 37410 | -| total_timesteps | 607232 | -| train/ | | -| approx_kl | 0.028148243 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.377 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 47430 | -| policy_gradient_loss | -0.0113 | -| std | 0.352 | -| value_loss | 0.003 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4745 | -| time_elapsed | 37414 | -| total_timesteps | 607360 | -| train/ | | -| approx_kl | 0.0066096783 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.375 | -| explained_variance | -255 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 47440 | -| policy_gradient_loss | -0.00951 | -| std | 0.352 | -| value_loss | 1.06e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4746 | -| time_elapsed | 37417 | -| total_timesteps | 607488 | -| train/ | | -| approx_kl | 0.008634882 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.374 | -| explained_variance | -114 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 47450 | -| policy_gradient_loss | -0.00359 | -| std | 0.352 | -| value_loss | 7.42e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4747 | -| time_elapsed | 37420 | -| total_timesteps | 607616 | -| train/ | | -| approx_kl | 0.01753226 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -5.13 | -| learning_rate | 0.0003 | -| loss | 0.000624 | -| n_updates | 47460 | -| policy_gradient_loss | -0.0014 | -| std | 0.351 | -| value_loss | 9.19e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4748 | -| time_elapsed | 37424 | -| total_timesteps | 607744 | -| train/ | | -| approx_kl | 0.0264922 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | 0.0017 | -| n_updates | 47470 | -| policy_gradient_loss | -0.00173 | -| std | 0.351 | -| value_loss | 3.43e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4749 | -| time_elapsed | 37426 | -| total_timesteps | 607872 | -| train/ | | -| approx_kl | 0.014604907 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | 0.00339 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 47480 | -| policy_gradient_loss | -0.00372 | -| std | 0.352 | -| value_loss | 1.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4750 | -| time_elapsed | 37429 | -| total_timesteps | 608000 | -| train/ | | -| approx_kl | 0.015342204 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.375 | -| explained_variance | -0.00949 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 47490 | -| policy_gradient_loss | -0.00954 | -| std | 0.352 | -| value_loss | 8.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4751 | -| time_elapsed | 37432 | -| total_timesteps | 608128 | -| train/ | | -| approx_kl | 0.016058642 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.376 | -| explained_variance | 0.00183 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 47500 | -| policy_gradient_loss | -0.00672 | -| std | 0.352 | -| value_loss | 3.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4752 | -| time_elapsed | 37439 | -| total_timesteps | 608256 | -| train/ | | -| approx_kl | 0.025920255 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.377 | -| explained_variance | 0.907 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 47510 | -| policy_gradient_loss | -0.0124 | -| std | 0.353 | -| value_loss | 0.000636 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4753 | -| time_elapsed | 37442 | -| total_timesteps | 608384 | -| train/ | | -| approx_kl | 0.027804755 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.378 | -| explained_variance | -36.4 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 47520 | -| policy_gradient_loss | -0.00352 | -| std | 0.354 | -| value_loss | 2.82e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4754 | -| time_elapsed | 37446 | -| total_timesteps | 608512 | -| train/ | | -| approx_kl | 5.3035095e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.38 | -| explained_variance | -88.8 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 47530 | -| policy_gradient_loss | 0.00444 | -| std | 0.354 | -| value_loss | 1.53e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4755 | -| time_elapsed | 37449 | -| total_timesteps | 608640 | -| train/ | | -| approx_kl | 0.01926634 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.381 | -| explained_variance | -4.61 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 47540 | -| policy_gradient_loss | -0.00261 | -| std | 0.354 | -| value_loss | 4.42e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4756 | -| time_elapsed | 37451 | -| total_timesteps | 608768 | -| train/ | | -| approx_kl | 0.014126468 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.382 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 47550 | -| policy_gradient_loss | -0.0108 | -| std | 0.355 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4757 | -| time_elapsed | 37455 | -| total_timesteps | 608896 | -| train/ | | -| approx_kl | 0.005932131 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.382 | -| explained_variance | 0.00511 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 47560 | -| policy_gradient_loss | -0.000713 | -| std | 0.354 | -| value_loss | 1.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4758 | -| time_elapsed | 37457 | -| total_timesteps | 609024 | -| train/ | | -| approx_kl | 0.009571947 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.379 | -| explained_variance | 0.00644 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 47570 | -| policy_gradient_loss | -0.00221 | -| std | 0.353 | -| value_loss | 4.69e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4759 | -| time_elapsed | 37464 | -| total_timesteps | 609152 | -| train/ | | -| approx_kl | 0.0038898983 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.376 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | 0.000451 | -| n_updates | 47580 | -| policy_gradient_loss | -9.01e-05 | -| std | 0.351 | -| value_loss | 0.00172 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4760 | -| time_elapsed | 37468 | -| total_timesteps | 609280 | -| train/ | | -| approx_kl | 0.032372754 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -772 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 47590 | -| policy_gradient_loss | -0.00564 | -| std | 0.35 | -| value_loss | 1.82e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4761 | -| time_elapsed | 37471 | -| total_timesteps | 609408 | -| train/ | | -| approx_kl | 0.056909613 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -693 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 47600 | -| policy_gradient_loss | -0.00845 | -| std | 0.35 | -| value_loss | 5.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4762 | -| time_elapsed | 37474 | -| total_timesteps | 609536 | -| train/ | | -| approx_kl | 0.053705487 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -9.82 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 47610 | -| policy_gradient_loss | -0.00888 | -| std | 0.351 | -| value_loss | 4.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4763 | -| time_elapsed | 37476 | -| total_timesteps | 609664 | -| train/ | | -| approx_kl | 0.006206428 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -7.83 | -| learning_rate | 0.0003 | -| loss | -0.000872 | -| n_updates | 47620 | -| policy_gradient_loss | -0.000569 | -| std | 0.35 | -| value_loss | 3.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4764 | -| time_elapsed | 37479 | -| total_timesteps | 609792 | -| train/ | | -| approx_kl | 0.016841626 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | -0.0953 | -| learning_rate | 0.0003 | -| loss | 0.000491 | -| n_updates | 47630 | -| policy_gradient_loss | -0.00145 | -| std | 0.349 | -| value_loss | 2.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 16 | -| iterations | 4765 | -| time_elapsed | 37481 | -| total_timesteps | 609920 | -| train/ | | -| approx_kl | 0.015877727 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -6.48 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 47640 | -| policy_gradient_loss | -0.00231 | -| std | 0.349 | -| value_loss | 1.63e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4766 | -| time_elapsed | 37483 | -| total_timesteps | 610048 | -| train/ | | -| approx_kl | 0.0019874796 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.366 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 47650 | -| policy_gradient_loss | -0.000227 | -| std | 0.349 | -| value_loss | 1.61e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4767 | -| time_elapsed | 37488 | -| total_timesteps | 610176 | -| train/ | | -| approx_kl | 0.05070945 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | -6.79 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 47660 | -| policy_gradient_loss | -0.00408 | -| std | 0.35 | -| value_loss | 0.00361 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4768 | -| time_elapsed | 37493 | -| total_timesteps | 610304 | -| train/ | | -| approx_kl | 0.0011053565 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -626 | -| learning_rate | 0.0003 | -| loss | -3.89e-06 | -| n_updates | 47670 | -| policy_gradient_loss | 0.000376 | -| std | 0.35 | -| value_loss | 3.39e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4769 | -| time_elapsed | 37495 | -| total_timesteps | 610432 | -| train/ | | -| approx_kl | 0.039211396 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -179 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 47680 | -| policy_gradient_loss | -0.00476 | -| std | 0.35 | -| value_loss | 1.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4770 | -| time_elapsed | 37497 | -| total_timesteps | 610560 | -| train/ | | -| approx_kl | 0.008438784 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | -0.0652 | -| learning_rate | 0.0003 | -| loss | 0.000931 | -| n_updates | 47690 | -| policy_gradient_loss | 0.000883 | -| std | 0.349 | -| value_loss | 2.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4771 | -| time_elapsed | 37500 | -| total_timesteps | 610688 | -| train/ | | -| approx_kl | 0.006403421 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | -0.639 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 47700 | -| policy_gradient_loss | -0.000826 | -| std | 0.35 | -| value_loss | 3.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4772 | -| time_elapsed | 37504 | -| total_timesteps | 610816 | -| train/ | | -| approx_kl | 0.011656843 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | 0.00736 | -| learning_rate | 0.0003 | -| loss | 0.0013 | -| n_updates | 47710 | -| policy_gradient_loss | 0.000367 | -| std | 0.35 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4773 | -| time_elapsed | 37508 | -| total_timesteps | 610944 | -| train/ | | -| approx_kl | 0.011602521 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -0.0047 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 47720 | -| policy_gradient_loss | -0.00424 | -| std | 0.351 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4774 | -| time_elapsed | 37512 | -| total_timesteps | 611072 | -| train/ | | -| approx_kl | 0.0054186573 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | -0.00065 | -| n_updates | 47730 | -| policy_gradient_loss | -0.00028 | -| std | 0.35 | -| value_loss | 4.94e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4775 | -| time_elapsed | 37517 | -| total_timesteps | 611200 | -| train/ | | -| approx_kl | 0.052755527 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | 0.886 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 47740 | -| policy_gradient_loss | -0.00781 | -| std | 0.35 | -| value_loss | 0.000213 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4776 | -| time_elapsed | 37520 | -| total_timesteps | 611328 | -| train/ | | -| approx_kl | 0.0067936764 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | -80.9 | -| learning_rate | 0.0003 | -| loss | -1.57e-05 | -| n_updates | 47750 | -| policy_gradient_loss | 6.85e-05 | -| std | 0.348 | -| value_loss | 2.75e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4777 | -| time_elapsed | 37525 | -| total_timesteps | 611456 | -| train/ | | -| approx_kl | 0.010014466 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -61.8 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 47760 | -| policy_gradient_loss | -0.00338 | -| std | 0.347 | -| value_loss | 9.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4778 | -| time_elapsed | 37528 | -| total_timesteps | 611584 | -| train/ | | -| approx_kl | 0.028291197 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -2.16 | -| learning_rate | 0.0003 | -| loss | -0.000592 | -| n_updates | 47770 | -| policy_gradient_loss | -0.00213 | -| std | 0.347 | -| value_loss | 1.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4779 | -| time_elapsed | 37532 | -| total_timesteps | 611712 | -| train/ | | -| approx_kl | 0.020271676 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 47780 | -| policy_gradient_loss | -0.00694 | -| std | 0.347 | -| value_loss | 6.01e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4780 | -| time_elapsed | 37536 | -| total_timesteps | 611840 | -| train/ | | -| approx_kl | 0.023416571 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.00771 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 47790 | -| policy_gradient_loss | -0.00445 | -| std | 0.346 | -| value_loss | 5.27e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 16 | -| iterations | 4781 | -| time_elapsed | 37539 | -| total_timesteps | 611968 | -| train/ | | -| approx_kl | 0.01845035 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00573 | -| n_updates | 47800 | -| policy_gradient_loss | -0.00458 | -| std | 0.346 | -| value_loss | 2.63e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4782 | -| time_elapsed | 37542 | -| total_timesteps | 612096 | -| train/ | | -| approx_kl | 0.017822254 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | -0.00526 | -| n_updates | 47810 | -| policy_gradient_loss | -0.00602 | -| std | 0.346 | -| value_loss | 1.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4783 | -| time_elapsed | 37549 | -| total_timesteps | 612224 | -| train/ | | -| approx_kl | 0.011427041 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | 0.663 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 47820 | -| policy_gradient_loss | -0.0083 | -| std | 0.347 | -| value_loss | 0.00628 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4784 | -| time_elapsed | 37553 | -| total_timesteps | 612352 | -| train/ | | -| approx_kl | 0.01201454 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -47.8 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 47830 | -| policy_gradient_loss | -0.00895 | -| std | 0.347 | -| value_loss | 8.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4785 | -| time_elapsed | 37557 | -| total_timesteps | 612480 | -| train/ | | -| approx_kl | 0.001979886 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -387 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 47840 | -| policy_gradient_loss | 0.000257 | -| std | 0.346 | -| value_loss | 1.2e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4786 | -| time_elapsed | 37559 | -| total_timesteps | 612608 | -| train/ | | -| approx_kl | 0.0010878546 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -29.9 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 47850 | -| policy_gradient_loss | 0.000681 | -| std | 0.346 | -| value_loss | 1.5e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4787 | -| time_elapsed | 37562 | -| total_timesteps | 612736 | -| train/ | | -| approx_kl | 0.0016155685 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -0.661 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 47860 | -| policy_gradient_loss | 0.000847 | -| std | 0.346 | -| value_loss | 3.19e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4788 | -| time_elapsed | 37565 | -| total_timesteps | 612864 | -| train/ | | -| approx_kl | 0.02316508 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -6.96e-05 | -| n_updates | 47870 | -| policy_gradient_loss | -0.00262 | -| std | 0.346 | -| value_loss | 1.6e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 16 | -| iterations | 4789 | -| time_elapsed | 37569 | -| total_timesteps | 612992 | -| train/ | | -| approx_kl | 0.008331173 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 47880 | -| policy_gradient_loss | -0.00137 | -| std | 0.347 | -| value_loss | 6.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4790 | -| time_elapsed | 37573 | -| total_timesteps | 613120 | -| train/ | | -| approx_kl | 0.012303308 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 47890 | -| policy_gradient_loss | -0.00137 | -| std | 0.348 | -| value_loss | 5.27e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4791 | -| time_elapsed | 37582 | -| total_timesteps | 613248 | -| train/ | | -| approx_kl | 0.0061224136 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.000418 | -| n_updates | 47900 | -| policy_gradient_loss | -0.000329 | -| std | 0.348 | -| value_loss | 0.00038 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4792 | -| time_elapsed | 37585 | -| total_timesteps | 613376 | -| train/ | | -| approx_kl | 0.012002189 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -477 | -| learning_rate | 0.0003 | -| loss | -0.000898 | -| n_updates | 47910 | -| policy_gradient_loss | -0.000854 | -| std | 0.348 | -| value_loss | 2.36e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4793 | -| time_elapsed | 37588 | -| total_timesteps | 613504 | -| train/ | | -| approx_kl | 0.00694429 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -660 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 47920 | -| policy_gradient_loss | -0.000686 | -| std | 0.349 | -| value_loss | 5.18e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4794 | -| time_elapsed | 37591 | -| total_timesteps | 613632 | -| train/ | | -| approx_kl | 0.0036193295 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | -20.3 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 47930 | -| policy_gradient_loss | -0.000979 | -| std | 0.349 | -| value_loss | 9.61e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4795 | -| time_elapsed | 37593 | -| total_timesteps | 613760 | -| train/ | | -| approx_kl | 0.000623683 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | -8.51 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 47940 | -| policy_gradient_loss | 0.0012 | -| std | 0.35 | -| value_loss | 1.84e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4796 | -| time_elapsed | 37596 | -| total_timesteps | 613888 | -| train/ | | -| approx_kl | 0.0105007235 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | -0.433 | -| learning_rate | 0.0003 | -| loss | 0.000244 | -| n_updates | 47950 | -| policy_gradient_loss | -0.00018 | -| std | 0.349 | -| value_loss | 2.34e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4797 | -| time_elapsed | 37599 | -| total_timesteps | 614016 | -| train/ | | -| approx_kl | 0.027637996 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | 0.0058 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 47960 | -| policy_gradient_loss | -0.0098 | -| std | 0.349 | -| value_loss | 1.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4798 | -| time_elapsed | 37606 | -| total_timesteps | 614144 | -| train/ | | -| approx_kl | 0.031845428 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | -0.366 | -| explained_variance | 0.877 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 47970 | -| policy_gradient_loss | -0.0056 | -| std | 0.349 | -| value_loss | 0.00171 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4799 | -| time_elapsed | 37608 | -| total_timesteps | 614272 | -| train/ | | -| approx_kl | 0.00031632278 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -562 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 47980 | -| policy_gradient_loss | 0.00407 | -| std | 0.349 | -| value_loss | 5.34e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4800 | -| time_elapsed | 37611 | -| total_timesteps | 614400 | -| train/ | | -| approx_kl | 0.06374653 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -7.68e+03 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 47990 | -| policy_gradient_loss | -0.00915 | -| std | 0.349 | -| value_loss | 2.39e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4801 | -| time_elapsed | 37614 | -| total_timesteps | 614528 | -| train/ | | -| approx_kl | 0.02610713 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -280 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 48000 | -| policy_gradient_loss | -0.0124 | -| std | 0.349 | -| value_loss | 5.69e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4802 | -| time_elapsed | 37618 | -| total_timesteps | 614656 | -| train/ | | -| approx_kl | 0.019360142 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -376 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 48010 | -| policy_gradient_loss | -0.00592 | -| std | 0.348 | -| value_loss | 9.64e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4803 | -| time_elapsed | 37620 | -| total_timesteps | 614784 | -| train/ | | -| approx_kl | 0.031324666 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -105 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 48020 | -| policy_gradient_loss | -0.00791 | -| std | 0.348 | -| value_loss | 3.04e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4804 | -| time_elapsed | 37624 | -| total_timesteps | 614912 | -| train/ | | -| approx_kl | 0.0016162703 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -3.43 | -| learning_rate | 0.0003 | -| loss | -0.00793 | -| n_updates | 48030 | -| policy_gradient_loss | 0.000156 | -| std | 0.348 | -| value_loss | 2.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4805 | -| time_elapsed | 37627 | -| total_timesteps | 615040 | -| train/ | | -| approx_kl | 0.022896262 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -0.746 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 48040 | -| policy_gradient_loss | -0.00661 | -| std | 0.348 | -| value_loss | 9.24e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4806 | -| time_elapsed | 37634 | -| total_timesteps | 615168 | -| train/ | | -| approx_kl | 0.011528149 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 48050 | -| policy_gradient_loss | -0.00119 | -| std | 0.348 | -| value_loss | 6.73e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4807 | -| time_elapsed | 37638 | -| total_timesteps | 615296 | -| train/ | | -| approx_kl | 0.0057145236 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -241 | -| learning_rate | 0.0003 | -| loss | -0.00565 | -| n_updates | 48060 | -| policy_gradient_loss | -0.00109 | -| std | 0.347 | -| value_loss | 5.68e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4808 | -| time_elapsed | 37643 | -| total_timesteps | 615424 | -| train/ | | -| approx_kl | 0.00025472417 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -198 | -| learning_rate | 0.0003 | -| loss | -0.000649 | -| n_updates | 48070 | -| policy_gradient_loss | 0.000385 | -| std | 0.346 | -| value_loss | 2.27e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4809 | -| time_elapsed | 37645 | -| total_timesteps | 615552 | -| train/ | | -| approx_kl | 0.00042679673 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -30.7 | -| learning_rate | 0.0003 | -| loss | 0.000241 | -| n_updates | 48080 | -| policy_gradient_loss | 0.000374 | -| std | 0.345 | -| value_loss | 4.39e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4810 | -| time_elapsed | 37649 | -| total_timesteps | 615680 | -| train/ | | -| approx_kl | 0.009679667 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -42.5 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 48090 | -| policy_gradient_loss | -0.00323 | -| std | 0.345 | -| value_loss | 9.42e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4811 | -| time_elapsed | 37652 | -| total_timesteps | 615808 | -| train/ | | -| approx_kl | 0.0001459918 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 48100 | -| policy_gradient_loss | 0.00344 | -| std | 0.345 | -| value_loss | 1.92e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4812 | -| time_elapsed | 37656 | -| total_timesteps | 615936 | -| train/ | | -| approx_kl | 0.01889342 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -0.0745 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 48110 | -| policy_gradient_loss | -0.0055 | -| std | 0.345 | -| value_loss | 1.8e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4813 | -| time_elapsed | 37659 | -| total_timesteps | 616064 | -| train/ | | -| approx_kl | 0.018348368 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 48120 | -| policy_gradient_loss | -0.00329 | -| std | 0.346 | -| value_loss | 4.96e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4814 | -| time_elapsed | 37665 | -| total_timesteps | 616192 | -| train/ | | -| approx_kl | 0.015788967 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 48130 | -| policy_gradient_loss | -0.0131 | -| std | 0.345 | -| value_loss | 5.9e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4815 | -| time_elapsed | 37667 | -| total_timesteps | 616320 | -| train/ | | -| approx_kl | 0.004680043 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -128 | -| learning_rate | 0.0003 | -| loss | -0.000928 | -| n_updates | 48140 | -| policy_gradient_loss | -0.000481 | -| std | 0.344 | -| value_loss | 4.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4816 | -| time_elapsed | 37669 | -| total_timesteps | 616448 | -| train/ | | -| approx_kl | 0.009607164 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.352 | -| explained_variance | -217 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 48150 | -| policy_gradient_loss | -0.00258 | -| std | 0.344 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4817 | -| time_elapsed | 37671 | -| total_timesteps | 616576 | -| train/ | | -| approx_kl | 0.008084637 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | -0.376 | -| learning_rate | 0.0003 | -| loss | -0.000706 | -| n_updates | 48160 | -| policy_gradient_loss | -0.000777 | -| std | 0.343 | -| value_loss | 6.48e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4818 | -| time_elapsed | 37674 | -| total_timesteps | 616704 | -| train/ | | -| approx_kl | 0.020017242 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 48170 | -| policy_gradient_loss | -0.00672 | -| std | 0.342 | -| value_loss | 1.72e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4819 | -| time_elapsed | 37677 | -| total_timesteps | 616832 | -| train/ | | -| approx_kl | 0.010997977 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.346 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 48180 | -| policy_gradient_loss | -0.00061 | -| std | 0.342 | -| value_loss | 3.27e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4820 | -| time_elapsed | 37681 | -| total_timesteps | 616960 | -| train/ | | -| approx_kl | 0.010148917 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.345 | -| explained_variance | -0.00152 | -| learning_rate | 0.0003 | -| loss | 0.000775 | -| n_updates | 48190 | -| policy_gradient_loss | -0.000403 | -| std | 0.342 | -| value_loss | 2.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4821 | -| time_elapsed | 37685 | -| total_timesteps | 617088 | -| train/ | | -| approx_kl | 0.020298013 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | -0.345 | -| explained_variance | 0.00469 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 48200 | -| policy_gradient_loss | -0.00685 | -| std | 0.342 | -| value_loss | 7.97e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4822 | -| time_elapsed | 37691 | -| total_timesteps | 617216 | -| train/ | | -| approx_kl | 0.017535694 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.345 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.00971 | -| n_updates | 48210 | -| policy_gradient_loss | -0.00367 | -| std | 0.342 | -| value_loss | 0.000179 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4823 | -| time_elapsed | 37695 | -| total_timesteps | 617344 | -| train/ | | -| approx_kl | 0.017295092 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.344 | -| explained_variance | -1.06e+03 | -| learning_rate | 0.0003 | -| loss | 0.00022 | -| n_updates | 48220 | -| policy_gradient_loss | -0.000166 | -| std | 0.341 | -| value_loss | 5.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4824 | -| time_elapsed | 37698 | -| total_timesteps | 617472 | -| train/ | | -| approx_kl | 0.020299703 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.344 | -| explained_variance | -342 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 48230 | -| policy_gradient_loss | -0.00567 | -| std | 0.341 | -| value_loss | 9.51e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4825 | -| time_elapsed | 37700 | -| total_timesteps | 617600 | -| train/ | | -| approx_kl | 0.025442597 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | -9.35 | -| learning_rate | 0.0003 | -| loss | -0.00935 | -| n_updates | 48240 | -| policy_gradient_loss | -0.00923 | -| std | 0.341 | -| value_loss | 5.15e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4826 | -| time_elapsed | 37703 | -| total_timesteps | 617728 | -| train/ | | -| approx_kl | 0.0133199785 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | -1.39 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 48250 | -| policy_gradient_loss | -0.00768 | -| std | 0.341 | -| value_loss | 9.4e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4827 | -| time_elapsed | 37706 | -| total_timesteps | 617856 | -| train/ | | -| approx_kl | 0.022291347 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | 0.00451 | -| learning_rate | 0.0003 | -| loss | 0.00649 | -| n_updates | 48260 | -| policy_gradient_loss | 0.0024 | -| std | 0.341 | -| value_loss | 6.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 16 | -| iterations | 4828 | -| time_elapsed | 37710 | -| total_timesteps | 617984 | -| train/ | | -| approx_kl | 0.025329856 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | 0.00355 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 48270 | -| policy_gradient_loss | -0.0166 | -| std | 0.341 | -| value_loss | 6.1e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4829 | -| time_elapsed | 37713 | -| total_timesteps | 618112 | -| train/ | | -| approx_kl | 0.006942434 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.344 | -| explained_variance | -0.00537 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 48280 | -| policy_gradient_loss | -0.000784 | -| std | 0.342 | -| value_loss | 2.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4830 | -| time_elapsed | 37721 | -| total_timesteps | 618240 | -| train/ | | -| approx_kl | 0.011889694 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 48290 | -| policy_gradient_loss | -0.0108 | -| std | 0.343 | -| value_loss | 0.000292 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4831 | -| time_elapsed | 37725 | -| total_timesteps | 618368 | -| train/ | | -| approx_kl | 0.01567203 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -184 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 48300 | -| policy_gradient_loss | -0.00683 | -| std | 0.343 | -| value_loss | 1.6e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4832 | -| time_elapsed | 37728 | -| total_timesteps | 618496 | -| train/ | | -| approx_kl | 0.0014593354 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.349 | -| explained_variance | -709 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 48310 | -| policy_gradient_loss | 0.000647 | -| std | 0.343 | -| value_loss | 2.11e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4833 | -| time_elapsed | 37732 | -| total_timesteps | 618624 | -| train/ | | -| approx_kl | 0.0016107559 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.349 | -| explained_variance | -2.74e+03 | -| learning_rate | 0.0003 | -| loss | -0.00633 | -| n_updates | 48320 | -| policy_gradient_loss | 0.00112 | -| std | 0.343 | -| value_loss | 2.77e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4834 | -| time_elapsed | 37734 | -| total_timesteps | 618752 | -| train/ | | -| approx_kl | 0.0014081597 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 48330 | -| policy_gradient_loss | 0.000555 | -| std | 0.343 | -| value_loss | 3.38e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 16 | -| iterations | 4835 | -| time_elapsed | 37737 | -| total_timesteps | 618880 | -| train/ | | -| approx_kl | 0.0013404414 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 48340 | -| policy_gradient_loss | 0.000576 | -| std | 0.342 | -| value_loss | 2.94e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4836 | -| time_elapsed | 37740 | -| total_timesteps | 619008 | -| train/ | | -| approx_kl | 0.0054422123 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.000102 | -| n_updates | 48350 | -| policy_gradient_loss | 0.00049 | -| std | 0.342 | -| value_loss | 6.7e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4837 | -| time_elapsed | 37747 | -| total_timesteps | 619136 | -| train/ | | -| approx_kl | 0.03373073 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | -0.00976 | -| n_updates | 48360 | -| policy_gradient_loss | -0.00743 | -| std | 0.342 | -| value_loss | 0.0022 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4838 | -| time_elapsed | 37750 | -| total_timesteps | 619264 | -| train/ | | -| approx_kl | 4.8621558e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -3.92e+03 | -| learning_rate | 0.0003 | -| loss | -0.000123 | -| n_updates | 48370 | -| policy_gradient_loss | 4.14e-05 | -| std | 0.342 | -| value_loss | 5.64e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4839 | -| time_elapsed | 37754 | -| total_timesteps | 619392 | -| train/ | | -| approx_kl | 0.030158173 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.345 | -| explained_variance | -7.4e+03 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 48380 | -| policy_gradient_loss | -0.00258 | -| std | 0.341 | -| value_loss | 9.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4840 | -| time_elapsed | 37758 | -| total_timesteps | 619520 | -| train/ | | -| approx_kl | 0.047318656 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | -0.342 | -| explained_variance | -234 | -| learning_rate | 0.0003 | -| loss | -0.00798 | -| n_updates | 48390 | -| policy_gradient_loss | -0.00646 | -| std | 0.34 | -| value_loss | 4.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4841 | -| time_elapsed | 37760 | -| total_timesteps | 619648 | -| train/ | | -| approx_kl | 0.044447273 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | -0.341 | -| explained_variance | -100 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 48400 | -| policy_gradient_loss | -0.00966 | -| std | 0.34 | -| value_loss | 9.71e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4842 | -| time_elapsed | 37764 | -| total_timesteps | 619776 | -| train/ | | -| approx_kl | 0.031496592 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.341 | -| explained_variance | -2.53 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 48410 | -| policy_gradient_loss | -0.00868 | -| std | 0.34 | -| value_loss | 4.8e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 16 | -| iterations | 4843 | -| time_elapsed | 37768 | -| total_timesteps | 619904 | -| train/ | | -| approx_kl | 0.0009143939 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 48420 | -| policy_gradient_loss | -0.000243 | -| std | 0.342 | -| value_loss | 8.18e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4844 | -| time_elapsed | 37770 | -| total_timesteps | 620032 | -| train/ | | -| approx_kl | 0.0042542275 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 48430 | -| policy_gradient_loss | -0.00104 | -| std | 0.343 | -| value_loss | 6.11e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4845 | -| time_elapsed | 37777 | -| total_timesteps | 620160 | -| train/ | | -| approx_kl | 0.001765341 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | 0.44 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 48440 | -| policy_gradient_loss | 0.000192 | -| std | 0.343 | -| value_loss | 0.000686 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4846 | -| time_elapsed | 37779 | -| total_timesteps | 620288 | -| train/ | | -| approx_kl | 0.041036192 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -437 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 48450 | -| policy_gradient_loss | -0.0113 | -| std | 0.343 | -| value_loss | 2.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4847 | -| time_elapsed | 37782 | -| total_timesteps | 620416 | -| train/ | | -| approx_kl | 0.018887049 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.349 | -| explained_variance | -173 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 48460 | -| policy_gradient_loss | -0.00863 | -| std | 0.343 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4848 | -| time_elapsed | 37784 | -| total_timesteps | 620544 | -| train/ | | -| approx_kl | 0.012526182 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -266 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 48470 | -| policy_gradient_loss | -0.000872 | -| std | 0.342 | -| value_loss | 3.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4849 | -| time_elapsed | 37787 | -| total_timesteps | 620672 | -| train/ | | -| approx_kl | 0.00852244 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.346 | -| explained_variance | -0.704 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 48480 | -| policy_gradient_loss | -0.00126 | -| std | 0.341 | -| value_loss | 1.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4850 | -| time_elapsed | 37791 | -| total_timesteps | 620800 | -| train/ | | -| approx_kl | 0.013775464 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | -2.96 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 48490 | -| policy_gradient_loss | -0.002 | -| std | 0.341 | -| value_loss | 6.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4851 | -| time_elapsed | 37795 | -| total_timesteps | 620928 | -| train/ | | -| approx_kl | 0.011402918 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | -6.31e+03 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 48500 | -| policy_gradient_loss | -0.00746 | -| std | 0.341 | -| value_loss | 8.59e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4852 | -| time_elapsed | 37798 | -| total_timesteps | 621056 | -| train/ | | -| approx_kl | 0.0053445874 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.342 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 48510 | -| policy_gradient_loss | -0.00215 | -| std | 0.341 | -| value_loss | 2.64e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4853 | -| time_elapsed | 37805 | -| total_timesteps | 621184 | -| train/ | | -| approx_kl | 0.00066604465 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.342 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 48520 | -| policy_gradient_loss | 0.00118 | -| std | 0.341 | -| value_loss | 0.000167 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4854 | -| time_elapsed | 37809 | -| total_timesteps | 621312 | -| train/ | | -| approx_kl | 0.05345615 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | -0.342 | -| explained_variance | -148 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 48530 | -| policy_gradient_loss | -0.0102 | -| std | 0.34 | -| value_loss | 5.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4855 | -| time_elapsed | 37812 | -| total_timesteps | 621440 | -| train/ | | -| approx_kl | 0.010064095 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.342 | -| explained_variance | -40.3 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 48540 | -| policy_gradient_loss | -0.000889 | -| std | 0.341 | -| value_loss | 1.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4856 | -| time_elapsed | 37816 | -| total_timesteps | 621568 | -| train/ | | -| approx_kl | 0.01131249 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.344 | -| explained_variance | -0.577 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 48550 | -| policy_gradient_loss | -0.00174 | -| std | 0.342 | -| value_loss | 2.24e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4857 | -| time_elapsed | 37819 | -| total_timesteps | 621696 | -| train/ | | -| approx_kl | 0.009370841 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.345 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 48560 | -| policy_gradient_loss | -0.00106 | -| std | 0.342 | -| value_loss | 1.13e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4858 | -| time_elapsed | 37821 | -| total_timesteps | 621824 | -| train/ | | -| approx_kl | 0.0070376024 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.345 | -| explained_variance | -0.000289 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 48570 | -| policy_gradient_loss | -0.00101 | -| std | 0.342 | -| value_loss | 1.36e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 16 | -| iterations | 4859 | -| time_elapsed | 37824 | -| total_timesteps | 621952 | -| train/ | | -| approx_kl | 0.014154982 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.345 | -| explained_variance | -0.000203 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 48580 | -| policy_gradient_loss | -0.00652 | -| std | 0.342 | -| value_loss | 1.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4860 | -| time_elapsed | 37826 | -| total_timesteps | 622080 | -| train/ | | -| approx_kl | 0.008261158 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.346 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 48590 | -| policy_gradient_loss | -0.00244 | -| std | 0.342 | -| value_loss | 5.84e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4861 | -| time_elapsed | 37831 | -| total_timesteps | 622208 | -| train/ | | -| approx_kl | 0.052045234 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | 0.903 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 48600 | -| policy_gradient_loss | -0.00424 | -| std | 0.342 | -| value_loss | 0.000645 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4862 | -| time_elapsed | 37835 | -| total_timesteps | 622336 | -| train/ | | -| approx_kl | 0.0058765044 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.346 | -| explained_variance | -1.51e+03 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 48610 | -| policy_gradient_loss | -0.00116 | -| std | 0.342 | -| value_loss | 5.41e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4863 | -| time_elapsed | 37839 | -| total_timesteps | 622464 | -| train/ | | -| approx_kl | 0.029902605 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.346 | -| explained_variance | -2.43e+03 | -| learning_rate | 0.0003 | -| loss | -0.000521 | -| n_updates | 48620 | -| policy_gradient_loss | -0.00167 | -| std | 0.342 | -| value_loss | 2.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4864 | -| time_elapsed | 37842 | -| total_timesteps | 622592 | -| train/ | | -| approx_kl | 0.019672932 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.346 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 48630 | -| policy_gradient_loss | -0.0049 | -| std | 0.342 | -| value_loss | 2.3e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4865 | -| time_elapsed | 37845 | -| total_timesteps | 622720 | -| train/ | | -| approx_kl | 3.096182e-06 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -33.3 | -| learning_rate | 0.0003 | -| loss | -5.67e-05 | -| n_updates | 48640 | -| policy_gradient_loss | 0.000886 | -| std | 0.342 | -| value_loss | 4.26e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4866 | -| time_elapsed | 37847 | -| total_timesteps | 622848 | -| train/ | | -| approx_kl | 0.0021178084 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -2.1 | -| learning_rate | 0.0003 | -| loss | -0.00762 | -| n_updates | 48650 | -| policy_gradient_loss | -2.05e-05 | -| std | 0.342 | -| value_loss | 1.82e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 16 | -| iterations | 4867 | -| time_elapsed | 37850 | -| total_timesteps | 622976 | -| train/ | | -| approx_kl | 0.0009829644 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.347 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 48660 | -| policy_gradient_loss | 0.000583 | -| std | 0.342 | -| value_loss | 2.41e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4868 | -| time_elapsed | 37853 | -| total_timesteps | 623104 | -| train/ | | -| approx_kl | 0.010782866 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.00428 | -| n_updates | 48670 | -| policy_gradient_loss | -0.00419 | -| std | 0.343 | -| value_loss | 2.93e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4869 | -| time_elapsed | 37860 | -| total_timesteps | 623232 | -| train/ | | -| approx_kl | 0.051423777 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 48680 | -| policy_gradient_loss | -0.00829 | -| std | 0.342 | -| value_loss | 0.00246 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4870 | -| time_elapsed | 37863 | -| total_timesteps | 623360 | -| train/ | | -| approx_kl | 0.0006052605 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -807 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 48690 | -| policy_gradient_loss | 0.000544 | -| std | 0.343 | -| value_loss | 5.79e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4871 | -| time_elapsed | 37866 | -| total_timesteps | 623488 | -| train/ | | -| approx_kl | 0.009702155 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.351 | -| explained_variance | -1.78e+03 | -| learning_rate | 0.0003 | -| loss | -0.000208 | -| n_updates | 48700 | -| policy_gradient_loss | -0.000124 | -| std | 0.345 | -| value_loss | 1.96e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4872 | -| time_elapsed | 37870 | -| total_timesteps | 623616 | -| train/ | | -| approx_kl | 0.012985547 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -16.1 | -| learning_rate | 0.0003 | -| loss | -0.00393 | -| n_updates | 48710 | -| policy_gradient_loss | -0.00195 | -| std | 0.345 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4873 | -| time_elapsed | 37874 | -| total_timesteps | 623744 | -| train/ | | -| approx_kl | 0.005778044 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -35.2 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 48720 | -| policy_gradient_loss | -0.00106 | -| std | 0.345 | -| value_loss | 7.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4874 | -| time_elapsed | 37877 | -| total_timesteps | 623872 | -| train/ | | -| approx_kl | 0.010288507 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | 0.00274 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 48730 | -| policy_gradient_loss | -0.00171 | -| std | 0.345 | -| value_loss | 2.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4875 | -| time_elapsed | 37880 | -| total_timesteps | 624000 | -| train/ | | -| approx_kl | 0.012736872 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.21 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 48740 | -| policy_gradient_loss | -0.00541 | -| std | 0.345 | -| value_loss | 1.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4876 | -| time_elapsed | 37883 | -| total_timesteps | 624128 | -| train/ | | -| approx_kl | 0.016836636 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | 0.0037 | -| learning_rate | 0.0003 | -| loss | 0.00778 | -| n_updates | 48750 | -| policy_gradient_loss | 0.00406 | -| std | 0.345 | -| value_loss | 6.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4877 | -| time_elapsed | 37890 | -| total_timesteps | 624256 | -| train/ | | -| approx_kl | 0.009523425 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 48760 | -| policy_gradient_loss | -0.00225 | -| std | 0.345 | -| value_loss | 0.000856 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4878 | -| time_elapsed | 37893 | -| total_timesteps | 624384 | -| train/ | | -| approx_kl | 0.07806343 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -713 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 48770 | -| policy_gradient_loss | -0.00614 | -| std | 0.345 | -| value_loss | 5.19e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4879 | -| time_elapsed | 37896 | -| total_timesteps | 624512 | -| train/ | | -| approx_kl | 0.028488422 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -55.1 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 48780 | -| policy_gradient_loss | -0.0018 | -| std | 0.345 | -| value_loss | 9.04e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4880 | -| time_elapsed | 37898 | -| total_timesteps | 624640 | -| train/ | | -| approx_kl | 0.0068000774 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -2.54 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 48790 | -| policy_gradient_loss | -0.000878 | -| std | 0.346 | -| value_loss | 8.68e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4881 | -| time_elapsed | 37900 | -| total_timesteps | 624768 | -| train/ | | -| approx_kl | 0.00042553665 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -34.7 | -| learning_rate | 0.0003 | -| loss | -0.000387 | -| n_updates | 48800 | -| policy_gradient_loss | -1.37e-05 | -| std | 0.348 | -| value_loss | 9.24e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 16 | -| iterations | 4882 | -| time_elapsed | 37903 | -| total_timesteps | 624896 | -| train/ | | -| approx_kl | 0.0040424177 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.366 | -| explained_variance | -0.621 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 48810 | -| policy_gradient_loss | -0.000681 | -| std | 0.35 | -| value_loss | 7.9e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4883 | -| time_elapsed | 37905 | -| total_timesteps | 625024 | -| train/ | | -| approx_kl | 0.0023260321 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -0.00599 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 48820 | -| policy_gradient_loss | -0.000375 | -| std | 0.352 | -| value_loss | 4.9e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4884 | -| time_elapsed | 37913 | -| total_timesteps | 625152 | -| train/ | | -| approx_kl | 0.07884441 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | -0.375 | -| explained_variance | -0.359 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 48830 | -| policy_gradient_loss | -0.00795 | -| std | 0.352 | -| value_loss | 0.00218 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4885 | -| time_elapsed | 37917 | -| total_timesteps | 625280 | -| train/ | | -| approx_kl | 0.0040507093 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.376 | -| explained_variance | -364 | -| learning_rate | 0.0003 | -| loss | 0.000358 | -| n_updates | 48840 | -| policy_gradient_loss | 0.000293 | -| std | 0.352 | -| value_loss | 7.9e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4886 | -| time_elapsed | 37919 | -| total_timesteps | 625408 | -| train/ | | -| approx_kl | 0.015812358 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -275 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 48850 | -| policy_gradient_loss | -0.00513 | -| std | 0.351 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4887 | -| time_elapsed | 37922 | -| total_timesteps | 625536 | -| train/ | | -| approx_kl | 0.0014929539 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | -0.372 | -| explained_variance | -0.83 | -| learning_rate | 0.0003 | -| loss | 0.000674 | -| n_updates | 48860 | -| policy_gradient_loss | 0.000782 | -| std | 0.351 | -| value_loss | 4.43e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4888 | -| time_elapsed | 37925 | -| total_timesteps | 625664 | -| train/ | | -| approx_kl | 0.013959004 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.000149 | -| n_updates | 48870 | -| policy_gradient_loss | -0.00138 | -| std | 0.351 | -| value_loss | 2.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4889 | -| time_elapsed | 37928 | -| total_timesteps | 625792 | -| train/ | | -| approx_kl | 0.014634122 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 48880 | -| policy_gradient_loss | -0.00243 | -| std | 0.35 | -| value_loss | 1.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 16 | -| iterations | 4890 | -| time_elapsed | 37932 | -| total_timesteps | 625920 | -| train/ | | -| approx_kl | 0.018438011 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | 0.000227 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 48890 | -| policy_gradient_loss | -0.00387 | -| std | 0.35 | -| value_loss | 1.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4891 | -| time_elapsed | 37935 | -| total_timesteps | 626048 | -| train/ | | -| approx_kl | 0.025030673 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -0.00323 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 48900 | -| policy_gradient_loss | -0.0116 | -| std | 0.35 | -| value_loss | 1.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4892 | -| time_elapsed | 37942 | -| total_timesteps | 626176 | -| train/ | | -| approx_kl | 0.011147025 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 48910 | -| policy_gradient_loss | -0.00902 | -| std | 0.35 | -| value_loss | 0.00268 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4893 | -| time_elapsed | 37946 | -| total_timesteps | 626304 | -| train/ | | -| approx_kl | 0.012912165 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -406 | -| learning_rate | 0.0003 | -| loss | -0.000904 | -| n_updates | 48920 | -| policy_gradient_loss | -0.000555 | -| std | 0.351 | -| value_loss | 3.85e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4894 | -| time_elapsed | 37949 | -| total_timesteps | 626432 | -| train/ | | -| approx_kl | 0.0042394227 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.374 | -| explained_variance | -1.65e+03 | -| learning_rate | 0.0003 | -| loss | -0.000902 | -| n_updates | 48930 | -| policy_gradient_loss | -0.0004 | -| std | 0.353 | -| value_loss | 1.84e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4895 | -| time_elapsed | 37952 | -| total_timesteps | 626560 | -| train/ | | -| approx_kl | 0.019013792 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | -0.377 | -| explained_variance | -19.1 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 48940 | -| policy_gradient_loss | -0.00154 | -| std | 0.352 | -| value_loss | 9.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4896 | -| time_elapsed | 37956 | -| total_timesteps | 626688 | -| train/ | | -| approx_kl | 0.017463809 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.375 | -| explained_variance | -49.6 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 48950 | -| policy_gradient_loss | -0.00163 | -| std | 0.352 | -| value_loss | 4.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4897 | -| time_elapsed | 37958 | -| total_timesteps | 626816 | -| train/ | | -| approx_kl | 0.020093407 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.374 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.0081 | -| n_updates | 48960 | -| policy_gradient_loss | -0.00679 | -| std | 0.352 | -| value_loss | 4.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 16 | -| iterations | 4898 | -| time_elapsed | 37960 | -| total_timesteps | 626944 | -| train/ | | -| approx_kl | 0.014614362 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -1.32 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 48970 | -| policy_gradient_loss | -0.00234 | -| std | 0.351 | -| value_loss | 3.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4899 | -| time_elapsed | 37965 | -| total_timesteps | 627072 | -| train/ | | -| approx_kl | 0.023266692 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -3.38 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 48980 | -| policy_gradient_loss | -0.0124 | -| std | 0.351 | -| value_loss | 4.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4900 | -| time_elapsed | 37971 | -| total_timesteps | 627200 | -| train/ | | -| approx_kl | 0.031065611 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -0.469 | -| learning_rate | 0.0003 | -| loss | -0.00974 | -| n_updates | 48990 | -| policy_gradient_loss | -0.005 | -| std | 0.351 | -| value_loss | 0.00209 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4901 | -| time_elapsed | 37974 | -| total_timesteps | 627328 | -| train/ | | -| approx_kl | 0.058004268 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -4.04e+03 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 49000 | -| policy_gradient_loss | -0.00942 | -| std | 0.351 | -| value_loss | 6.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4902 | -| time_elapsed | 37976 | -| total_timesteps | 627456 | -| train/ | | -| approx_kl | 0.025295714 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | -0.372 | -| explained_variance | -3.89e+03 | -| learning_rate | 0.0003 | -| loss | 3.35e-05 | -| n_updates | 49010 | -| policy_gradient_loss | -0.00117 | -| std | 0.351 | -| value_loss | 1.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4903 | -| time_elapsed | 37980 | -| total_timesteps | 627584 | -| train/ | | -| approx_kl | 0.022348946 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -18.5 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 49020 | -| policy_gradient_loss | -0.00236 | -| std | 0.351 | -| value_loss | 1.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4904 | -| time_elapsed | 37984 | -| total_timesteps | 627712 | -| train/ | | -| approx_kl | 0.042015146 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | -0.372 | -| explained_variance | -90.4 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 49030 | -| policy_gradient_loss | -0.0101 | -| std | 0.351 | -| value_loss | 7.99e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4905 | -| time_elapsed | 37987 | -| total_timesteps | 627840 | -| train/ | | -| approx_kl | 0.010996721 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -2.58 | -| learning_rate | 0.0003 | -| loss | 0.000131 | -| n_updates | 49040 | -| policy_gradient_loss | -7.5e-05 | -| std | 0.351 | -| value_loss | 5.4e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 16 | -| iterations | 4906 | -| time_elapsed | 37990 | -| total_timesteps | 627968 | -| train/ | | -| approx_kl | 0.02266024 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.372 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 49050 | -| policy_gradient_loss | -0.00775 | -| std | 0.351 | -| value_loss | 6.71e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4907 | -| time_elapsed | 37993 | -| total_timesteps | 628096 | -| train/ | | -| approx_kl | 0.016241929 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -0.372 | -| explained_variance | 0.00826 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 49060 | -| policy_gradient_loss | -0.00932 | -| std | 0.351 | -| value_loss | 2.59e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4908 | -| time_elapsed | 37999 | -| total_timesteps | 628224 | -| train/ | | -| approx_kl | 0.01633498 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.372 | -| explained_variance | 0.851 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 49070 | -| policy_gradient_loss | -0.0134 | -| std | 0.351 | -| value_loss | 0.00206 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4909 | -| time_elapsed | 38003 | -| total_timesteps | 628352 | -| train/ | | -| approx_kl | 0.019412678 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.374 | -| explained_variance | -1.32e+03 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 49080 | -| policy_gradient_loss | -0.00155 | -| std | 0.352 | -| value_loss | 1.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4910 | -| time_elapsed | 38007 | -| total_timesteps | 628480 | -| train/ | | -| approx_kl | 0.001699971 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.375 | -| explained_variance | -2.71e+03 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 49090 | -| policy_gradient_loss | -7.13e-05 | -| std | 0.353 | -| value_loss | 3.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4911 | -| time_elapsed | 38010 | -| total_timesteps | 628608 | -| train/ | | -| approx_kl | 0.026603151 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | -0.377 | -| explained_variance | -180 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 49100 | -| policy_gradient_loss | -0.00161 | -| std | 0.353 | -| value_loss | 1.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4912 | -| time_elapsed | 38013 | -| total_timesteps | 628736 | -| train/ | | -| approx_kl | 0.014730586 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.376 | -| explained_variance | -176 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 49110 | -| policy_gradient_loss | -0.00124 | -| std | 0.352 | -| value_loss | 6.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4913 | -| time_elapsed | 38016 | -| total_timesteps | 628864 | -| train/ | | -| approx_kl | 0.023815993 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | -0.374 | -| explained_variance | -19.5 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 49120 | -| policy_gradient_loss | -0.00924 | -| std | 0.351 | -| value_loss | 6.57e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 16 | -| iterations | 4914 | -| time_elapsed | 38019 | -| total_timesteps | 628992 | -| train/ | | -| approx_kl | 0.019087112 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.373 | -| explained_variance | -33.7 | -| learning_rate | 0.0003 | -| loss | -0.00897 | -| n_updates | 49130 | -| policy_gradient_loss | -0.00467 | -| std | 0.351 | -| value_loss | 5.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4915 | -| time_elapsed | 38022 | -| total_timesteps | 629120 | -| train/ | | -| approx_kl | 0.018233776 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.371 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 49140 | -| policy_gradient_loss | -0.00298 | -| std | 0.351 | -| value_loss | 5.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4916 | -| time_elapsed | 38031 | -| total_timesteps | 629248 | -| train/ | | -| approx_kl | 0.014110608 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.00986 | -| n_updates | 49150 | -| policy_gradient_loss | -0.00404 | -| std | 0.35 | -| value_loss | 0.00285 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4917 | -| time_elapsed | 38035 | -| total_timesteps | 629376 | -| train/ | | -| approx_kl | 4.0999614e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | -1.04e+03 | -| learning_rate | 0.0003 | -| loss | -0.000561 | -| n_updates | 49160 | -| policy_gradient_loss | 0.00179 | -| std | 0.35 | -| value_loss | 6e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4918 | -| time_elapsed | 38038 | -| total_timesteps | 629504 | -| train/ | | -| approx_kl | 0.0473327 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | -378 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 49170 | -| policy_gradient_loss | -0.0167 | -| std | 0.35 | -| value_loss | 1.75e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4919 | -| time_elapsed | 38043 | -| total_timesteps | 629632 | -| train/ | | -| approx_kl | 0.0084371045 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.368 | -| explained_variance | -14.3 | -| learning_rate | 0.0003 | -| loss | 1.17e-05 | -| n_updates | 49180 | -| policy_gradient_loss | -0.000155 | -| std | 0.35 | -| value_loss | 1.3e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4920 | -| time_elapsed | 38046 | -| total_timesteps | 629760 | -| train/ | | -| approx_kl | 0.01765918 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | -7.12 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 49190 | -| policy_gradient_loss | -0.0133 | -| std | 0.349 | -| value_loss | 3.32e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 16 | -| iterations | 4921 | -| time_elapsed | 38050 | -| total_timesteps | 629888 | -| train/ | | -| approx_kl | 0.023499232 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | -0.366 | -| explained_variance | -0.807 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 49200 | -| policy_gradient_loss | -0.00749 | -| std | 0.349 | -| value_loss | 9.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4922 | -| time_elapsed | 38054 | -| total_timesteps | 630016 | -| train/ | | -| approx_kl | 0.018167783 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.366 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 49210 | -| policy_gradient_loss | -0.00778 | -| std | 0.349 | -| value_loss | 2.4e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4923 | -| time_elapsed | 38062 | -| total_timesteps | 630144 | -| train/ | | -| approx_kl | 0.0059076673 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.366 | -| explained_variance | 0.678 | -| learning_rate | 0.0003 | -| loss | 0.000144 | -| n_updates | 49220 | -| policy_gradient_loss | 5.35e-06 | -| std | 0.35 | -| value_loss | 0.000716 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4924 | -| time_elapsed | 38066 | -| total_timesteps | 630272 | -| train/ | | -| approx_kl | 0.0147378305 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | -1.3e+03 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 49230 | -| policy_gradient_loss | -0.00346 | -| std | 0.35 | -| value_loss | 7.99e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4925 | -| time_elapsed | 38070 | -| total_timesteps | 630400 | -| train/ | | -| approx_kl | 0.021395124 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | -547 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 49240 | -| policy_gradient_loss | -0.00579 | -| std | 0.35 | -| value_loss | 1.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4926 | -| time_elapsed | 38074 | -| total_timesteps | 630528 | -| train/ | | -| approx_kl | 0.018319514 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | -6.81 | -| learning_rate | 0.0003 | -| loss | 0.000342 | -| n_updates | 49250 | -| policy_gradient_loss | -5.07e-05 | -| std | 0.35 | -| value_loss | 1.5e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4927 | -| time_elapsed | 38078 | -| total_timesteps | 630656 | -| train/ | | -| approx_kl | 0.0059933607 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.366 | -| explained_variance | -0.495 | -| learning_rate | 0.0003 | -| loss | 1.02e-05 | -| n_updates | 49260 | -| policy_gradient_loss | -0.000443 | -| std | 0.348 | -| value_loss | 1.29e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4928 | -| time_elapsed | 38081 | -| total_timesteps | 630784 | -| train/ | | -| approx_kl | 0.0074103503 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.000342 | -| n_updates | 49270 | -| policy_gradient_loss | -0.000378 | -| std | 0.348 | -| value_loss | 3.11e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 16 | -| iterations | 4929 | -| time_elapsed | 38084 | -| total_timesteps | 630912 | -| train/ | | -| approx_kl | 0.022351516 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 49280 | -| policy_gradient_loss | -0.00784 | -| std | 0.347 | -| value_loss | 1.56e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4930 | -| time_elapsed | 38087 | -| total_timesteps | 631040 | -| train/ | | -| approx_kl | 0.0013213968 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | -0.000164 | -| n_updates | 49290 | -| policy_gradient_loss | -6.31e-05 | -| std | 0.347 | -| value_loss | 1.46e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4931 | -| time_elapsed | 38093 | -| total_timesteps | 631168 | -| train/ | | -| approx_kl | 0.030512609 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -4.02 | -| learning_rate | 0.0003 | -| loss | -0.0074 | -| n_updates | 49300 | -| policy_gradient_loss | -0.00385 | -| std | 0.347 | -| value_loss | 0.00192 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4932 | -| time_elapsed | 38097 | -| total_timesteps | 631296 | -| train/ | | -| approx_kl | 0.057693306 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -469 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 49310 | -| policy_gradient_loss | -0.00597 | -| std | 0.347 | -| value_loss | 6.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4933 | -| time_elapsed | 38100 | -| total_timesteps | 631424 | -| train/ | | -| approx_kl | 0.018480571 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -3.49e+03 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 49320 | -| policy_gradient_loss | -0.00845 | -| std | 0.347 | -| value_loss | 2.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4934 | -| time_elapsed | 38102 | -| total_timesteps | 631552 | -| train/ | | -| approx_kl | 0.051791493 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -796 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 49330 | -| policy_gradient_loss | -0.0115 | -| std | 0.347 | -| value_loss | 4.69e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4935 | -| time_elapsed | 38106 | -| total_timesteps | 631680 | -| train/ | | -| approx_kl | 0.00092895096 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -68.7 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 49340 | -| policy_gradient_loss | 0.000759 | -| std | 0.347 | -| value_loss | 1.05e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4936 | -| time_elapsed | 38109 | -| total_timesteps | 631808 | -| train/ | | -| approx_kl | 0.0015805974 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -13.3 | -| learning_rate | 0.0003 | -| loss | -0.00852 | -| n_updates | 49350 | -| policy_gradient_loss | 0.00104 | -| std | 0.347 | -| value_loss | 2.88e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4937 | -| time_elapsed | 38112 | -| total_timesteps | 631936 | -| train/ | | -| approx_kl | 0.011863584 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 49360 | -| policy_gradient_loss | 0.00127 | -| std | 0.346 | -| value_loss | 5.15e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4938 | -| time_elapsed | 38116 | -| total_timesteps | 632064 | -| train/ | | -| approx_kl | 0.026383238 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | -0.00717 | -| n_updates | 49370 | -| policy_gradient_loss | -0.00648 | -| std | 0.346 | -| value_loss | 1.37e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4939 | -| time_elapsed | 38122 | -| total_timesteps | 632192 | -| train/ | | -| approx_kl | 0.018489283 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | 0.807 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 49380 | -| policy_gradient_loss | -0.00876 | -| std | 0.346 | -| value_loss | 0.00177 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4940 | -| time_elapsed | 38125 | -| total_timesteps | 632320 | -| train/ | | -| approx_kl | 0.07159352 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -20.7 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 49390 | -| policy_gradient_loss | -0.00361 | -| std | 0.347 | -| value_loss | 2.28e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4941 | -| time_elapsed | 38129 | -| total_timesteps | 632448 | -| train/ | | -| approx_kl | 0.0009267004 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -145 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 49400 | -| policy_gradient_loss | 0.00132 | -| std | 0.347 | -| value_loss | 1.85e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4942 | -| time_elapsed | 38133 | -| total_timesteps | 632576 | -| train/ | | -| approx_kl | 0.0015016524 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -347 | -| learning_rate | 0.0003 | -| loss | -0.00338 | -| n_updates | 49410 | -| policy_gradient_loss | 0.000411 | -| std | 0.347 | -| value_loss | 2.12e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4943 | -| time_elapsed | 38136 | -| total_timesteps | 632704 | -| train/ | | -| approx_kl | 0.017982788 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | -0.000302 | -| n_updates | 49420 | -| policy_gradient_loss | -0.000441 | -| std | 0.348 | -| value_loss | 4.97e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4944 | -| time_elapsed | 38140 | -| total_timesteps | 632832 | -| train/ | | -| approx_kl | 0.0038256939 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -0.000204 | -| n_updates | 49430 | -| policy_gradient_loss | -0.000483 | -| std | 0.35 | -| value_loss | 1.6e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4945 | -| time_elapsed | 38144 | -| total_timesteps | 632960 | -| train/ | | -| approx_kl | 0.015183801 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 49440 | -| policy_gradient_loss | -0.00305 | -| std | 0.35 | -| value_loss | 6.73e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4946 | -| time_elapsed | 38147 | -| total_timesteps | 633088 | -| train/ | | -| approx_kl | 0.004087364 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | 0.00407 | -| learning_rate | 0.0003 | -| loss | -0.000459 | -| n_updates | 49450 | -| policy_gradient_loss | -0.00039 | -| std | 0.348 | -| value_loss | 1.2e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4947 | -| time_elapsed | 38153 | -| total_timesteps | 633216 | -| train/ | | -| approx_kl | 0.014475829 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 49460 | -| policy_gradient_loss | -0.00265 | -| std | 0.347 | -| value_loss | 0.000144 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4948 | -| time_elapsed | 38157 | -| total_timesteps | 633344 | -| train/ | | -| approx_kl | 0.00048771594 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -190 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 49470 | -| policy_gradient_loss | 0.00073 | -| std | 0.347 | -| value_loss | 8.32e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4949 | -| time_elapsed | 38160 | -| total_timesteps | 633472 | -| train/ | | -| approx_kl | 0.057217013 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -131 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 49480 | -| policy_gradient_loss | -0.0117 | -| std | 0.347 | -| value_loss | 2.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4950 | -| time_elapsed | 38163 | -| total_timesteps | 633600 | -| train/ | | -| approx_kl | 0.002456694 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -7.53 | -| learning_rate | 0.0003 | -| loss | 4.68e-06 | -| n_updates | 49490 | -| policy_gradient_loss | 3.65e-05 | -| std | 0.348 | -| value_loss | 1.73e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4951 | -| time_elapsed | 38167 | -| total_timesteps | 633728 | -| train/ | | -| approx_kl | 0.015490513 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.00294 | -| n_updates | 49500 | -| policy_gradient_loss | -0.000624 | -| std | 0.348 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4952 | -| time_elapsed | 38171 | -| total_timesteps | 633856 | -| train/ | | -| approx_kl | 0.008491922 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.000951 | -| n_updates | 49510 | -| policy_gradient_loss | -0.0014 | -| std | 0.348 | -| value_loss | 4.42e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 16 | -| iterations | 4953 | -| time_elapsed | 38174 | -| total_timesteps | 633984 | -| train/ | | -| approx_kl | 0.020846711 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | 0.00653 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 49520 | -| policy_gradient_loss | -0.0088 | -| std | 0.347 | -| value_loss | 5.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4954 | -| time_elapsed | 38177 | -| total_timesteps | 634112 | -| train/ | | -| approx_kl | 0.011454651 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -0.00284 | -| learning_rate | 0.0003 | -| loss | -0.000867 | -| n_updates | 49530 | -| policy_gradient_loss | -0.00176 | -| std | 0.347 | -| value_loss | 6.94e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4955 | -| time_elapsed | 38184 | -| total_timesteps | 634240 | -| train/ | | -| approx_kl | 0.03551811 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -4.53 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 49540 | -| policy_gradient_loss | -0.00808 | -| std | 0.346 | -| value_loss | 0.00179 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4956 | -| time_elapsed | 38187 | -| total_timesteps | 634368 | -| train/ | | -| approx_kl | 0.0016349088 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -2.06e+03 | -| learning_rate | 0.0003 | -| loss | -0.00857 | -| n_updates | 49550 | -| policy_gradient_loss | 0.00166 | -| std | 0.346 | -| value_loss | 3.66e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4957 | -| time_elapsed | 38190 | -| total_timesteps | 634496 | -| train/ | | -| approx_kl | 0.025986044 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -1.13e+03 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 49560 | -| policy_gradient_loss | -0.00727 | -| std | 0.346 | -| value_loss | 1.41e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4958 | -| time_elapsed | 38194 | -| total_timesteps | 634624 | -| train/ | | -| approx_kl | 0.00047553657 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -696 | -| learning_rate | 0.0003 | -| loss | -0.000283 | -| n_updates | 49570 | -| policy_gradient_loss | -6.14e-05 | -| std | 0.346 | -| value_loss | 1.1e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4959 | -| time_elapsed | 38196 | -| total_timesteps | 634752 | -| train/ | | -| approx_kl | 0.02737303 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -28.7 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 49580 | -| policy_gradient_loss | -0.011 | -| std | 0.346 | -| value_loss | 5.51e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 16 | -| iterations | 4960 | -| time_elapsed | 38199 | -| total_timesteps | 634880 | -| train/ | | -| approx_kl | 0.019743118 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -17.9 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 49590 | -| policy_gradient_loss | -0.00224 | -| std | 0.346 | -| value_loss | 5.58e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4961 | -| time_elapsed | 38202 | -| total_timesteps | 635008 | -| train/ | | -| approx_kl | 0.026172224 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00763 | -| n_updates | 49600 | -| policy_gradient_loss | -0.00802 | -| std | 0.347 | -| value_loss | 1.22e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4962 | -| time_elapsed | 38212 | -| total_timesteps | 635136 | -| train/ | | -| approx_kl | 0.019633578 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | 0.666 | -| learning_rate | 0.0003 | -| loss | -0.0091 | -| n_updates | 49610 | -| policy_gradient_loss | -0.00478 | -| std | 0.346 | -| value_loss | 0.00566 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4963 | -| time_elapsed | 38215 | -| total_timesteps | 635264 | -| train/ | | -| approx_kl | 1.672702e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -152 | -| learning_rate | 0.0003 | -| loss | -0.00062 | -| n_updates | 49620 | -| policy_gradient_loss | 0.00349 | -| std | 0.346 | -| value_loss | 8.06e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4964 | -| time_elapsed | 38219 | -| total_timesteps | 635392 | -| train/ | | -| approx_kl | 0.0021940116 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -2.79e+03 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 49630 | -| policy_gradient_loss | 7.44e-06 | -| std | 0.346 | -| value_loss | 3.85e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4965 | -| time_elapsed | 38222 | -| total_timesteps | 635520 | -| train/ | | -| approx_kl | 0.060242996 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -2.99e+03 | -| learning_rate | 0.0003 | -| loss | -0.0087 | -| n_updates | 49640 | -| policy_gradient_loss | -0.00684 | -| std | 0.347 | -| value_loss | 2.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4966 | -| time_elapsed | 38224 | -| total_timesteps | 635648 | -| train/ | | -| approx_kl | 0.011226903 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -6.66 | -| learning_rate | 0.0003 | -| loss | -0.00085 | -| n_updates | 49650 | -| policy_gradient_loss | -0.0009 | -| std | 0.346 | -| value_loss | 4.22e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4967 | -| time_elapsed | 38227 | -| total_timesteps | 635776 | -| train/ | | -| approx_kl | 0.01821912 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -112 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 49660 | -| policy_gradient_loss | -0.00133 | -| std | 0.345 | -| value_loss | 1.85e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 4968 | -| time_elapsed | 38230 | -| total_timesteps | 635904 | -| train/ | | -| approx_kl | 0.008205935 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.000606 | -| n_updates | 49670 | -| policy_gradient_loss | -0.000635 | -| std | 0.346 | -| value_loss | 7.87e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4969 | -| time_elapsed | 38233 | -| total_timesteps | 636032 | -| train/ | | -| approx_kl | 0.00917829 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 49680 | -| policy_gradient_loss | -0.00138 | -| std | 0.345 | -| value_loss | 1.38e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4970 | -| time_elapsed | 38240 | -| total_timesteps | 636160 | -| train/ | | -| approx_kl | 0.011593981 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | 0.888 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 49690 | -| policy_gradient_loss | -0.00065 | -| std | 0.345 | -| value_loss | 0.000246 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4971 | -| time_elapsed | 38243 | -| total_timesteps | 636288 | -| train/ | | -| approx_kl | 0.009626713 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -1.12e+03 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 49700 | -| policy_gradient_loss | -0.00109 | -| std | 0.345 | -| value_loss | 2.34e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4972 | -| time_elapsed | 38245 | -| total_timesteps | 636416 | -| train/ | | -| approx_kl | 0.00068784924 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -3.84e+03 | -| learning_rate | 0.0003 | -| loss | -0.00849 | -| n_updates | 49710 | -| policy_gradient_loss | 0.00334 | -| std | 0.344 | -| value_loss | 1.2e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4973 | -| time_elapsed | 38248 | -| total_timesteps | 636544 | -| train/ | | -| approx_kl | 0.031075733 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -7.95 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 49720 | -| policy_gradient_loss | -0.0152 | -| std | 0.345 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4974 | -| time_elapsed | 38250 | -| total_timesteps | 636672 | -| train/ | | -| approx_kl | 0.021586752 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -5.13 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 49730 | -| policy_gradient_loss | -0.00796 | -| std | 0.345 | -| value_loss | 1.67e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4975 | -| time_elapsed | 38253 | -| total_timesteps | 636800 | -| train/ | | -| approx_kl | 0.0017289659 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | 5.24e-05 | -| n_updates | 49740 | -| policy_gradient_loss | 0.000251 | -| std | 0.346 | -| value_loss | 5.68e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 16 | -| iterations | 4976 | -| time_elapsed | 38256 | -| total_timesteps | 636928 | -| train/ | | -| approx_kl | 0.00034895446 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -0.00389 | -| learning_rate | 0.0003 | -| loss | -0.000371 | -| n_updates | 49750 | -| policy_gradient_loss | -2.95e-05 | -| std | 0.346 | -| value_loss | 7.57e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4977 | -| time_elapsed | 38258 | -| total_timesteps | 637056 | -| train/ | | -| approx_kl | 0.012908323 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 49760 | -| policy_gradient_loss | -0.00477 | -| std | 0.347 | -| value_loss | 1.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4978 | -| time_elapsed | 38264 | -| total_timesteps | 637184 | -| train/ | | -| approx_kl | 0.02168875 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | 0.828 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 49770 | -| policy_gradient_loss | -0.00514 | -| std | 0.347 | -| value_loss | 0.00176 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4979 | -| time_elapsed | 38267 | -| total_timesteps | 637312 | -| train/ | | -| approx_kl | 0.07396889 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -1.09e+03 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 49780 | -| policy_gradient_loss | -0.0028 | -| std | 0.347 | -| value_loss | 3.21e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4980 | -| time_elapsed | 38270 | -| total_timesteps | 637440 | -| train/ | | -| approx_kl | 0.0047816397 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -3.4e+03 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 49790 | -| policy_gradient_loss | -0.00163 | -| std | 0.347 | -| value_loss | 2.5e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4981 | -| time_elapsed | 38273 | -| total_timesteps | 637568 | -| train/ | | -| approx_kl | 0.01952263 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -6.79 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 49800 | -| policy_gradient_loss | -0.000374 | -| std | 0.348 | -| value_loss | 2.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4982 | -| time_elapsed | 38276 | -| total_timesteps | 637696 | -| train/ | | -| approx_kl | 0.011141034 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -0.0664 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 49810 | -| policy_gradient_loss | -0.00213 | -| std | 0.347 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4983 | -| time_elapsed | 38279 | -| total_timesteps | 637824 | -| train/ | | -| approx_kl | 0.013671057 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00675 | -| n_updates | 49820 | -| policy_gradient_loss | -0.00273 | -| std | 0.346 | -| value_loss | 3.64e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 4984 | -| time_elapsed | 38282 | -| total_timesteps | 637952 | -| train/ | | -| approx_kl | 0.012461619 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 49830 | -| policy_gradient_loss | -0.00206 | -| std | 0.346 | -| value_loss | 7.15e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4985 | -| time_elapsed | 38287 | -| total_timesteps | 638080 | -| train/ | | -| approx_kl | 0.009443075 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -0.00359 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 49840 | -| policy_gradient_loss | -0.00224 | -| std | 0.346 | -| value_loss | 2.41e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4986 | -| time_elapsed | 38295 | -| total_timesteps | 638208 | -| train/ | | -| approx_kl | 0.0018578027 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.000129 | -| n_updates | 49850 | -| policy_gradient_loss | -2.64e-05 | -| std | 0.347 | -| value_loss | 4.39e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4987 | -| time_elapsed | 38298 | -| total_timesteps | 638336 | -| train/ | | -| approx_kl | 0.026630316 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -391 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 49860 | -| policy_gradient_loss | -0.00788 | -| std | 0.347 | -| value_loss | 5.11e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4988 | -| time_elapsed | 38301 | -| total_timesteps | 638464 | -| train/ | | -| approx_kl | 0.00085952366 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -1.76e+03 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 49870 | -| policy_gradient_loss | 0.000916 | -| std | 0.347 | -| value_loss | 1.71e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4989 | -| time_elapsed | 38303 | -| total_timesteps | 638592 | -| train/ | | -| approx_kl | 0.00014377339 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -35.7 | -| learning_rate | 0.0003 | -| loss | -0.000429 | -| n_updates | 49880 | -| policy_gradient_loss | 0.000333 | -| std | 0.346 | -| value_loss | 9.23e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4990 | -| time_elapsed | 38306 | -| total_timesteps | 638720 | -| train/ | | -| approx_kl | 0.0055053593 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 49890 | -| policy_gradient_loss | -0.00114 | -| std | 0.346 | -| value_loss | 1.31e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4991 | -| time_elapsed | 38308 | -| total_timesteps | 638848 | -| train/ | | -| approx_kl | 0.026935797 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | -0.00736 | -| n_updates | 49900 | -| policy_gradient_loss | -0.0078 | -| std | 0.346 | -| value_loss | 5.76e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 4992 | -| time_elapsed | 38311 | -| total_timesteps | 638976 | -| train/ | | -| approx_kl | 0.025054999 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | 0.00189 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 49910 | -| policy_gradient_loss | -0.0113 | -| std | 0.346 | -| value_loss | 4.12e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 16 | -| iterations | 4993 | -| time_elapsed | 38314 | -| total_timesteps | 639104 | -| train/ | | -| approx_kl | 0.0053098532 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 49920 | -| policy_gradient_loss | -0.0026 | -| std | 0.346 | -| value_loss | 4.06e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 16 | -| iterations | 4994 | -| time_elapsed | 38323 | -| total_timesteps | 639232 | -| train/ | | -| approx_kl | 0.03322863 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | 0.858 | -| learning_rate | 0.0003 | -| loss | -0.000358 | -| n_updates | 49930 | -| policy_gradient_loss | -0.00125 | -| std | 0.345 | -| value_loss | 0.00129 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 16 | -| iterations | 4995 | -| time_elapsed | 38325 | -| total_timesteps | 639360 | -| train/ | | -| approx_kl | 0.019263249 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -835 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 49940 | -| policy_gradient_loss | -0.0118 | -| std | 0.345 | -| value_loss | 2.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 16 | -| iterations | 4996 | -| time_elapsed | 38327 | -| total_timesteps | 639488 | -| train/ | | -| approx_kl | 0.032407355 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -1.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 49950 | -| policy_gradient_loss | -0.0103 | -| std | 0.344 | -| value_loss | 5.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 16 | -| iterations | 4997 | -| time_elapsed | 38329 | -| total_timesteps | 639616 | -| train/ | | -| approx_kl | 0.035842218 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.352 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.000137 | -| n_updates | 49960 | -| policy_gradient_loss | -0.00285 | -| std | 0.344 | -| value_loss | 2.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 16 | -| iterations | 4998 | -| time_elapsed | 38333 | -| total_timesteps | 639744 | -| train/ | | -| approx_kl | 0.026763786 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.352 | -| explained_variance | -25.3 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 49970 | -| policy_gradient_loss | -0.00338 | -| std | 0.344 | -| value_loss | 7.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 16 | -| iterations | 4999 | -| time_elapsed | 38336 | -| total_timesteps | 639872 | -| train/ | | -| approx_kl | 0.027597439 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -7.26 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 49980 | -| policy_gradient_loss | -0.0118 | -| std | 0.345 | -| value_loss | 1.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5000 | -| time_elapsed | 38340 | -| total_timesteps | 640000 | -| train/ | | -| approx_kl | 0.008284595 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | -0.000778 | -| n_updates | 49990 | -| policy_gradient_loss | -0.000709 | -| std | 0.346 | -| value_loss | 1.68e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5001 | -| time_elapsed | 38343 | -| total_timesteps | 640128 | -| train/ | | -| approx_kl | 0.020672841 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.000975 | -| n_updates | 50000 | -| policy_gradient_loss | -0.00335 | -| std | 0.346 | -| value_loss | 1.01e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5002 | -| time_elapsed | 38350 | -| total_timesteps | 640256 | -| train/ | | -| approx_kl | 0.0048061106 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 50010 | -| policy_gradient_loss | -0.000527 | -| std | 0.346 | -| value_loss | 4.53e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5003 | -| time_elapsed | 38354 | -| total_timesteps | 640384 | -| train/ | | -| approx_kl | 0.008362261 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -635 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 50020 | -| policy_gradient_loss | -0.00274 | -| std | 0.346 | -| value_loss | 2.18e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5004 | -| time_elapsed | 38357 | -| total_timesteps | 640512 | -| train/ | | -| approx_kl | 0.04487478 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -583 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 50030 | -| policy_gradient_loss | -0.013 | -| std | 0.346 | -| value_loss | 1.07e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5005 | -| time_elapsed | 38361 | -| total_timesteps | 640640 | -| train/ | | -| approx_kl | 0.0003427798 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 50040 | -| policy_gradient_loss | 0.000861 | -| std | 0.345 | -| value_loss | 2.76e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5006 | -| time_elapsed | 38364 | -| total_timesteps | 640768 | -| train/ | | -| approx_kl | 0.0020262948 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -1.22 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 50050 | -| policy_gradient_loss | 0.000411 | -| std | 0.344 | -| value_loss | 1.54e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 16 | -| iterations | 5007 | -| time_elapsed | 38367 | -| total_timesteps | 640896 | -| train/ | | -| approx_kl | 0.00096251955 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.352 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 50060 | -| policy_gradient_loss | 0.000262 | -| std | 0.344 | -| value_loss | 5.04e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5008 | -| time_elapsed | 38370 | -| total_timesteps | 641024 | -| train/ | | -| approx_kl | 0.0008772784 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 50070 | -| policy_gradient_loss | 0.000121 | -| std | 0.345 | -| value_loss | 7.57e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5009 | -| time_elapsed | 38379 | -| total_timesteps | 641152 | -| train/ | | -| approx_kl | 0.0016915174 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -5.54 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 50080 | -| policy_gradient_loss | 3.66e-05 | -| std | 0.346 | -| value_loss | 0.00283 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5010 | -| time_elapsed | 38382 | -| total_timesteps | 641280 | -| train/ | | -| approx_kl | 0.0013771686 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -4.03e+03 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 50090 | -| policy_gradient_loss | 0.000411 | -| std | 0.347 | -| value_loss | 7.51e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5011 | -| time_elapsed | 38386 | -| total_timesteps | 641408 | -| train/ | | -| approx_kl | 0.0012197103 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -4.28e+03 | -| learning_rate | 0.0003 | -| loss | -0.0097 | -| n_updates | 50100 | -| policy_gradient_loss | 0.00153 | -| std | 0.347 | -| value_loss | 1.86e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5012 | -| time_elapsed | 38390 | -| total_timesteps | 641536 | -| train/ | | -| approx_kl | 0.014930144 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -513 | -| learning_rate | 0.0003 | -| loss | 8.52e-06 | -| n_updates | 50110 | -| policy_gradient_loss | -0.000245 | -| std | 0.347 | -| value_loss | 4.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5013 | -| time_elapsed | 38395 | -| total_timesteps | 641664 | -| train/ | | -| approx_kl | 0.019359149 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -4.54 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 50120 | -| policy_gradient_loss | -0.00269 | -| std | 0.347 | -| value_loss | 8.8e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5014 | -| time_elapsed | 38398 | -| total_timesteps | 641792 | -| train/ | | -| approx_kl | 0.0317021 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | -0.00817 | -| n_updates | 50130 | -| policy_gradient_loss | -0.00705 | -| std | 0.346 | -| value_loss | 1.01e-09 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 16 | -| iterations | 5015 | -| time_elapsed | 38402 | -| total_timesteps | 641920 | -| train/ | | -| approx_kl | 0.0049243965 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.349 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 50140 | -| policy_gradient_loss | -0.00113 | -| std | 0.347 | -| value_loss | 4.63e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5016 | -| time_elapsed | 38406 | -| total_timesteps | 642048 | -| train/ | | -| approx_kl | 0.012666522 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | 0.000372 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 50150 | -| policy_gradient_loss | -0.00437 | -| std | 0.347 | -| value_loss | 8.17e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5017 | -| time_elapsed | 38412 | -| total_timesteps | 642176 | -| train/ | | -| approx_kl | 0.022546833 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 50160 | -| policy_gradient_loss | -0.00484 | -| std | 0.348 | -| value_loss | 0.000271 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5018 | -| time_elapsed | 38416 | -| total_timesteps | 642304 | -| train/ | | -| approx_kl | 0.03987828 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -5.8e+03 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 50170 | -| policy_gradient_loss | -0.00886 | -| std | 0.348 | -| value_loss | 4.42e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5019 | -| time_elapsed | 38420 | -| total_timesteps | 642432 | -| train/ | | -| approx_kl | 0.015946392 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -442 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 50180 | -| policy_gradient_loss | -0.00128 | -| std | 0.347 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5020 | -| time_elapsed | 38423 | -| total_timesteps | 642560 | -| train/ | | -| approx_kl | 0.0136961285 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -2.64 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 50190 | -| policy_gradient_loss | -0.0104 | -| std | 0.347 | -| value_loss | 3.01e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5021 | -| time_elapsed | 38425 | -| total_timesteps | 642688 | -| train/ | | -| approx_kl | 0.011738955 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.36 | -| explained_variance | -3.89 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 50200 | -| policy_gradient_loss | -0.00621 | -| std | 0.347 | -| value_loss | 1.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5022 | -| time_elapsed | 38428 | -| total_timesteps | 642816 | -| train/ | | -| approx_kl | 0.018803995 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 50210 | -| policy_gradient_loss | -0.00607 | -| std | 0.346 | -| value_loss | 1.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 16 | -| iterations | 5023 | -| time_elapsed | 38430 | -| total_timesteps | 642944 | -| train/ | | -| approx_kl | 0.017498177 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -0.00772 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 50220 | -| policy_gradient_loss | -0.00469 | -| std | 0.346 | -| value_loss | 1.29e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5024 | -| time_elapsed | 38433 | -| total_timesteps | 643072 | -| train/ | | -| approx_kl | 0.020517392 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 50230 | -| policy_gradient_loss | -0.00377 | -| std | 0.345 | -| value_loss | 1.24e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5025 | -| time_elapsed | 38438 | -| total_timesteps | 643200 | -| train/ | | -| approx_kl | 0.013565848 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.00813 | -| n_updates | 50240 | -| policy_gradient_loss | -0.0032 | -| std | 0.345 | -| value_loss | 0.00137 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5026 | -| time_elapsed | 38442 | -| total_timesteps | 643328 | -| train/ | | -| approx_kl | 0.048625693 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -2.91e+03 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 50250 | -| policy_gradient_loss | -0.0133 | -| std | 0.344 | -| value_loss | 3.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5027 | -| time_elapsed | 38447 | -| total_timesteps | 643456 | -| train/ | | -| approx_kl | 0.016777467 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -707 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 50260 | -| policy_gradient_loss | -0.00242 | -| std | 0.344 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5028 | -| time_elapsed | 38450 | -| total_timesteps | 643584 | -| train/ | | -| approx_kl | 0.012730902 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 50270 | -| policy_gradient_loss | -0.00733 | -| std | 0.344 | -| value_loss | 2.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5029 | -| time_elapsed | 38455 | -| total_timesteps | 643712 | -| train/ | | -| approx_kl | 0.017058888 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.0241 | -| n_updates | 50280 | -| policy_gradient_loss | -0.012 | -| std | 0.344 | -| value_loss | 2.14e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5030 | -| time_elapsed | 38459 | -| total_timesteps | 643840 | -| train/ | | -| approx_kl | 0.0026357025 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -0.0092 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 50290 | -| policy_gradient_loss | -0.000159 | -| std | 0.344 | -| value_loss | 1.28e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 16 | -| iterations | 5031 | -| time_elapsed | 38462 | -| total_timesteps | 643968 | -| train/ | | -| approx_kl | 0.00017002644 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.000307 | -| n_updates | 50300 | -| policy_gradient_loss | 0.00058 | -| std | 0.344 | -| value_loss | 2.11e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5032 | -| time_elapsed | 38466 | -| total_timesteps | 644096 | -| train/ | | -| approx_kl | 0.019547481 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | 0.00354 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 50310 | -| policy_gradient_loss | -0.00596 | -| std | 0.344 | -| value_loss | 5.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5033 | -| time_elapsed | 38473 | -| total_timesteps | 644224 | -| train/ | | -| approx_kl | 0.027438276 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 50320 | -| policy_gradient_loss | -0.00585 | -| std | 0.344 | -| value_loss | 0.000235 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5034 | -| time_elapsed | 38478 | -| total_timesteps | 644352 | -| train/ | | -| approx_kl | 0.011995265 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -56.8 | -| learning_rate | 0.0003 | -| loss | 0.000606 | -| n_updates | 50330 | -| policy_gradient_loss | 0.000187 | -| std | 0.344 | -| value_loss | 4.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5035 | -| time_elapsed | 38482 | -| total_timesteps | 644480 | -| train/ | | -| approx_kl | 0.023837592 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.351 | -| explained_variance | -33.9 | -| learning_rate | 0.0003 | -| loss | -0.0083 | -| n_updates | 50340 | -| policy_gradient_loss | -0.00405 | -| std | 0.344 | -| value_loss | 1.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5036 | -| time_elapsed | 38486 | -| total_timesteps | 644608 | -| train/ | | -| approx_kl | 0.020292018 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | -0.0969 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 50350 | -| policy_gradient_loss | -0.00487 | -| std | 0.343 | -| value_loss | 4.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5037 | -| time_elapsed | 38488 | -| total_timesteps | 644736 | -| train/ | | -| approx_kl | 0.002557817 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.351 | -| explained_variance | -0.403 | -| learning_rate | 0.0003 | -| loss | -0.000923 | -| n_updates | 50360 | -| policy_gradient_loss | -0.000362 | -| std | 0.345 | -| value_loss | 2.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5038 | -| time_elapsed | 38490 | -| total_timesteps | 644864 | -| train/ | | -| approx_kl | 0.013588326 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.262 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 50370 | -| policy_gradient_loss | -0.00847 | -| std | 0.346 | -| value_loss | 5.67e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5039 | -| time_elapsed | 38493 | -| total_timesteps | 644992 | -| train/ | | -| approx_kl | 0.0041295434 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -0.779 | -| learning_rate | 0.0003 | -| loss | 9.22e-05 | -| n_updates | 50380 | -| policy_gradient_loss | 4.99e-05 | -| std | 0.347 | -| value_loss | 3.53e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 16 | -| iterations | 5040 | -| time_elapsed | 38495 | -| total_timesteps | 645120 | -| train/ | | -| approx_kl | 0.011892511 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 50390 | -| policy_gradient_loss | -0.00433 | -| std | 0.347 | -| value_loss | 6.3e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 16 | -| iterations | 5041 | -| time_elapsed | 38505 | -| total_timesteps | 645248 | -| train/ | | -| approx_kl | 0.09006937 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | 0.0356 | -| learning_rate | 0.0003 | -| loss | -0.00924 | -| n_updates | 50400 | -| policy_gradient_loss | -0.0055 | -| std | 0.348 | -| value_loss | 0.000939 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 16 | -| iterations | 5042 | -| time_elapsed | 38509 | -| total_timesteps | 645376 | -| train/ | | -| approx_kl | 0.00060298666 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -1.76e+03 | -| learning_rate | 0.0003 | -| loss | 0.0031 | -| n_updates | 50410 | -| policy_gradient_loss | 0.00505 | -| std | 0.348 | -| value_loss | 7e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 16 | -| iterations | 5043 | -| time_elapsed | 38512 | -| total_timesteps | 645504 | -| train/ | | -| approx_kl | 0.026098799 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -3.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.00465 | -| n_updates | 50420 | -| policy_gradient_loss | -0.00409 | -| std | 0.348 | -| value_loss | 2.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 16 | -| iterations | 5044 | -| time_elapsed | 38516 | -| total_timesteps | 645632 | -| train/ | | -| approx_kl | 0.017797118 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 50430 | -| policy_gradient_loss | -0.00718 | -| std | 0.347 | -| value_loss | 3.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 16 | -| iterations | 5045 | -| time_elapsed | 38520 | -| total_timesteps | 645760 | -| train/ | | -| approx_kl | 0.053859755 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -123 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 50440 | -| policy_gradient_loss | -0.0036 | -| std | 0.348 | -| value_loss | 3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 16 | -| iterations | 5046 | -| time_elapsed | 38522 | -| total_timesteps | 645888 | -| train/ | | -| approx_kl | 0.029352175 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -15 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 50450 | -| policy_gradient_loss | -0.00431 | -| std | 0.349 | -| value_loss | 8.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5047 | -| time_elapsed | 38526 | -| total_timesteps | 646016 | -| train/ | | -| approx_kl | 0.022728091 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | -0.0091 | -| n_updates | 50460 | -| policy_gradient_loss | -0.00689 | -| std | 0.349 | -| value_loss | 3.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5048 | -| time_elapsed | 38534 | -| total_timesteps | 646144 | -| train/ | | -| approx_kl | 0.023129992 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | 0.943 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 50470 | -| policy_gradient_loss | -0.00951 | -| std | 0.35 | -| value_loss | 0.000266 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5049 | -| time_elapsed | 38537 | -| total_timesteps | 646272 | -| train/ | | -| approx_kl | 0.012670976 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | -2.13e+03 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 50480 | -| policy_gradient_loss | -0.002 | -| std | 0.35 | -| value_loss | 6.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5050 | -| time_elapsed | 38541 | -| total_timesteps | 646400 | -| train/ | | -| approx_kl | 0.034391813 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -1.71e+03 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 50490 | -| policy_gradient_loss | -0.00963 | -| std | 0.35 | -| value_loss | 3.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5051 | -| time_elapsed | 38545 | -| total_timesteps | 646528 | -| train/ | | -| approx_kl | 0.011320636 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.37 | -| explained_variance | -197 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 50500 | -| policy_gradient_loss | -0.0103 | -| std | 0.35 | -| value_loss | 3.68e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5052 | -| time_elapsed | 38548 | -| total_timesteps | 646656 | -| train/ | | -| approx_kl | 0.015182147 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | -0.369 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.00643 | -| n_updates | 50510 | -| policy_gradient_loss | -0.00616 | -| std | 0.35 | -| value_loss | 4.02e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5053 | -| time_elapsed | 38551 | -| total_timesteps | 646784 | -| train/ | | -| approx_kl | 0.012726638 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.367 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 50520 | -| policy_gradient_loss | -0.00263 | -| std | 0.349 | -| value_loss | 8.34e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 16 | -| iterations | 5054 | -| time_elapsed | 38554 | -| total_timesteps | 646912 | -| train/ | | -| approx_kl | 0.017124962 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -0.398 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 50530 | -| policy_gradient_loss | -0.00231 | -| std | 0.349 | -| value_loss | 1.19e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5055 | -| time_elapsed | 38557 | -| total_timesteps | 647040 | -| train/ | | -| approx_kl | 0.005050334 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.000876 | -| n_updates | 50540 | -| policy_gradient_loss | -0.000696 | -| std | 0.347 | -| value_loss | 2.18e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5056 | -| time_elapsed | 38563 | -| total_timesteps | 647168 | -| train/ | | -| approx_kl | 0.01085852 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | 0.736 | -| learning_rate | 0.0003 | -| loss | -0.000883 | -| n_updates | 50550 | -| policy_gradient_loss | -0.00122 | -| std | 0.345 | -| value_loss | 0.00313 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5057 | -| time_elapsed | 38566 | -| total_timesteps | 647296 | -| train/ | | -| approx_kl | 0.041873198 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -466 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 50560 | -| policy_gradient_loss | -0.0029 | -| std | 0.345 | -| value_loss | 4.1e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5058 | -| time_elapsed | 38569 | -| total_timesteps | 647424 | -| train/ | | -| approx_kl | 0.0016250606 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -590 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 50570 | -| policy_gradient_loss | 0.0013 | -| std | 0.345 | -| value_loss | 1.36e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5059 | -| time_elapsed | 38572 | -| total_timesteps | 647552 | -| train/ | | -| approx_kl | 0.027835276 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -66.1 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 50580 | -| policy_gradient_loss | -0.00195 | -| std | 0.344 | -| value_loss | 2.1e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5060 | -| time_elapsed | 38576 | -| total_timesteps | 647680 | -| train/ | | -| approx_kl | 3.0954834e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -2.58 | -| learning_rate | 0.0003 | -| loss | -2.14e-05 | -| n_updates | 50590 | -| policy_gradient_loss | -6.96e-06 | -| std | 0.344 | -| value_loss | 5.15e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5061 | -| time_elapsed | 38578 | -| total_timesteps | 647808 | -| train/ | | -| approx_kl | 0.012789692 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -0.0985 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 50600 | -| policy_gradient_loss | -0.00281 | -| std | 0.344 | -| value_loss | 9.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 16 | -| iterations | 5062 | -| time_elapsed | 38579 | -| total_timesteps | 647936 | -| train/ | | -| approx_kl | 0.009470491 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -0.00556 | -| learning_rate | 0.0003 | -| loss | -0.000701 | -| n_updates | 50610 | -| policy_gradient_loss | -0.00161 | -| std | 0.345 | -| value_loss | 5.07e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5063 | -| time_elapsed | 38583 | -| total_timesteps | 648064 | -| train/ | | -| approx_kl | 0.02092837 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 50620 | -| policy_gradient_loss | -0.0117 | -| std | 0.346 | -| value_loss | 1.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5064 | -| time_elapsed | 38588 | -| total_timesteps | 648192 | -| train/ | | -| approx_kl | 0.026326124 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 50630 | -| policy_gradient_loss | -0.00974 | -| std | 0.346 | -| value_loss | 9.99e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5065 | -| time_elapsed | 38590 | -| total_timesteps | 648320 | -| train/ | | -| approx_kl | 0.0003394275 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.359 | -| explained_variance | -633 | -| learning_rate | 0.0003 | -| loss | -0.000705 | -| n_updates | 50640 | -| policy_gradient_loss | 0.000651 | -| std | 0.347 | -| value_loss | 1.21e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5066 | -| time_elapsed | 38593 | -| total_timesteps | 648448 | -| train/ | | -| approx_kl | 0.05118406 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.00634 | -| n_updates | 50650 | -| policy_gradient_loss | -0.00501 | -| std | 0.347 | -| value_loss | 3.68e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5067 | -| time_elapsed | 38595 | -| total_timesteps | 648576 | -| train/ | | -| approx_kl | 0.0062692384 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -180 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 50660 | -| policy_gradient_loss | -0.00183 | -| std | 0.347 | -| value_loss | 5.36e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5068 | -| time_elapsed | 38599 | -| total_timesteps | 648704 | -| train/ | | -| approx_kl | 0.00046409573 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.362 | -| explained_variance | -0.0972 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 50670 | -| policy_gradient_loss | 0.000988 | -| std | 0.348 | -| value_loss | 1.48e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5069 | -| time_elapsed | 38602 | -| total_timesteps | 648832 | -| train/ | | -| approx_kl | 0.0019520223 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.363 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | -0.00338 | -| n_updates | 50680 | -| policy_gradient_loss | 0.000302 | -| std | 0.348 | -| value_loss | 1.56e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 16 | -| iterations | 5070 | -| time_elapsed | 38604 | -| total_timesteps | 648960 | -| train/ | | -| approx_kl | 0.012596959 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -0.00235 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 50690 | -| policy_gradient_loss | -0.00166 | -| std | 0.348 | -| value_loss | 6.05e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5071 | -| time_elapsed | 38607 | -| total_timesteps | 649088 | -| train/ | | -| approx_kl | 0.0192752 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 50700 | -| policy_gradient_loss | -0.0116 | -| std | 0.349 | -| value_loss | 8.86e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5072 | -| time_elapsed | 38611 | -| total_timesteps | 649216 | -| train/ | | -| approx_kl | 0.01882089 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | -0.365 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 50710 | -| policy_gradient_loss | -0.00782 | -| std | 0.348 | -| value_loss | 0.000137 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5073 | -| time_elapsed | 38614 | -| total_timesteps | 649344 | -| train/ | | -| approx_kl | 0.0064216345 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.364 | -| explained_variance | -81.2 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 50720 | -| policy_gradient_loss | -0.000644 | -| std | 0.348 | -| value_loss | 5.22e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5074 | -| time_elapsed | 38615 | -| total_timesteps | 649472 | -| train/ | | -| approx_kl | 0.00044851564 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.361 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | 9.15e-05 | -| n_updates | 50730 | -| policy_gradient_loss | 0.000351 | -| std | 0.347 | -| value_loss | 2.68e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5075 | -| time_elapsed | 38618 | -| total_timesteps | 649600 | -| train/ | | -| approx_kl | 0.031169046 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.358 | -| explained_variance | -8.63 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 50740 | -| policy_gradient_loss | -0.00641 | -| std | 0.346 | -| value_loss | 2.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5076 | -| time_elapsed | 38621 | -| total_timesteps | 649728 | -| train/ | | -| approx_kl | 0.036811814 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.357 | -| explained_variance | -143 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 50750 | -| policy_gradient_loss | -0.0102 | -| std | 0.346 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5077 | -| time_elapsed | 38624 | -| total_timesteps | 649856 | -| train/ | | -| approx_kl | 0.018102199 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.356 | -| explained_variance | -0.53 | -| learning_rate | 0.0003 | -| loss | -0.0028 | -| n_updates | 50760 | -| policy_gradient_loss | -0.00455 | -| std | 0.345 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 16 | -| iterations | 5078 | -| time_elapsed | 38627 | -| total_timesteps | 649984 | -| train/ | | -| approx_kl | 0.034744464 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | -0.355 | -| explained_variance | -0.0946 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 50770 | -| policy_gradient_loss | -0.0177 | -| std | 0.345 | -| value_loss | 4.48e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 5079 | -| time_elapsed | 38631 | -| total_timesteps | 650112 | -| train/ | | -| approx_kl | 0.0024008267 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -0.00516 | -| learning_rate | 0.0003 | -| loss | -0.000672 | -| n_updates | 50780 | -| policy_gradient_loss | -0.000204 | -| std | 0.345 | -| value_loss | 1.16e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 5080 | -| time_elapsed | 38639 | -| total_timesteps | 650240 | -| train/ | | -| approx_kl | 0.0066476 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -4.49 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 50790 | -| policy_gradient_loss | -0.00431 | -| std | 0.344 | -| value_loss | 0.00307 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 5081 | -| time_elapsed | 38642 | -| total_timesteps | 650368 | -| train/ | | -| approx_kl | 0.058317438 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -50.2 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 50800 | -| policy_gradient_loss | -0.00532 | -| std | 0.344 | -| value_loss | 2.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 5082 | -| time_elapsed | 38645 | -| total_timesteps | 650496 | -| train/ | | -| approx_kl | 0.013800554 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.352 | -| explained_variance | -43.3 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 50810 | -| policy_gradient_loss | -0.00229 | -| std | 0.344 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 5083 | -| time_elapsed | 38648 | -| total_timesteps | 650624 | -| train/ | | -| approx_kl | 0.029765055 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.351 | -| explained_variance | -0.378 | -| learning_rate | 0.0003 | -| loss | -0.00845 | -| n_updates | 50820 | -| policy_gradient_loss | -0.0084 | -| std | 0.344 | -| value_loss | 2.45e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 5084 | -| time_elapsed | 38650 | -| total_timesteps | 650752 | -| train/ | | -| approx_kl | 0.0119989645 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 50830 | -| policy_gradient_loss | -0.00305 | -| std | 0.343 | -| value_loss | 1.87e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 16 | -| iterations | 5085 | -| time_elapsed | 38653 | -| total_timesteps | 650880 | -| train/ | | -| approx_kl | 0.010482902 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 50840 | -| policy_gradient_loss | -0.00275 | -| std | 0.343 | -| value_loss | 6.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5086 | -| time_elapsed | 38655 | -| total_timesteps | 651008 | -| train/ | | -| approx_kl | 0.011101047 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.349 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 50850 | -| policy_gradient_loss | -0.00812 | -| std | 0.343 | -| value_loss | 7.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5087 | -| time_elapsed | 38665 | -| total_timesteps | 651136 | -| train/ | | -| approx_kl | 0.013470488 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.349 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 50860 | -| policy_gradient_loss | -0.00466 | -| std | 0.343 | -| value_loss | 0.000112 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5088 | -| time_elapsed | 38667 | -| total_timesteps | 651264 | -| train/ | | -| approx_kl | 0.007852407 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -0.921 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 50870 | -| policy_gradient_loss | 0.000858 | -| std | 0.343 | -| value_loss | 2.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5089 | -| time_elapsed | 38670 | -| total_timesteps | 651392 | -| train/ | | -| approx_kl | 0.009495426 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -3.49 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 50880 | -| policy_gradient_loss | -0.00438 | -| std | 0.342 | -| value_loss | 2.03e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5090 | -| time_elapsed | 38674 | -| total_timesteps | 651520 | -| train/ | | -| approx_kl | 0.0036218618 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | -0.348 | -| explained_variance | -0.311 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 50890 | -| policy_gradient_loss | -0.000966 | -| std | 0.343 | -| value_loss | 1.19e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5091 | -| time_elapsed | 38678 | -| total_timesteps | 651648 | -| train/ | | -| approx_kl | 0.023749577 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | -0.349 | -| explained_variance | -0.00318 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 50900 | -| policy_gradient_loss | -0.00429 | -| std | 0.343 | -| value_loss | 6.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5092 | -| time_elapsed | 38680 | -| total_timesteps | 651776 | -| train/ | | -| approx_kl | 0.012680093 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 50910 | -| policy_gradient_loss | -0.00341 | -| std | 0.343 | -| value_loss | 2.75e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 16 | -| iterations | 5093 | -| time_elapsed | 38684 | -| total_timesteps | 651904 | -| train/ | | -| approx_kl | 0.01031372 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | 0.000399 | -| learning_rate | 0.0003 | -| loss | -0.00516 | -| n_updates | 50920 | -| policy_gradient_loss | -0.00336 | -| std | 0.343 | -| value_loss | 2.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5094 | -| time_elapsed | 38687 | -| total_timesteps | 652032 | -| train/ | | -| approx_kl | 0.011040354 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | 0.00136 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 50930 | -| policy_gradient_loss | -0.0012 | -| std | 0.344 | -| value_loss | 1.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5095 | -| time_elapsed | 38694 | -| total_timesteps | 652160 | -| train/ | | -| approx_kl | 0.012102442 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -2.9 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 50940 | -| policy_gradient_loss | -0.0099 | -| std | 0.344 | -| value_loss | 0.00241 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5096 | -| time_elapsed | 38698 | -| total_timesteps | 652288 | -| train/ | | -| approx_kl | 0.024840277 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -235 | -| learning_rate | 0.0003 | -| loss | -0.00853 | -| n_updates | 50950 | -| policy_gradient_loss | -0.00411 | -| std | 0.344 | -| value_loss | 7.05e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5097 | -| time_elapsed | 38700 | -| total_timesteps | 652416 | -| train/ | | -| approx_kl | 3.878353e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.352 | -| explained_variance | -1.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 50960 | -| policy_gradient_loss | 0.00466 | -| std | 0.344 | -| value_loss | 3.79e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5098 | -| time_elapsed | 38703 | -| total_timesteps | 652544 | -| train/ | | -| approx_kl | 0.002090409 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.352 | -| explained_variance | -362 | -| learning_rate | 0.0003 | -| loss | -0.00693 | -| n_updates | 50970 | -| policy_gradient_loss | 5.53e-05 | -| std | 0.344 | -| value_loss | 1.81e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5099 | -| time_elapsed | 38707 | -| total_timesteps | 652672 | -| train/ | | -| approx_kl | 0.0011327183 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -3.23e+03 | -| learning_rate | 0.0003 | -| loss | -0.00889 | -| n_updates | 50980 | -| policy_gradient_loss | 0.00203 | -| std | 0.345 | -| value_loss | 3.47e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5100 | -| time_elapsed | 38710 | -| total_timesteps | 652800 | -| train/ | | -| approx_kl | 0.023569683 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.354 | -| explained_variance | -92.3 | -| learning_rate | 0.0003 | -| loss | -0.000888 | -| n_updates | 50990 | -| policy_gradient_loss | -0.00117 | -| std | 0.345 | -| value_loss | 2.15e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 16 | -| iterations | 5101 | -| time_elapsed | 38714 | -| total_timesteps | 652928 | -| train/ | | -| approx_kl | 0.020276353 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | -0.353 | -| explained_variance | -8.83 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 51000 | -| policy_gradient_loss | -0.00236 | -| std | 0.344 | -| value_loss | 2.64e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5102 | -| time_elapsed | 38718 | -| total_timesteps | 653056 | -| train/ | | -| approx_kl | 0.0012967624 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.35 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.000874 | -| n_updates | 51010 | -| policy_gradient_loss | -0.000337 | -| std | 0.342 | -| value_loss | 2.55e-12 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5103 | -| time_elapsed | 38724 | -| total_timesteps | 653184 | -| train/ | | -| approx_kl | 0.031185841 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.343 | -| explained_variance | 0.623 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 51020 | -| policy_gradient_loss | -0.00788 | -| std | 0.34 | -| value_loss | 0.000535 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5104 | -| time_elapsed | 38729 | -| total_timesteps | 653312 | -| train/ | | -| approx_kl | 0.04749439 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | -0.34 | -| explained_variance | -1.98e+03 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 51030 | -| policy_gradient_loss | -0.00867 | -| std | 0.34 | -| value_loss | 8.47e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5105 | -| time_elapsed | 38732 | -| total_timesteps | 653440 | -| train/ | | -| approx_kl | 0.0067817904 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | -0.338 | -| explained_variance | -3.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 51040 | -| policy_gradient_loss | -0.000621 | -| std | 0.339 | -| value_loss | 4.36e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5106 | -| time_elapsed | 38736 | -| total_timesteps | 653568 | -| train/ | | -| approx_kl | 0.0013075024 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.335 | -| explained_variance | -3.98 | -| learning_rate | 0.0003 | -| loss | -9.54e-05 | -| n_updates | 51050 | -| policy_gradient_loss | 0.00012 | -| std | 0.337 | -| value_loss | 4.11e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5107 | -| time_elapsed | 38739 | -| total_timesteps | 653696 | -| train/ | | -| approx_kl | 0.011807896 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.331 | -| explained_variance | -3.69 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 51060 | -| policy_gradient_loss | -0.000979 | -| std | 0.337 | -| value_loss | 3.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5108 | -| time_elapsed | 38743 | -| total_timesteps | 653824 | -| train/ | | -| approx_kl | 0.031889006 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | -0.329 | -| explained_variance | -0.735 | -| learning_rate | 0.0003 | -| loss | 0.00152 | -| n_updates | 51070 | -| policy_gradient_loss | -0.00243 | -| std | 0.336 | -| value_loss | 1.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 16 | -| iterations | 5109 | -| time_elapsed | 38747 | -| total_timesteps | 653952 | -| train/ | | -| approx_kl | 0.01166915 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.328 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 51080 | -| policy_gradient_loss | -0.00199 | -| std | 0.336 | -| value_loss | 1.49e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5110 | -| time_elapsed | 38751 | -| total_timesteps | 654080 | -| train/ | | -| approx_kl | 0.002648937 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.33 | -| explained_variance | 0.00413 | -| learning_rate | 0.0003 | -| loss | 1.12e-05 | -| n_updates | 51090 | -| policy_gradient_loss | -0.000277 | -| std | 0.337 | -| value_loss | 2.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5111 | -| time_elapsed | 38757 | -| total_timesteps | 654208 | -| train/ | | -| approx_kl | 0.01529194 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | -0.333 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 51100 | -| policy_gradient_loss | -0.00151 | -| std | 0.338 | -| value_loss | 0.000195 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5112 | -| time_elapsed | 38761 | -| total_timesteps | 654336 | -| train/ | | -| approx_kl | 0.009159101 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.333 | -| explained_variance | -317 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 51110 | -| policy_gradient_loss | -0.00149 | -| std | 0.337 | -| value_loss | 2.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5113 | -| time_elapsed | 38764 | -| total_timesteps | 654464 | -| train/ | | -| approx_kl | 0.022514772 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | -0.332 | -| explained_variance | -286 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 51120 | -| policy_gradient_loss | -0.00881 | -| std | 0.337 | -| value_loss | 7.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5114 | -| time_elapsed | 38767 | -| total_timesteps | 654592 | -| train/ | | -| approx_kl | 0.023588771 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.332 | -| explained_variance | -6.32 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 51130 | -| policy_gradient_loss | -0.0069 | -| std | 0.337 | -| value_loss | 2.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5115 | -| time_elapsed | 38770 | -| total_timesteps | 654720 | -| train/ | | -| approx_kl | 0.008860886 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.331 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 51140 | -| policy_gradient_loss | -0.00851 | -| std | 0.337 | -| value_loss | 1.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5116 | -| time_elapsed | 38773 | -| total_timesteps | 654848 | -| train/ | | -| approx_kl | 0.008606092 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.331 | -| explained_variance | 0.00501 | -| learning_rate | 0.0003 | -| loss | -0.000756 | -| n_updates | 51150 | -| policy_gradient_loss | -0.000999 | -| std | 0.337 | -| value_loss | 6.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 16 | -| iterations | 5117 | -| time_elapsed | 38777 | -| total_timesteps | 654976 | -| train/ | | -| approx_kl | 0.012829217 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | -0.33 | -| explained_variance | -0.000231 | -| learning_rate | 0.0003 | -| loss | -0.00826 | -| n_updates | 51160 | -| policy_gradient_loss | -0.00512 | -| std | 0.336 | -| value_loss | 4.14e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 16 | -| iterations | 5118 | -| time_elapsed | 38780 | -| total_timesteps | 655104 | -| train/ | | -| approx_kl | 0.014156775 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.329 | -| explained_variance | -0.00579 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 51170 | -| policy_gradient_loss | -0.00318 | -| std | 0.336 | -| value_loss | 2.86e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 16 | -| iterations | 5119 | -| time_elapsed | 38788 | -| total_timesteps | 655232 | -| train/ | | -| approx_kl | 0.021911968 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.327 | -| explained_variance | -6.12 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 51180 | -| policy_gradient_loss | -0.00584 | -| std | 0.336 | -| value_loss | 0.00212 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 16 | -| iterations | 5120 | -| time_elapsed | 38791 | -| total_timesteps | 655360 | -| train/ | | -| approx_kl | 0.00019306969 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.326 | -| explained_variance | -246 | -| learning_rate | 0.0003 | -| loss | -0.000623 | -| n_updates | 51190 | -| policy_gradient_loss | 0.000726 | -| std | 0.335 | -| value_loss | 2.41e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 16 | -| iterations | 5121 | -| time_elapsed | 38795 | -| total_timesteps | 655488 | -| train/ | | -| approx_kl | 0.002323273 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.325 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 51200 | -| policy_gradient_loss | 0.000572 | -| std | 0.335 | -| value_loss | 6.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 16 | -| iterations | 5122 | -| time_elapsed | 38799 | -| total_timesteps | 655616 | -| train/ | | -| approx_kl | 0.06577032 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | -0.325 | -| explained_variance | -3.26 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 51210 | -| policy_gradient_loss | -0.00853 | -| std | 0.335 | -| value_loss | 3.27e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 16 | -| iterations | 5123 | -| time_elapsed | 38803 | -| total_timesteps | 655744 | -| train/ | | -| approx_kl | 0.03305002 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.326 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 51220 | -| policy_gradient_loss | -0.00879 | -| std | 0.335 | -| value_loss | 1.53e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 16 | -| iterations | 5124 | -| time_elapsed | 38808 | -| total_timesteps | 655872 | -| train/ | | -| approx_kl | 0.03141086 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | -0.327 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 51230 | -| policy_gradient_loss | -0.014 | -| std | 0.336 | -| value_loss | 2.32e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5125 | -| time_elapsed | 38811 | -| total_timesteps | 656000 | -| train/ | | -| approx_kl | 0.006384395 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.327 | -| explained_variance | 0.0063 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 51240 | -| policy_gradient_loss | -0.000706 | -| std | 0.335 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5126 | -| time_elapsed | 38814 | -| total_timesteps | 656128 | -| train/ | | -| approx_kl | 0.0156031735 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.322 | -| explained_variance | -0.000532 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 51250 | -| policy_gradient_loss | -0.00562 | -| std | 0.333 | -| value_loss | 5.49e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5127 | -| time_elapsed | 38823 | -| total_timesteps | 656256 | -| train/ | | -| approx_kl | 0.019102212 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.319 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 51260 | -| policy_gradient_loss | -0.0099 | -| std | 0.333 | -| value_loss | 5.51e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5128 | -| time_elapsed | 38826 | -| total_timesteps | 656384 | -| train/ | | -| approx_kl | 0.0030197361 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.32 | -| explained_variance | -200 | -| learning_rate | 0.0003 | -| loss | -0.00055 | -| n_updates | 51270 | -| policy_gradient_loss | -0.000244 | -| std | 0.334 | -| value_loss | 2.86e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5129 | -| time_elapsed | 38828 | -| total_timesteps | 656512 | -| train/ | | -| approx_kl | 0.018492652 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.323 | -| explained_variance | -1.29e+03 | -| learning_rate | 0.0003 | -| loss | -0.00782 | -| n_updates | 51280 | -| policy_gradient_loss | -0.00293 | -| std | 0.335 | -| value_loss | 2.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5130 | -| time_elapsed | 38831 | -| total_timesteps | 656640 | -| train/ | | -| approx_kl | 0.040729806 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | -0.325 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 51290 | -| policy_gradient_loss | -0.00684 | -| std | 0.335 | -| value_loss | 6.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5131 | -| time_elapsed | 38834 | -| total_timesteps | 656768 | -| train/ | | -| approx_kl | 0.021128377 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.325 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 51300 | -| policy_gradient_loss | -0.0112 | -| std | 0.335 | -| value_loss | 2.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 16 | -| iterations | 5132 | -| time_elapsed | 38837 | -| total_timesteps | 656896 | -| train/ | | -| approx_kl | 0.013785313 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | -0.325 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.000998 | -| n_updates | 51310 | -| policy_gradient_loss | -0.000495 | -| std | 0.335 | -| value_loss | 2.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5133 | -| time_elapsed | 38840 | -| total_timesteps | 657024 | -| train/ | | -| approx_kl | 0.018806344 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.326 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 51320 | -| policy_gradient_loss | -0.00428 | -| std | 0.335 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5134 | -| time_elapsed | 38848 | -| total_timesteps | 657152 | -| train/ | | -| approx_kl | 0.031625673 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | -0.325 | -| explained_variance | 0.508 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 51330 | -| policy_gradient_loss | -0.00778 | -| std | 0.335 | -| value_loss | 0.00058 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5135 | -| time_elapsed | 38852 | -| total_timesteps | 657280 | -| train/ | | -| approx_kl | 0.019050734 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | -0.324 | -| explained_variance | -2.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 51340 | -| policy_gradient_loss | -0.00107 | -| std | 0.334 | -| value_loss | 8.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5136 | -| time_elapsed | 38856 | -| total_timesteps | 657408 | -| train/ | | -| approx_kl | 0.020427397 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -0.321 | -| explained_variance | -2.18e+03 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 51350 | -| policy_gradient_loss | -0.00182 | -| std | 0.333 | -| value_loss | 2.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5137 | -| time_elapsed | 38860 | -| total_timesteps | 657536 | -| train/ | | -| approx_kl | 0.012886079 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.318 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.00985 | -| n_updates | 51360 | -| policy_gradient_loss | -0.00333 | -| std | 0.332 | -| value_loss | 2.28e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5138 | -| time_elapsed | 38862 | -| total_timesteps | 657664 | -| train/ | | -| approx_kl | 0.0001191902 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.316 | -| explained_variance | -80.5 | -| learning_rate | 0.0003 | -| loss | -0.00077 | -| n_updates | 51370 | -| policy_gradient_loss | 0.00148 | -| std | 0.332 | -| value_loss | 2.33e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5139 | -| time_elapsed | 38866 | -| total_timesteps | 657792 | -| train/ | | -| approx_kl | 0.002288749 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.315 | -| explained_variance | -5.02 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 51380 | -| policy_gradient_loss | 0.00011 | -| std | 0.332 | -| value_loss | 2.19e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 16 | -| iterations | 5140 | -| time_elapsed | 38870 | -| total_timesteps | 657920 | -| train/ | | -| approx_kl | 0.017502105 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | -0.316 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.000913 | -| n_updates | 51390 | -| policy_gradient_loss | -0.00055 | -| std | 0.332 | -| value_loss | 1.77e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5141 | -| time_elapsed | 38874 | -| total_timesteps | 658048 | -| train/ | | -| approx_kl | 0.0091691725 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.315 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.00734 | -| n_updates | 51400 | -| policy_gradient_loss | -0.00312 | -| std | 0.331 | -| value_loss | 7.76e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5142 | -| time_elapsed | 38881 | -| total_timesteps | 658176 | -| train/ | | -| approx_kl | 0.007351371 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.314 | -| explained_variance | 0.142 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 51410 | -| policy_gradient_loss | -0.00713 | -| std | 0.331 | -| value_loss | 0.000685 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5143 | -| time_elapsed | 38884 | -| total_timesteps | 658304 | -| train/ | | -| approx_kl | 0.005733192 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.312 | -| explained_variance | -1.03e+03 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 51420 | -| policy_gradient_loss | -0.000568 | -| std | 0.33 | -| value_loss | 2.93e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5144 | -| time_elapsed | 38887 | -| total_timesteps | 658432 | -| train/ | | -| approx_kl | 0.058147375 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | -0.31 | -| explained_variance | -6.05e+03 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 51430 | -| policy_gradient_loss | -0.00376 | -| std | 0.33 | -| value_loss | 1.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5145 | -| time_elapsed | 38891 | -| total_timesteps | 658560 | -| train/ | | -| approx_kl | 0.01944009 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.309 | -| explained_variance | -6.76 | -| learning_rate | 0.0003 | -| loss | -0.00907 | -| n_updates | 51440 | -| policy_gradient_loss | -0.00462 | -| std | 0.33 | -| value_loss | 4.76e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5146 | -| time_elapsed | 38895 | -| total_timesteps | 658688 | -| train/ | | -| approx_kl | 0.0037032925 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.309 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 51450 | -| policy_gradient_loss | -0.00162 | -| std | 0.33 | -| value_loss | 8.14e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5147 | -| time_elapsed | 38898 | -| total_timesteps | 658816 | -| train/ | | -| approx_kl | 0.016205441 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.31 | -| explained_variance | -4.59 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 51460 | -| policy_gradient_loss | -0.00168 | -| std | 0.33 | -| value_loss | 2.32e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 16 | -| iterations | 5148 | -| time_elapsed | 38901 | -| total_timesteps | 658944 | -| train/ | | -| approx_kl | 0.0008845995 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.31 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 51470 | -| policy_gradient_loss | 0.000809 | -| std | 0.329 | -| value_loss | 1.7e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5149 | -| time_elapsed | 38904 | -| total_timesteps | 659072 | -| train/ | | -| approx_kl | 0.0013403771 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.308 | -| explained_variance | 0.00204 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 51480 | -| policy_gradient_loss | 0.000808 | -| std | 0.329 | -| value_loss | 9.72e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5150 | -| time_elapsed | 38910 | -| total_timesteps | 659200 | -| train/ | | -| approx_kl | 0.0013332777 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.307 | -| explained_variance | 0.291 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 51490 | -| policy_gradient_loss | 0.000543 | -| std | 0.329 | -| value_loss | 0.000537 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5151 | -| time_elapsed | 38914 | -| total_timesteps | 659328 | -| train/ | | -| approx_kl | 0.028095214 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | -0.306 | -| explained_variance | -508 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 51500 | -| policy_gradient_loss | -0.00201 | -| std | 0.328 | -| value_loss | 7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5152 | -| time_elapsed | 38917 | -| total_timesteps | 659456 | -| train/ | | -| approx_kl | 0.025867743 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.303 | -| explained_variance | -857 | -| learning_rate | 0.0003 | -| loss | -0.00725 | -| n_updates | 51510 | -| policy_gradient_loss | -0.00368 | -| std | 0.327 | -| value_loss | 1.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5153 | -| time_elapsed | 38921 | -| total_timesteps | 659584 | -| train/ | | -| approx_kl | 0.011378359 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.3 | -| explained_variance | -3.81 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 51520 | -| policy_gradient_loss | 0.000997 | -| std | 0.326 | -| value_loss | 2.37e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5154 | -| time_elapsed | 38924 | -| total_timesteps | 659712 | -| train/ | | -| approx_kl | 0.0028229952 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.297 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | 0.000117 | -| n_updates | 51530 | -| policy_gradient_loss | 9.3e-05 | -| std | 0.326 | -| value_loss | 2.79e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5155 | -| time_elapsed | 38926 | -| total_timesteps | 659840 | -| train/ | | -| approx_kl | 0.021068538 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.298 | -| explained_variance | -0.00707 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 51540 | -| policy_gradient_loss | -0.00848 | -| std | 0.326 | -| value_loss | 6.21e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 16 | -| iterations | 5156 | -| time_elapsed | 38928 | -| total_timesteps | 659968 | -| train/ | | -| approx_kl | 0.0003777123 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.299 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | 0.00015 | -| n_updates | 51550 | -| policy_gradient_loss | 0.000154 | -| std | 0.326 | -| value_loss | 2.09e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5157 | -| time_elapsed | 38932 | -| total_timesteps | 660096 | -| train/ | | -| approx_kl | 0.009903736 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | -0.299 | -| explained_variance | 0.00338 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 51560 | -| policy_gradient_loss | -0.0014 | -| std | 0.326 | -| value_loss | 9.12e-11 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5158 | -| time_elapsed | 38940 | -| total_timesteps | 660224 | -| train/ | | -| approx_kl | 0.00011924142 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.295 | -| explained_variance | 0.888 | -| learning_rate | 0.0003 | -| loss | -0.000252 | -| n_updates | 51570 | -| policy_gradient_loss | -0.000224 | -| std | 0.324 | -| value_loss | 0.000571 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5159 | -| time_elapsed | 38944 | -| total_timesteps | 660352 | -| train/ | | -| approx_kl | 0.02382913 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -1.55e+03 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 51580 | -| policy_gradient_loss | -0.00227 | -| std | 0.324 | -| value_loss | 7.7e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5160 | -| time_elapsed | 38947 | -| total_timesteps | 660480 | -| train/ | | -| approx_kl | 0.0471716 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -341 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 51590 | -| policy_gradient_loss | -0.00848 | -| std | 0.324 | -| value_loss | 3.03e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5161 | -| time_elapsed | 38951 | -| total_timesteps | 660608 | -| train/ | | -| approx_kl | 0.02211453 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -6.56 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 51600 | -| policy_gradient_loss | 7.91e-05 | -| std | 0.324 | -| value_loss | 7.93e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5162 | -| time_elapsed | 38954 | -| total_timesteps | 660736 | -| train/ | | -| approx_kl | 0.020020483 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -56.3 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 51610 | -| policy_gradient_loss | -0.00181 | -| std | 0.324 | -| value_loss | 6.69e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5163 | -| time_elapsed | 38958 | -| total_timesteps | 660864 | -| train/ | | -| approx_kl | 0.019547692 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.29 | -| explained_variance | -4.22 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 51620 | -| policy_gradient_loss | -0.00276 | -| std | 0.323 | -| value_loss | 3.01e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 16 | -| iterations | 5164 | -| time_elapsed | 38962 | -| total_timesteps | 660992 | -| train/ | | -| approx_kl | 0.013923392 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | -0.289 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 51630 | -| policy_gradient_loss | -0.00413 | -| std | 0.323 | -| value_loss | 4.98e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.793 | -| time/ | | -| fps | 16 | -| iterations | 5165 | -| time_elapsed | 38966 | -| total_timesteps | 661120 | -| train/ | | -| approx_kl | 0.014522599 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | -0.289 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 51640 | -| policy_gradient_loss | -0.00396 | -| std | 0.323 | -| value_loss | 2.59e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.793 | -| time/ | | -| fps | 16 | -| iterations | 5166 | -| time_elapsed | 38976 | -| total_timesteps | 661248 | -| train/ | | -| approx_kl | 0.02563382 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -0.29 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 51650 | -| policy_gradient_loss | -0.00165 | -| std | 0.324 | -| value_loss | 2.83e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.793 | -| time/ | | -| fps | 16 | -| iterations | 5167 | -| time_elapsed | 38980 | -| total_timesteps | 661376 | -| train/ | | -| approx_kl | 0.01052461 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.293 | -| explained_variance | -2.27e+03 | -| learning_rate | 0.0003 | -| loss | -0.00828 | -| n_updates | 51660 | -| policy_gradient_loss | -0.00265 | -| std | 0.324 | -| value_loss | 3.09e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.793 | -| time/ | | -| fps | 16 | -| iterations | 5168 | -| time_elapsed | 38984 | -| total_timesteps | 661504 | -| train/ | | -| approx_kl | 0.00014532125 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.293 | -| explained_variance | -3.13e+03 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 51670 | -| policy_gradient_loss | 0.00189 | -| std | 0.324 | -| value_loss | 9.67e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.793 | -| time/ | | -| fps | 16 | -| iterations | 5169 | -| time_elapsed | 38987 | -| total_timesteps | 661632 | -| train/ | | -| approx_kl | 0.002216735 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.293 | -| explained_variance | -682 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 51680 | -| policy_gradient_loss | 9.05e-05 | -| std | 0.324 | -| value_loss | 2.43e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.793 | -| time/ | | -| fps | 16 | -| iterations | 5170 | -| time_elapsed | 38990 | -| total_timesteps | 661760 | -| train/ | | -| approx_kl | 0.018916493 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -0.849 | -| learning_rate | 0.0003 | -| loss | -0.00036 | -| n_updates | 51690 | -| policy_gradient_loss | -0.0012 | -| std | 0.324 | -| value_loss | 2.98e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.793 | -| time/ | | -| fps | 16 | -| iterations | 5171 | -| time_elapsed | 38994 | -| total_timesteps | 661888 | -| train/ | | -| approx_kl | 0.0037067048 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.291 | -| explained_variance | -7.65 | -| learning_rate | 0.0003 | -| loss | -0.000777 | -| n_updates | 51700 | -| policy_gradient_loss | -0.000308 | -| std | 0.324 | -| value_loss | 1.34e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5172 | -| time_elapsed | 38997 | -| total_timesteps | 662016 | -| train/ | | -| approx_kl | 0.025336295 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 51710 | -| policy_gradient_loss | -0.00958 | -| std | 0.324 | -| value_loss | 5.49e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5173 | -| time_elapsed | 39006 | -| total_timesteps | 662144 | -| train/ | | -| approx_kl | 0.013618732 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.293 | -| explained_variance | 0.687 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 51720 | -| policy_gradient_loss | -0.0115 | -| std | 0.324 | -| value_loss | 0.000418 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5174 | -| time_elapsed | 39010 | -| total_timesteps | 662272 | -| train/ | | -| approx_kl | 0.012804774 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -142 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 51730 | -| policy_gradient_loss | -0.00101 | -| std | 0.324 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5175 | -| time_elapsed | 39014 | -| total_timesteps | 662400 | -| train/ | | -| approx_kl | 0.012678748 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.29 | -| explained_variance | -478 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 51740 | -| policy_gradient_loss | -0.00959 | -| std | 0.323 | -| value_loss | 5.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5176 | -| time_elapsed | 39015 | -| total_timesteps | 662528 | -| train/ | | -| approx_kl | 0.008483787 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | -0.289 | -| explained_variance | -6.01 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 51750 | -| policy_gradient_loss | -0.000848 | -| std | 0.323 | -| value_loss | 2.28e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5177 | -| time_elapsed | 39018 | -| total_timesteps | 662656 | -| train/ | | -| approx_kl | 0.0016100216 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.287 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 51760 | -| policy_gradient_loss | 0.000772 | -| std | 0.322 | -| value_loss | 6.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5178 | -| time_elapsed | 39020 | -| total_timesteps | 662784 | -| train/ | | -| approx_kl | 0.044576053 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | -0.286 | -| explained_variance | -1.64 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 51770 | -| policy_gradient_loss | -0.0194 | -| std | 0.322 | -| value_loss | 6.14e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 16 | -| iterations | 5179 | -| time_elapsed | 39022 | -| total_timesteps | 662912 | -| train/ | | -| approx_kl | 0.01711372 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | -0.286 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | -0.00683 | -| n_updates | 51780 | -| policy_gradient_loss | -0.00513 | -| std | 0.322 | -| value_loss | 3.65e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 16 | -| iterations | 5180 | -| time_elapsed | 39024 | -| total_timesteps | 663040 | -| train/ | | -| approx_kl | 0.01511894 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | -0.286 | -| explained_variance | 0.00517 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 51790 | -| policy_gradient_loss | -0.00209 | -| std | 0.323 | -| value_loss | 1.64e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 16 | -| iterations | 5181 | -| time_elapsed | 39031 | -| total_timesteps | 663168 | -| train/ | | -| approx_kl | 0.019821329 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.288 | -| explained_variance | 0.702 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 51800 | -| policy_gradient_loss | -0.0098 | -| std | 0.323 | -| value_loss | 0.00402 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 16 | -| iterations | 5182 | -| time_elapsed | 39034 | -| total_timesteps | 663296 | -| train/ | | -| approx_kl | 0.013106525 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.289 | -| explained_variance | -251 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 51810 | -| policy_gradient_loss | -0.00647 | -| std | 0.323 | -| value_loss | 7.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 16 | -| iterations | 5183 | -| time_elapsed | 39038 | -| total_timesteps | 663424 | -| train/ | | -| approx_kl | 0.090784274 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | -0.29 | -| explained_variance | -2.54e+03 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 51820 | -| policy_gradient_loss | -0.00565 | -| std | 0.323 | -| value_loss | 5.98e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 16 | -| iterations | 5184 | -| time_elapsed | 39042 | -| total_timesteps | 663552 | -| train/ | | -| approx_kl | 0.023870142 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.291 | -| explained_variance | -265 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 51830 | -| policy_gradient_loss | -0.000922 | -| std | 0.324 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 16 | -| iterations | 5185 | -| time_elapsed | 39046 | -| total_timesteps | 663680 | -| train/ | | -| approx_kl | 0.008381202 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.294 | -| explained_variance | -226 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 51840 | -| policy_gradient_loss | -0.00582 | -| std | 0.325 | -| value_loss | 1.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 16 | -| iterations | 5186 | -| time_elapsed | 39049 | -| total_timesteps | 663808 | -| train/ | | -| approx_kl | 0.031061243 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | -0.296 | -| explained_variance | -13.5 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 51850 | -| policy_gradient_loss | -0.00659 | -| std | 0.325 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.78 | -| time/ | | -| fps | 17 | -| iterations | 5187 | -| time_elapsed | 39053 | -| total_timesteps | 663936 | -| train/ | | -| approx_kl | 0.0035430766 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.296 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 51860 | -| policy_gradient_loss | -0.000136 | -| std | 0.325 | -| value_loss | 1.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5188 | -| time_elapsed | 39057 | -| total_timesteps | 664064 | -| train/ | | -| approx_kl | 0.026018865 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | -0.295 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | 0.00494 | -| n_updates | 51870 | -| policy_gradient_loss | -7.74e-06 | -| std | 0.325 | -| value_loss | 1.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5189 | -| time_elapsed | 39063 | -| total_timesteps | 664192 | -| train/ | | -| approx_kl | 0.03888893 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.295 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 51880 | -| policy_gradient_loss | -0.00634 | -| std | 0.325 | -| value_loss | 0.000126 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5190 | -| time_elapsed | 39066 | -| total_timesteps | 664320 | -| train/ | | -| approx_kl | 0.005058716 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.294 | -| explained_variance | -82.3 | -| learning_rate | 0.0003 | -| loss | 0.000239 | -| n_updates | 51890 | -| policy_gradient_loss | 0.000162 | -| std | 0.325 | -| value_loss | 4.52e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5191 | -| time_elapsed | 39070 | -| total_timesteps | 664448 | -| train/ | | -| approx_kl | 0.02115359 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | -0.296 | -| explained_variance | -2.55 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 51900 | -| policy_gradient_loss | -0.016 | -| std | 0.325 | -| value_loss | 6.42e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5192 | -| time_elapsed | 39073 | -| total_timesteps | 664576 | -| train/ | | -| approx_kl | 0.014642501 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.296 | -| explained_variance | -0.54 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 51910 | -| policy_gradient_loss | -0.00279 | -| std | 0.325 | -| value_loss | 1.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5193 | -| time_elapsed | 39076 | -| total_timesteps | 664704 | -| train/ | | -| approx_kl | 0.016955703 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -0.295 | -| explained_variance | 0.000873 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 51920 | -| policy_gradient_loss | -0.00786 | -| std | 0.325 | -| value_loss | 2.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5194 | -| time_elapsed | 39080 | -| total_timesteps | 664832 | -| train/ | | -| approx_kl | 0.017167041 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.294 | -| explained_variance | 0.00251 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 51930 | -| policy_gradient_loss | -0.0124 | -| std | 0.325 | -| value_loss | 5.75e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5195 | -| time_elapsed | 39083 | -| total_timesteps | 664960 | -| train/ | | -| approx_kl | 0.020588614 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.294 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 51940 | -| policy_gradient_loss | -0.00434 | -| std | 0.324 | -| value_loss | 1.17e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5196 | -| time_elapsed | 39088 | -| total_timesteps | 665088 | -| train/ | | -| approx_kl | 1.8531922e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.000337 | -| n_updates | 51950 | -| policy_gradient_loss | -0.00013 | -| std | 0.323 | -| value_loss | 4.4e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5197 | -| time_elapsed | 39096 | -| total_timesteps | 665216 | -| train/ | | -| approx_kl | 0.009433307 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.288 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 51960 | -| policy_gradient_loss | -0.0146 | -| std | 0.322 | -| value_loss | 0.000231 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5198 | -| time_elapsed | 39099 | -| total_timesteps | 665344 | -| train/ | | -| approx_kl | 0.02280756 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.287 | -| explained_variance | -4.89 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 51970 | -| policy_gradient_loss | -0.0109 | -| std | 0.322 | -| value_loss | 1.2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5199 | -| time_elapsed | 39103 | -| total_timesteps | 665472 | -| train/ | | -| approx_kl | 0.015230043 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.286 | -| explained_variance | -11.9 | -| learning_rate | 0.0003 | -| loss | -0.00595 | -| n_updates | 51980 | -| policy_gradient_loss | -0.00277 | -| std | 0.322 | -| value_loss | 1.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5200 | -| time_elapsed | 39107 | -| total_timesteps | 665600 | -| train/ | | -| approx_kl | 0.008889316 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.287 | -| explained_variance | -0.452 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 51990 | -| policy_gradient_loss | -0.00158 | -| std | 0.323 | -| value_loss | 5.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5201 | -| time_elapsed | 39110 | -| total_timesteps | 665728 | -| train/ | | -| approx_kl | 0.01353741 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.288 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 52000 | -| policy_gradient_loss | -0.00495 | -| std | 0.323 | -| value_loss | 3.81e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5202 | -| time_elapsed | 39114 | -| total_timesteps | 665856 | -| train/ | | -| approx_kl | 0.010500114 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -0.289 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 52010 | -| policy_gradient_loss | -0.00102 | -| std | 0.324 | -| value_loss | 2.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5203 | -| time_elapsed | 39117 | -| total_timesteps | 665984 | -| train/ | | -| approx_kl | 0.010931359 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | 0.00471 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 52020 | -| policy_gradient_loss | -0.00116 | -| std | 0.324 | -| value_loss | 8.61e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 17 | -| iterations | 5204 | -| time_elapsed | 39121 | -| total_timesteps | 666112 | -| train/ | | -| approx_kl | 0.0048352997 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -0.00179 | -| learning_rate | 0.0003 | -| loss | -0.000311 | -| n_updates | 52030 | -| policy_gradient_loss | -0.000171 | -| std | 0.324 | -| value_loss | 4.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 17 | -| iterations | 5205 | -| time_elapsed | 39128 | -| total_timesteps | 666240 | -| train/ | | -| approx_kl | 0.012819447 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | 0.768 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 52040 | -| policy_gradient_loss | -0.0106 | -| std | 0.324 | -| value_loss | 0.000525 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 17 | -| iterations | 5206 | -| time_elapsed | 39131 | -| total_timesteps | 666368 | -| train/ | | -| approx_kl | 0.006107307 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.292 | -| explained_variance | -206 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 52050 | -| policy_gradient_loss | -0.00553 | -| std | 0.324 | -| value_loss | 6.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 17 | -| iterations | 5207 | -| time_elapsed | 39135 | -| total_timesteps | 666496 | -| train/ | | -| approx_kl | 0.010938557 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.293 | -| explained_variance | -264 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 52060 | -| policy_gradient_loss | -0.00514 | -| std | 0.325 | -| value_loss | 1.47e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 17 | -| iterations | 5208 | -| time_elapsed | 39137 | -| total_timesteps | 666624 | -| train/ | | -| approx_kl | 0.0033828337 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.294 | -| explained_variance | -9.84 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 52070 | -| policy_gradient_loss | -0.000161 | -| std | 0.324 | -| value_loss | 9.92e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 17 | -| iterations | 5209 | -| time_elapsed | 39141 | -| total_timesteps | 666752 | -| train/ | | -| approx_kl | 0.0009398144 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.291 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.000969 | -| n_updates | 52080 | -| policy_gradient_loss | 7.04e-05 | -| std | 0.323 | -| value_loss | 2.26e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 17 | -| iterations | 5210 | -| time_elapsed | 39145 | -| total_timesteps | 666880 | -| train/ | | -| approx_kl | 0.0029056938 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.287 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 52090 | -| policy_gradient_loss | -0.000293 | -| std | 0.321 | -| value_loss | 1.42e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5211 | -| time_elapsed | 39147 | -| total_timesteps | 667008 | -| train/ | | -| approx_kl | 0.015672622 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.282 | -| explained_variance | 0.000509 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 52100 | -| policy_gradient_loss | -0.003 | -| std | 0.321 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5212 | -| time_elapsed | 39156 | -| total_timesteps | 667136 | -| train/ | | -| approx_kl | 0.009415632 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.281 | -| explained_variance | 0.692 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 52110 | -| policy_gradient_loss | -0.00751 | -| std | 0.32 | -| value_loss | 0.000505 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5213 | -| time_elapsed | 39160 | -| total_timesteps | 667264 | -| train/ | | -| approx_kl | 0.017460693 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | -0.28 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | -0.000901 | -| n_updates | 52120 | -| policy_gradient_loss | -0.000957 | -| std | 0.32 | -| value_loss | 3.97e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5214 | -| time_elapsed | 39164 | -| total_timesteps | 667392 | -| train/ | | -| approx_kl | 0.02119049 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | -0.277 | -| explained_variance | -64.1 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 52130 | -| policy_gradient_loss | -0.00978 | -| std | 0.319 | -| value_loss | 1.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5215 | -| time_elapsed | 39168 | -| total_timesteps | 667520 | -| train/ | | -| approx_kl | 0.027841868 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | -0.277 | -| explained_variance | -29.5 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 52140 | -| policy_gradient_loss | -0.00857 | -| std | 0.319 | -| value_loss | 3.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5216 | -| time_elapsed | 39171 | -| total_timesteps | 667648 | -| train/ | | -| approx_kl | 0.017120076 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.277 | -| explained_variance | -0.837 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 52150 | -| policy_gradient_loss | -0.00464 | -| std | 0.319 | -| value_loss | 4.28e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5217 | -| time_elapsed | 39175 | -| total_timesteps | 667776 | -| train/ | | -| approx_kl | 0.0044994284 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.278 | -| explained_variance | -0.0095 | -| learning_rate | 0.0003 | -| loss | 0.000383 | -| n_updates | 52160 | -| policy_gradient_loss | 0.000893 | -| std | 0.32 | -| value_loss | 2.52e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5218 | -| time_elapsed | 39178 | -| total_timesteps | 667904 | -| train/ | | -| approx_kl | 0.008354548 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.278 | -| explained_variance | 0.00295 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 52170 | -| policy_gradient_loss | -0.00128 | -| std | 0.319 | -| value_loss | 8.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5219 | -| time_elapsed | 39181 | -| total_timesteps | 668032 | -| train/ | | -| approx_kl | 0.0093576815 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.276 | -| explained_variance | -0.616 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 52180 | -| policy_gradient_loss | -0.00227 | -| std | 0.319 | -| value_loss | 5.24e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5220 | -| time_elapsed | 39188 | -| total_timesteps | 668160 | -| train/ | | -| approx_kl | 0.0032200688 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.276 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 52190 | -| policy_gradient_loss | -0.00353 | -| std | 0.319 | -| value_loss | 5.08e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5221 | -| time_elapsed | 39193 | -| total_timesteps | 668288 | -| train/ | | -| approx_kl | 0.0028491043 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.277 | -| explained_variance | -87.8 | -| learning_rate | 0.0003 | -| loss | -0.00343 | -| n_updates | 52200 | -| policy_gradient_loss | -2.68e-05 | -| std | 0.319 | -| value_loss | 2.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5222 | -| time_elapsed | 39196 | -| total_timesteps | 668416 | -| train/ | | -| approx_kl | 0.0014662747 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.278 | -| explained_variance | -49.7 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 52210 | -| policy_gradient_loss | 0.000817 | -| std | 0.319 | -| value_loss | 6.01e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5223 | -| time_elapsed | 39199 | -| total_timesteps | 668544 | -| train/ | | -| approx_kl | 0.025512611 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -0.277 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 52220 | -| policy_gradient_loss | -0.00783 | -| std | 0.319 | -| value_loss | 1.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5224 | -| time_elapsed | 39202 | -| total_timesteps | 668672 | -| train/ | | -| approx_kl | 0.011752108 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | -0.277 | -| explained_variance | -0.0741 | -| learning_rate | 0.0003 | -| loss | -0.000756 | -| n_updates | 52230 | -| policy_gradient_loss | -0.00202 | -| std | 0.319 | -| value_loss | 3.44e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5225 | -| time_elapsed | 39206 | -| total_timesteps | 668800 | -| train/ | | -| approx_kl | 0.012496015 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.276 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 52240 | -| policy_gradient_loss | -0.00497 | -| std | 0.318 | -| value_loss | 1.81e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.785 | -| time/ | | -| fps | 17 | -| iterations | 5226 | -| time_elapsed | 39209 | -| total_timesteps | 668928 | -| train/ | | -| approx_kl | 0.015355378 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.273 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.000712 | -| n_updates | 52250 | -| policy_gradient_loss | -0.0015 | -| std | 0.318 | -| value_loss | 5.59e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5227 | -| time_elapsed | 39213 | -| total_timesteps | 669056 | -| train/ | | -| approx_kl | 0.0105214175 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.272 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 52260 | -| policy_gradient_loss | -0.00143 | -| std | 0.317 | -| value_loss | 9.28e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5228 | -| time_elapsed | 39218 | -| total_timesteps | 669184 | -| train/ | | -| approx_kl | 0.0020662816 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.27 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 52270 | -| policy_gradient_loss | -0.00101 | -| std | 0.316 | -| value_loss | 5.19e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5229 | -| time_elapsed | 39221 | -| total_timesteps | 669312 | -| train/ | | -| approx_kl | 0.02465408 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -828 | -| learning_rate | 0.0003 | -| loss | -0.00865 | -| n_updates | 52280 | -| policy_gradient_loss | -0.00372 | -| std | 0.316 | -| value_loss | 7.23e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5230 | -| time_elapsed | 39225 | -| total_timesteps | 669440 | -| train/ | | -| approx_kl | 5.220808e-05 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.265 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | 0.00164 | -| n_updates | 52290 | -| policy_gradient_loss | 0.0106 | -| std | 0.315 | -| value_loss | 2.08e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5231 | -| time_elapsed | 39228 | -| total_timesteps | 669568 | -| train/ | | -| approx_kl | 0.065586984 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -34.2 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 52300 | -| policy_gradient_loss | -0.0052 | -| std | 0.315 | -| value_loss | 6.78e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5232 | -| time_elapsed | 39232 | -| total_timesteps | 669696 | -| train/ | | -| approx_kl | 0.032602753 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -4.18 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 52310 | -| policy_gradient_loss | -0.00365 | -| std | 0.315 | -| value_loss | 3.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5233 | -| time_elapsed | 39234 | -| total_timesteps | 669824 | -| train/ | | -| approx_kl | 0.011497769 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.263 | -| explained_variance | -0.00764 | -| learning_rate | 0.0003 | -| loss | 0.000356 | -| n_updates | 52320 | -| policy_gradient_loss | -0.000521 | -| std | 0.315 | -| value_loss | 3.9e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5234 | -| time_elapsed | 39237 | -| total_timesteps | 669952 | -| train/ | | -| approx_kl | 0.01577235 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.00308 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 52330 | -| policy_gradient_loss | -0.00342 | -| std | 0.315 | -| value_loss | 5.45e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5235 | -| time_elapsed | 39239 | -| total_timesteps | 670080 | -| train/ | | -| approx_kl | 0.022738691 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 52340 | -| policy_gradient_loss | -0.00956 | -| std | 0.316 | -| value_loss | 7.1e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5236 | -| time_elapsed | 39243 | -| total_timesteps | 670208 | -| train/ | | -| approx_kl | 0.010305234 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 52350 | -| policy_gradient_loss | -0.0131 | -| std | 0.316 | -| value_loss | 0.0001 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5237 | -| time_elapsed | 39244 | -| total_timesteps | 670336 | -| train/ | | -| approx_kl | 0.03217443 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -1.82e+03 | -| learning_rate | 0.0003 | -| loss | -0.00997 | -| n_updates | 52360 | -| policy_gradient_loss | -0.00502 | -| std | 0.316 | -| value_loss | 7.88e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5238 | -| time_elapsed | 39247 | -| total_timesteps | 670464 | -| train/ | | -| approx_kl | 0.00019611791 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.265 | -| explained_variance | -367 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 52370 | -| policy_gradient_loss | 0.00258 | -| std | 0.315 | -| value_loss | 2.36e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5239 | -| time_elapsed | 39250 | -| total_timesteps | 670592 | -| train/ | | -| approx_kl | 0.0024091373 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.265 | -| explained_variance | -8.8 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 52380 | -| policy_gradient_loss | 0.000193 | -| std | 0.315 | -| value_loss | 1.35e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5240 | -| time_elapsed | 39252 | -| total_timesteps | 670720 | -| train/ | | -| approx_kl | 0.0012916196 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 52390 | -| policy_gradient_loss | 0.0028 | -| std | 0.315 | -| value_loss | 1.33e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5241 | -| time_elapsed | 39256 | -| total_timesteps | 670848 | -| train/ | | -| approx_kl | 0.0014716866 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.265 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 52400 | -| policy_gradient_loss | 0.000478 | -| std | 0.315 | -| value_loss | 2.05e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5242 | -| time_elapsed | 39259 | -| total_timesteps | 670976 | -| train/ | | -| approx_kl | 0.0016894974 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 52410 | -| policy_gradient_loss | 0.000663 | -| std | 0.316 | -| value_loss | 1.41e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5243 | -| time_elapsed | 39262 | -| total_timesteps | 671104 | -| train/ | | -| approx_kl | 0.0012740227 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 52420 | -| policy_gradient_loss | 0.000228 | -| std | 0.316 | -| value_loss | 2.62e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5244 | -| time_elapsed | 39270 | -| total_timesteps | 671232 | -| train/ | | -| approx_kl | 0.01724818 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -4.07 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 52430 | -| policy_gradient_loss | -0.0124 | -| std | 0.316 | -| value_loss | 0.00141 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5245 | -| time_elapsed | 39273 | -| total_timesteps | 671360 | -| train/ | | -| approx_kl | 0.024195012 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -2.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 52440 | -| policy_gradient_loss | -0.0131 | -| std | 0.316 | -| value_loss | 1.99e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5246 | -| time_elapsed | 39276 | -| total_timesteps | 671488 | -| train/ | | -| approx_kl | 0.024828758 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -61.6 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 52450 | -| policy_gradient_loss | -0.00928 | -| std | 0.316 | -| value_loss | 8.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5247 | -| time_elapsed | 39280 | -| total_timesteps | 671616 | -| train/ | | -| approx_kl | 0.010370964 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -0.877 | -| learning_rate | 0.0003 | -| loss | 0.000724 | -| n_updates | 52460 | -| policy_gradient_loss | 0.000187 | -| std | 0.316 | -| value_loss | 1.12e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5248 | -| time_elapsed | 39283 | -| total_timesteps | 671744 | -| train/ | | -| approx_kl | 0.0049742474 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.268 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 52470 | -| policy_gradient_loss | -0.00105 | -| std | 0.317 | -| value_loss | 6.77e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5249 | -| time_elapsed | 39286 | -| total_timesteps | 671872 | -| train/ | | -| approx_kl | 0.01272831 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.271 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 52480 | -| policy_gradient_loss | -0.0027 | -| std | 0.318 | -| value_loss | 2.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5250 | -| time_elapsed | 39289 | -| total_timesteps | 672000 | -| train/ | | -| approx_kl | 0.020226873 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -0.274 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.00063 | -| n_updates | 52490 | -| policy_gradient_loss | -0.00164 | -| std | 0.319 | -| value_loss | 1.78e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5251 | -| time_elapsed | 39292 | -| total_timesteps | 672128 | -| train/ | | -| approx_kl | 0.01161978 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | -0.275 | -| explained_variance | -0.00165 | -| learning_rate | 0.0003 | -| loss | -0.00574 | -| n_updates | 52500 | -| policy_gradient_loss | -0.00396 | -| std | 0.319 | -| value_loss | 1.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5252 | -| time_elapsed | 39299 | -| total_timesteps | 672256 | -| train/ | | -| approx_kl | 0.053757347 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.275 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 52510 | -| policy_gradient_loss | -0.0176 | -| std | 0.318 | -| value_loss | 1.2e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5253 | -| time_elapsed | 39302 | -| total_timesteps | 672384 | -| train/ | | -| approx_kl | 0.014963532 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -0.275 | -| explained_variance | -1.96 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 52520 | -| policy_gradient_loss | -0.000164 | -| std | 0.319 | -| value_loss | 3.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5254 | -| time_elapsed | 39306 | -| total_timesteps | 672512 | -| train/ | | -| approx_kl | 0.020544501 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.276 | -| explained_variance | -2.24 | -| learning_rate | 0.0003 | -| loss | -0.00532 | -| n_updates | 52530 | -| policy_gradient_loss | -0.00441 | -| std | 0.319 | -| value_loss | 1.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5255 | -| time_elapsed | 39309 | -| total_timesteps | 672640 | -| train/ | | -| approx_kl | 0.019520037 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | -0.277 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 52540 | -| policy_gradient_loss | -0.00642 | -| std | 0.319 | -| value_loss | 2.33e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5256 | -| time_elapsed | 39313 | -| total_timesteps | 672768 | -| train/ | | -| approx_kl | 0.018212607 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | -0.276 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.000639 | -| n_updates | 52550 | -| policy_gradient_loss | -0.0012 | -| std | 0.318 | -| value_loss | 1.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5257 | -| time_elapsed | 39316 | -| total_timesteps | 672896 | -| train/ | | -| approx_kl | 0.012118897 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | -0.274 | -| explained_variance | -0.00305 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 52560 | -| policy_gradient_loss | -0.000346 | -| std | 0.318 | -| value_loss | 9.9e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5258 | -| time_elapsed | 39318 | -| total_timesteps | 673024 | -| train/ | | -| approx_kl | 9.4690826e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.273 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | -0.000322 | -| n_updates | 52570 | -| policy_gradient_loss | -0.000119 | -| std | 0.317 | -| value_loss | 2.18e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5259 | -| time_elapsed | 39327 | -| total_timesteps | 673152 | -| train/ | | -| approx_kl | 0.0023260913 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | -0.27 | -| explained_variance | 0.723 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 52580 | -| policy_gradient_loss | -0.0138 | -| std | 0.316 | -| value_loss | 0.00236 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5260 | -| time_elapsed | 39332 | -| total_timesteps | 673280 | -| train/ | | -| approx_kl | 0.011740085 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.268 | -| explained_variance | -382 | -| learning_rate | 0.0003 | -| loss | -0.000214 | -| n_updates | 52590 | -| policy_gradient_loss | -0.000229 | -| std | 0.316 | -| value_loss | 1.12e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5261 | -| time_elapsed | 39335 | -| total_timesteps | 673408 | -| train/ | | -| approx_kl | 0.02127511 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.269 | -| explained_variance | -2.06e+03 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 52600 | -| policy_gradient_loss | -0.0017 | -| std | 0.317 | -| value_loss | 4.86e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5262 | -| time_elapsed | 39337 | -| total_timesteps | 673536 | -| train/ | | -| approx_kl | 0.017401598 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | -0.27 | -| explained_variance | -17.6 | -| learning_rate | 0.0003 | -| loss | -0.000891 | -| n_updates | 52610 | -| policy_gradient_loss | -0.000661 | -| std | 0.317 | -| value_loss | 3.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5263 | -| time_elapsed | 39341 | -| total_timesteps | 673664 | -| train/ | | -| approx_kl | 0.010918789 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.272 | -| explained_variance | -81 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 52620 | -| policy_gradient_loss | -0.00144 | -| std | 0.317 | -| value_loss | 2.86e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5264 | -| time_elapsed | 39344 | -| total_timesteps | 673792 | -| train/ | | -| approx_kl | 0.0019452716 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.271 | -| explained_variance | -4.07 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 52630 | -| policy_gradient_loss | 0.000322 | -| std | 0.317 | -| value_loss | 1.7e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5265 | -| time_elapsed | 39348 | -| total_timesteps | 673920 | -| train/ | | -| approx_kl | 0.0011924212 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.27 | -| explained_variance | -0.969 | -| learning_rate | 0.0003 | -| loss | -0.00595 | -| n_updates | 52640 | -| policy_gradient_loss | 0.00152 | -| std | 0.317 | -| value_loss | 4.92e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5266 | -| time_elapsed | 39350 | -| total_timesteps | 674048 | -| train/ | | -| approx_kl | 0.013683228 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.27 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 52650 | -| policy_gradient_loss | -0.00184 | -| std | 0.317 | -| value_loss | 3.87e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5267 | -| time_elapsed | 39356 | -| total_timesteps | 674176 | -| train/ | | -| approx_kl | 0.0046434025 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.272 | -| explained_variance | 0.244 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 52660 | -| policy_gradient_loss | -0.00829 | -| std | 0.318 | -| value_loss | 0.000647 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5268 | -| time_elapsed | 39360 | -| total_timesteps | 674304 | -| train/ | | -| approx_kl | 0.036099676 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.273 | -| explained_variance | -1.7e+03 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 52670 | -| policy_gradient_loss | -0.00588 | -| std | 0.318 | -| value_loss | 7.08e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5269 | -| time_elapsed | 39364 | -| total_timesteps | 674432 | -| train/ | | -| approx_kl | 0.0016006907 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.272 | -| explained_variance | -1.56e+03 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 52680 | -| policy_gradient_loss | 0.000349 | -| std | 0.317 | -| value_loss | 1.17e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5270 | -| time_elapsed | 39368 | -| total_timesteps | 674560 | -| train/ | | -| approx_kl | 0.0017765136 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.271 | -| explained_variance | -264 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 52690 | -| policy_gradient_loss | 0.00113 | -| std | 0.317 | -| value_loss | 1.91e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5271 | -| time_elapsed | 39371 | -| total_timesteps | 674688 | -| train/ | | -| approx_kl | 0.00083718775 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.269 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | -0.000897 | -| n_updates | 52700 | -| policy_gradient_loss | 0.000211 | -| std | 0.316 | -| value_loss | 6.19e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5272 | -| time_elapsed | 39374 | -| total_timesteps | 674816 | -| train/ | | -| approx_kl | 0.019471744 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | -0.265 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | 0.00344 | -| n_updates | 52710 | -| policy_gradient_loss | 0.000684 | -| std | 0.315 | -| value_loss | 3.53e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5273 | -| time_elapsed | 39378 | -| total_timesteps | 674944 | -| train/ | | -| approx_kl | 0.028126225 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 52720 | -| policy_gradient_loss | -0.0137 | -| std | 0.315 | -| value_loss | 3.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5274 | -| time_elapsed | 39382 | -| total_timesteps | 675072 | -| train/ | | -| approx_kl | 0.008271826 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 52730 | -| policy_gradient_loss | -0.00585 | -| std | 0.315 | -| value_loss | 6.16e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5275 | -| time_elapsed | 39387 | -| total_timesteps | 675200 | -| train/ | | -| approx_kl | 0.011089148 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.263 | -| explained_variance | 0.598 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 52740 | -| policy_gradient_loss | -0.0141 | -| std | 0.314 | -| value_loss | 0.00731 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5276 | -| time_elapsed | 39391 | -| total_timesteps | 675328 | -| train/ | | -| approx_kl | 0.011042645 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.263 | -| explained_variance | -2.43e+03 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 52750 | -| policy_gradient_loss | -0.00108 | -| std | 0.315 | -| value_loss | 4.3e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5277 | -| time_elapsed | 39394 | -| total_timesteps | 675456 | -| train/ | | -| approx_kl | 0.04357417 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | -0.265 | -| explained_variance | -782 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 52760 | -| policy_gradient_loss | -0.00339 | -| std | 0.316 | -| value_loss | 2.57e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5278 | -| time_elapsed | 39398 | -| total_timesteps | 675584 | -| train/ | | -| approx_kl | 0.024526834 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | -0.00984 | -| n_updates | 52770 | -| policy_gradient_loss | -0.00688 | -| std | 0.316 | -| value_loss | 6.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5279 | -| time_elapsed | 39402 | -| total_timesteps | 675712 | -| train/ | | -| approx_kl | 0.013177125 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -8.2 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 52780 | -| policy_gradient_loss | -0.00748 | -| std | 0.316 | -| value_loss | 3.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5280 | -| time_elapsed | 39406 | -| total_timesteps | 675840 | -| train/ | | -| approx_kl | 0.011060813 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.268 | -| explained_variance | -0.35 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 52790 | -| policy_gradient_loss | -0.0019 | -| std | 0.316 | -| value_loss | 2.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5281 | -| time_elapsed | 39409 | -| total_timesteps | 675968 | -| train/ | | -| approx_kl | 0.018559143 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | 0.00675 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 52800 | -| policy_gradient_loss | -0.013 | -| std | 0.316 | -| value_loss | 3.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5282 | -| time_elapsed | 39413 | -| total_timesteps | 676096 | -| train/ | | -| approx_kl | 0.021330819 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 52810 | -| policy_gradient_loss | -0.00566 | -| std | 0.316 | -| value_loss | 2.19e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5283 | -| time_elapsed | 39423 | -| total_timesteps | 676224 | -| train/ | | -| approx_kl | 0.01781386 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 52820 | -| policy_gradient_loss | -0.0171 | -| std | 0.316 | -| value_loss | 0.000451 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5284 | -| time_elapsed | 39425 | -| total_timesteps | 676352 | -| train/ | | -| approx_kl | 0.027656056 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -529 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 52830 | -| policy_gradient_loss | -0.00594 | -| std | 0.316 | -| value_loss | 6.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5285 | -| time_elapsed | 39427 | -| total_timesteps | 676480 | -| train/ | | -| approx_kl | 0.045057893 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -209 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 52840 | -| policy_gradient_loss | -0.00506 | -| std | 0.315 | -| value_loss | 2.27e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5286 | -| time_elapsed | 39431 | -| total_timesteps | 676608 | -| train/ | | -| approx_kl | 0.0095772855 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -8.02 | -| learning_rate | 0.0003 | -| loss | -0.00774 | -| n_updates | 52850 | -| policy_gradient_loss | -0.00223 | -| std | 0.315 | -| value_loss | 3.91e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5287 | -| time_elapsed | 39434 | -| total_timesteps | 676736 | -| train/ | | -| approx_kl | 0.00030613877 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.531 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 52860 | -| policy_gradient_loss | 0.00103 | -| std | 0.315 | -| value_loss | 6.52e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5288 | -| time_elapsed | 39437 | -| total_timesteps | 676864 | -| train/ | | -| approx_kl | 0.0024921885 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 52870 | -| policy_gradient_loss | 0.000347 | -| std | 0.315 | -| value_loss | 5.71e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5289 | -| time_elapsed | 39441 | -| total_timesteps | 676992 | -| train/ | | -| approx_kl | 0.021586407 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | -0.262 | -| explained_variance | -0.000319 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 52880 | -| policy_gradient_loss | -0.000403 | -| std | 0.314 | -| value_loss | 2.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5290 | -| time_elapsed | 39444 | -| total_timesteps | 677120 | -| train/ | | -| approx_kl | 0.018372875 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.261 | -| explained_variance | -0.00775 | -| learning_rate | 0.0003 | -| loss | -0.00864 | -| n_updates | 52890 | -| policy_gradient_loss | -0.00826 | -| std | 0.314 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5291 | -| time_elapsed | 39454 | -| total_timesteps | 677248 | -| train/ | | -| approx_kl | 0.0059631257 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.26 | -| explained_variance | 0.861 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 52900 | -| policy_gradient_loss | -0.00976 | -| std | 0.314 | -| value_loss | 0.00147 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5292 | -| time_elapsed | 39457 | -| total_timesteps | 677376 | -| train/ | | -| approx_kl | 0.011756482 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | -0.259 | -| explained_variance | -225 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 52910 | -| policy_gradient_loss | -0.00126 | -| std | 0.314 | -| value_loss | 3.93e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5293 | -| time_elapsed | 39460 | -| total_timesteps | 677504 | -| train/ | | -| approx_kl | 0.0044678 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.26 | -| explained_variance | -3.21e+03 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 52920 | -| policy_gradient_loss | -0.000635 | -| std | 0.314 | -| value_loss | 2.55e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5294 | -| time_elapsed | 39465 | -| total_timesteps | 677632 | -| train/ | | -| approx_kl | 0.052567855 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | -0.262 | -| explained_variance | -18.5 | -| learning_rate | 0.0003 | -| loss | -0.000763 | -| n_updates | 52930 | -| policy_gradient_loss | -0.00324 | -| std | 0.315 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5295 | -| time_elapsed | 39469 | -| total_timesteps | 677760 | -| train/ | | -| approx_kl | 0.020987054 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.262 | -| explained_variance | -0.687 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 52940 | -| policy_gradient_loss | -0.0122 | -| std | 0.315 | -| value_loss | 1.48e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5296 | -| time_elapsed | 39472 | -| total_timesteps | 677888 | -| train/ | | -| approx_kl | 0.0070214584 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.263 | -| explained_variance | -0.0793 | -| learning_rate | 0.0003 | -| loss | 0.000435 | -| n_updates | 52950 | -| policy_gradient_loss | -0.000323 | -| std | 0.316 | -| value_loss | 6.83e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5297 | -| time_elapsed | 39475 | -| total_timesteps | 678016 | -| train/ | | -| approx_kl | 0.014840418 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -0.00602 | -| learning_rate | 0.0003 | -| loss | -0.0088 | -| n_updates | 52960 | -| policy_gradient_loss | -0.00641 | -| std | 0.316 | -| value_loss | 3.81e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5298 | -| time_elapsed | 39483 | -| total_timesteps | 678144 | -| train/ | | -| approx_kl | 0.056336433 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 52970 | -| policy_gradient_loss | -0.0101 | -| std | 0.316 | -| value_loss | 4.47e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5299 | -| time_elapsed | 39486 | -| total_timesteps | 678272 | -| train/ | | -| approx_kl | 0.0055307546 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -69 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 52980 | -| policy_gradient_loss | -0.000342 | -| std | 0.316 | -| value_loss | 1.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5300 | -| time_elapsed | 39489 | -| total_timesteps | 678400 | -| train/ | | -| approx_kl | 0.036617704 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -32.2 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 52990 | -| policy_gradient_loss | -0.0119 | -| std | 0.316 | -| value_loss | 2.6e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5301 | -| time_elapsed | 39493 | -| total_timesteps | 678528 | -| train/ | | -| approx_kl | 0.0035292632 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -0.641 | -| learning_rate | 0.0003 | -| loss | -0.000452 | -| n_updates | 53000 | -| policy_gradient_loss | -0.000279 | -| std | 0.315 | -| value_loss | 7.27e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5302 | -| time_elapsed | 39497 | -| total_timesteps | 678656 | -| train/ | | -| approx_kl | 0.0069890604 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 53010 | -| policy_gradient_loss | 0.000294 | -| std | 0.315 | -| value_loss | 7.55e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5303 | -| time_elapsed | 39501 | -| total_timesteps | 678784 | -| train/ | | -| approx_kl | 0.013344621 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.263 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 53020 | -| policy_gradient_loss | -0.00364 | -| std | 0.315 | -| value_loss | 3.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5304 | -| time_elapsed | 39504 | -| total_timesteps | 678912 | -| train/ | | -| approx_kl | 0.018359741 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.00132 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 53030 | -| policy_gradient_loss | -0.00316 | -| std | 0.315 | -| value_loss | 1.89e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5305 | -| time_elapsed | 39508 | -| total_timesteps | 679040 | -| train/ | | -| approx_kl | 0.0121935075 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.265 | -| explained_variance | -0.00613 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 53040 | -| policy_gradient_loss | -0.0024 | -| std | 0.315 | -| value_loss | 1.08e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5306 | -| time_elapsed | 39515 | -| total_timesteps | 679168 | -| train/ | | -| approx_kl | 0.043032955 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 53050 | -| policy_gradient_loss | -0.0191 | -| std | 0.316 | -| value_loss | 0.000111 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5307 | -| time_elapsed | 39518 | -| total_timesteps | 679296 | -| train/ | | -| approx_kl | 0.03881158 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 53060 | -| policy_gradient_loss | -0.00352 | -| std | 0.316 | -| value_loss | 1.85e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5308 | -| time_elapsed | 39522 | -| total_timesteps | 679424 | -| train/ | | -| approx_kl | 0.035905432 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.268 | -| explained_variance | -1.71e+03 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 53070 | -| policy_gradient_loss | -0.00784 | -| std | 0.316 | -| value_loss | 5.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5309 | -| time_elapsed | 39526 | -| total_timesteps | 679552 | -| train/ | | -| approx_kl | 0.022252008 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | -0.268 | -| explained_variance | -93.9 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 53080 | -| policy_gradient_loss | -0.00379 | -| std | 0.316 | -| value_loss | 2.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5310 | -| time_elapsed | 39528 | -| total_timesteps | 679680 | -| train/ | | -| approx_kl | 0.020069607 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.268 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 53090 | -| policy_gradient_loss | -0.00494 | -| std | 0.316 | -| value_loss | 1.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5311 | -| time_elapsed | 39532 | -| total_timesteps | 679808 | -| train/ | | -| approx_kl | 0.013463338 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.269 | -| explained_variance | -0.381 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 53100 | -| policy_gradient_loss | -0.00357 | -| std | 0.317 | -| value_loss | 3.64e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.779 | -| time/ | | -| fps | 17 | -| iterations | 5312 | -| time_elapsed | 39534 | -| total_timesteps | 679936 | -| train/ | | -| approx_kl | 0.024947058 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | -0.269 | -| explained_variance | 0.0016 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 53110 | -| policy_gradient_loss | -0.0123 | -| std | 0.317 | -| value_loss | 9.41e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5313 | -| time_elapsed | 39537 | -| total_timesteps | 680064 | -| train/ | | -| approx_kl | 0.013480019 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.269 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 53120 | -| policy_gradient_loss | -0.00658 | -| std | 0.317 | -| value_loss | 6.02e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5314 | -| time_elapsed | 39543 | -| total_timesteps | 680192 | -| train/ | | -| approx_kl | 0.0136654535 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.27 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 53130 | -| policy_gradient_loss | -0.0156 | -| std | 0.317 | -| value_loss | 1.21e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5315 | -| time_elapsed | 39547 | -| total_timesteps | 680320 | -| train/ | | -| approx_kl | 0.02684224 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | -0.269 | -| explained_variance | -658 | -| learning_rate | 0.0003 | -| loss | -0.00979 | -| n_updates | 53140 | -| policy_gradient_loss | -0.00792 | -| std | 0.317 | -| value_loss | 2.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5316 | -| time_elapsed | 39550 | -| total_timesteps | 680448 | -| train/ | | -| approx_kl | 0.023509935 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -0.269 | -| explained_variance | -392 | -| learning_rate | 0.0003 | -| loss | -0.00996 | -| n_updates | 53150 | -| policy_gradient_loss | -0.00421 | -| std | 0.316 | -| value_loss | 7.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5317 | -| time_elapsed | 39553 | -| total_timesteps | 680576 | -| train/ | | -| approx_kl | 0.025379334 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | -0.268 | -| explained_variance | -3.22 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 53160 | -| policy_gradient_loss | -0.000676 | -| std | 0.316 | -| value_loss | 3.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5318 | -| time_elapsed | 39555 | -| total_timesteps | 680704 | -| train/ | | -| approx_kl | 0.039615527 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | -0.267 | -| explained_variance | -2.14 | -| learning_rate | 0.0003 | -| loss | -0.00897 | -| n_updates | 53170 | -| policy_gradient_loss | -0.00795 | -| std | 0.316 | -| value_loss | 1.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5319 | -| time_elapsed | 39558 | -| total_timesteps | 680832 | -| train/ | | -| approx_kl | 0.005676177 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.266 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 53180 | -| policy_gradient_loss | -0.00103 | -| std | 0.315 | -| value_loss | 1.9e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5320 | -| time_elapsed | 39561 | -| total_timesteps | 680960 | -| train/ | | -| approx_kl | 0.0052447952 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.264 | -| explained_variance | -0.000617 | -| learning_rate | 0.0003 | -| loss | -0.00027 | -| n_updates | 53190 | -| policy_gradient_loss | -0.000332 | -| std | 0.315 | -| value_loss | 1.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5321 | -| time_elapsed | 39563 | -| total_timesteps | 681088 | -| train/ | | -| approx_kl | 0.014246153 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.262 | -| explained_variance | -0.0963 | -| learning_rate | 0.0003 | -| loss | -0.00839 | -| n_updates | 53200 | -| policy_gradient_loss | -0.00423 | -| std | 0.314 | -| value_loss | 2.16e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5322 | -| time_elapsed | 39568 | -| total_timesteps | 681216 | -| train/ | | -| approx_kl | 0.030592043 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.261 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 53210 | -| policy_gradient_loss | -0.0163 | -| std | 0.314 | -| value_loss | 9.11e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5323 | -| time_elapsed | 39570 | -| total_timesteps | 681344 | -| train/ | | -| approx_kl | 0.016258756 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.259 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.00492 | -| n_updates | 53220 | -| policy_gradient_loss | -0.00297 | -| std | 0.313 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5324 | -| time_elapsed | 39572 | -| total_timesteps | 681472 | -| train/ | | -| approx_kl | 0.013633959 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.258 | -| explained_variance | -5.68e+03 | -| learning_rate | 0.0003 | -| loss | -0.00752 | -| n_updates | 53230 | -| policy_gradient_loss | -0.0026 | -| std | 0.313 | -| value_loss | 4.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5325 | -| time_elapsed | 39575 | -| total_timesteps | 681600 | -| train/ | | -| approx_kl | 0.023332693 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | -0.256 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 53240 | -| policy_gradient_loss | -0.00508 | -| std | 0.312 | -| value_loss | 1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5326 | -| time_elapsed | 39578 | -| total_timesteps | 681728 | -| train/ | | -| approx_kl | 0.016161568 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.255 | -| explained_variance | -0.407 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 53250 | -| policy_gradient_loss | -0.0063 | -| std | 0.312 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5327 | -| time_elapsed | 39582 | -| total_timesteps | 681856 | -| train/ | | -| approx_kl | 0.0011941097 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.256 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 53260 | -| policy_gradient_loss | 0.000384 | -| std | 0.313 | -| value_loss | 3.48e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5328 | -| time_elapsed | 39585 | -| total_timesteps | 681984 | -| train/ | | -| approx_kl | 0.0018977937 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.259 | -| explained_variance | 0.00381 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 53270 | -| policy_gradient_loss | 0.000292 | -| std | 0.314 | -| value_loss | 5.22e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5329 | -| time_elapsed | 39588 | -| total_timesteps | 682112 | -| train/ | | -| approx_kl | 0.031229012 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | -0.26 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 53280 | -| policy_gradient_loss | -0.0151 | -| std | 0.314 | -| value_loss | 1.52e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5330 | -| time_elapsed | 39594 | -| total_timesteps | 682240 | -| train/ | | -| approx_kl | 0.04298089 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.259 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 53290 | -| policy_gradient_loss | -0.0112 | -| std | 0.313 | -| value_loss | 0.00354 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5331 | -| time_elapsed | 39598 | -| total_timesteps | 682368 | -| train/ | | -| approx_kl | 0.0274799 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | -0.256 | -| explained_variance | -744 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 53300 | -| policy_gradient_loss | -0.0151 | -| std | 0.312 | -| value_loss | 0.000163 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5332 | -| time_elapsed | 39602 | -| total_timesteps | 682496 | -| train/ | | -| approx_kl | 0.01918402 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | -0.253 | -| explained_variance | -461 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 53310 | -| policy_gradient_loss | -0.0115 | -| std | 0.311 | -| value_loss | 0.000161 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5333 | -| time_elapsed | 39607 | -| total_timesteps | 682624 | -| train/ | | -| approx_kl | 0.010115651 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | -0.252 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | 0.000248 | -| n_updates | 53320 | -| policy_gradient_loss | 8.98e-05 | -| std | 0.311 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5334 | -| time_elapsed | 39610 | -| total_timesteps | 682752 | -| train/ | | -| approx_kl | 0.011455102 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.251 | -| explained_variance | -1.8 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 53330 | -| policy_gradient_loss | -0.00287 | -| std | 0.311 | -| value_loss | 1.5e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5335 | -| time_elapsed | 39614 | -| total_timesteps | 682880 | -| train/ | | -| approx_kl | 0.0069904686 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.249 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 53340 | -| policy_gradient_loss | -0.00154 | -| std | 0.31 | -| value_loss | 5.67e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5336 | -| time_elapsed | 39618 | -| total_timesteps | 683008 | -| train/ | | -| approx_kl | 0.0055174553 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.248 | -| explained_variance | 0.00558 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 53350 | -| policy_gradient_loss | -0.00199 | -| std | 0.31 | -| value_loss | 4.93e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5337 | -| time_elapsed | 39625 | -| total_timesteps | 683136 | -| train/ | | -| approx_kl | 0.009832213 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -0.248 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 53360 | -| policy_gradient_loss | 0.000707 | -| std | 0.31 | -| value_loss | 0.000212 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5338 | -| time_elapsed | 39628 | -| total_timesteps | 683264 | -| train/ | | -| approx_kl | 0.017926147 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.246 | -| explained_variance | -87.6 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 53370 | -| policy_gradient_loss | -0.00331 | -| std | 0.309 | -| value_loss | 7.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5339 | -| time_elapsed | 39632 | -| total_timesteps | 683392 | -| train/ | | -| approx_kl | 0.005163276 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.245 | -| explained_variance | -155 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 53380 | -| policy_gradient_loss | -0.000367 | -| std | 0.309 | -| value_loss | 3.91e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5340 | -| time_elapsed | 39635 | -| total_timesteps | 683520 | -| train/ | | -| approx_kl | 6.9125555e-05 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.247 | -| explained_variance | -18.3 | -| learning_rate | 0.0003 | -| loss | -0.000193 | -| n_updates | 53390 | -| policy_gradient_loss | 0.000375 | -| std | 0.311 | -| value_loss | 2.01e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5341 | -| time_elapsed | 39638 | -| total_timesteps | 683648 | -| train/ | | -| approx_kl | 0.007057117 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.251 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 53400 | -| policy_gradient_loss | -0.000449 | -| std | 0.311 | -| value_loss | 4.53e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5342 | -| time_elapsed | 39641 | -| total_timesteps | 683776 | -| train/ | | -| approx_kl | 0.0041652815 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.251 | -| explained_variance | -0.229 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 53410 | -| policy_gradient_loss | -0.000175 | -| std | 0.311 | -| value_loss | 9.43e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.776 | -| time/ | | -| fps | 17 | -| iterations | 5343 | -| time_elapsed | 39645 | -| total_timesteps | 683904 | -| train/ | | -| approx_kl | 0.0057856357 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.251 | -| explained_variance | -0.00419 | -| learning_rate | 0.0003 | -| loss | -0.00725 | -| n_updates | 53420 | -| policy_gradient_loss | -0.00116 | -| std | 0.311 | -| value_loss | 1.16e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5344 | -| time_elapsed | 39648 | -| total_timesteps | 684032 | -| train/ | | -| approx_kl | 0.021093184 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | -0.251 | -| explained_variance | -0.072 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 53430 | -| policy_gradient_loss | -1.49e-05 | -| std | 0.311 | -| value_loss | 2.33e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5345 | -| time_elapsed | 39654 | -| total_timesteps | 684160 | -| train/ | | -| approx_kl | 0.13897622 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | -0.252 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0283 | -| n_updates | 53440 | -| policy_gradient_loss | -0.0243 | -| std | 0.311 | -| value_loss | 0.000434 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5346 | -| time_elapsed | 39657 | -| total_timesteps | 684288 | -| train/ | | -| approx_kl | 0.019241711 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.251 | -| explained_variance | -490 | -| learning_rate | 0.0003 | -| loss | -0.00786 | -| n_updates | 53450 | -| policy_gradient_loss | -0.00438 | -| std | 0.311 | -| value_loss | 9.25e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5347 | -| time_elapsed | 39660 | -| total_timesteps | 684416 | -| train/ | | -| approx_kl | 0.0055977404 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | -0.25 | -| explained_variance | -803 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 53460 | -| policy_gradient_loss | -0.00106 | -| std | 0.31 | -| value_loss | 3.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5348 | -| time_elapsed | 39664 | -| total_timesteps | 684544 | -| train/ | | -| approx_kl | 0.0009447946 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.248 | -| explained_variance | -340 | -| learning_rate | 0.0003 | -| loss | -0.00064 | -| n_updates | 53470 | -| policy_gradient_loss | -6.9e-05 | -| std | 0.309 | -| value_loss | 3.37e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5349 | -| time_elapsed | 39667 | -| total_timesteps | 684672 | -| train/ | | -| approx_kl | 0.026349425 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | -0.244 | -| explained_variance | -1.07e+03 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 53480 | -| policy_gradient_loss | -0.00361 | -| std | 0.308 | -| value_loss | 2.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5350 | -| time_elapsed | 39671 | -| total_timesteps | 684800 | -| train/ | | -| approx_kl | 0.04004276 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | -0.242 | -| explained_variance | -393 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 53490 | -| policy_gradient_loss | -0.0085 | -| std | 0.308 | -| value_loss | 1.71e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5351 | -| time_elapsed | 39674 | -| total_timesteps | 684928 | -| train/ | | -| approx_kl | 0.001924796 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.241 | -| explained_variance | -9.74 | -| learning_rate | 0.0003 | -| loss | -0.00339 | -| n_updates | 53500 | -| policy_gradient_loss | 0.000603 | -| std | 0.308 | -| value_loss | 2.97e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5352 | -| time_elapsed | 39678 | -| total_timesteps | 685056 | -| train/ | | -| approx_kl | 0.01541092 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | -0.24 | -| explained_variance | -0.674 | -| learning_rate | 0.0003 | -| loss | 0.00546 | -| n_updates | 53510 | -| policy_gradient_loss | 0.00317 | -| std | 0.307 | -| value_loss | 4.4e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5353 | -| time_elapsed | 39685 | -| total_timesteps | 685184 | -| train/ | | -| approx_kl | 0.022562977 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -0.238 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 53520 | -| policy_gradient_loss | -0.0153 | -| std | 0.307 | -| value_loss | 0.000553 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5354 | -| time_elapsed | 39689 | -| total_timesteps | 685312 | -| train/ | | -| approx_kl | 0.02020099 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | -0.236 | -| explained_variance | -17.9 | -| learning_rate | 0.0003 | -| loss | -0.00601 | -| n_updates | 53530 | -| policy_gradient_loss | -0.00392 | -| std | 0.306 | -| value_loss | 4.81e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5355 | -| time_elapsed | 39692 | -| total_timesteps | 685440 | -| train/ | | -| approx_kl | 0.006066058 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.235 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 53540 | -| policy_gradient_loss | -0.00121 | -| std | 0.306 | -| value_loss | 2.14e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5356 | -| time_elapsed | 39696 | -| total_timesteps | 685568 | -| train/ | | -| approx_kl | 0.0006792452 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.235 | -| explained_variance | -0.7 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 53550 | -| policy_gradient_loss | 0.00165 | -| std | 0.306 | -| value_loss | 6.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5357 | -| time_elapsed | 39699 | -| total_timesteps | 685696 | -| train/ | | -| approx_kl | 0.014786452 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | -0.236 | -| explained_variance | -0.0784 | -| learning_rate | 0.0003 | -| loss | 0.00132 | -| n_updates | 53560 | -| policy_gradient_loss | 0.000625 | -| std | 0.307 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5358 | -| time_elapsed | 39703 | -| total_timesteps | 685824 | -| train/ | | -| approx_kl | 0.011576787 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.238 | -| explained_variance | -0.0466 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 53570 | -| policy_gradient_loss | -0.00357 | -| std | 0.307 | -| value_loss | 1.62e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5359 | -| time_elapsed | 39707 | -| total_timesteps | 685952 | -| train/ | | -| approx_kl | 0.00093594706 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.238 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | -0.000448 | -| n_updates | 53580 | -| policy_gradient_loss | -6.48e-05 | -| std | 0.307 | -| value_loss | 4.11e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5360 | -| time_elapsed | 39710 | -| total_timesteps | 686080 | -| train/ | | -| approx_kl | 0.008130704 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.236 | -| explained_variance | -0.0695 | -| learning_rate | 0.0003 | -| loss | 0.00336 | -| n_updates | 53590 | -| policy_gradient_loss | 0.000164 | -| std | 0.306 | -| value_loss | 1.63e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5361 | -| time_elapsed | 39717 | -| total_timesteps | 686208 | -| train/ | | -| approx_kl | 0.0402458 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.235 | -| explained_variance | 0.326 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 53600 | -| policy_gradient_loss | -0.0188 | -| std | 0.306 | -| value_loss | 0.00142 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5362 | -| time_elapsed | 39720 | -| total_timesteps | 686336 | -| train/ | | -| approx_kl | 0.02565591 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.235 | -| explained_variance | -1.21e+03 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 53610 | -| policy_gradient_loss | -0.00592 | -| std | 0.306 | -| value_loss | 1.39e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5363 | -| time_elapsed | 39725 | -| total_timesteps | 686464 | -| train/ | | -| approx_kl | 0.02038042 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | -0.234 | -| explained_variance | -1.3e+03 | -| learning_rate | 0.0003 | -| loss | 0.000222 | -| n_updates | 53620 | -| policy_gradient_loss | 3.62e-05 | -| std | 0.305 | -| value_loss | 4.93e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5364 | -| time_elapsed | 39728 | -| total_timesteps | 686592 | -| train/ | | -| approx_kl | 0.014145907 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.231 | -| explained_variance | -71 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 53630 | -| policy_gradient_loss | -0.00495 | -| std | 0.305 | -| value_loss | 7.29e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5365 | -| time_elapsed | 39732 | -| total_timesteps | 686720 | -| train/ | | -| approx_kl | 0.0060558994 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.229 | -| explained_variance | -5.66 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 53640 | -| policy_gradient_loss | -0.00105 | -| std | 0.304 | -| value_loss | 1.23e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5366 | -| time_elapsed | 39733 | -| total_timesteps | 686848 | -| train/ | | -| approx_kl | 0.02623473 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | -0.229 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 53650 | -| policy_gradient_loss | -0.00389 | -| std | 0.304 | -| value_loss | 7.69e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5367 | -| time_elapsed | 39736 | -| total_timesteps | 686976 | -| train/ | | -| approx_kl | 0.010295739 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.229 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 53660 | -| policy_gradient_loss | -0.00281 | -| std | 0.304 | -| value_loss | 2.82e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5368 | -| time_elapsed | 39738 | -| total_timesteps | 687104 | -| train/ | | -| approx_kl | 0.0068214964 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | -0.228 | -| explained_variance | -0.00438 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 53670 | -| policy_gradient_loss | -0.00163 | -| std | 0.304 | -| value_loss | 3.06e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5369 | -| time_elapsed | 39745 | -| total_timesteps | 687232 | -| train/ | | -| approx_kl | 0.007424246 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.227 | -| explained_variance | -1.63 | -| learning_rate | 0.0003 | -| loss | -0.0265 | -| n_updates | 53680 | -| policy_gradient_loss | -0.0161 | -| std | 0.303 | -| value_loss | 0.00327 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5370 | -| time_elapsed | 39749 | -| total_timesteps | 687360 | -| train/ | | -| approx_kl | 0.0017430885 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.225 | -| explained_variance | -264 | -| learning_rate | 0.0003 | -| loss | -0.000282 | -| n_updates | 53690 | -| policy_gradient_loss | -0.000142 | -| std | 0.303 | -| value_loss | 5.71e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5371 | -| time_elapsed | 39753 | -| total_timesteps | 687488 | -| train/ | | -| approx_kl | 0.017663674 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | -0.223 | -| explained_variance | -32.2 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 53700 | -| policy_gradient_loss | -0.0069 | -| std | 0.302 | -| value_loss | 1.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5372 | -| time_elapsed | 39756 | -| total_timesteps | 687616 | -| train/ | | -| approx_kl | 0.01165131 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.222 | -| explained_variance | -0.949 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 53710 | -| policy_gradient_loss | -0.00163 | -| std | 0.302 | -| value_loss | 1.72e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5373 | -| time_elapsed | 39760 | -| total_timesteps | 687744 | -| train/ | | -| approx_kl | 0.0048545846 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.219 | -| explained_variance | -0.093 | -| learning_rate | 0.0003 | -| loss | -0.000438 | -| n_updates | 53720 | -| policy_gradient_loss | -0.0003 | -| std | 0.301 | -| value_loss | 9.6e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.771 | -| time/ | | -| fps | 17 | -| iterations | 5374 | -| time_elapsed | 39764 | -| total_timesteps | 687872 | -| train/ | | -| approx_kl | 0.017860144 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.217 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 53730 | -| policy_gradient_loss | -0.00943 | -| std | 0.3 | -| value_loss | 2.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5375 | -| time_elapsed | 39767 | -| total_timesteps | 688000 | -| train/ | | -| approx_kl | 0.0051818346 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | -0.216 | -| explained_variance | -0.000216 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 53740 | -| policy_gradient_loss | -0.000422 | -| std | 0.301 | -| value_loss | 1.85e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5376 | -| time_elapsed | 39769 | -| total_timesteps | 688128 | -| train/ | | -| approx_kl | 0.0060480773 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.218 | -| explained_variance | -0.0012 | -| learning_rate | 0.0003 | -| loss | -0.000327 | -| n_updates | 53750 | -| policy_gradient_loss | 0.000121 | -| std | 0.301 | -| value_loss | 4.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5377 | -| time_elapsed | 39776 | -| total_timesteps | 688256 | -| train/ | | -| approx_kl | 0.013419984 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.217 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | -0.0277 | -| n_updates | 53760 | -| policy_gradient_loss | -0.0182 | -| std | 0.3 | -| value_loss | 0.000226 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5378 | -| time_elapsed | 39780 | -| total_timesteps | 688384 | -| train/ | | -| approx_kl | 0.016546845 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.216 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 53770 | -| policy_gradient_loss | -0.00267 | -| std | 0.3 | -| value_loss | 2.9e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5379 | -| time_elapsed | 39783 | -| total_timesteps | 688512 | -| train/ | | -| approx_kl | 0.0037796767 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.215 | -| explained_variance | -4.14 | -| learning_rate | 0.0003 | -| loss | -0.000564 | -| n_updates | 53780 | -| policy_gradient_loss | -0.000322 | -| std | 0.299 | -| value_loss | 3.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5380 | -| time_elapsed | 39786 | -| total_timesteps | 688640 | -| train/ | | -| approx_kl | 0.012794921 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | -0.211 | -| explained_variance | -0.333 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 53790 | -| policy_gradient_loss | -0.00227 | -| std | 0.299 | -| value_loss | 4.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5381 | -| time_elapsed | 39791 | -| total_timesteps | 688768 | -| train/ | | -| approx_kl | 0.005560518 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.209 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | -0.000283 | -| n_updates | 53800 | -| policy_gradient_loss | -0.000287 | -| std | 0.298 | -| value_loss | 5.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5382 | -| time_elapsed | 39795 | -| total_timesteps | 688896 | -| train/ | | -| approx_kl | 0.0024622246 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.206 | -| explained_variance | -0.00145 | -| learning_rate | 0.0003 | -| loss | -0.000666 | -| n_updates | 53810 | -| policy_gradient_loss | -0.000333 | -| std | 0.296 | -| value_loss | 1.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5383 | -| time_elapsed | 39798 | -| total_timesteps | 689024 | -| train/ | | -| approx_kl | 0.016259868 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.201 | -| explained_variance | -0.00539 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 53820 | -| policy_gradient_loss | -0.00927 | -| std | 0.295 | -| value_loss | 2.09e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5384 | -| time_elapsed | 39804 | -| total_timesteps | 689152 | -| train/ | | -| approx_kl | 0.0009040283 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.198 | -| explained_variance | 0.384 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 53830 | -| policy_gradient_loss | -0.00607 | -| std | 0.295 | -| value_loss | 0.00788 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5385 | -| time_elapsed | 39808 | -| total_timesteps | 689280 | -| train/ | | -| approx_kl | 0.05647753 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | -0.196 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 53840 | -| policy_gradient_loss | -0.0104 | -| std | 0.294 | -| value_loss | 5.49e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5386 | -| time_elapsed | 39811 | -| total_timesteps | 689408 | -| train/ | | -| approx_kl | 0.018236078 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.195 | -| explained_variance | -184 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 53850 | -| policy_gradient_loss | -0.00674 | -| std | 0.294 | -| value_loss | 3.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5387 | -| time_elapsed | 39815 | -| total_timesteps | 689536 | -| train/ | | -| approx_kl | 0.036105275 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | -0.196 | -| explained_variance | -54.6 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 53860 | -| policy_gradient_loss | -0.00986 | -| std | 0.294 | -| value_loss | 2e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5388 | -| time_elapsed | 39817 | -| total_timesteps | 689664 | -| train/ | | -| approx_kl | 0.0127031 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.196 | -| explained_variance | -0.989 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 53870 | -| policy_gradient_loss | -0.00283 | -| std | 0.294 | -| value_loss | 8.99e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5389 | -| time_elapsed | 39820 | -| total_timesteps | 689792 | -| train/ | | -| approx_kl | 0.013623735 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.195 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 53880 | -| policy_gradient_loss | -0.00275 | -| std | 0.294 | -| value_loss | 2.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5390 | -| time_elapsed | 39823 | -| total_timesteps | 689920 | -| train/ | | -| approx_kl | 0.010046221 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.194 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 53890 | -| policy_gradient_loss | 0.000321 | -| std | 0.293 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5391 | -| time_elapsed | 39825 | -| total_timesteps | 690048 | -| train/ | | -| approx_kl | 0.012942892 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | -0.192 | -| explained_variance | -0.073 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 53900 | -| policy_gradient_loss | -0.00209 | -| std | 0.293 | -| value_loss | 3.37e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5392 | -| time_elapsed | 39832 | -| total_timesteps | 690176 | -| train/ | | -| approx_kl | 0.0014926153 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.191 | -| explained_variance | 0.495 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 53910 | -| policy_gradient_loss | -0.0129 | -| std | 0.293 | -| value_loss | 0.0142 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5393 | -| time_elapsed | 39836 | -| total_timesteps | 690304 | -| train/ | | -| approx_kl | 0.04722306 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | -0.191 | -| explained_variance | -96.1 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 53920 | -| policy_gradient_loss | -0.0113 | -| std | 0.293 | -| value_loss | 0.00036 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5394 | -| time_elapsed | 39841 | -| total_timesteps | 690432 | -| train/ | | -| approx_kl | 0.018748093 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.191 | -| explained_variance | -62 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 53930 | -| policy_gradient_loss | -0.00109 | -| std | 0.294 | -| value_loss | 7.15e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5395 | -| time_elapsed | 39844 | -| total_timesteps | 690560 | -| train/ | | -| approx_kl | 0.0005261046 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.195 | -| explained_variance | -46 | -| learning_rate | 0.0003 | -| loss | -0.000504 | -| n_updates | 53940 | -| policy_gradient_loss | 4.48e-05 | -| std | 0.294 | -| value_loss | 4.35e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5396 | -| time_elapsed | 39848 | -| total_timesteps | 690688 | -| train/ | | -| approx_kl | 0.006598375 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.198 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | 0.000967 | -| n_updates | 53950 | -| policy_gradient_loss | 0.000974 | -| std | 0.295 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5397 | -| time_elapsed | 39852 | -| total_timesteps | 690816 | -| train/ | | -| approx_kl | 0.011640135 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.198 | -| explained_variance | -0.827 | -| learning_rate | 0.0003 | -| loss | 1.15e-05 | -| n_updates | 53960 | -| policy_gradient_loss | -0.000266 | -| std | 0.295 | -| value_loss | 3.88e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5398 | -| time_elapsed | 39855 | -| total_timesteps | 690944 | -| train/ | | -| approx_kl | 0.0042287973 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.196 | -| explained_variance | 0.00413 | -| learning_rate | 0.0003 | -| loss | -0.000984 | -| n_updates | 53970 | -| policy_gradient_loss | -0.000379 | -| std | 0.294 | -| value_loss | 5.35e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5399 | -| time_elapsed | 39859 | -| total_timesteps | 691072 | -| train/ | | -| approx_kl | 0.012512615 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -0.192 | -| explained_variance | 0.00791 | -| learning_rate | 0.0003 | -| loss | -0.00199 | -| n_updates | 53980 | -| policy_gradient_loss | -0.00191 | -| std | 0.292 | -| value_loss | 3.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5400 | -| time_elapsed | 39865 | -| total_timesteps | 691200 | -| train/ | | -| approx_kl | 0.007061381 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.188 | -| explained_variance | 0.258 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 53990 | -| policy_gradient_loss | -0.00861 | -| std | 0.292 | -| value_loss | 0.00272 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5401 | -| time_elapsed | 39868 | -| total_timesteps | 691328 | -| train/ | | -| approx_kl | 0.014362719 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.186 | -| explained_variance | -82.4 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 54000 | -| policy_gradient_loss | -0.00082 | -| std | 0.291 | -| value_loss | 7.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5402 | -| time_elapsed | 39871 | -| total_timesteps | 691456 | -| train/ | | -| approx_kl | 0.013064705 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.183 | -| explained_variance | -47.3 | -| learning_rate | 0.0003 | -| loss | -0.000731 | -| n_updates | 54010 | -| policy_gradient_loss | -0.000724 | -| std | 0.29 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5403 | -| time_elapsed | 39876 | -| total_timesteps | 691584 | -| train/ | | -| approx_kl | 0.002037671 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.18 | -| explained_variance | -4.46 | -| learning_rate | 0.0003 | -| loss | -0.000209 | -| n_updates | 54020 | -| policy_gradient_loss | -0.000111 | -| std | 0.289 | -| value_loss | 5.47e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5404 | -| time_elapsed | 39880 | -| total_timesteps | 691712 | -| train/ | | -| approx_kl | 0.00615177 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.179 | -| explained_variance | -0.569 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 54030 | -| policy_gradient_loss | -0.00439 | -| std | 0.289 | -| value_loss | 4e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5405 | -| time_elapsed | 39884 | -| total_timesteps | 691840 | -| train/ | | -| approx_kl | 0.0042537097 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.179 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -9.84e-05 | -| n_updates | 54040 | -| policy_gradient_loss | -5.75e-05 | -| std | 0.289 | -| value_loss | 1.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.775 | -| time/ | | -| fps | 17 | -| iterations | 5406 | -| time_elapsed | 39888 | -| total_timesteps | 691968 | -| train/ | | -| approx_kl | 0.015110651 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.178 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0016 | -| n_updates | 54050 | -| policy_gradient_loss | -0.000216 | -| std | 0.289 | -| value_loss | 2.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5407 | -| time_elapsed | 39891 | -| total_timesteps | 692096 | -| train/ | | -| approx_kl | 0.008622307 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | -0.177 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | -0.000688 | -| n_updates | 54060 | -| policy_gradient_loss | -0.000681 | -| std | 0.289 | -| value_loss | 4e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5408 | -| time_elapsed | 39899 | -| total_timesteps | 692224 | -| train/ | | -| approx_kl | 0.00057550473 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.175 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 54070 | -| policy_gradient_loss | -0.00666 | -| std | 0.288 | -| value_loss | 0.000614 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5409 | -| time_elapsed | 39902 | -| total_timesteps | 692352 | -| train/ | | -| approx_kl | 0.012986593 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | -0.172 | -| explained_variance | -34.5 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 54080 | -| policy_gradient_loss | -0.00501 | -| std | 0.287 | -| value_loss | 9.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5410 | -| time_elapsed | 39907 | -| total_timesteps | 692480 | -| train/ | | -| approx_kl | 0.021364529 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.17 | -| explained_variance | -24.6 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 54090 | -| policy_gradient_loss | -0.00376 | -| std | 0.287 | -| value_loss | 2.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5411 | -| time_elapsed | 39910 | -| total_timesteps | 692608 | -| train/ | | -| approx_kl | 0.02927031 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.169 | -| explained_variance | -1.42 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 54100 | -| policy_gradient_loss | -0.00627 | -| std | 0.287 | -| value_loss | 1.39e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5412 | -| time_elapsed | 39913 | -| total_timesteps | 692736 | -| train/ | | -| approx_kl | 0.01713098 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | -0.169 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | -0.00486 | -| n_updates | 54110 | -| policy_gradient_loss | -0.00469 | -| std | 0.286 | -| value_loss | 6.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5413 | -| time_elapsed | 39918 | -| total_timesteps | 692864 | -| train/ | | -| approx_kl | 0.012062514 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.168 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.00249 | -| n_updates | 54120 | -| policy_gradient_loss | 1.51e-05 | -| std | 0.286 | -| value_loss | 4.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5414 | -| time_elapsed | 39922 | -| total_timesteps | 692992 | -| train/ | | -| approx_kl | 0.018955177 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | -0.168 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 54130 | -| policy_gradient_loss | -0.00325 | -| std | 0.286 | -| value_loss | 2.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5415 | -| time_elapsed | 39926 | -| total_timesteps | 693120 | -| train/ | | -| approx_kl | 0.01909702 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.168 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 54140 | -| policy_gradient_loss | -0.00258 | -| std | 0.286 | -| value_loss | 1.93e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5416 | -| time_elapsed | 39935 | -| total_timesteps | 693248 | -| train/ | | -| approx_kl | 0.045971874 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.167 | -| explained_variance | 0.562 | -| learning_rate | 0.0003 | -| loss | -0.03 | -| n_updates | 54150 | -| policy_gradient_loss | -0.0211 | -| std | 0.286 | -| value_loss | 0.0012 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5417 | -| time_elapsed | 39938 | -| total_timesteps | 693376 | -| train/ | | -| approx_kl | 0.004923403 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.167 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.0098 | -| n_updates | 54160 | -| policy_gradient_loss | -0.00179 | -| std | 0.286 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5418 | -| time_elapsed | 39941 | -| total_timesteps | 693504 | -| train/ | | -| approx_kl | 0.011263574 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | -0.167 | -| explained_variance | -69 | -| learning_rate | 0.0003 | -| loss | -0.000688 | -| n_updates | 54170 | -| policy_gradient_loss | -0.00078 | -| std | 0.286 | -| value_loss | 4.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5419 | -| time_elapsed | 39943 | -| total_timesteps | 693632 | -| train/ | | -| approx_kl | 0.025579406 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | -0.166 | -| explained_variance | -2.66 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 54180 | -| policy_gradient_loss | -0.00688 | -| std | 0.285 | -| value_loss | 7.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5420 | -| time_elapsed | 39947 | -| total_timesteps | 693760 | -| train/ | | -| approx_kl | 0.026104964 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | -0.164 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.00404 | -| n_updates | 54190 | -| policy_gradient_loss | 0.000362 | -| std | 0.285 | -| value_loss | 2.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.769 | -| time/ | | -| fps | 17 | -| iterations | 5421 | -| time_elapsed | 39951 | -| total_timesteps | 693888 | -| train/ | | -| approx_kl | 0.010956749 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.164 | -| explained_variance | -7.61e-05 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 54200 | -| policy_gradient_loss | -0.00145 | -| std | 0.285 | -| value_loss | 5.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5422 | -| time_elapsed | 39955 | -| total_timesteps | 694016 | -| train/ | | -| approx_kl | 0.029645706 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | -0.164 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | -0.00861 | -| n_updates | 54210 | -| policy_gradient_loss | -0.00872 | -| std | 0.285 | -| value_loss | 2.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5423 | -| time_elapsed | 39966 | -| total_timesteps | 694144 | -| train/ | | -| approx_kl | 0.016975863 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.163 | -| explained_variance | -2.02 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 54220 | -| policy_gradient_loss | -0.0161 | -| std | 0.285 | -| value_loss | 0.00253 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5424 | -| time_elapsed | 39970 | -| total_timesteps | 694272 | -| train/ | | -| approx_kl | 0.022939712 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.162 | -| explained_variance | -221 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 54230 | -| policy_gradient_loss | -0.00574 | -| std | 0.284 | -| value_loss | 6.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5425 | -| time_elapsed | 39973 | -| total_timesteps | 694400 | -| train/ | | -| approx_kl | 0.017767837 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | -0.161 | -| explained_variance | -477 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 54240 | -| policy_gradient_loss | -0.000383 | -| std | 0.284 | -| value_loss | 1.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5426 | -| time_elapsed | 39975 | -| total_timesteps | 694528 | -| train/ | | -| approx_kl | 0.013382734 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.158 | -| explained_variance | -581 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 54250 | -| policy_gradient_loss | -0.00111 | -| std | 0.283 | -| value_loss | 5.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5427 | -| time_elapsed | 39979 | -| total_timesteps | 694656 | -| train/ | | -| approx_kl | 0.013439508 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.154 | -| explained_variance | -48.1 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 54260 | -| policy_gradient_loss | -0.00168 | -| std | 0.282 | -| value_loss | 7.39e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5428 | -| time_elapsed | 39983 | -| total_timesteps | 694784 | -| train/ | | -| approx_kl | 0.0033375411 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.152 | -| explained_variance | -2.23 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 54270 | -| policy_gradient_loss | -5.48e-05 | -| std | 0.282 | -| value_loss | 1.47e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.77 | -| time/ | | -| fps | 17 | -| iterations | 5429 | -| time_elapsed | 39986 | -| total_timesteps | 694912 | -| train/ | | -| approx_kl | 0.0014884602 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.151 | -| explained_variance | -0.771 | -| learning_rate | 0.0003 | -| loss | -0.00586 | -| n_updates | 54280 | -| policy_gradient_loss | 0.00176 | -| std | 0.282 | -| value_loss | 1.22e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5430 | -| time_elapsed | 39990 | -| total_timesteps | 695040 | -| train/ | | -| approx_kl | 0.0027357554 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.151 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 54290 | -| policy_gradient_loss | 0.000827 | -| std | 0.281 | -| value_loss | 6.12e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5431 | -| time_elapsed | 39999 | -| total_timesteps | 695168 | -| train/ | | -| approx_kl | 0.01629596 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.151 | -| explained_variance | 0.729 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 54300 | -| policy_gradient_loss | -0.00348 | -| std | 0.282 | -| value_loss | 0.00322 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5432 | -| time_elapsed | 40003 | -| total_timesteps | 695296 | -| train/ | | -| approx_kl | 0.010160981 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.152 | -| explained_variance | -4.47 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 54310 | -| policy_gradient_loss | -0.00165 | -| std | 0.282 | -| value_loss | 3.29e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5433 | -| time_elapsed | 40006 | -| total_timesteps | 695424 | -| train/ | | -| approx_kl | 0.020837571 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.154 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 54320 | -| policy_gradient_loss | -0.00841 | -| std | 0.282 | -| value_loss | 2.14e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5434 | -| time_elapsed | 40010 | -| total_timesteps | 695552 | -| train/ | | -| approx_kl | 0.00094028516 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.154 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 54330 | -| policy_gradient_loss | 0.00146 | -| std | 0.282 | -| value_loss | 1.12e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5435 | -| time_elapsed | 40013 | -| total_timesteps | 695680 | -| train/ | | -| approx_kl | 0.0151881315 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | -0.154 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 54340 | -| policy_gradient_loss | 0.00127 | -| std | 0.282 | -| value_loss | 3.19e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5436 | -| time_elapsed | 40016 | -| total_timesteps | 695808 | -| train/ | | -| approx_kl | 0.02880878 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.154 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 54350 | -| policy_gradient_loss | -0.00399 | -| std | 0.282 | -| value_loss | 5.25e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5437 | -| time_elapsed | 40021 | -| total_timesteps | 695936 | -| train/ | | -| approx_kl | 0.0137883015 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.154 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 54360 | -| policy_gradient_loss | 9.41e-05 | -| std | 0.282 | -| value_loss | 5.84e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5438 | -| time_elapsed | 40025 | -| total_timesteps | 696064 | -| train/ | | -| approx_kl | 0.011860237 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.155 | -| explained_variance | -0.0949 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 54370 | -| policy_gradient_loss | -0.000981 | -| std | 0.282 | -| value_loss | 1.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5439 | -| time_elapsed | 40030 | -| total_timesteps | 696192 | -| train/ | | -| approx_kl | 0.14491749 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.154 | -| explained_variance | -4.15 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 54380 | -| policy_gradient_loss | -0.013 | -| std | 0.282 | -| value_loss | 0.00207 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5440 | -| time_elapsed | 40034 | -| total_timesteps | 696320 | -| train/ | | -| approx_kl | 6.544916e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.153 | -| explained_variance | -234 | -| learning_rate | 0.0003 | -| loss | -0.000194 | -| n_updates | 54390 | -| policy_gradient_loss | -5.78e-05 | -| std | 0.281 | -| value_loss | 4.46e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5441 | -| time_elapsed | 40037 | -| total_timesteps | 696448 | -| train/ | | -| approx_kl | 0.015282214 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | -0.149 | -| explained_variance | -220 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 54400 | -| policy_gradient_loss | -0.00147 | -| std | 0.28 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5442 | -| time_elapsed | 40041 | -| total_timesteps | 696576 | -| train/ | | -| approx_kl | 0.024891559 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | -0.145 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 54410 | -| policy_gradient_loss | -0.00835 | -| std | 0.279 | -| value_loss | 3.68e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5443 | -| time_elapsed | 40044 | -| total_timesteps | 696704 | -| train/ | | -| approx_kl | 0.014503427 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.143 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 54420 | -| policy_gradient_loss | -0.0064 | -| std | 0.279 | -| value_loss | 1.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5444 | -| time_elapsed | 40048 | -| total_timesteps | 696832 | -| train/ | | -| approx_kl | 0.016765982 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | -0.14 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 54430 | -| policy_gradient_loss | -0.00241 | -| std | 0.278 | -| value_loss | 9.92e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5445 | -| time_elapsed | 40052 | -| total_timesteps | 696960 | -| train/ | | -| approx_kl | 0.01704771 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | -0.139 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 54440 | -| policy_gradient_loss | -0.00762 | -| std | 0.278 | -| value_loss | 1.18e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5446 | -| time_elapsed | 40054 | -| total_timesteps | 697088 | -| train/ | | -| approx_kl | 0.013864532 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | -0.138 | -| explained_variance | 0.00327 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 54450 | -| policy_gradient_loss | -0.00364 | -| std | 0.278 | -| value_loss | 7.03e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5447 | -| time_elapsed | 40062 | -| total_timesteps | 697216 | -| train/ | | -| approx_kl | 0.03328793 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.137 | -| explained_variance | 0.81 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 54460 | -| policy_gradient_loss | -0.012 | -| std | 0.277 | -| value_loss | 0.0017 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5448 | -| time_elapsed | 40066 | -| total_timesteps | 697344 | -| train/ | | -| approx_kl | 0.007904923 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.135 | -| explained_variance | -4.96 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 54470 | -| policy_gradient_loss | -0.00167 | -| std | 0.277 | -| value_loss | 1.94e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5449 | -| time_elapsed | 40068 | -| total_timesteps | 697472 | -| train/ | | -| approx_kl | 0.08293233 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | -0.134 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 54480 | -| policy_gradient_loss | -0.008 | -| std | 0.277 | -| value_loss | 9.88e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5450 | -| time_elapsed | 40072 | -| total_timesteps | 697600 | -| train/ | | -| approx_kl | 0.013599483 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.133 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | -0.00995 | -| n_updates | 54490 | -| policy_gradient_loss | -0.0064 | -| std | 0.276 | -| value_loss | 5.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5451 | -| time_elapsed | 40075 | -| total_timesteps | 697728 | -| train/ | | -| approx_kl | 0.018995749 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.132 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | -0.00405 | -| n_updates | 54500 | -| policy_gradient_loss | -0.00423 | -| std | 0.276 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5452 | -| time_elapsed | 40078 | -| total_timesteps | 697856 | -| train/ | | -| approx_kl | 0.010390436 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | -0.13 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | 0.000127 | -| n_updates | 54510 | -| policy_gradient_loss | -0.000581 | -| std | 0.275 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5453 | -| time_elapsed | 40081 | -| total_timesteps | 697984 | -| train/ | | -| approx_kl | 0.0026047146 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.127 | -| explained_variance | 0.00118 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 54520 | -| policy_gradient_loss | -0.00315 | -| std | 0.274 | -| value_loss | 1.84e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5454 | -| time_elapsed | 40084 | -| total_timesteps | 698112 | -| train/ | | -| approx_kl | 0.011036621 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.125 | -| explained_variance | -0.0083 | -| learning_rate | 0.0003 | -| loss | 0.000852 | -| n_updates | 54530 | -| policy_gradient_loss | -0.000281 | -| std | 0.274 | -| value_loss | 1.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5455 | -| time_elapsed | 40092 | -| total_timesteps | 698240 | -| train/ | | -| approx_kl | 0.025829025 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | -0.125 | -| explained_variance | 0.684 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 54540 | -| policy_gradient_loss | -0.0195 | -| std | 0.274 | -| value_loss | 0.00427 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5456 | -| time_elapsed | 40095 | -| total_timesteps | 698368 | -| train/ | | -| approx_kl | 0.008069108 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.125 | -| explained_variance | -131 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 54550 | -| policy_gradient_loss | -0.000957 | -| std | 0.274 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5457 | -| time_elapsed | 40099 | -| total_timesteps | 698496 | -| train/ | | -| approx_kl | 0.114712775 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | -0.126 | -| explained_variance | -754 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 54560 | -| policy_gradient_loss | -0.0031 | -| std | 0.275 | -| value_loss | 4.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5458 | -| time_elapsed | 40103 | -| total_timesteps | 698624 | -| train/ | | -| approx_kl | 0.0016253078 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.127 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 54570 | -| policy_gradient_loss | 0.00127 | -| std | 0.275 | -| value_loss | 2.23e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5459 | -| time_elapsed | 40106 | -| total_timesteps | 698752 | -| train/ | | -| approx_kl | 0.041639782 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | -0.128 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 54580 | -| policy_gradient_loss | -0.0133 | -| std | 0.275 | -| value_loss | 2.36e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5460 | -| time_elapsed | 40110 | -| total_timesteps | 698880 | -| train/ | | -| approx_kl | 0.01711297 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -0.127 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 54590 | -| policy_gradient_loss | -0.00371 | -| std | 0.275 | -| value_loss | 6.22e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5461 | -| time_elapsed | 40113 | -| total_timesteps | 699008 | -| train/ | | -| approx_kl | 0.012107959 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | -0.126 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 54600 | -| policy_gradient_loss | 0.000268 | -| std | 0.274 | -| value_loss | 1.41e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5462 | -| time_elapsed | 40122 | -| total_timesteps | 699136 | -| train/ | | -| approx_kl | 0.3067552 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.126 | -| explained_variance | -3.53 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 54610 | -| policy_gradient_loss | -0.0201 | -| std | 0.274 | -| value_loss | 0.0021 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5463 | -| time_elapsed | 40126 | -| total_timesteps | 699264 | -| train/ | | -| approx_kl | 0.018676678 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -0.126 | -| explained_variance | -236 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 54620 | -| policy_gradient_loss | -0.00375 | -| std | 0.274 | -| value_loss | 5.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5464 | -| time_elapsed | 40130 | -| total_timesteps | 699392 | -| train/ | | -| approx_kl | 0.021319235 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.125 | -| explained_variance | -396 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 54630 | -| policy_gradient_loss | -0.00586 | -| std | 0.274 | -| value_loss | 2.65e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5465 | -| time_elapsed | 40134 | -| total_timesteps | 699520 | -| train/ | | -| approx_kl | 0.015384187 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.125 | -| explained_variance | -269 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 54640 | -| policy_gradient_loss | -0.00978 | -| std | 0.274 | -| value_loss | 1.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5466 | -| time_elapsed | 40139 | -| total_timesteps | 699648 | -| train/ | | -| approx_kl | 0.029240534 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | -0.125 | -| explained_variance | -109 | -| learning_rate | 0.0003 | -| loss | -0.00722 | -| n_updates | 54650 | -| policy_gradient_loss | -0.00544 | -| std | 0.274 | -| value_loss | 1.08e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5467 | -| time_elapsed | 40143 | -| total_timesteps | 699776 | -| train/ | | -| approx_kl | 0.01486153 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | -0.126 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -0.000614 | -| n_updates | 54660 | -| policy_gradient_loss | -0.00129 | -| std | 0.275 | -| value_loss | 8.81e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.772 | -| time/ | | -| fps | 17 | -| iterations | 5468 | -| time_elapsed | 40145 | -| total_timesteps | 699904 | -| train/ | | -| approx_kl | 0.008369036 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.127 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | -0.000901 | -| n_updates | 54670 | -| policy_gradient_loss | -0.00131 | -| std | 0.275 | -| value_loss | 1.49e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5469 | -| time_elapsed | 40149 | -| total_timesteps | 700032 | -| train/ | | -| approx_kl | 0.007216265 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.125 | -| explained_variance | -0.00701 | -| learning_rate | 0.0003 | -| loss | -0.000964 | -| n_updates | 54680 | -| policy_gradient_loss | -0.000563 | -| std | 0.274 | -| value_loss | 2.63e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5470 | -| time_elapsed | 40159 | -| total_timesteps | 700160 | -| train/ | | -| approx_kl | 0.023735004 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.123 | -| explained_variance | 0.721 | -| learning_rate | 0.0003 | -| loss | -0.0309 | -| n_updates | 54690 | -| policy_gradient_loss | -0.0232 | -| std | 0.273 | -| value_loss | 0.000447 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5471 | -| time_elapsed | 40163 | -| total_timesteps | 700288 | -| train/ | | -| approx_kl | 0.012725266 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.122 | -| explained_variance | -4.74 | -| learning_rate | 0.0003 | -| loss | -0.000313 | -| n_updates | 54700 | -| policy_gradient_loss | -0.000329 | -| std | 0.273 | -| value_loss | 5.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5472 | -| time_elapsed | 40166 | -| total_timesteps | 700416 | -| train/ | | -| approx_kl | 0.033489797 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | -9.87 | -| learning_rate | 0.0003 | -| loss | -0.00489 | -| n_updates | 54710 | -| policy_gradient_loss | -0.00623 | -| std | 0.272 | -| value_loss | 3.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5473 | -| time_elapsed | 40169 | -| total_timesteps | 700544 | -| train/ | | -| approx_kl | 0.011825134 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -0.119 | -| explained_variance | -0.897 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 54720 | -| policy_gradient_loss | -0.00103 | -| std | 0.273 | -| value_loss | 1.14e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5474 | -| time_elapsed | 40173 | -| total_timesteps | 700672 | -| train/ | | -| approx_kl | 4.0000305e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | -2.97e-05 | -| n_updates | 54730 | -| policy_gradient_loss | -9.29e-06 | -| std | 0.273 | -| value_loss | 8.85e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5475 | -| time_elapsed | 40176 | -| total_timesteps | 700800 | -| train/ | | -| approx_kl | 0.0018437449 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.121 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | -0.000194 | -| n_updates | 54740 | -| policy_gradient_loss | -7.63e-05 | -| std | 0.273 | -| value_loss | 1.09e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.767 | -| time/ | | -| fps | 17 | -| iterations | 5476 | -| time_elapsed | 40179 | -| total_timesteps | 700928 | -| train/ | | -| approx_kl | 0.0235828 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 54750 | -| policy_gradient_loss | -0.005 | -| std | 0.273 | -| value_loss | 8.15e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5477 | -| time_elapsed | 40183 | -| total_timesteps | 701056 | -| train/ | | -| approx_kl | 0.019408284 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -0.119 | -| explained_variance | 0.00729 | -| learning_rate | 0.0003 | -| loss | -0.00879 | -| n_updates | 54760 | -| policy_gradient_loss | -0.0055 | -| std | 0.273 | -| value_loss | 3.27e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5478 | -| time_elapsed | 40188 | -| total_timesteps | 701184 | -| train/ | | -| approx_kl | 0.38438594 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | 0.915 | -| learning_rate | 0.0003 | -| loss | -0.0248 | -| n_updates | 54770 | -| policy_gradient_loss | -0.0168 | -| std | 0.273 | -| value_loss | 0.000219 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5479 | -| time_elapsed | 40191 | -| total_timesteps | 701312 | -| train/ | | -| approx_kl | 0.04125832 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | -0.122 | -| explained_variance | -19.3 | -| learning_rate | 0.0003 | -| loss | -0.0315 | -| n_updates | 54780 | -| policy_gradient_loss | -0.0199 | -| std | 0.273 | -| value_loss | 7.29e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5480 | -| time_elapsed | 40195 | -| total_timesteps | 701440 | -| train/ | | -| approx_kl | 0.0065629985 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | -0.122 | -| explained_variance | -99.1 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 54790 | -| policy_gradient_loss | -0.000934 | -| std | 0.273 | -| value_loss | 3.54e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5481 | -| time_elapsed | 40198 | -| total_timesteps | 701568 | -| train/ | | -| approx_kl | 0.022412589 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | -0.122 | -| explained_variance | -32.5 | -| learning_rate | 0.0003 | -| loss | 0.00278 | -| n_updates | 54800 | -| policy_gradient_loss | 0.000799 | -| std | 0.273 | -| value_loss | 1.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5482 | -| time_elapsed | 40202 | -| total_timesteps | 701696 | -| train/ | | -| approx_kl | 0.016813679 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.122 | -| explained_variance | -120 | -| learning_rate | 0.0003 | -| loss | -0.00925 | -| n_updates | 54810 | -| policy_gradient_loss | -0.00308 | -| std | 0.273 | -| value_loss | 7.68e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5483 | -| time_elapsed | 40205 | -| total_timesteps | 701824 | -| train/ | | -| approx_kl | 0.00032475358 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.121 | -| explained_variance | -58.5 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 54820 | -| policy_gradient_loss | 0.00279 | -| std | 0.273 | -| value_loss | 1.71e-10 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.764 | -| time/ | | -| fps | 17 | -| iterations | 5484 | -| time_elapsed | 40207 | -| total_timesteps | 701952 | -| train/ | | -| approx_kl | 0.01967443 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | -3.35 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 54830 | -| policy_gradient_loss | -0.00255 | -| std | 0.273 | -| value_loss | 2.27e-11 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5485 | -| time_elapsed | 40210 | -| total_timesteps | 702080 | -| train/ | | -| approx_kl | 1.1954922e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | -0.465 | -| learning_rate | 0.0003 | -| loss | -3.25e-05 | -| n_updates | 54840 | -| policy_gradient_loss | 9.77e-05 | -| std | 0.273 | -| value_loss | 3e-12 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5486 | -| time_elapsed | 40216 | -| total_timesteps | 702208 | -| train/ | | -| approx_kl | 0.01790328 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 54850 | -| policy_gradient_loss | -0.015 | -| std | 0.273 | -| value_loss | 0.00202 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5487 | -| time_elapsed | 40220 | -| total_timesteps | 702336 | -| train/ | | -| approx_kl | 0.05967968 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | -0.121 | -| explained_variance | -2.14e+03 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 54860 | -| policy_gradient_loss | -0.00797 | -| std | 0.273 | -| value_loss | 1.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5488 | -| time_elapsed | 40225 | -| total_timesteps | 702464 | -| train/ | | -| approx_kl | 0.075332396 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | -0.121 | -| explained_variance | -2.27e+03 | -| learning_rate | 0.0003 | -| loss | -0.00987 | -| n_updates | 54870 | -| policy_gradient_loss | -0.00914 | -| std | 0.273 | -| value_loss | 6.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5489 | -| time_elapsed | 40228 | -| total_timesteps | 702592 | -| train/ | | -| approx_kl | 0.028936008 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.121 | -| explained_variance | -450 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 54880 | -| policy_gradient_loss | -0.0114 | -| std | 0.273 | -| value_loss | 4.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5490 | -| time_elapsed | 40231 | -| total_timesteps | 702720 | -| train/ | | -| approx_kl | 0.02880214 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.121 | -| explained_variance | -17.9 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 54890 | -| policy_gradient_loss | -0.00276 | -| std | 0.273 | -| value_loss | 2.1e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5491 | -| time_elapsed | 40235 | -| total_timesteps | 702848 | -| train/ | | -| approx_kl | 0.02289413 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | -0.799 | -| learning_rate | 0.0003 | -| loss | -4.15e-05 | -| n_updates | 54900 | -| policy_gradient_loss | -0.00216 | -| std | 0.273 | -| value_loss | 7.74e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5492 | -| time_elapsed | 40238 | -| total_timesteps | 702976 | -| train/ | | -| approx_kl | 0.017825589 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.12 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 54910 | -| policy_gradient_loss | -0.00816 | -| std | 0.273 | -| value_loss | 7.46e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5493 | -| time_elapsed | 40242 | -| total_timesteps | 703104 | -| train/ | | -| approx_kl | 0.008395689 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | -0.119 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 54920 | -| policy_gradient_loss | -0.00138 | -| std | 0.272 | -| value_loss | 2.62e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5494 | -| time_elapsed | 40248 | -| total_timesteps | 703232 | -| train/ | | -| approx_kl | 0.05488502 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.116 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | 0.00512 | -| n_updates | 54930 | -| policy_gradient_loss | -0.0138 | -| std | 0.272 | -| value_loss | 0.000102 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5495 | -| time_elapsed | 40252 | -| total_timesteps | 703360 | -| train/ | | -| approx_kl | 0.025760327 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.115 | -| explained_variance | -28.9 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 54940 | -| policy_gradient_loss | -0.00713 | -| std | 0.271 | -| value_loss | 6.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5496 | -| time_elapsed | 40257 | -| total_timesteps | 703488 | -| train/ | | -| approx_kl | 0.009723647 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.114 | -| explained_variance | -71.2 | -| learning_rate | 0.0003 | -| loss | -0.000137 | -| n_updates | 54950 | -| policy_gradient_loss | -0.00052 | -| std | 0.271 | -| value_loss | 4.57e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5497 | -| time_elapsed | 40260 | -| total_timesteps | 703616 | -| train/ | | -| approx_kl | 0.030521309 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | -0.112 | -| explained_variance | -16.2 | -| learning_rate | 0.0003 | -| loss | -0.00701 | -| n_updates | 54960 | -| policy_gradient_loss | -0.00439 | -| std | 0.271 | -| value_loss | 2.83e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5498 | -| time_elapsed | 40264 | -| total_timesteps | 703744 | -| train/ | | -| approx_kl | 0.009371877 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.111 | -| explained_variance | -0.361 | -| learning_rate | 0.0003 | -| loss | -0.00562 | -| n_updates | 54970 | -| policy_gradient_loss | -0.00152 | -| std | 0.27 | -| value_loss | 1.23e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5499 | -| time_elapsed | 40267 | -| total_timesteps | 703872 | -| train/ | | -| approx_kl | 0.0069976286 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | -0.111 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | -0.00617 | -| n_updates | 54980 | -| policy_gradient_loss | -0.00121 | -| std | 0.27 | -| value_loss | 2.39e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5500 | -| time_elapsed | 40271 | -| total_timesteps | 704000 | -| train/ | | -| approx_kl | 0.006163077 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.109 | -| explained_variance | -0.0662 | -| learning_rate | 0.0003 | -| loss | -0.000595 | -| n_updates | 54990 | -| policy_gradient_loss | -0.000362 | -| std | 0.269 | -| value_loss | 8.63e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5501 | -| time_elapsed | 40274 | -| total_timesteps | 704128 | -| train/ | | -| approx_kl | 0.0050863964 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.106 | -| explained_variance | -0.00289 | -| learning_rate | 0.0003 | -| loss | -0.000729 | -| n_updates | 55000 | -| policy_gradient_loss | -0.00068 | -| std | 0.269 | -| value_loss | 5.62e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5502 | -| time_elapsed | 40281 | -| total_timesteps | 704256 | -| train/ | | -| approx_kl | 0.030319303 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.105 | -| explained_variance | 0.755 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 55010 | -| policy_gradient_loss | -0.000406 | -| std | 0.269 | -| value_loss | 0.000477 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5503 | -| time_elapsed | 40284 | -| total_timesteps | 704384 | -| train/ | | -| approx_kl | 26.565443 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.103 | -| explained_variance | -781 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 55020 | -| policy_gradient_loss | -0.00453 | -| std | 0.268 | -| value_loss | 2.33e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5504 | -| time_elapsed | 40289 | -| total_timesteps | 704512 | -| train/ | | -| approx_kl | 0.65974396 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.0996 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 55030 | -| policy_gradient_loss | -0.0107 | -| std | 0.267 | -| value_loss | 9.37e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5505 | -| time_elapsed | 40293 | -| total_timesteps | 704640 | -| train/ | | -| approx_kl | 0.07250324 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | -0.0972 | -| explained_variance | -83.9 | -| learning_rate | 0.0003 | -| loss | -0.00526 | -| n_updates | 55040 | -| policy_gradient_loss | -0.00482 | -| std | 0.266 | -| value_loss | 6.27e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5506 | -| time_elapsed | 40297 | -| total_timesteps | 704768 | -| train/ | | -| approx_kl | 0.033485744 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | -0.095 | -| explained_variance | -1.75 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 55050 | -| policy_gradient_loss | -0.0119 | -| std | 0.266 | -| value_loss | 5.06e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5507 | -| time_elapsed | 40299 | -| total_timesteps | 704896 | -| train/ | | -| approx_kl | 0.00049409084 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0922 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 55060 | -| policy_gradient_loss | -0.000519 | -| std | 0.264 | -| value_loss | 2.52e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5508 | -| time_elapsed | 40303 | -| total_timesteps | 705024 | -| train/ | | -| approx_kl | 0.0042762863 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.0849 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 55070 | -| policy_gradient_loss | -0.00412 | -| std | 0.262 | -| value_loss | 2.16e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5509 | -| time_elapsed | 40311 | -| total_timesteps | 705152 | -| train/ | | -| approx_kl | 0.121073045 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.0798 | -| explained_variance | 0.781 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 55080 | -| policy_gradient_loss | -0.0174 | -| std | 0.262 | -| value_loss | 0.00207 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5510 | -| time_elapsed | 40316 | -| total_timesteps | 705280 | -| train/ | | -| approx_kl | 0.04769114 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | -0.0785 | -| explained_variance | -266 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 55090 | -| policy_gradient_loss | -0.00697 | -| std | 0.262 | -| value_loss | 1.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5511 | -| time_elapsed | 40320 | -| total_timesteps | 705408 | -| train/ | | -| approx_kl | 0.015797164 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.0786 | -| explained_variance | -252 | -| learning_rate | 0.0003 | -| loss | -0.00476 | -| n_updates | 55100 | -| policy_gradient_loss | -0.00135 | -| std | 0.262 | -| value_loss | 7.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5512 | -| time_elapsed | 40324 | -| total_timesteps | 705536 | -| train/ | | -| approx_kl | 0.017121835 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | -0.08 | -| explained_variance | -23.1 | -| learning_rate | 0.0003 | -| loss | 0.000566 | -| n_updates | 55110 | -| policy_gradient_loss | 0.000463 | -| std | 0.262 | -| value_loss | 1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5513 | -| time_elapsed | 40327 | -| total_timesteps | 705664 | -| train/ | | -| approx_kl | 0.018051824 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | -0.0812 | -| explained_variance | -0.922 | -| learning_rate | 0.0003 | -| loss | 0.0082 | -| n_updates | 55120 | -| policy_gradient_loss | 0.00439 | -| std | 0.262 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5514 | -| time_elapsed | 40330 | -| total_timesteps | 705792 | -| train/ | | -| approx_kl | 7.959735e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0824 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.000594 | -| n_updates | 55130 | -| policy_gradient_loss | -8.17e-05 | -| std | 0.263 | -| value_loss | 4.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5515 | -| time_elapsed | 40333 | -| total_timesteps | 705920 | -| train/ | | -| approx_kl | 0.006846649 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | -0.0858 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 55140 | -| policy_gradient_loss | 0.000102 | -| std | 0.264 | -| value_loss | 1.19e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5516 | -| time_elapsed | 40335 | -| total_timesteps | 706048 | -| train/ | | -| approx_kl | 0.02420983 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | -0.0864 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 55150 | -| policy_gradient_loss | -0.00972 | -| std | 0.264 | -| value_loss | 8.17e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5517 | -| time_elapsed | 40340 | -| total_timesteps | 706176 | -| train/ | | -| approx_kl | 0.08480118 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.0877 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 55160 | -| policy_gradient_loss | -0.0158 | -| std | 0.265 | -| value_loss | 0.000534 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5518 | -| time_elapsed | 40343 | -| total_timesteps | 706304 | -| train/ | | -| approx_kl | 0.016311862 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | -0.0893 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | 0.000136 | -| n_updates | 55170 | -| policy_gradient_loss | -0.000484 | -| std | 0.265 | -| value_loss | 4.66e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5519 | -| time_elapsed | 40346 | -| total_timesteps | 706432 | -| train/ | | -| approx_kl | 2.4456065e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0881 | -| explained_variance | -20.1 | -| learning_rate | 0.0003 | -| loss | -0.00026 | -| n_updates | 55180 | -| policy_gradient_loss | -2.89e-06 | -| std | 0.264 | -| value_loss | 2.06e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5520 | -| time_elapsed | 40350 | -| total_timesteps | 706560 | -| train/ | | -| approx_kl | 0.019993458 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.0848 | -| explained_variance | -2.29 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 55190 | -| policy_gradient_loss | -0.00375 | -| std | 0.263 | -| value_loss | 5.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5521 | -| time_elapsed | 40353 | -| total_timesteps | 706688 | -| train/ | | -| approx_kl | 0.023738394 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.0827 | -| explained_variance | -0.313 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 55200 | -| policy_gradient_loss | -0.00592 | -| std | 0.263 | -| value_loss | 2.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5522 | -| time_elapsed | 40357 | -| total_timesteps | 706816 | -| train/ | | -| approx_kl | 0.021561231 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | -0.0822 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 55210 | -| policy_gradient_loss | -0.00124 | -| std | 0.263 | -| value_loss | 4.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.765 | -| time/ | | -| fps | 17 | -| iterations | 5523 | -| time_elapsed | 40360 | -| total_timesteps | 706944 | -| train/ | | -| approx_kl | 0.016976122 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.0827 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 55220 | -| policy_gradient_loss | -0.00213 | -| std | 0.263 | -| value_loss | 5.6e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5524 | -| time_elapsed | 40364 | -| total_timesteps | 707072 | -| train/ | | -| approx_kl | 0.0095220385 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | -0.0836 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 55230 | -| policy_gradient_loss | -0.00295 | -| std | 0.263 | -| value_loss | 4.92e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5525 | -| time_elapsed | 40370 | -| total_timesteps | 707200 | -| train/ | | -| approx_kl | 0.17431445 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | -0.0839 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | -0.0342 | -| n_updates | 55240 | -| policy_gradient_loss | -0.0226 | -| std | 0.263 | -| value_loss | 0.0003 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5526 | -| time_elapsed | 40374 | -| total_timesteps | 707328 | -| train/ | | -| approx_kl | 0.02964293 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -0.0848 | -| explained_variance | -14.4 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 55250 | -| policy_gradient_loss | -0.0128 | -| std | 0.264 | -| value_loss | 7.52e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5527 | -| time_elapsed | 40377 | -| total_timesteps | 707456 | -| train/ | | -| approx_kl | 0.0036993292 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.0846 | -| explained_variance | -41.3 | -| learning_rate | 0.0003 | -| loss | -0.00027 | -| n_updates | 55260 | -| policy_gradient_loss | -0.000146 | -| std | 0.263 | -| value_loss | 5.55e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5528 | -| time_elapsed | 40380 | -| total_timesteps | 707584 | -| train/ | | -| approx_kl | 0.035511594 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | -0.0815 | -| explained_variance | -4.55 | -| learning_rate | 0.0003 | -| loss | -0.00974 | -| n_updates | 55270 | -| policy_gradient_loss | -0.00753 | -| std | 0.262 | -| value_loss | 3.98e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5529 | -| time_elapsed | 40383 | -| total_timesteps | 707712 | -| train/ | | -| approx_kl | 0.015754268 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.0793 | -| explained_variance | -0.408 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 55280 | -| policy_gradient_loss | -0.00238 | -| std | 0.262 | -| value_loss | 4.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5530 | -| time_elapsed | 40387 | -| total_timesteps | 707840 | -| train/ | | -| approx_kl | 0.030597772 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | -0.0789 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 55290 | -| policy_gradient_loss | -0.0122 | -| std | 0.262 | -| value_loss | 3.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.766 | -| time/ | | -| fps | 17 | -| iterations | 5531 | -| time_elapsed | 40390 | -| total_timesteps | 707968 | -| train/ | | -| approx_kl | 0.022736486 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | -0.0787 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00671 | -| n_updates | 55300 | -| policy_gradient_loss | -0.00588 | -| std | 0.262 | -| value_loss | 2.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5532 | -| time_elapsed | 40393 | -| total_timesteps | 708096 | -| train/ | | -| approx_kl | 0.016277911 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | -0.0796 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 55310 | -| policy_gradient_loss | -0.00284 | -| std | 0.262 | -| value_loss | 8.43e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5533 | -| time_elapsed | 40399 | -| total_timesteps | 708224 | -| train/ | | -| approx_kl | 0.039529733 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.0812 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 55320 | -| policy_gradient_loss | -0.0172 | -| std | 0.263 | -| value_loss | 0.000177 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5534 | -| time_elapsed | 40402 | -| total_timesteps | 708352 | -| train/ | | -| approx_kl | 0.03180676 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.0823 | -| explained_variance | -7.19 | -| learning_rate | 0.0003 | -| loss | -0.00699 | -| n_updates | 55330 | -| policy_gradient_loss | -0.00577 | -| std | 0.263 | -| value_loss | 2.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5535 | -| time_elapsed | 40404 | -| total_timesteps | 708480 | -| train/ | | -| approx_kl | 0.028588336 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.0836 | -| explained_variance | -31.1 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 55340 | -| policy_gradient_loss | -0.0105 | -| std | 0.263 | -| value_loss | 3.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5536 | -| time_elapsed | 40408 | -| total_timesteps | 708608 | -| train/ | | -| approx_kl | 0.006592238 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.0848 | -| explained_variance | -2.99 | -| learning_rate | 0.0003 | -| loss | -0.000273 | -| n_updates | 55350 | -| policy_gradient_loss | -0.000301 | -| std | 0.264 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5537 | -| time_elapsed | 40411 | -| total_timesteps | 708736 | -| train/ | | -| approx_kl | 0.0056527825 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | -0.0866 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.000464 | -| n_updates | 55360 | -| policy_gradient_loss | -0.000255 | -| std | 0.264 | -| value_loss | 9.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5538 | -| time_elapsed | 40414 | -| total_timesteps | 708864 | -| train/ | | -| approx_kl | 0.014708163 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.0892 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 55370 | -| policy_gradient_loss | -0.00549 | -| std | 0.265 | -| value_loss | 9.88e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5539 | -| time_elapsed | 40416 | -| total_timesteps | 708992 | -| train/ | | -| approx_kl | 0.03625769 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | -0.0906 | -| explained_variance | 0.00309 | -| learning_rate | 0.0003 | -| loss | -0.00997 | -| n_updates | 55380 | -| policy_gradient_loss | -0.00941 | -| std | 0.265 | -| value_loss | 3.01e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5540 | -| time_elapsed | 40420 | -| total_timesteps | 709120 | -| train/ | | -| approx_kl | 0.00732541 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.0919 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.000412 | -| n_updates | 55390 | -| policy_gradient_loss | -0.000236 | -| std | 0.265 | -| value_loss | 7.46e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5541 | -| time_elapsed | 40430 | -| total_timesteps | 709248 | -| train/ | | -| approx_kl | 0.14009312 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.0927 | -| explained_variance | -9.2 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 55400 | -| policy_gradient_loss | -0.0177 | -| std | 0.266 | -| value_loss | 0.00262 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5542 | -| time_elapsed | 40435 | -| total_timesteps | 709376 | -| train/ | | -| approx_kl | 0.014013399 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.0932 | -| explained_variance | -212 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 55410 | -| policy_gradient_loss | -0.00824 | -| std | 0.266 | -| value_loss | 1.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5543 | -| time_elapsed | 40438 | -| total_timesteps | 709504 | -| train/ | | -| approx_kl | 0.018364664 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.0937 | -| explained_variance | -328 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 55420 | -| policy_gradient_loss | -0.00424 | -| std | 0.266 | -| value_loss | 4.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5544 | -| time_elapsed | 40440 | -| total_timesteps | 709632 | -| train/ | | -| approx_kl | 0.017991398 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | -0.0928 | -| explained_variance | -27 | -| learning_rate | 0.0003 | -| loss | -0.000611 | -| n_updates | 55430 | -| policy_gradient_loss | -0.000559 | -| std | 0.265 | -| value_loss | 3.34e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5545 | -| time_elapsed | 40443 | -| total_timesteps | 709760 | -| train/ | | -| approx_kl | 0.0025293576 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.0897 | -| explained_variance | -2.03 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 55440 | -| policy_gradient_loss | -0.000145 | -| std | 0.264 | -| value_loss | 1.26e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 17 | -| iterations | 5546 | -| time_elapsed | 40445 | -| total_timesteps | 709888 | -| train/ | | -| approx_kl | 0.0076676584 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | -0.0868 | -| explained_variance | 0.000526 | -| learning_rate | 0.0003 | -| loss | 2.21e-05 | -| n_updates | 55450 | -| policy_gradient_loss | -0.00035 | -| std | 0.264 | -| value_loss | 1.18e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5547 | -| time_elapsed | 40448 | -| total_timesteps | 710016 | -| train/ | | -| approx_kl | 0.01712545 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.0853 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 55460 | -| policy_gradient_loss | -0.00384 | -| std | 0.263 | -| value_loss | 1.32e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5548 | -| time_elapsed | 40457 | -| total_timesteps | 710144 | -| train/ | | -| approx_kl | 0.09747541 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | -0.0835 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 55470 | -| policy_gradient_loss | -0.00455 | -| std | 0.263 | -| value_loss | 0.000171 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5549 | -| time_elapsed | 40460 | -| total_timesteps | 710272 | -| train/ | | -| approx_kl | 0.028080598 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.0817 | -| explained_variance | -206 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 55480 | -| policy_gradient_loss | -0.00214 | -| std | 0.263 | -| value_loss | 3.23e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5550 | -| time_elapsed | 40463 | -| total_timesteps | 710400 | -| train/ | | -| approx_kl | 0.0257255 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | -0.0817 | -| explained_variance | -214 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 55490 | -| policy_gradient_loss | -0.014 | -| std | 0.262 | -| value_loss | 1.13e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5551 | -| time_elapsed | 40466 | -| total_timesteps | 710528 | -| train/ | | -| approx_kl | 0.017718654 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | -0.0814 | -| explained_variance | -8.56 | -| learning_rate | 0.0003 | -| loss | -0.00052 | -| n_updates | 55500 | -| policy_gradient_loss | -0.000839 | -| std | 0.263 | -| value_loss | 1.19e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5552 | -| time_elapsed | 40468 | -| total_timesteps | 710656 | -| train/ | | -| approx_kl | 0.0350389 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | -0.082 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | -0.00941 | -| n_updates | 55510 | -| policy_gradient_loss | -0.00986 | -| std | 0.263 | -| value_loss | 1.93e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5553 | -| time_elapsed | 40472 | -| total_timesteps | 710784 | -| train/ | | -| approx_kl | 0.011702061 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.0829 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.000909 | -| n_updates | 55520 | -| policy_gradient_loss | -0.00148 | -| std | 0.263 | -| value_loss | 1.91e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 17 | -| iterations | 5554 | -| time_elapsed | 40476 | -| total_timesteps | 710912 | -| train/ | | -| approx_kl | 0.017353099 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -0.0834 | -| explained_variance | -0.0641 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 55530 | -| policy_gradient_loss | -0.00424 | -| std | 0.263 | -| value_loss | 1.23e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5555 | -| time_elapsed | 40480 | -| total_timesteps | 711040 | -| train/ | | -| approx_kl | 0.021165056 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | -0.0836 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | -0.00556 | -| n_updates | 55540 | -| policy_gradient_loss | -0.00495 | -| std | 0.263 | -| value_loss | 1.67e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5556 | -| time_elapsed | 40488 | -| total_timesteps | 711168 | -| train/ | | -| approx_kl | 0.04089547 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | -0.0845 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0317 | -| n_updates | 55550 | -| policy_gradient_loss | -0.0167 | -| std | 0.263 | -| value_loss | 5.48e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5557 | -| time_elapsed | 40492 | -| total_timesteps | 711296 | -| train/ | | -| approx_kl | 0.021238806 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | -0.0852 | -| explained_variance | -26.2 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 55560 | -| policy_gradient_loss | -0.0111 | -| std | 0.264 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5558 | -| time_elapsed | 40496 | -| total_timesteps | 711424 | -| train/ | | -| approx_kl | 0.016578674 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.0856 | -| explained_variance | -743 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 55570 | -| policy_gradient_loss | -0.00758 | -| std | 0.264 | -| value_loss | 1.71e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5559 | -| time_elapsed | 40500 | -| total_timesteps | 711552 | -| train/ | | -| approx_kl | 0.05455631 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | -0.086 | -| explained_variance | -597 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 55580 | -| policy_gradient_loss | -0.0109 | -| std | 0.264 | -| value_loss | 9.75e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5560 | -| time_elapsed | 40503 | -| total_timesteps | 711680 | -| train/ | | -| approx_kl | 0.0032116594 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.0851 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 55590 | -| policy_gradient_loss | -0.000552 | -| std | 0.263 | -| value_loss | 1.89e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5561 | -| time_elapsed | 40507 | -| total_timesteps | 711808 | -| train/ | | -| approx_kl | 0.007386199 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.0819 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.000338 | -| n_updates | 55600 | -| policy_gradient_loss | -0.000462 | -| std | 0.262 | -| value_loss | 1.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5562 | -| time_elapsed | 40510 | -| total_timesteps | 711936 | -| train/ | | -| approx_kl | 0.037991825 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.0811 | -| explained_variance | -71.9 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 55610 | -| policy_gradient_loss | -0.00901 | -| std | 0.262 | -| value_loss | 5.96e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5563 | -| time_elapsed | 40513 | -| total_timesteps | 712064 | -| train/ | | -| approx_kl | 0.022171991 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | -0.0805 | -| explained_variance | -0.655 | -| learning_rate | 0.0003 | -| loss | -0.000997 | -| n_updates | 55620 | -| policy_gradient_loss | -0.00246 | -| std | 0.262 | -| value_loss | 1.33e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5564 | -| time_elapsed | 40519 | -| total_timesteps | 712192 | -| train/ | | -| approx_kl | 0.07906221 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | -0.0799 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0311 | -| n_updates | 55630 | -| policy_gradient_loss | -0.0223 | -| std | 0.262 | -| value_loss | 4.08e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5565 | -| time_elapsed | 40521 | -| total_timesteps | 712320 | -| train/ | | -| approx_kl | 0.05559134 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | -0.0803 | -| explained_variance | -21.9 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 55640 | -| policy_gradient_loss | -0.0053 | -| std | 0.262 | -| value_loss | 5.69e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5566 | -| time_elapsed | 40524 | -| total_timesteps | 712448 | -| train/ | | -| approx_kl | 0.008439671 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | -0.0801 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 55650 | -| policy_gradient_loss | -0.00225 | -| std | 0.262 | -| value_loss | 2.23e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5567 | -| time_elapsed | 40527 | -| total_timesteps | 712576 | -| train/ | | -| approx_kl | 0.00093906466 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.08 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 55660 | -| policy_gradient_loss | 0.00261 | -| std | 0.262 | -| value_loss | 9.04e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5568 | -| time_elapsed | 40531 | -| total_timesteps | 712704 | -| train/ | | -| approx_kl | 0.0031033824 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | -0.08 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 55670 | -| policy_gradient_loss | 0.00138 | -| std | 0.262 | -| value_loss | 6.32e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5569 | -| time_elapsed | 40534 | -| total_timesteps | 712832 | -| train/ | | -| approx_kl | 0.0016247681 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.0794 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | -0.000197 | -| n_updates | 55680 | -| policy_gradient_loss | 0.000896 | -| std | 0.262 | -| value_loss | 5.03e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.756 | -| time/ | | -| fps | 17 | -| iterations | 5570 | -| time_elapsed | 40537 | -| total_timesteps | 712960 | -| train/ | | -| approx_kl | 0.011064056 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | -0.0787 | -| explained_variance | -0.00565 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 55690 | -| policy_gradient_loss | -0.00312 | -| std | 0.262 | -| value_loss | 4.98e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5571 | -| time_elapsed | 40541 | -| total_timesteps | 713088 | -| train/ | | -| approx_kl | 0.015959159 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | -0.0793 | -| explained_variance | -0.00216 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 55700 | -| policy_gradient_loss | -0.00329 | -| std | 0.262 | -| value_loss | 2.21e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5572 | -| time_elapsed | 40548 | -| total_timesteps | 713216 | -| train/ | | -| approx_kl | 0.17904712 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | -0.08 | -| explained_variance | 0.923 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 55710 | -| policy_gradient_loss | -0.0174 | -| std | 0.262 | -| value_loss | 0.000426 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5573 | -| time_elapsed | 40552 | -| total_timesteps | 713344 | -| train/ | | -| approx_kl | 0.0069609587 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | -0.0806 | -| explained_variance | -6.29e+03 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 55720 | -| policy_gradient_loss | -0.00102 | -| std | 0.262 | -| value_loss | 1.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5574 | -| time_elapsed | 40556 | -| total_timesteps | 713472 | -| train/ | | -| approx_kl | 0.0013940018 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0814 | -| explained_variance | -4.39e+03 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 55730 | -| policy_gradient_loss | 0.000443 | -| std | 0.263 | -| value_loss | 5.96e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5575 | -| time_elapsed | 40559 | -| total_timesteps | 713600 | -| train/ | | -| approx_kl | 0.0025858874 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0834 | -| explained_variance | -215 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 55740 | -| policy_gradient_loss | 0.000211 | -| std | 0.263 | -| value_loss | 2.36e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5576 | -| time_elapsed | 40561 | -| total_timesteps | 713728 | -| train/ | | -| approx_kl | 0.002019667 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0854 | -| explained_variance | -1.61 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 55750 | -| policy_gradient_loss | 0.00206 | -| std | 0.264 | -| value_loss | 1.34e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5577 | -| time_elapsed | 40565 | -| total_timesteps | 713856 | -| train/ | | -| approx_kl | 0.027954543 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | -0.0865 | -| explained_variance | -0.756 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 55760 | -| policy_gradient_loss | 0.00575 | -| std | 0.264 | -| value_loss | 3.94e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.747 | -| time/ | | -| fps | 17 | -| iterations | 5578 | -| time_elapsed | 40568 | -| total_timesteps | 713984 | -| train/ | | -| approx_kl | 0.010368234 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.0866 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.00215 | -| n_updates | 55770 | -| policy_gradient_loss | 1.81e-05 | -| std | 0.264 | -| value_loss | 9.16e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.746 | -| time/ | | -| fps | 17 | -| iterations | 5579 | -| time_elapsed | 40573 | -| total_timesteps | 714112 | -| train/ | | -| approx_kl | 0.0019951435 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.0857 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 55780 | -| policy_gradient_loss | -0.00034 | -| std | 0.263 | -| value_loss | 4.3e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.746 | -| time/ | | -| fps | 17 | -| iterations | 5580 | -| time_elapsed | 40582 | -| total_timesteps | 714240 | -| train/ | | -| approx_kl | 0.035250105 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | -0.0839 | -| explained_variance | -4.74 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 55790 | -| policy_gradient_loss | -0.00867 | -| std | 0.263 | -| value_loss | 0.00166 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.746 | -| time/ | | -| fps | 17 | -| iterations | 5581 | -| time_elapsed | 40586 | -| total_timesteps | 714368 | -| train/ | | -| approx_kl | 0.026889052 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | -0.0832 | -| explained_variance | -3.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 55800 | -| policy_gradient_loss | -0.00172 | -| std | 0.263 | -| value_loss | 1.05e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.746 | -| time/ | | -| fps | 17 | -| iterations | 5582 | -| time_elapsed | 40590 | -| total_timesteps | 714496 | -| train/ | | -| approx_kl | 0.04182647 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -0.0808 | -| explained_variance | -539 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 55810 | -| policy_gradient_loss | -0.00868 | -| std | 0.262 | -| value_loss | 4.74e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.746 | -| time/ | | -| fps | 17 | -| iterations | 5583 | -| time_elapsed | 40592 | -| total_timesteps | 714624 | -| train/ | | -| approx_kl | 0.003759889 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.0792 | -| explained_variance | -8.83 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 55820 | -| policy_gradient_loss | 9.36e-05 | -| std | 0.262 | -| value_loss | 7.82e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.746 | -| time/ | | -| fps | 17 | -| iterations | 5584 | -| time_elapsed | 40595 | -| total_timesteps | 714752 | -| train/ | | -| approx_kl | 0.02437102 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | -0.0777 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | 0.00257 | -| n_updates | 55830 | -| policy_gradient_loss | -0.00117 | -| std | 0.261 | -| value_loss | 3e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.746 | -| time/ | | -| fps | 17 | -| iterations | 5585 | -| time_elapsed | 40597 | -| total_timesteps | 714880 | -| train/ | | -| approx_kl | 0.0025395504 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0769 | -| explained_variance | -0.00691 | -| learning_rate | 0.0003 | -| loss | -0.000835 | -| n_updates | 55840 | -| policy_gradient_loss | -0.000152 | -| std | 0.262 | -| value_loss | 3.28e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5586 | -| time_elapsed | 40599 | -| total_timesteps | 715008 | -| train/ | | -| approx_kl | 0.0139499195 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.0786 | -| explained_variance | 0.00257 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 55850 | -| policy_gradient_loss | -0.00348 | -| std | 0.262 | -| value_loss | 2.56e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5587 | -| time_elapsed | 40606 | -| total_timesteps | 715136 | -| train/ | | -| approx_kl | 0.041106164 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | -0.0797 | -| explained_variance | 0.692 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 55860 | -| policy_gradient_loss | -0.00493 | -| std | 0.262 | -| value_loss | 0.00342 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5588 | -| time_elapsed | 40609 | -| total_timesteps | 715264 | -| train/ | | -| approx_kl | 0.13243225 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | -0.0784 | -| explained_variance | -3.04e+03 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 55870 | -| policy_gradient_loss | -0.0159 | -| std | 0.262 | -| value_loss | 1.3e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5589 | -| time_elapsed | 40612 | -| total_timesteps | 715392 | -| train/ | | -| approx_kl | 0.040712446 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | -0.0786 | -| explained_variance | -3.6e+03 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 55880 | -| policy_gradient_loss | -0.00177 | -| std | 0.262 | -| value_loss | 4.9e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5590 | -| time_elapsed | 40616 | -| total_timesteps | 715520 | -| train/ | | -| approx_kl | 0.0112542175 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | -0.0805 | -| explained_variance | -7.32 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 55890 | -| policy_gradient_loss | -0.00244 | -| std | 0.262 | -| value_loss | 1.14e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5591 | -| time_elapsed | 40620 | -| total_timesteps | 715648 | -| train/ | | -| approx_kl | 0.0006262935 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0814 | -| explained_variance | -373 | -| learning_rate | 0.0003 | -| loss | -0.000688 | -| n_updates | 55900 | -| policy_gradient_loss | 0.000711 | -| std | 0.262 | -| value_loss | 7.75e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5592 | -| time_elapsed | 40625 | -| total_timesteps | 715776 | -| train/ | | -| approx_kl | 0.015996631 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | -0.0807 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.000997 | -| n_updates | 55910 | -| policy_gradient_loss | 0.000579 | -| std | 0.262 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.734 | -| time/ | | -| fps | 17 | -| iterations | 5593 | -| time_elapsed | 40630 | -| total_timesteps | 715904 | -| train/ | | -| approx_kl | 0.017003084 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | -0.0804 | -| explained_variance | -4.65 | -| learning_rate | 0.0003 | -| loss | 8.22e-05 | -| n_updates | 55920 | -| policy_gradient_loss | -0.000772 | -| std | 0.262 | -| value_loss | 3.62e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5594 | -| time_elapsed | 40633 | -| total_timesteps | 716032 | -| train/ | | -| approx_kl | 0.0075790733 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | -0.0798 | -| explained_variance | 0.00488 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 55930 | -| policy_gradient_loss | -0.00081 | -| std | 0.262 | -| value_loss | 1.71e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5595 | -| time_elapsed | 40641 | -| total_timesteps | 716160 | -| train/ | | -| approx_kl | 0.05081851 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.0795 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.027 | -| n_updates | 55940 | -| policy_gradient_loss | -0.0168 | -| std | 0.262 | -| value_loss | 4.75e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5596 | -| time_elapsed | 40645 | -| total_timesteps | 716288 | -| train/ | | -| approx_kl | 0.0009427741 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0796 | -| explained_variance | -35.5 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 55950 | -| policy_gradient_loss | 0.00273 | -| std | 0.262 | -| value_loss | 1.59e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5597 | -| time_elapsed | 40649 | -| total_timesteps | 716416 | -| train/ | | -| approx_kl | 0.0029793177 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0797 | -| explained_variance | -78.6 | -| learning_rate | 0.0003 | -| loss | -0.00803 | -| n_updates | 55960 | -| policy_gradient_loss | 0.000744 | -| std | 0.262 | -| value_loss | 4.76e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5598 | -| time_elapsed | 40652 | -| total_timesteps | 716544 | -| train/ | | -| approx_kl | 9.732321e-05 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.0784 | -| explained_variance | -2.46 | -| learning_rate | 0.0003 | -| loss | -0.000787 | -| n_updates | 55970 | -| policy_gradient_loss | 0.000218 | -| std | 0.261 | -| value_loss | 3.11e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5599 | -| time_elapsed | 40653 | -| total_timesteps | 716672 | -| train/ | | -| approx_kl | 0.015134694 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -0.0733 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 55980 | -| policy_gradient_loss | -0.00323 | -| std | 0.26 | -| value_loss | 3.75e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5600 | -| time_elapsed | 40657 | -| total_timesteps | 716800 | -| train/ | | -| approx_kl | 0.011407074 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | -0.0706 | -| explained_variance | -0.00363 | -| learning_rate | 0.0003 | -| loss | 0.000489 | -| n_updates | 55990 | -| policy_gradient_loss | -0.000676 | -| std | 0.259 | -| value_loss | 2.26e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.737 | -| time/ | | -| fps | 17 | -| iterations | 5601 | -| time_elapsed | 40661 | -| total_timesteps | 716928 | -| train/ | | -| approx_kl | 0.02285208 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | -0.0696 | -| explained_variance | -0.075 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 56000 | -| policy_gradient_loss | -0.00556 | -| std | 0.259 | -| value_loss | 4.32e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5602 | -| time_elapsed | 40665 | -| total_timesteps | 717056 | -| train/ | | -| approx_kl | 0.012460599 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | -0.0692 | -| explained_variance | -0.00846 | -| learning_rate | 0.0003 | -| loss | -0.000192 | -| n_updates | 56010 | -| policy_gradient_loss | -0.00146 | -| std | 0.259 | -| value_loss | 2.79e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5603 | -| time_elapsed | 40670 | -| total_timesteps | 717184 | -| train/ | | -| approx_kl | 0.06687999 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | -0.0678 | -| explained_variance | 0.728 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 56020 | -| policy_gradient_loss | -0.00186 | -| std | 0.258 | -| value_loss | 0.00457 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5604 | -| time_elapsed | 40674 | -| total_timesteps | 717312 | -| train/ | | -| approx_kl | 0.045507893 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | -0.0647 | -| explained_variance | -827 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 56030 | -| policy_gradient_loss | -0.0102 | -| std | 0.258 | -| value_loss | 5.41e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5605 | -| time_elapsed | 40677 | -| total_timesteps | 717440 | -| train/ | | -| approx_kl | 0.02956938 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.0634 | -| explained_variance | -1.36e+03 | -| learning_rate | 0.0003 | -| loss | -0.00838 | -| n_updates | 56040 | -| policy_gradient_loss | -0.00346 | -| std | 0.258 | -| value_loss | 1.81e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5606 | -| time_elapsed | 40679 | -| total_timesteps | 717568 | -| train/ | | -| approx_kl | 7.71787e-06 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | -0.0635 | -| explained_variance | -66.7 | -| learning_rate | 0.0003 | -| loss | 0.000232 | -| n_updates | 56050 | -| policy_gradient_loss | 0.00325 | -| std | 0.258 | -| value_loss | 6.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5607 | -| time_elapsed | 40682 | -| total_timesteps | 717696 | -| train/ | | -| approx_kl | 0.031398848 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | -0.0639 | -| explained_variance | -22.4 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 56060 | -| policy_gradient_loss | -0.0136 | -| std | 0.258 | -| value_loss | 3.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5608 | -| time_elapsed | 40685 | -| total_timesteps | 717824 | -| train/ | | -| approx_kl | 0.012891555 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | -0.0641 | -| explained_variance | -2.89 | -| learning_rate | 0.0003 | -| loss | -0.000901 | -| n_updates | 56070 | -| policy_gradient_loss | -0.000847 | -| std | 0.258 | -| value_loss | 9.1e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.736 | -| time/ | | -| fps | 17 | -| iterations | 5609 | -| time_elapsed | 40688 | -| total_timesteps | 717952 | -| train/ | | -| approx_kl | 0.016515031 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.0629 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 56080 | -| policy_gradient_loss | -0.00208 | -| std | 0.258 | -| value_loss | 5.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5610 | -| time_elapsed | 40692 | -| total_timesteps | 718080 | -| train/ | | -| approx_kl | 0.023478359 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | -0.0633 | -| explained_variance | -0.00608 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 56090 | -| policy_gradient_loss | -0.0145 | -| std | 0.258 | -| value_loss | 4.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5611 | -| time_elapsed | 40697 | -| total_timesteps | 718208 | -| train/ | | -| approx_kl | 0.046663698 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.0641 | -| explained_variance | -8 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 56100 | -| policy_gradient_loss | -0.0144 | -| std | 0.258 | -| value_loss | 0.005 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5612 | -| time_elapsed | 40700 | -| total_timesteps | 718336 | -| train/ | | -| approx_kl | 0.00124428 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0645 | -| explained_variance | -147 | -| learning_rate | 0.0003 | -| loss | -0.000297 | -| n_updates | 56110 | -| policy_gradient_loss | -3.42e-05 | -| std | 0.258 | -| value_loss | 4.05e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5613 | -| time_elapsed | 40704 | -| total_timesteps | 718464 | -| train/ | | -| approx_kl | 0.00222197 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0637 | -| explained_variance | -33.2 | -| learning_rate | 0.0003 | -| loss | 7.94e-05 | -| n_updates | 56120 | -| policy_gradient_loss | 4.8e-05 | -| std | 0.258 | -| value_loss | 7.51e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5614 | -| time_elapsed | 40707 | -| total_timesteps | 718592 | -| train/ | | -| approx_kl | 0.013614308 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.0625 | -| explained_variance | -0.0786 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 56130 | -| policy_gradient_loss | -0.00566 | -| std | 0.257 | -| value_loss | 4.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5615 | -| time_elapsed | 40710 | -| total_timesteps | 718720 | -| train/ | | -| approx_kl | 0.008503644 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | -0.0613 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | 0.00164 | -| n_updates | 56140 | -| policy_gradient_loss | 0.000199 | -| std | 0.257 | -| value_loss | 3.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5616 | -| time_elapsed | 40713 | -| total_timesteps | 718848 | -| train/ | | -| approx_kl | 0.017921971 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | -0.0595 | -| explained_variance | 0.00689 | -| learning_rate | 0.0003 | -| loss | -0.00564 | -| n_updates | 56150 | -| policy_gradient_loss | -0.00476 | -| std | 0.257 | -| value_loss | 1.78e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.743 | -| time/ | | -| fps | 17 | -| iterations | 5617 | -| time_elapsed | 40716 | -| total_timesteps | 718976 | -| train/ | | -| approx_kl | 0.006325569 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | -0.0582 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 56160 | -| policy_gradient_loss | -0.0014 | -| std | 0.256 | -| value_loss | 9.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.739 | -| time/ | | -| fps | 17 | -| iterations | 5618 | -| time_elapsed | 40718 | -| total_timesteps | 719104 | -| train/ | | -| approx_kl | 0.010706709 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.0572 | -| explained_variance | 0.00339 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 56170 | -| policy_gradient_loss | -0.00169 | -| std | 0.256 | -| value_loss | 1.33e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.739 | -| time/ | | -| fps | 17 | -| iterations | 5619 | -| time_elapsed | 40726 | -| total_timesteps | 719232 | -| train/ | | -| approx_kl | 0.065338135 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | -0.0577 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 56180 | -| policy_gradient_loss | -0.0147 | -| std | 0.256 | -| value_loss | 0.00301 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.739 | -| time/ | | -| fps | 17 | -| iterations | 5620 | -| time_elapsed | 40729 | -| total_timesteps | 719360 | -| train/ | | -| approx_kl | 0.0042114104 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.0584 | -| explained_variance | -137 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 56190 | -| policy_gradient_loss | 4.75e-05 | -| std | 0.257 | -| value_loss | 6.35e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.739 | -| time/ | | -| fps | 17 | -| iterations | 5621 | -| time_elapsed | 40732 | -| total_timesteps | 719488 | -| train/ | | -| approx_kl | 0.022311406 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | -0.0591 | -| explained_variance | -233 | -| learning_rate | 0.0003 | -| loss | -0.000368 | -| n_updates | 56200 | -| policy_gradient_loss | -0.000785 | -| std | 0.257 | -| value_loss | 4.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.739 | -| time/ | | -| fps | 17 | -| iterations | 5622 | -| time_elapsed | 40735 | -| total_timesteps | 719616 | -| train/ | | -| approx_kl | 0.050655358 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | -0.0597 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.00513 | -| n_updates | 56210 | -| policy_gradient_loss | -0.00706 | -| std | 0.257 | -| value_loss | 2.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.739 | -| time/ | | -| fps | 17 | -| iterations | 5623 | -| time_elapsed | 40739 | -| total_timesteps | 719744 | -| train/ | | -| approx_kl | 0.01663804 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.0594 | -| explained_variance | -0.735 | -| learning_rate | 0.0003 | -| loss | -0.000725 | -| n_updates | 56220 | -| policy_gradient_loss | -0.0015 | -| std | 0.257 | -| value_loss | 4.75e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.739 | -| time/ | | -| fps | 17 | -| iterations | 5624 | -| time_elapsed | 40743 | -| total_timesteps | 719872 | -| train/ | | -| approx_kl | 0.02550485 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.0583 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 56230 | -| policy_gradient_loss | -0.00958 | -| std | 0.256 | -| value_loss | 6.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5625 | -| time_elapsed | 40747 | -| total_timesteps | 720000 | -| train/ | | -| approx_kl | 0.008432044 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.0583 | -| explained_variance | -0.00723 | -| learning_rate | 0.0003 | -| loss | 0.000116 | -| n_updates | 56240 | -| policy_gradient_loss | -0.00028 | -| std | 0.257 | -| value_loss | 8.99e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5626 | -| time_elapsed | 40750 | -| total_timesteps | 720128 | -| train/ | | -| approx_kl | 0.0076671564 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.0603 | -| explained_variance | 0.00309 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 56250 | -| policy_gradient_loss | 0.000184 | -| std | 0.257 | -| value_loss | 1.33e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5627 | -| time_elapsed | 40757 | -| total_timesteps | 720256 | -| train/ | | -| approx_kl | 0.018318264 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | -0.0615 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 56260 | -| policy_gradient_loss | -0.0135 | -| std | 0.257 | -| value_loss | 0.00196 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5628 | -| time_elapsed | 40761 | -| total_timesteps | 720384 | -| train/ | | -| approx_kl | 0.0246775 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.0612 | -| explained_variance | -3.17e+03 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 56270 | -| policy_gradient_loss | -0.0103 | -| std | 0.257 | -| value_loss | 4.91e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5629 | -| time_elapsed | 40764 | -| total_timesteps | 720512 | -| train/ | | -| approx_kl | 0.03657054 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | -0.0611 | -| explained_variance | -2.81e+03 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 56280 | -| policy_gradient_loss | -0.0019 | -| std | 0.257 | -| value_loss | 2.21e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5630 | -| time_elapsed | 40768 | -| total_timesteps | 720640 | -| train/ | | -| approx_kl | 0.08251956 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | -0.0623 | -| explained_variance | -27.5 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 56290 | -| policy_gradient_loss | -0.0121 | -| std | 0.258 | -| value_loss | 3.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5631 | -| time_elapsed | 40770 | -| total_timesteps | 720768 | -| train/ | | -| approx_kl | 0.029287152 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.0635 | -| explained_variance | -128 | -| learning_rate | 0.0003 | -| loss | -0.0083 | -| n_updates | 56300 | -| policy_gradient_loss | -0.00632 | -| std | 0.258 | -| value_loss | 3.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 17 | -| iterations | 5632 | -| time_elapsed | 40772 | -| total_timesteps | 720896 | -| train/ | | -| approx_kl | 0.008076841 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | -0.0649 | -| explained_variance | -3.95 | -| learning_rate | 0.0003 | -| loss | 0.000574 | -| n_updates | 56310 | -| policy_gradient_loss | -0.000165 | -| std | 0.259 | -| value_loss | 1.82e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5633 | -| time_elapsed | 40774 | -| total_timesteps | 721024 | -| train/ | | -| approx_kl | 0.023305053 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | -0.0666 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 56320 | -| policy_gradient_loss | -0.0109 | -| std | 0.259 | -| value_loss | 1.68e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5634 | -| time_elapsed | 40783 | -| total_timesteps | 721152 | -| train/ | | -| approx_kl | 0.06524076 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.0671 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.0353 | -| n_updates | 56330 | -| policy_gradient_loss | -0.0205 | -| std | 0.259 | -| value_loss | 8.7e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5635 | -| time_elapsed | 40787 | -| total_timesteps | 721280 | -| train/ | | -| approx_kl | 0.04368301 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | -0.0671 | -| explained_variance | -43.9 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 56340 | -| policy_gradient_loss | -0.00942 | -| std | 0.259 | -| value_loss | 1.51e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5636 | -| time_elapsed | 40791 | -| total_timesteps | 721408 | -| train/ | | -| approx_kl | 0.0010876134 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0666 | -| explained_variance | -120 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 56350 | -| policy_gradient_loss | 0.00264 | -| std | 0.259 | -| value_loss | 4.89e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5637 | -| time_elapsed | 40795 | -| total_timesteps | 721536 | -| train/ | | -| approx_kl | 0.0028983261 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0664 | -| explained_variance | -8.26 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 56360 | -| policy_gradient_loss | 0.000251 | -| std | 0.259 | -| value_loss | 4.75e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5638 | -| time_elapsed | 40798 | -| total_timesteps | 721664 | -| train/ | | -| approx_kl | 0.0020677499 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.066 | -| explained_variance | -0.568 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 56370 | -| policy_gradient_loss | 0.00114 | -| std | 0.258 | -| value_loss | 2.33e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5639 | -| time_elapsed | 40802 | -| total_timesteps | 721792 | -| train/ | | -| approx_kl | 0.0076509244 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.0652 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -2.61e-05 | -| n_updates | 56380 | -| policy_gradient_loss | 0.0014 | -| std | 0.258 | -| value_loss | 4.26e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.76 | -| time/ | | -| fps | 17 | -| iterations | 5640 | -| time_elapsed | 40807 | -| total_timesteps | 721920 | -| train/ | | -| approx_kl | 0.0030793473 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | -0.0624 | -| explained_variance | -0.000475 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 56390 | -| policy_gradient_loss | -0.000764 | -| std | 0.257 | -| value_loss | 1.06e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5641 | -| time_elapsed | 40811 | -| total_timesteps | 722048 | -| train/ | | -| approx_kl | 0.0019603367 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | -0.0566 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.000107 | -| n_updates | 56400 | -| policy_gradient_loss | 9.32e-05 | -| std | 0.256 | -| value_loss | 1.5e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5642 | -| time_elapsed | 40818 | -| total_timesteps | 722176 | -| train/ | | -| approx_kl | 0.04196647 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | -0.0542 | -| explained_variance | -2.21 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 56410 | -| policy_gradient_loss | -0.0153 | -| std | 0.255 | -| value_loss | 0.00326 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5643 | -| time_elapsed | 40822 | -| total_timesteps | 722304 | -| train/ | | -| approx_kl | 0.022352979 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.0529 | -| explained_variance | -4.41e+03 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 56420 | -| policy_gradient_loss | -0.00152 | -| std | 0.255 | -| value_loss | 1.83e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5644 | -| time_elapsed | 40826 | -| total_timesteps | 722432 | -| train/ | | -| approx_kl | 0.015577132 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.0496 | -| explained_variance | -8.04e+03 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 56430 | -| policy_gradient_loss | -0.00101 | -| std | 0.254 | -| value_loss | 3.9e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5645 | -| time_elapsed | 40829 | -| total_timesteps | 722560 | -| train/ | | -| approx_kl | 0.020146297 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | -0.0458 | -| explained_variance | -28.4 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 56440 | -| policy_gradient_loss | -0.00183 | -| std | 0.253 | -| value_loss | 2.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5646 | -| time_elapsed | 40831 | -| total_timesteps | 722688 | -| train/ | | -| approx_kl | 0.009563971 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.0455 | -| explained_variance | -245 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 56450 | -| policy_gradient_loss | -0.000485 | -| std | 0.254 | -| value_loss | 2.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5647 | -| time_elapsed | 40835 | -| total_timesteps | 722816 | -| train/ | | -| approx_kl | 0.013500992 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | -0.0478 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | -0.000494 | -| n_updates | 56460 | -| policy_gradient_loss | -0.00044 | -| std | 0.254 | -| value_loss | 1e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.763 | -| time/ | | -| fps | 17 | -| iterations | 5648 | -| time_elapsed | 40838 | -| total_timesteps | 722944 | -| train/ | | -| approx_kl | 0.017123312 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.0459 | -| explained_variance | -0.454 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 56470 | -| policy_gradient_loss | -0.00768 | -| std | 0.253 | -| value_loss | 4.23e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5649 | -| time_elapsed | 40840 | -| total_timesteps | 723072 | -| train/ | | -| approx_kl | 0.021916926 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | -0.0443 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | 0.00258 | -| n_updates | 56480 | -| policy_gradient_loss | -2.44e-05 | -| std | 0.253 | -| value_loss | 9.51e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5650 | -| time_elapsed | 40846 | -| total_timesteps | 723200 | -| train/ | | -| approx_kl | 0.030967575 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.0429 | -| explained_variance | 0.663 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 56490 | -| policy_gradient_loss | -0.0161 | -| std | 0.252 | -| value_loss | 0.00109 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5651 | -| time_elapsed | 40849 | -| total_timesteps | 723328 | -| train/ | | -| approx_kl | 0.0047691083 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.0419 | -| explained_variance | -40.6 | -| learning_rate | 0.0003 | -| loss | -0.00616 | -| n_updates | 56500 | -| policy_gradient_loss | -4.7e-05 | -| std | 0.252 | -| value_loss | 7.35e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5652 | -| time_elapsed | 40853 | -| total_timesteps | 723456 | -| train/ | | -| approx_kl | 0.0021467935 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.042 | -| explained_variance | -114 | -| learning_rate | 0.0003 | -| loss | -0.00379 | -| n_updates | 56510 | -| policy_gradient_loss | 0.00121 | -| std | 0.252 | -| value_loss | 3.61e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5653 | -| time_elapsed | 40856 | -| total_timesteps | 723584 | -| train/ | | -| approx_kl | 1.9231811e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0423 | -| explained_variance | -44.6 | -| learning_rate | 0.0003 | -| loss | -0.00016 | -| n_updates | 56520 | -| policy_gradient_loss | 0.000442 | -| std | 0.253 | -| value_loss | 5.31e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5654 | -| time_elapsed | 40858 | -| total_timesteps | 723712 | -| train/ | | -| approx_kl | 0.022768008 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.0448 | -| explained_variance | -3.28 | -| learning_rate | 0.0003 | -| loss | 0.000265 | -| n_updates | 56530 | -| policy_gradient_loss | -0.000529 | -| std | 0.253 | -| value_loss | 8.4e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5655 | -| time_elapsed | 40861 | -| total_timesteps | 723840 | -| train/ | | -| approx_kl | 0.012275744 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | -0.0467 | -| explained_variance | -0.262 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 56540 | -| policy_gradient_loss | -0.00229 | -| std | 0.254 | -| value_loss | 8.69e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.757 | -| time/ | | -| fps | 17 | -| iterations | 5656 | -| time_elapsed | 40864 | -| total_timesteps | 723968 | -| train/ | | -| approx_kl | 0.01959946 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | -0.0474 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 56550 | -| policy_gradient_loss | -0.00514 | -| std | 0.254 | -| value_loss | 4.88e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5657 | -| time_elapsed | 40868 | -| total_timesteps | 724096 | -| train/ | | -| approx_kl | 0.02608443 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | -0.0467 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 56560 | -| policy_gradient_loss | -0.0115 | -| std | 0.253 | -| value_loss | 1.11e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5658 | -| time_elapsed | 40875 | -| total_timesteps | 724224 | -| train/ | | -| approx_kl | 0.1657442 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | -0.0452 | -| explained_variance | 0.732 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 56570 | -| policy_gradient_loss | -0.0111 | -| std | 0.253 | -| value_loss | 0.00484 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5659 | -| time_elapsed | 40878 | -| total_timesteps | 724352 | -| train/ | | -| approx_kl | 0.027404731 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | -0.0434 | -| explained_variance | -1.39e+03 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 56580 | -| policy_gradient_loss | -0.0131 | -| std | 0.252 | -| value_loss | 1.46e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5660 | -| time_elapsed | 40883 | -| total_timesteps | 724480 | -| train/ | | -| approx_kl | 0.06845073 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | -0.042 | -| explained_variance | -877 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 56590 | -| policy_gradient_loss | -0.00712 | -| std | 0.252 | -| value_loss | 3.68e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5661 | -| time_elapsed | 40886 | -| total_timesteps | 724608 | -| train/ | | -| approx_kl | 0.09916486 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | -0.0415 | -| explained_variance | -20.5 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 56600 | -| policy_gradient_loss | -0.00662 | -| std | 0.252 | -| value_loss | 8.32e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5662 | -| time_elapsed | 40890 | -| total_timesteps | 724736 | -| train/ | | -| approx_kl | 0.013295766 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | -0.0404 | -| explained_variance | -0.899 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 56610 | -| policy_gradient_loss | -0.00248 | -| std | 0.252 | -| value_loss | 1.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5663 | -| time_elapsed | 40893 | -| total_timesteps | 724864 | -| train/ | | -| approx_kl | 0.017075641 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | -0.0377 | -| explained_variance | -0.298 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 56620 | -| policy_gradient_loss | -0.0026 | -| std | 0.251 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.749 | -| time/ | | -| fps | 17 | -| iterations | 5664 | -| time_elapsed | 40896 | -| total_timesteps | 724992 | -| train/ | | -| approx_kl | 0.0059834444 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.0353 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 56630 | -| policy_gradient_loss | -0.00121 | -| std | 0.25 | -| value_loss | 3.32e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.752 | -| time/ | | -| fps | 17 | -| iterations | 5665 | -| time_elapsed | 40900 | -| total_timesteps | 725120 | -| train/ | | -| approx_kl | 0.017062578 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | -0.0331 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 56640 | -| policy_gradient_loss | -0.00572 | -| std | 0.25 | -| value_loss | 2.06e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.752 | -| time/ | | -| fps | 17 | -| iterations | 5666 | -| time_elapsed | 40909 | -| total_timesteps | 725248 | -| train/ | | -| approx_kl | 1.1032006 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | -0.0317 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 56650 | -| policy_gradient_loss | -0.00979 | -| std | 0.25 | -| value_loss | 0.000505 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.752 | -| time/ | | -| fps | 17 | -| iterations | 5667 | -| time_elapsed | 40913 | -| total_timesteps | 725376 | -| train/ | | -| approx_kl | 0.061523944 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | -0.0303 | -| explained_variance | -53 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 56660 | -| policy_gradient_loss | -0.00502 | -| std | 0.249 | -| value_loss | 2.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.752 | -| time/ | | -| fps | 17 | -| iterations | 5668 | -| time_elapsed | 40917 | -| total_timesteps | 725504 | -| train/ | | -| approx_kl | 0.014594809 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.0299 | -| explained_variance | -95.1 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 56670 | -| policy_gradient_loss | -0.00252 | -| std | 0.249 | -| value_loss | 5.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.752 | -| time/ | | -| fps | 17 | -| iterations | 5669 | -| time_elapsed | 40921 | -| total_timesteps | 725632 | -| train/ | | -| approx_kl | 0.0014973865 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0277 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.00064 | -| n_updates | 56680 | -| policy_gradient_loss | -0.000302 | -| std | 0.248 | -| value_loss | 1.58e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.752 | -| time/ | | -| fps | 17 | -| iterations | 5670 | -| time_elapsed | 40924 | -| total_timesteps | 725760 | -| train/ | | -| approx_kl | 0.015661642 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | -0.0231 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 56690 | -| policy_gradient_loss | -0.00344 | -| std | 0.247 | -| value_loss | 9.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.752 | -| time/ | | -| fps | 17 | -| iterations | 5671 | -| time_elapsed | 40926 | -| total_timesteps | 725888 | -| train/ | | -| approx_kl | 0.0005458514 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0214 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | -0.00022 | -| n_updates | 56700 | -| policy_gradient_loss | -7.59e-06 | -| std | 0.247 | -| value_loss | 1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5672 | -| time_elapsed | 40929 | -| total_timesteps | 726016 | -| train/ | | -| approx_kl | 0.013250104 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | -0.0217 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | -0.000569 | -| n_updates | 56710 | -| policy_gradient_loss | -0.000936 | -| std | 0.247 | -| value_loss | 6.27e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5673 | -| time_elapsed | 40938 | -| total_timesteps | 726144 | -| train/ | | -| approx_kl | 0.03698689 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | -0.0212 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.0261 | -| n_updates | 56720 | -| policy_gradient_loss | -0.0214 | -| std | 0.247 | -| value_loss | 5.62e-05 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5674 | -| time_elapsed | 40943 | -| total_timesteps | 726272 | -| train/ | | -| approx_kl | 1.108996 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.0202 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | -0.0251 | -| n_updates | 56730 | -| policy_gradient_loss | -0.0111 | -| std | 0.247 | -| value_loss | 1.91e-07 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5675 | -| time_elapsed | 40947 | -| total_timesteps | 726400 | -| train/ | | -| approx_kl | 0.00012582308 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0201 | -| explained_variance | -7.43 | -| learning_rate | 0.0003 | -| loss | 6.96e-05 | -| n_updates | 56740 | -| policy_gradient_loss | 0.000109 | -| std | 0.247 | -| value_loss | 3.09e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5676 | -| time_elapsed | 40950 | -| total_timesteps | 726528 | -| train/ | | -| approx_kl | 0.012417772 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | -0.0209 | -| explained_variance | -0.297 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 56750 | -| policy_gradient_loss | 0.000197 | -| std | 0.247 | -| value_loss | 1.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5677 | -| time_elapsed | 40954 | -| total_timesteps | 726656 | -| train/ | | -| approx_kl | 0.016009824 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | -0.022 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 56760 | -| policy_gradient_loss | -0.0081 | -| std | 0.247 | -| value_loss | 8.27e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5678 | -| time_elapsed | 40957 | -| total_timesteps | 726784 | -| train/ | | -| approx_kl | 0.01699819 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | -0.0225 | -| explained_variance | -0.0922 | -| learning_rate | 0.0003 | -| loss | -0.00647 | -| n_updates | 56770 | -| policy_gradient_loss | -0.00553 | -| std | 0.248 | -| value_loss | 8.61e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.759 | -| time/ | | -| fps | 17 | -| iterations | 5679 | -| time_elapsed | 40961 | -| total_timesteps | 726912 | -| train/ | | -| approx_kl | 0.015610812 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.0229 | -| explained_variance | -0.00507 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 56780 | -| policy_gradient_loss | -0.00338 | -| std | 0.248 | -| value_loss | 7.34e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5680 | -| time_elapsed | 40964 | -| total_timesteps | 727040 | -| train/ | | -| approx_kl | 0.016213354 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.0235 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 56790 | -| policy_gradient_loss | -0.00714 | -| std | 0.248 | -| value_loss | 4.77e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5681 | -| time_elapsed | 40970 | -| total_timesteps | 727168 | -| train/ | | -| approx_kl | 0.013641476 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.0228 | -| explained_variance | 0.595 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 56800 | -| policy_gradient_loss | -0.00966 | -| std | 0.247 | -| value_loss | 0.00482 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5682 | -| time_elapsed | 40973 | -| total_timesteps | 727296 | -| train/ | | -| approx_kl | 0.49536172 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | -0.0215 | -| explained_variance | -16.8 | -| learning_rate | 0.0003 | -| loss | -0.00993 | -| n_updates | 56810 | -| policy_gradient_loss | -0.0049 | -| std | 0.247 | -| value_loss | 4.03e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5683 | -| time_elapsed | 40976 | -| total_timesteps | 727424 | -| train/ | | -| approx_kl | 0.011451509 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | -0.0209 | -| explained_variance | -20.8 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 56820 | -| policy_gradient_loss | -0.00309 | -| std | 0.247 | -| value_loss | 5.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5684 | -| time_elapsed | 40979 | -| total_timesteps | 727552 | -| train/ | | -| approx_kl | 0.036299147 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | -0.0205 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 56830 | -| policy_gradient_loss | -0.00723 | -| std | 0.247 | -| value_loss | 1.19e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5685 | -| time_elapsed | 40982 | -| total_timesteps | 727680 | -| train/ | | -| approx_kl | 0.0153928865 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | -0.02 | -| explained_variance | -0.433 | -| learning_rate | 0.0003 | -| loss | 0.000423 | -| n_updates | 56840 | -| policy_gradient_loss | -0.000652 | -| std | 0.247 | -| value_loss | 7.84e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5686 | -| time_elapsed | 40985 | -| total_timesteps | 727808 | -| train/ | | -| approx_kl | 0.0138722835 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | -0.0193 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.00545 | -| n_updates | 56850 | -| policy_gradient_loss | -0.00346 | -| std | 0.247 | -| value_loss | 5e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5687 | -| time_elapsed | 40989 | -| total_timesteps | 727936 | -| train/ | | -| approx_kl | 0.017809052 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | -0.0188 | -| explained_variance | 0.00119 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 56860 | -| policy_gradient_loss | -0.00151 | -| std | 0.247 | -| value_loss | 6.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5688 | -| time_elapsed | 40992 | -| total_timesteps | 728064 | -| train/ | | -| approx_kl | 0.0060586617 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | -0.0187 | -| explained_variance | -0.00204 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 56870 | -| policy_gradient_loss | -0.004 | -| std | 0.247 | -| value_loss | 5.37e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5689 | -| time_elapsed | 40997 | -| total_timesteps | 728192 | -| train/ | | -| approx_kl | 2.3379292 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | -0.0189 | -| explained_variance | 0.942 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 56880 | -| policy_gradient_loss | -0.0106 | -| std | 0.247 | -| value_loss | 0.000434 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5690 | -| time_elapsed | 41000 | -| total_timesteps | 728320 | -| train/ | | -| approx_kl | 0.004133647 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.0184 | -| explained_variance | -2.99 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 56890 | -| policy_gradient_loss | -5.66e-06 | -| std | 0.246 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5691 | -| time_elapsed | 41002 | -| total_timesteps | 728448 | -| train/ | | -| approx_kl | 0.0019355449 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0186 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | -0.00346 | -| n_updates | 56900 | -| policy_gradient_loss | 0.000852 | -| std | 0.247 | -| value_loss | 4.9e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5692 | -| time_elapsed | 41005 | -| total_timesteps | 728576 | -| train/ | | -| approx_kl | 0.022699043 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | -0.0194 | -| explained_variance | -0.49 | -| learning_rate | 0.0003 | -| loss | 0.00412 | -| n_updates | 56910 | -| policy_gradient_loss | 0.00151 | -| std | 0.247 | -| value_loss | 5.32e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5693 | -| time_elapsed | 41008 | -| total_timesteps | 728704 | -| train/ | | -| approx_kl | 0.0011614459 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | -0.0218 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 56920 | -| policy_gradient_loss | -0.000674 | -| std | 0.248 | -| value_loss | 1.25e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5694 | -| time_elapsed | 41012 | -| total_timesteps | 728832 | -| train/ | | -| approx_kl | 0.01301302 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | -0.0252 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 56930 | -| policy_gradient_loss | -0.000796 | -| std | 0.248 | -| value_loss | 3.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.758 | -| time/ | | -| fps | 17 | -| iterations | 5695 | -| time_elapsed | 41015 | -| total_timesteps | 728960 | -| train/ | | -| approx_kl | 0.024942072 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | -0.0263 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 56940 | -| policy_gradient_loss | -0.0101 | -| std | 0.249 | -| value_loss | 1.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5696 | -| time_elapsed | 41018 | -| total_timesteps | 729088 | -| train/ | | -| approx_kl | 0.005994114 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | -0.0274 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.00076 | -| n_updates | 56950 | -| policy_gradient_loss | -0.000288 | -| std | 0.249 | -| value_loss | 3.58e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5697 | -| time_elapsed | 41025 | -| total_timesteps | 729216 | -| train/ | | -| approx_kl | 6.0404286 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | -0.0295 | -| explained_variance | -2.46 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 56960 | -| policy_gradient_loss | -0.00404 | -| std | 0.249 | -| value_loss | 0.0032 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5698 | -| time_elapsed | 41029 | -| total_timesteps | 729344 | -| train/ | | -| approx_kl | 0.030154303 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | -0.03 | -| explained_variance | -414 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 56970 | -| policy_gradient_loss | -0.00737 | -| std | 0.249 | -| value_loss | 8.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5699 | -| time_elapsed | 41032 | -| total_timesteps | 729472 | -| train/ | | -| approx_kl | 0.0081752045 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | -0.0306 | -| explained_variance | -186 | -| learning_rate | 0.0003 | -| loss | 0.0016 | -| n_updates | 56980 | -| policy_gradient_loss | 0.00116 | -| std | 0.25 | -| value_loss | 3.19e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5700 | -| time_elapsed | 41035 | -| total_timesteps | 729600 | -| train/ | | -| approx_kl | 0.022580456 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | -0.0311 | -| explained_variance | -6.09 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 56990 | -| policy_gradient_loss | -0.0031 | -| std | 0.25 | -| value_loss | 1.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5701 | -| time_elapsed | 41039 | -| total_timesteps | 729728 | -| train/ | | -| approx_kl | 0.015869914 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | -0.0304 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | -0.000481 | -| n_updates | 57000 | -| policy_gradient_loss | -0.00115 | -| std | 0.249 | -| value_loss | 3.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5702 | -| time_elapsed | 41042 | -| total_timesteps | 729856 | -| train/ | | -| approx_kl | 0.03767253 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | -0.0298 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 57010 | -| policy_gradient_loss | -0.014 | -| std | 0.249 | -| value_loss | 4.99e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.754 | -| time/ | | -| fps | 17 | -| iterations | 5703 | -| time_elapsed | 41045 | -| total_timesteps | 729984 | -| train/ | | -| approx_kl | 0.014833834 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | -0.0297 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 57020 | -| policy_gradient_loss | -0.00351 | -| std | 0.249 | -| value_loss | 4.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5704 | -| time_elapsed | 41048 | -| total_timesteps | 730112 | -| train/ | | -| approx_kl | 0.018293224 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | -0.0301 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.000183 | -| n_updates | 57030 | -| policy_gradient_loss | -0.00184 | -| std | 0.249 | -| value_loss | 1.06e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5705 | -| time_elapsed | 41058 | -| total_timesteps | 730240 | -| train/ | | -| approx_kl | 0.39697006 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | -0.0301 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 57040 | -| policy_gradient_loss | -0.00882 | -| std | 0.249 | -| value_loss | 0.00181 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5706 | -| time_elapsed | 41061 | -| total_timesteps | 730368 | -| train/ | | -| approx_kl | 0.051088862 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | -0.0291 | -| explained_variance | -278 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 57050 | -| policy_gradient_loss | -0.0126 | -| std | 0.249 | -| value_loss | 4.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5707 | -| time_elapsed | 41064 | -| total_timesteps | 730496 | -| train/ | | -| approx_kl | 0.03458164 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | -0.0283 | -| explained_variance | -595 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 57060 | -| policy_gradient_loss | -0.0134 | -| std | 0.249 | -| value_loss | 2.52e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5708 | -| time_elapsed | 41067 | -| total_timesteps | 730624 | -| train/ | | -| approx_kl | 0.04198139 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | -0.0281 | -| explained_variance | -32.3 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 57070 | -| policy_gradient_loss | -0.00561 | -| std | 0.249 | -| value_loss | 1.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5709 | -| time_elapsed | 41071 | -| total_timesteps | 730752 | -| train/ | | -| approx_kl | 0.013931091 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.0287 | -| explained_variance | -0.303 | -| learning_rate | 0.0003 | -| loss | 0.000956 | -| n_updates | 57080 | -| policy_gradient_loss | -0.00109 | -| std | 0.249 | -| value_loss | 4.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.753 | -| time/ | | -| fps | 17 | -| iterations | 5710 | -| time_elapsed | 41075 | -| total_timesteps | 730880 | -| train/ | | -| approx_kl | 0.024896871 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | -0.0298 | -| explained_variance | -2.9 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 57090 | -| policy_gradient_loss | -0.00962 | -| std | 0.249 | -| value_loss | 4.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5711 | -| time_elapsed | 41079 | -| total_timesteps | 731008 | -| train/ | | -| approx_kl | 0.037932083 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | -0.0294 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 57100 | -| policy_gradient_loss | -0.00976 | -| std | 0.249 | -| value_loss | 3.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5712 | -| time_elapsed | 41089 | -| total_timesteps | 731136 | -| train/ | | -| approx_kl | 0.028938785 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | -0.029 | -| explained_variance | 0.828 | -| learning_rate | 0.0003 | -| loss | -0.0299 | -| n_updates | 57110 | -| policy_gradient_loss | -0.0213 | -| std | 0.249 | -| value_loss | 0.00326 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5713 | -| time_elapsed | 41092 | -| total_timesteps | 731264 | -| train/ | | -| approx_kl | 0.55680317 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | -0.0289 | -| explained_variance | -255 | -| learning_rate | 0.0003 | -| loss | -0.0265 | -| n_updates | 57120 | -| policy_gradient_loss | -0.0176 | -| std | 0.249 | -| value_loss | 3.74e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5714 | -| time_elapsed | 41095 | -| total_timesteps | 731392 | -| train/ | | -| approx_kl | 0.007053649 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | -0.0288 | -| explained_variance | -29.2 | -| learning_rate | 0.0003 | -| loss | -0.00953 | -| n_updates | 57130 | -| policy_gradient_loss | -0.00705 | -| std | 0.249 | -| value_loss | 8.85e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5715 | -| time_elapsed | 41099 | -| total_timesteps | 731520 | -| train/ | | -| approx_kl | 0.03516685 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | -0.0283 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 57140 | -| policy_gradient_loss | -0.0118 | -| std | 0.249 | -| value_loss | 0.000163 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5716 | -| time_elapsed | 41101 | -| total_timesteps | 731648 | -| train/ | | -| approx_kl | 0.021807626 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -0.0275 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.00091 | -| n_updates | 57150 | -| policy_gradient_loss | -0.00224 | -| std | 0.248 | -| value_loss | 9.19e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5717 | -| time_elapsed | 41104 | -| total_timesteps | 731776 | -| train/ | | -| approx_kl | 0.02389411 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | -0.0257 | -| explained_variance | -0.00799 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 57160 | -| policy_gradient_loss | -0.00953 | -| std | 0.248 | -| value_loss | 5.79e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.761 | -| time/ | | -| fps | 17 | -| iterations | 5718 | -| time_elapsed | 41107 | -| total_timesteps | 731904 | -| train/ | | -| approx_kl | 0.0046416856 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | -0.0246 | -| explained_variance | -0.0775 | -| learning_rate | 0.0003 | -| loss | -0.000809 | -| n_updates | 57170 | -| policy_gradient_loss | -0.000523 | -| std | 0.248 | -| value_loss | 1.25e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5719 | -| time_elapsed | 41110 | -| total_timesteps | 732032 | -| train/ | | -| approx_kl | 0.011470573 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.0219 | -| explained_variance | -0.00556 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 57180 | -| policy_gradient_loss | -0.00144 | -| std | 0.247 | -| value_loss | 1.49e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5720 | -| time_elapsed | 41118 | -| total_timesteps | 732160 | -| train/ | | -| approx_kl | 0.24901898 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.0215 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 57190 | -| policy_gradient_loss | -0.018 | -| std | 0.247 | -| value_loss | 0.00145 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5721 | -| time_elapsed | 41121 | -| total_timesteps | 732288 | -| train/ | | -| approx_kl | 0.026377864 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | -0.0223 | -| explained_variance | -12.8 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 57200 | -| policy_gradient_loss | -0.00175 | -| std | 0.248 | -| value_loss | 2.47e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5722 | -| time_elapsed | 41123 | -| total_timesteps | 732416 | -| train/ | | -| approx_kl | 0.00026749307 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0252 | -| explained_variance | -331 | -| learning_rate | 0.0003 | -| loss | -0.000475 | -| n_updates | 57210 | -| policy_gradient_loss | -0.000171 | -| std | 0.249 | -| value_loss | 8.07e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5723 | -| time_elapsed | 41126 | -| total_timesteps | 732544 | -| train/ | | -| approx_kl | 0.037025724 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | -0.0289 | -| explained_variance | -3.21 | -| learning_rate | 0.0003 | -| loss | -0.00816 | -| n_updates | 57220 | -| policy_gradient_loss | -0.00864 | -| std | 0.249 | -| value_loss | 9.96e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5724 | -| time_elapsed | 41130 | -| total_timesteps | 732672 | -| train/ | | -| approx_kl | 0.0063360734 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | -0.0292 | -| explained_variance | -0.474 | -| learning_rate | 0.0003 | -| loss | 0.000208 | -| n_updates | 57230 | -| policy_gradient_loss | 0.000111 | -| std | 0.249 | -| value_loss | 2.28e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5725 | -| time_elapsed | 41133 | -| total_timesteps | 732800 | -| train/ | | -| approx_kl | 0.047498755 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | -0.0281 | -| explained_variance | -0.585 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 57240 | -| policy_gradient_loss | -0.0139 | -| std | 0.249 | -| value_loss | 2.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.773 | -| time/ | | -| fps | 17 | -| iterations | 5726 | -| time_elapsed | 41135 | -| total_timesteps | 732928 | -| train/ | | -| approx_kl | 0.007994738 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | -0.0273 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 57250 | -| policy_gradient_loss | -0.00248 | -| std | 0.249 | -| value_loss | 6.53e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5727 | -| time_elapsed | 41138 | -| total_timesteps | 733056 | -| train/ | | -| approx_kl | 0.01553312 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | -0.0267 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.00477 | -| n_updates | 57260 | -| policy_gradient_loss | -0.00255 | -| std | 0.248 | -| value_loss | 3.71e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5728 | -| time_elapsed | 41142 | -| total_timesteps | 733184 | -| train/ | | -| approx_kl | 1.3052248 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | -0.0264 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 57270 | -| policy_gradient_loss | -0.0151 | -| std | 0.248 | -| value_loss | 0.00401 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5729 | -| time_elapsed | 41145 | -| total_timesteps | 733312 | -| train/ | | -| approx_kl | 0.014426761 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | -0.0258 | -| explained_variance | -201 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 57280 | -| policy_gradient_loss | -0.000937 | -| std | 0.248 | -| value_loss | 1.89e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5730 | -| time_elapsed | 41150 | -| total_timesteps | 733440 | -| train/ | | -| approx_kl | 0.044098955 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | -0.0237 | -| explained_variance | -312 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 57290 | -| policy_gradient_loss | -0.0138 | -| std | 0.248 | -| value_loss | 5.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5731 | -| time_elapsed | 41154 | -| total_timesteps | 733568 | -| train/ | | -| approx_kl | 0.034027472 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | -0.0226 | -| explained_variance | -3.3 | -| learning_rate | 0.0003 | -| loss | 0.000585 | -| n_updates | 57300 | -| policy_gradient_loss | -0.00148 | -| std | 0.247 | -| value_loss | 4.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5732 | -| time_elapsed | 41157 | -| total_timesteps | 733696 | -| train/ | | -| approx_kl | 0.03211918 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | -0.0227 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | -0.00728 | -| n_updates | 57310 | -| policy_gradient_loss | -0.00625 | -| std | 0.248 | -| value_loss | 2.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5733 | -| time_elapsed | 41161 | -| total_timesteps | 733824 | -| train/ | | -| approx_kl | 0.014408004 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | -0.0233 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 57320 | -| policy_gradient_loss | -0.00261 | -| std | 0.248 | -| value_loss | 3.69e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.777 | -| time/ | | -| fps | 17 | -| iterations | 5734 | -| time_elapsed | 41165 | -| total_timesteps | 733952 | -| train/ | | -| approx_kl | 0.01793277 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.0247 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 57330 | -| policy_gradient_loss | -0.00389 | -| std | 0.248 | -| value_loss | 2.42e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5735 | -| time_elapsed | 41169 | -| total_timesteps | 734080 | -| train/ | | -| approx_kl | 5.409494e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.0249 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -1.51e-05 | -| n_updates | 57340 | -| policy_gradient_loss | -4.76e-06 | -| std | 0.248 | -| value_loss | 2.1e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5736 | -| time_elapsed | 41175 | -| total_timesteps | 734208 | -| train/ | | -| approx_kl | 0.0029660212 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | -0.0239 | -| explained_variance | 0.858 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 57350 | -| policy_gradient_loss | -0.0127 | -| std | 0.248 | -| value_loss | 0.00254 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5737 | -| time_elapsed | 41179 | -| total_timesteps | 734336 | -| train/ | | -| approx_kl | 0.020020328 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | -0.0223 | -| explained_variance | -91.5 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 57360 | -| policy_gradient_loss | -0.00185 | -| std | 0.247 | -| value_loss | 2.74e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5738 | -| time_elapsed | 41183 | -| total_timesteps | 734464 | -| train/ | | -| approx_kl | 1.1750963e-05 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | -0.0233 | -| explained_variance | -42.6 | -| learning_rate | 0.0003 | -| loss | -0.00037 | -| n_updates | 57370 | -| policy_gradient_loss | 0.000508 | -| std | 0.248 | -| value_loss | 4.39e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5739 | -| time_elapsed | 41187 | -| total_timesteps | 734592 | -| train/ | | -| approx_kl | 0.01919644 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | -0.0265 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 57380 | -| policy_gradient_loss | -0.00365 | -| std | 0.249 | -| value_loss | 4.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5740 | -| time_elapsed | 41191 | -| total_timesteps | 734720 | -| train/ | | -| approx_kl | 0.020213239 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | -0.0283 | -| explained_variance | -0.68 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 57390 | -| policy_gradient_loss | -0.00985 | -| std | 0.249 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5741 | -| time_elapsed | 41194 | -| total_timesteps | 734848 | -| train/ | | -| approx_kl | 0.0061747828 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | -0.0285 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 57400 | -| policy_gradient_loss | -0.000758 | -| std | 0.249 | -| value_loss | 1.62e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.774 | -| time/ | | -| fps | 17 | -| iterations | 5742 | -| time_elapsed | 41198 | -| total_timesteps | 734976 | -| train/ | | -| approx_kl | 0.010340521 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | -0.0277 | -| explained_variance | -0.646 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 57410 | -| policy_gradient_loss | -0.00264 | -| std | 0.249 | -| value_loss | 2.84e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5743 | -| time_elapsed | 41201 | -| total_timesteps | 735104 | -| train/ | | -| approx_kl | 0.0016262932 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.0274 | -| explained_variance | -0.401 | -| learning_rate | 0.0003 | -| loss | -0.00752 | -| n_updates | 57420 | -| policy_gradient_loss | 0.00307 | -| std | 0.249 | -| value_loss | 1.75e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5744 | -| time_elapsed | 41209 | -| total_timesteps | 735232 | -| train/ | | -| approx_kl | 0.04043138 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | -0.0264 | -| explained_variance | 0.94 | -| learning_rate | 0.0003 | -| loss | -0.000274 | -| n_updates | 57430 | -| policy_gradient_loss | -0.00101 | -| std | 0.248 | -| value_loss | 0.000986 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5745 | -| time_elapsed | 41212 | -| total_timesteps | 735360 | -| train/ | | -| approx_kl | 0.05993302 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | -0.0247 | -| explained_variance | -1.2e+03 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 57440 | -| policy_gradient_loss | -0.00261 | -| std | 0.248 | -| value_loss | 1.87e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5746 | -| time_elapsed | 41216 | -| total_timesteps | 735488 | -| train/ | | -| approx_kl | 0.0031705596 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.0245 | -| explained_variance | -745 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 57450 | -| policy_gradient_loss | 0.000498 | -| std | 0.248 | -| value_loss | 4.68e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5747 | -| time_elapsed | 41220 | -| total_timesteps | 735616 | -| train/ | | -| approx_kl | 0.07512498 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | -0.0245 | -| explained_variance | -136 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 57460 | -| policy_gradient_loss | -0.0105 | -| std | 0.248 | -| value_loss | 3.03e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5748 | -| time_elapsed | 41224 | -| total_timesteps | 735744 | -| train/ | | -| approx_kl | 0.021881454 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.0222 | -| explained_variance | -61.4 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 57470 | -| policy_gradient_loss | -0.00124 | -| std | 0.247 | -| value_loss | 6.78e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5749 | -| time_elapsed | 41227 | -| total_timesteps | 735872 | -| train/ | | -| approx_kl | 0.01710569 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | -0.0194 | -| explained_variance | -33.7 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 57480 | -| policy_gradient_loss | -0.007 | -| std | 0.247 | -| value_loss | 1.81e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5750 | -| time_elapsed | 41230 | -| total_timesteps | 736000 | -| train/ | | -| approx_kl | 0.022415817 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | -0.0185 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 57490 | -| policy_gradient_loss | -0.00554 | -| std | 0.246 | -| value_loss | 6.82e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5751 | -| time_elapsed | 41233 | -| total_timesteps | 736128 | -| train/ | | -| approx_kl | 0.0067714495 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | -0.018 | -| explained_variance | -0.0943 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 57500 | -| policy_gradient_loss | -0.000923 | -| std | 0.246 | -| value_loss | 4.84e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5752 | -| time_elapsed | 41241 | -| total_timesteps | 736256 | -| train/ | | -| approx_kl | 0.50169027 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | -0.018 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 57510 | -| policy_gradient_loss | -0.0128 | -| std | 0.246 | -| value_loss | 0.00112 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5753 | -| time_elapsed | 41244 | -| total_timesteps | 736384 | -| train/ | | -| approx_kl | 0.006734791 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | -0.0183 | -| explained_variance | -87.7 | -| learning_rate | 0.0003 | -| loss | -0.000621 | -| n_updates | 57520 | -| policy_gradient_loss | -0.000216 | -| std | 0.246 | -| value_loss | 5.19e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5754 | -| time_elapsed | 41247 | -| total_timesteps | 736512 | -| train/ | | -| approx_kl | 0.028943539 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | -0.0163 | -| explained_variance | -133 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 57530 | -| policy_gradient_loss | -0.00516 | -| std | 0.246 | -| value_loss | 5.39e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5755 | -| time_elapsed | 41251 | -| total_timesteps | 736640 | -| train/ | | -| approx_kl | 0.004916738 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | -0.0148 | -| explained_variance | -6.25 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 57540 | -| policy_gradient_loss | -0.000414 | -| std | 0.245 | -| value_loss | 3.66e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5756 | -| time_elapsed | 41255 | -| total_timesteps | 736768 | -| train/ | | -| approx_kl | 0.0014082226 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | -0.0137 | -| explained_variance | -6.06 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 57550 | -| policy_gradient_loss | 0.00106 | -| std | 0.245 | -| value_loss | 4.54e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5757 | -| time_elapsed | 41258 | -| total_timesteps | 736896 | -| train/ | | -| approx_kl | 0.009361099 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | -0.0121 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 57560 | -| policy_gradient_loss | 0.00127 | -| std | 0.245 | -| value_loss | 2.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5758 | -| time_elapsed | 41261 | -| total_timesteps | 737024 | -| train/ | | -| approx_kl | 0.011508143 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | -0.0111 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 57570 | -| policy_gradient_loss | -0.00614 | -| std | 0.245 | -| value_loss | 2.52e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5759 | -| time_elapsed | 41271 | -| total_timesteps | 737152 | -| train/ | | -| approx_kl | 0.01624979 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | -0.0102 | -| explained_variance | -12.3 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 57580 | -| policy_gradient_loss | -0.0162 | -| std | 0.244 | -| value_loss | 0.0086 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5760 | -| time_elapsed | 41275 | -| total_timesteps | 737280 | -| train/ | | -| approx_kl | 0.025652345 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | -0.00892 | -| explained_variance | -3.74e+03 | -| learning_rate | 0.0003 | -| loss | -0.000763 | -| n_updates | 57590 | -| policy_gradient_loss | -0.000934 | -| std | 0.244 | -| value_loss | 3.5e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5761 | -| time_elapsed | 41279 | -| total_timesteps | 737408 | -| train/ | | -| approx_kl | 0.0005679778 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.00624 | -| explained_variance | -1.06e+04 | -| learning_rate | 0.0003 | -| loss | -0.000324 | -| n_updates | 57600 | -| policy_gradient_loss | -0.000115 | -| std | 0.243 | -| value_loss | 5.99e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5762 | -| time_elapsed | 41282 | -| total_timesteps | 737536 | -| train/ | | -| approx_kl | 0.03630188 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | -0.00233 | -| explained_variance | -171 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 57610 | -| policy_gradient_loss | -0.0111 | -| std | 0.242 | -| value_loss | 3.88e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5763 | -| time_elapsed | 41286 | -| total_timesteps | 737664 | -| train/ | | -| approx_kl | 0.04609346 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | -0.000713 | -| explained_variance | -89.3 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 57620 | -| policy_gradient_loss | -0.00453 | -| std | 0.242 | -| value_loss | 7.95e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5764 | -| time_elapsed | 41290 | -| total_timesteps | 737792 | -| train/ | | -| approx_kl | 0.018936869 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | -0.000413 | -| explained_variance | -3.57 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 57630 | -| policy_gradient_loss | -0.00296 | -| std | 0.242 | -| value_loss | 6.72e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.797 | -| time/ | | -| fps | 17 | -| iterations | 5765 | -| time_elapsed | 41293 | -| total_timesteps | 737920 | -| train/ | | -| approx_kl | 0.012407664 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.000264 | -| explained_variance | -0.542 | -| learning_rate | 0.0003 | -| loss | -0.000512 | -| n_updates | 57640 | -| policy_gradient_loss | -0.00107 | -| std | 0.242 | -| value_loss | 4.52e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5766 | -| time_elapsed | 41297 | -| total_timesteps | 738048 | -| train/ | | -| approx_kl | 0.024197131 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 0.00122 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 57650 | -| policy_gradient_loss | -0.00206 | -| std | 0.242 | -| value_loss | 8.81e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5767 | -| time_elapsed | 41304 | -| total_timesteps | 738176 | -| train/ | | -| approx_kl | 0.030055791 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.00131 | -| explained_variance | -12.8 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 57660 | -| policy_gradient_loss | -0.0157 | -| std | 0.242 | -| value_loss | 0.00355 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5768 | -| time_elapsed | 41308 | -| total_timesteps | 738304 | -| train/ | | -| approx_kl | 0.007884517 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 0.00121 | -| explained_variance | -855 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 57670 | -| policy_gradient_loss | -0.00742 | -| std | 0.242 | -| value_loss | 7.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5769 | -| time_elapsed | 41311 | -| total_timesteps | 738432 | -| train/ | | -| approx_kl | 0.030103806 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.000578 | -| explained_variance | -1.56e+03 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 57680 | -| policy_gradient_loss | -0.00649 | -| std | 0.242 | -| value_loss | 3.38e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5770 | -| time_elapsed | 41314 | -| total_timesteps | 738560 | -| train/ | | -| approx_kl | 0.0077686817 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.00112 | -| explained_variance | -232 | -| learning_rate | 0.0003 | -| loss | -0.000204 | -| n_updates | 57690 | -| policy_gradient_loss | -3.86e-05 | -| std | 0.241 | -| value_loss | 2.51e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5771 | -| time_elapsed | 41317 | -| total_timesteps | 738688 | -| train/ | | -| approx_kl | 0.018174909 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 0.0032 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 57700 | -| policy_gradient_loss | -0.00769 | -| std | 0.241 | -| value_loss | 1.62e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5772 | -| time_elapsed | 41320 | -| total_timesteps | 738816 | -| train/ | | -| approx_kl | 0.013270646 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 0.00349 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 57710 | -| policy_gradient_loss | -0.00132 | -| std | 0.241 | -| value_loss | 3.99e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.788 | -| time/ | | -| fps | 17 | -| iterations | 5773 | -| time_elapsed | 41324 | -| total_timesteps | 738944 | -| train/ | | -| approx_kl | 0.0107794395 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.00288 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 57720 | -| policy_gradient_loss | -0.00135 | -| std | 0.241 | -| value_loss | 5.25e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5774 | -| time_elapsed | 41327 | -| total_timesteps | 739072 | -| train/ | | -| approx_kl | 0.016969763 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.00187 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 57730 | -| policy_gradient_loss | -0.00234 | -| std | 0.242 | -| value_loss | 2.12e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5775 | -| time_elapsed | 41332 | -| total_timesteps | 739200 | -| train/ | | -| approx_kl | 0.46139568 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.00112 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.0271 | -| n_updates | 57740 | -| policy_gradient_loss | -0.0162 | -| std | 0.242 | -| value_loss | 9.29e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5776 | -| time_elapsed | 41336 | -| total_timesteps | 739328 | -| train/ | | -| approx_kl | 0.045127586 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 0.00134 | -| explained_variance | -4.85 | -| learning_rate | 0.0003 | -| loss | -0.0028 | -| n_updates | 57750 | -| policy_gradient_loss | -0.00514 | -| std | 0.242 | -| value_loss | 1.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5777 | -| time_elapsed | 41340 | -| total_timesteps | 739456 | -| train/ | | -| approx_kl | 0.016247608 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 0.00262 | -| explained_variance | -9.19 | -| learning_rate | 0.0003 | -| loss | -0.000845 | -| n_updates | 57760 | -| policy_gradient_loss | -0.000727 | -| std | 0.241 | -| value_loss | 1.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5778 | -| time_elapsed | 41344 | -| total_timesteps | 739584 | -| train/ | | -| approx_kl | 0.01651065 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.00424 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | -0.00431 | -| n_updates | 57770 | -| policy_gradient_loss | -0.00292 | -| std | 0.241 | -| value_loss | 8.54e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5779 | -| time_elapsed | 41348 | -| total_timesteps | 739712 | -| train/ | | -| approx_kl | 0.013115944 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.0037 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 57780 | -| policy_gradient_loss | -0.00258 | -| std | 0.241 | -| value_loss | 7.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5780 | -| time_elapsed | 41352 | -| total_timesteps | 739840 | -| train/ | | -| approx_kl | 0.008225188 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.00306 | -| explained_variance | -0.00117 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 57790 | -| policy_gradient_loss | -0.00185 | -| std | 0.241 | -| value_loss | 3.86e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.783 | -| time/ | | -| fps | 17 | -| iterations | 5781 | -| time_elapsed | 41356 | -| total_timesteps | 739968 | -| train/ | | -| approx_kl | 0.0111871045 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 0.00379 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 57800 | -| policy_gradient_loss | -0.00556 | -| std | 0.241 | -| value_loss | 1.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5782 | -| time_elapsed | 41360 | -| total_timesteps | 740096 | -| train/ | | -| approx_kl | 0.013371367 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.00435 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 57810 | -| policy_gradient_loss | -0.00165 | -| std | 0.241 | -| value_loss | 8.08e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5783 | -| time_elapsed | 41365 | -| total_timesteps | 740224 | -| train/ | | -| approx_kl | 0.020986792 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 0.00553 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 57820 | -| policy_gradient_loss | -0.0157 | -| std | 0.241 | -| value_loss | 0.00191 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5784 | -| time_elapsed | 41368 | -| total_timesteps | 740352 | -| train/ | | -| approx_kl | 0.0073505654 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.0059 | -| explained_variance | -211 | -| learning_rate | 0.0003 | -| loss | 7.67e-05 | -| n_updates | 57830 | -| policy_gradient_loss | 0.0002 | -| std | 0.241 | -| value_loss | 7.11e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5785 | -| time_elapsed | 41372 | -| total_timesteps | 740480 | -| train/ | | -| approx_kl | 0.055271983 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.00464 | -| explained_variance | -488 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 57840 | -| policy_gradient_loss | -0.00472 | -| std | 0.241 | -| value_loss | 3.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5786 | -| time_elapsed | 41376 | -| total_timesteps | 740608 | -| train/ | | -| approx_kl | 0.0044525955 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.00353 | -| explained_variance | -27.7 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 57850 | -| policy_gradient_loss | 0.00152 | -| std | 0.241 | -| value_loss | 3.53e-08 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5787 | -| time_elapsed | 41379 | -| total_timesteps | 740736 | -| train/ | | -| approx_kl | 0.000107883476 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | 0.00282 | -| explained_variance | -0.609 | -| learning_rate | 0.0003 | -| loss | -0.000393 | -| n_updates | 57860 | -| policy_gradient_loss | 0.000261 | -| std | 0.242 | -| value_loss | 3.09e-09 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5788 | -| time_elapsed | 41383 | -| total_timesteps | 740864 | -| train/ | | -| approx_kl | 0.034483574 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | -0.000298 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 57870 | -| policy_gradient_loss | -0.0205 | -| std | 0.242 | -| value_loss | 5.77e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.778 | -| time/ | | -| fps | 17 | -| iterations | 5789 | -| time_elapsed | 41387 | -| total_timesteps | 740992 | -| train/ | | -| approx_kl | 0.014473423 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | -0.00173 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 57880 | -| policy_gradient_loss | -0.000181 | -| std | 0.242 | -| value_loss | 7.82e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5790 | -| time_elapsed | 41390 | -| total_timesteps | 741120 | -| train/ | | -| approx_kl | 0.008440601 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | -0.00145 | -| explained_variance | -0.0041 | -| learning_rate | 0.0003 | -| loss | 0.00248 | -| n_updates | 57890 | -| policy_gradient_loss | 0.000238 | -| std | 0.242 | -| value_loss | 2.17e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5791 | -| time_elapsed | 41399 | -| total_timesteps | 741248 | -| train/ | | -| approx_kl | 0.028926024 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | -0.00073 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.0278 | -| n_updates | 57900 | -| policy_gradient_loss | -0.0213 | -| std | 0.242 | -| value_loss | 0.000147 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5792 | -| time_elapsed | 41403 | -| total_timesteps | 741376 | -| train/ | | -| approx_kl | 0.02040271 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | -0.000588 | -| explained_variance | -353 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 57910 | -| policy_gradient_loss | -0.0022 | -| std | 0.242 | -| value_loss | 9.42e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5793 | -| time_elapsed | 41406 | -| total_timesteps | 741504 | -| train/ | | -| approx_kl | 0.0005684602 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | -0.00122 | -| explained_variance | -131 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 57920 | -| policy_gradient_loss | 0.00422 | -| std | 0.242 | -| value_loss | 1.94e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5794 | -| time_elapsed | 41408 | -| total_timesteps | 741632 | -| train/ | | -| approx_kl | 0.003792718 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | -0.00115 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 57930 | -| policy_gradient_loss | 0.000187 | -| std | 0.242 | -| value_loss | 2.62e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5795 | -| time_elapsed | 41411 | -| total_timesteps | 741760 | -| train/ | | -| approx_kl | 0.047426455 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | -0.00153 | -| explained_variance | -37.9 | -| learning_rate | 0.0003 | -| loss | -0.00753 | -| n_updates | 57940 | -| policy_gradient_loss | -0.00762 | -| std | 0.242 | -| value_loss | 5.06e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.781 | -| time/ | | -| fps | 17 | -| iterations | 5796 | -| time_elapsed | 41414 | -| total_timesteps | 741888 | -| train/ | | -| approx_kl | 0.017602054 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | -0.00131 | -| explained_variance | -1.83 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 57950 | -| policy_gradient_loss | -0.00375 | -| std | 0.242 | -| value_loss | 7.3e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5797 | -| time_elapsed | 41418 | -| total_timesteps | 742016 | -| train/ | | -| approx_kl | 0.020330954 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | -0.000129 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 57960 | -| policy_gradient_loss | -0.00499 | -| std | 0.242 | -| value_loss | 5.61e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5798 | -| time_elapsed | 41426 | -| total_timesteps | 742144 | -| train/ | | -| approx_kl | 0.10582326 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.000818 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0319 | -| n_updates | 57970 | -| policy_gradient_loss | -0.0227 | -| std | 0.242 | -| value_loss | 3.12e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5799 | -| time_elapsed | 41429 | -| total_timesteps | 742272 | -| train/ | | -| approx_kl | 0.025544345 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.00146 | -| explained_variance | -3.65 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 57980 | -| policy_gradient_loss | -0.00702 | -| std | 0.242 | -| value_loss | 5.81e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5800 | -| time_elapsed | 41433 | -| total_timesteps | 742400 | -| train/ | | -| approx_kl | 0.023392204 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.00187 | -| explained_variance | -9.93 | -| learning_rate | 0.0003 | -| loss | -0.000569 | -| n_updates | 57990 | -| policy_gradient_loss | -0.00145 | -| std | 0.241 | -| value_loss | 4e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5801 | -| time_elapsed | 41436 | -| total_timesteps | 742528 | -| train/ | | -| approx_kl | 0.012077399 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 0.00263 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.00764 | -| n_updates | 58000 | -| policy_gradient_loss | -0.00406 | -| std | 0.241 | -| value_loss | 1.59e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5802 | -| time_elapsed | 41440 | -| total_timesteps | 742656 | -| train/ | | -| approx_kl | 0.02435654 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.00294 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 58010 | -| policy_gradient_loss | -0.00817 | -| std | 0.241 | -| value_loss | 1.15e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5803 | -| time_elapsed | 41443 | -| total_timesteps | 742784 | -| train/ | | -| approx_kl | 0.011132903 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 0.00355 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.000417 | -| n_updates | 58020 | -| policy_gradient_loss | -0.000513 | -| std | 0.241 | -| value_loss | 9.91e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 17 | -| iterations | 5804 | -| time_elapsed | 41447 | -| total_timesteps | 742912 | -| train/ | | -| approx_kl | 0.013825012 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.00417 | -| explained_variance | -0.00972 | -| learning_rate | 0.0003 | -| loss | 0.00134 | -| n_updates | 58030 | -| policy_gradient_loss | -0.00107 | -| std | 0.241 | -| value_loss | 6.71e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5805 | -| time_elapsed | 41451 | -| total_timesteps | 743040 | -| train/ | | -| approx_kl | 0.0013751248 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | 0.00714 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 58040 | -| policy_gradient_loss | -0.00144 | -| std | 0.239 | -| value_loss | 3.46e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5806 | -| time_elapsed | 41458 | -| total_timesteps | 743168 | -| train/ | | -| approx_kl | 0.0036407053 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.0142 | -| explained_variance | 0.797 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 58050 | -| policy_gradient_loss | -0.0109 | -| std | 0.238 | -| value_loss | 0.00303 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5807 | -| time_elapsed | 41461 | -| total_timesteps | 743296 | -| train/ | | -| approx_kl | 0.019962143 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.0188 | -| explained_variance | -7.71e+03 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 58060 | -| policy_gradient_loss | -0.00296 | -| std | 0.237 | -| value_loss | 3.58e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5808 | -| time_elapsed | 41465 | -| total_timesteps | 743424 | -| train/ | | -| approx_kl | 0.0002739583 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 0.0199 | -| explained_variance | -2.87e+03 | -| learning_rate | 0.0003 | -| loss | -0.000988 | -| n_updates | 58070 | -| policy_gradient_loss | 0.00158 | -| std | 0.237 | -| value_loss | 1.31e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5809 | -| time_elapsed | 41469 | -| total_timesteps | 743552 | -| train/ | | -| approx_kl | 0.08190781 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 0.0189 | -| explained_variance | -105 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 58080 | -| policy_gradient_loss | -0.00263 | -| std | 0.238 | -| value_loss | 7.59e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5810 | -| time_elapsed | 41472 | -| total_timesteps | 743680 | -| train/ | | -| approx_kl | 0.010671987 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 0.0171 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.00989 | -| n_updates | 58090 | -| policy_gradient_loss | -0.00262 | -| std | 0.238 | -| value_loss | 2.04e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5811 | -| time_elapsed | 41475 | -| total_timesteps | 743808 | -| train/ | | -| approx_kl | 0.00026539853 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 0.0167 | -| explained_variance | -1.85 | -| learning_rate | 0.0003 | -| loss | -0.000322 | -| n_updates | 58100 | -| policy_gradient_loss | 0.000578 | -| std | 0.238 | -| value_loss | 7.04e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.79 | -| time/ | | -| fps | 17 | -| iterations | 5812 | -| time_elapsed | 41478 | -| total_timesteps | 743936 | -| train/ | | -| approx_kl | 0.006913549 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.0188 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 58110 | -| policy_gradient_loss | -0.00152 | -| std | 0.237 | -| value_loss | 1.15e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5813 | -| time_elapsed | 41481 | -| total_timesteps | 744064 | -| train/ | | -| approx_kl | 0.01573313 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.0205 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.00259 | -| n_updates | 58120 | -| policy_gradient_loss | 0.00153 | -| std | 0.237 | -| value_loss | 2.48e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5814 | -| time_elapsed | 41488 | -| total_timesteps | 744192 | -| train/ | | -| approx_kl | 0.07809769 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.0216 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 58130 | -| policy_gradient_loss | -0.00686 | -| std | 0.237 | -| value_loss | 3.82e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5815 | -| time_elapsed | 41492 | -| total_timesteps | 744320 | -| train/ | | -| approx_kl | 0.009697451 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 0.0221 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 58140 | -| policy_gradient_loss | -0.00313 | -| std | 0.237 | -| value_loss | 2.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5816 | -| time_elapsed | 41495 | -| total_timesteps | 744448 | -| train/ | | -| approx_kl | 0.017961396 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.0221 | -| explained_variance | -15.9 | -| learning_rate | 0.0003 | -| loss | 0.000242 | -| n_updates | 58150 | -| policy_gradient_loss | -0.000667 | -| std | 0.237 | -| value_loss | 4.79e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5817 | -| time_elapsed | 41499 | -| total_timesteps | 744576 | -| train/ | | -| approx_kl | 0.0494701 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.0215 | -| explained_variance | -147 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 58160 | -| policy_gradient_loss | -0.0127 | -| std | 0.237 | -| value_loss | 1.6e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5818 | -| time_elapsed | 41503 | -| total_timesteps | 744704 | -| train/ | | -| approx_kl | 0.010576177 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.0215 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 58170 | -| policy_gradient_loss | -0.00204 | -| std | 0.237 | -| value_loss | 8.1e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5819 | -| time_elapsed | 41507 | -| total_timesteps | 744832 | -| train/ | | -| approx_kl | 0.016650302 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.0213 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | -0.000278 | -| n_updates | 58180 | -| policy_gradient_loss | -0.00139 | -| std | 0.237 | -| value_loss | 5.37e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.792 | -| time/ | | -| fps | 17 | -| iterations | 5820 | -| time_elapsed | 41511 | -| total_timesteps | 744960 | -| train/ | | -| approx_kl | 0.0040082987 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.021 | -| explained_variance | -0.0901 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 58190 | -| policy_gradient_loss | -0.0016 | -| std | 0.237 | -| value_loss | 2.19e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5821 | -| time_elapsed | 41513 | -| total_timesteps | 745088 | -| train/ | | -| approx_kl | 0.0023650667 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.0196 | -| explained_variance | 0.00372 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 58200 | -| policy_gradient_loss | 4.36e-05 | -| std | 0.238 | -| value_loss | 6.85e-10 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5822 | -| time_elapsed | 41522 | -| total_timesteps | 745216 | -| train/ | | -| approx_kl | 7.2396774 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.017 | -| explained_variance | 0.933 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 58210 | -| policy_gradient_loss | -0.0105 | -| std | 0.238 | -| value_loss | 0.000713 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5823 | -| time_elapsed | 41524 | -| total_timesteps | 745344 | -| train/ | | -| approx_kl | 0.03164737 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.0161 | -| explained_variance | -604 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 58220 | -| policy_gradient_loss | -0.0116 | -| std | 0.238 | -| value_loss | 2.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5824 | -| time_elapsed | 41527 | -| total_timesteps | 745472 | -| train/ | | -| approx_kl | 0.051582877 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 0.016 | -| explained_variance | -1.06e+04 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 58230 | -| policy_gradient_loss | -0.00441 | -| std | 0.238 | -| value_loss | 8.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5825 | -| time_elapsed | 41530 | -| total_timesteps | 745600 | -| train/ | | -| approx_kl | 0.060354497 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 0.0157 | -| explained_variance | -25.8 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 58240 | -| policy_gradient_loss | -0.00742 | -| std | 0.238 | -| value_loss | 1.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5826 | -| time_elapsed | 41533 | -| total_timesteps | 745728 | -| train/ | | -| approx_kl | 0.014115782 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.016 | -| explained_variance | -0.657 | -| learning_rate | 0.0003 | -| loss | -0.00534 | -| n_updates | 58250 | -| policy_gradient_loss | -0.00418 | -| std | 0.238 | -| value_loss | 6.68e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5827 | -| time_elapsed | 41535 | -| total_timesteps | 745856 | -| train/ | | -| approx_kl | 0.021992143 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.017 | -| explained_variance | -0.0936 | -| learning_rate | 0.0003 | -| loss | -0.00827 | -| n_updates | 58260 | -| policy_gradient_loss | -0.00857 | -| std | 0.238 | -| value_loss | 2.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.795 | -| time/ | | -| fps | 17 | -| iterations | 5828 | -| time_elapsed | 41547 | -| total_timesteps | 745984 | -| train/ | | -| approx_kl | 0.012835093 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.0174 | -| explained_variance | 0.00597 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 58270 | -| policy_gradient_loss | -0.0059 | -| std | 0.238 | -| value_loss | 6.33e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 17 | -| iterations | 5829 | -| time_elapsed | 41550 | -| total_timesteps | 746112 | -| train/ | | -| approx_kl | 0.0018784753 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0173 | -| explained_variance | -0.244 | -| learning_rate | 0.0003 | -| loss | -1.21e-05 | -| n_updates | 58280 | -| policy_gradient_loss | 1.17e-05 | -| std | 0.238 | -| value_loss | 1.91e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 17 | -| iterations | 5830 | -| time_elapsed | 41559 | -| total_timesteps | 746240 | -| train/ | | -| approx_kl | 0.5406659 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 0.0191 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | 0.00552 | -| n_updates | 58290 | -| policy_gradient_loss | 0.00757 | -| std | 0.237 | -| value_loss | 0.00299 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 17 | -| iterations | 5831 | -| time_elapsed | 41562 | -| total_timesteps | 746368 | -| train/ | | -| approx_kl | 0.01473753 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 0.0196 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | 0.00693 | -| n_updates | 58300 | -| policy_gradient_loss | 0.00682 | -| std | 0.237 | -| value_loss | 0.000162 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 17 | -| iterations | 5832 | -| time_elapsed | 41565 | -| total_timesteps | 746496 | -| train/ | | -| approx_kl | 0.015672313 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 0.0197 | -| explained_variance | 0.664 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 58310 | -| policy_gradient_loss | -0.0035 | -| std | 0.237 | -| value_loss | 0.000113 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 17 | -| iterations | 5833 | -| time_elapsed | 41568 | -| total_timesteps | 746624 | -| train/ | | -| approx_kl | 0.05974508 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 0.0203 | -| explained_variance | -2.46 | -| learning_rate | 0.0003 | -| loss | -0.0269 | -| n_updates | 58320 | -| policy_gradient_loss | -0.0252 | -| std | 0.237 | -| value_loss | 0.00138 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 17 | -| iterations | 5834 | -| time_elapsed | 41572 | -| total_timesteps | 746752 | -| train/ | | -| approx_kl | 0.009013804 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.0209 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.00873 | -| n_updates | 58330 | -| policy_gradient_loss | -0.00534 | -| std | 0.237 | -| value_loss | 0.000162 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 17 | -| iterations | 5835 | -| time_elapsed | 41575 | -| total_timesteps | 746880 | -| train/ | | -| approx_kl | 0.017327847 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.0212 | -| explained_variance | -2.78 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 58340 | -| policy_gradient_loss | -0.00072 | -| std | 0.237 | -| value_loss | 0.000566 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5836 | -| time_elapsed | 41579 | -| total_timesteps | 747008 | -| train/ | | -| approx_kl | 0.0049932385 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 0.0207 | -| explained_variance | -5.7 | -| learning_rate | 0.0003 | -| loss | -0.00782 | -| n_updates | 58350 | -| policy_gradient_loss | -0.00449 | -| std | 0.237 | -| value_loss | 1.55e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5837 | -| time_elapsed | 41588 | -| total_timesteps | 747136 | -| train/ | | -| approx_kl | 0.26364064 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 0.0207 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 58360 | -| policy_gradient_loss | -0.0116 | -| std | 0.237 | -| value_loss | 0.00289 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5838 | -| time_elapsed | 41592 | -| total_timesteps | 747264 | -| train/ | | -| approx_kl | 0.0144921215 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.0215 | -| explained_variance | -0.897 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 58370 | -| policy_gradient_loss | -0.00384 | -| std | 0.237 | -| value_loss | 0.000157 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5839 | -| time_elapsed | 41594 | -| total_timesteps | 747392 | -| train/ | | -| approx_kl | 0.035941985 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 0.0227 | -| explained_variance | -4.94 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 58380 | -| policy_gradient_loss | -0.0119 | -| std | 0.236 | -| value_loss | 0.000174 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5840 | -| time_elapsed | 41597 | -| total_timesteps | 747520 | -| train/ | | -| approx_kl | 0.011512309 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.0235 | -| explained_variance | -2.81 | -| learning_rate | 0.0003 | -| loss | -0.00876 | -| n_updates | 58390 | -| policy_gradient_loss | -0.00618 | -| std | 0.236 | -| value_loss | 0.000142 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5841 | -| time_elapsed | 41600 | -| total_timesteps | 747648 | -| train/ | | -| approx_kl | 0.011732039 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.0234 | -| explained_variance | -2.08 | -| learning_rate | 0.0003 | -| loss | -0.000494 | -| n_updates | 58400 | -| policy_gradient_loss | -0.00146 | -| std | 0.236 | -| value_loss | 0.000392 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5842 | -| time_elapsed | 41603 | -| total_timesteps | 747776 | -| train/ | | -| approx_kl | 0.014802368 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.023 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.00656 | -| n_updates | 58410 | -| policy_gradient_loss | -0.00507 | -| std | 0.236 | -| value_loss | 0.000174 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 17 | -| iterations | 5843 | -| time_elapsed | 41605 | -| total_timesteps | 747904 | -| train/ | | -| approx_kl | 0.019746765 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.0234 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 58420 | -| policy_gradient_loss | -0.00508 | -| std | 0.236 | -| value_loss | 0.000168 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5844 | -| time_elapsed | 41607 | -| total_timesteps | 748032 | -| train/ | | -| approx_kl | 0.021935033 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.0236 | -| explained_variance | -3.53 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 58430 | -| policy_gradient_loss | -0.00773 | -| std | 0.236 | -| value_loss | 0.000162 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5845 | -| time_elapsed | 41613 | -| total_timesteps | 748160 | -| train/ | | -| approx_kl | 0.19519134 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.0242 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 58440 | -| policy_gradient_loss | -0.00297 | -| std | 0.236 | -| value_loss | 0.000531 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5846 | -| time_elapsed | 41615 | -| total_timesteps | 748288 | -| train/ | | -| approx_kl | 0.02128998 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.0258 | -| explained_variance | -1.94 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 58450 | -| policy_gradient_loss | -0.0174 | -| std | 0.236 | -| value_loss | 4.57e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5847 | -| time_elapsed | 41618 | -| total_timesteps | 748416 | -| train/ | | -| approx_kl | 0.0074545206 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.0268 | -| explained_variance | -2.73 | -| learning_rate | 0.0003 | -| loss | -0.000135 | -| n_updates | 58460 | -| policy_gradient_loss | -0.000326 | -| std | 0.235 | -| value_loss | 5.96e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5848 | -| time_elapsed | 41620 | -| total_timesteps | 748544 | -| train/ | | -| approx_kl | 0.023081312 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.0273 | -| explained_variance | -1.95 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 58470 | -| policy_gradient_loss | -0.0109 | -| std | 0.236 | -| value_loss | 0.000346 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5849 | -| time_elapsed | 41623 | -| total_timesteps | 748672 | -| train/ | | -| approx_kl | 0.020151785 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.0266 | -| explained_variance | -4.23 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 58480 | -| policy_gradient_loss | -0.006 | -| std | 0.236 | -| value_loss | 0.000158 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5850 | -| time_elapsed | 41626 | -| total_timesteps | 748800 | -| train/ | | -| approx_kl | 0.019494008 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 0.0259 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | -0.0066 | -| n_updates | 58490 | -| policy_gradient_loss | -0.00579 | -| std | 0.236 | -| value_loss | 3.72e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.814 | -| time/ | | -| fps | 17 | -| iterations | 5851 | -| time_elapsed | 41630 | -| total_timesteps | 748928 | -| train/ | | -| approx_kl | 0.010400854 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.0256 | -| explained_variance | 0.492 | -| learning_rate | 0.0003 | -| loss | 0.00262 | -| n_updates | 58500 | -| policy_gradient_loss | 2.36e-05 | -| std | 0.236 | -| value_loss | 0.000555 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 17 | -| iterations | 5852 | -| time_elapsed | 41633 | -| total_timesteps | 749056 | -| train/ | | -| approx_kl | 0.019321041 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.026 | -| explained_variance | -4.11 | -| learning_rate | 0.0003 | -| loss | -0.000213 | -| n_updates | 58510 | -| policy_gradient_loss | -0.00275 | -| std | 0.236 | -| value_loss | 0.000861 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 17 | -| iterations | 5853 | -| time_elapsed | 41638 | -| total_timesteps | 749184 | -| train/ | | -| approx_kl | 0.016368613 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.0266 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 58520 | -| policy_gradient_loss | -0.00729 | -| std | 0.236 | -| value_loss | 0.000953 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 17 | -| iterations | 5854 | -| time_elapsed | 41642 | -| total_timesteps | 749312 | -| train/ | | -| approx_kl | 0.005032134 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.027 | -| explained_variance | -2.64 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 58530 | -| policy_gradient_loss | -0.000746 | -| std | 0.235 | -| value_loss | 0.00038 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 17 | -| iterations | 5855 | -| time_elapsed | 41644 | -| total_timesteps | 749440 | -| train/ | | -| approx_kl | 0.031088855 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 0.0279 | -| explained_variance | -0.846 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 58540 | -| policy_gradient_loss | -0.0101 | -| std | 0.235 | -| value_loss | 7.59e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 17 | -| iterations | 5856 | -| time_elapsed | 41646 | -| total_timesteps | 749568 | -| train/ | | -| approx_kl | 0.032357797 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 0.028 | -| explained_variance | -0.812 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 58550 | -| policy_gradient_loss | -0.00927 | -| std | 0.235 | -| value_loss | 0.000145 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 17 | -| iterations | 5857 | -| time_elapsed | 41649 | -| total_timesteps | 749696 | -| train/ | | -| approx_kl | 0.023993753 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.029 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | -0.0078 | -| n_updates | 58560 | -| policy_gradient_loss | -0.00722 | -| std | 0.235 | -| value_loss | 4.86e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 18 | -| iterations | 5858 | -| time_elapsed | 41653 | -| total_timesteps | 749824 | -| train/ | | -| approx_kl | 0.015303424 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.0307 | -| explained_variance | -1.02 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 58570 | -| policy_gradient_loss | -0.00797 | -| std | 0.234 | -| value_loss | 9.42e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 18 | -| iterations | 5859 | -| time_elapsed | 41656 | -| total_timesteps | 749952 | -| train/ | | -| approx_kl | 0.0062353592 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 0.031 | -| explained_variance | -1.84 | -| learning_rate | 0.0003 | -| loss | -0.000709 | -| n_updates | 58580 | -| policy_gradient_loss | -6.66e-05 | -| std | 0.235 | -| value_loss | 0.00015 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5860 | -| time_elapsed | 41660 | -| total_timesteps | 750080 | -| train/ | | -| approx_kl | 0.008126105 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.0296 | -| explained_variance | -3.83 | -| learning_rate | 0.0003 | -| loss | -0.00679 | -| n_updates | 58590 | -| policy_gradient_loss | -0.00496 | -| std | 0.235 | -| value_loss | 0.000141 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5861 | -| time_elapsed | 41666 | -| total_timesteps | 750208 | -| train/ | | -| approx_kl | 0.08788913 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.0289 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 58600 | -| policy_gradient_loss | -0.0146 | -| std | 0.235 | -| value_loss | 0.00147 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5862 | -| time_elapsed | 41671 | -| total_timesteps | 750336 | -| train/ | | -| approx_kl | 0.007037087 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.0273 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | -0.00056 | -| n_updates | 58610 | -| policy_gradient_loss | -0.000543 | -| std | 0.236 | -| value_loss | 0.000405 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5863 | -| time_elapsed | 41674 | -| total_timesteps | 750464 | -| train/ | | -| approx_kl | 0.0152448835 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.0246 | -| explained_variance | -1.88 | -| learning_rate | 0.0003 | -| loss | 0.00172 | -| n_updates | 58620 | -| policy_gradient_loss | -0.000783 | -| std | 0.237 | -| value_loss | 0.000266 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5864 | -| time_elapsed | 41678 | -| total_timesteps | 750592 | -| train/ | | -| approx_kl | 0.00085967174 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.0224 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.00025 | -| n_updates | 58630 | -| policy_gradient_loss | -0.000257 | -| std | 0.237 | -| value_loss | 0.000252 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5865 | -| time_elapsed | 41680 | -| total_timesteps | 750720 | -| train/ | | -| approx_kl | 0.004677732 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.0224 | -| explained_variance | -1.8 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 58640 | -| policy_gradient_loss | -0.00143 | -| std | 0.237 | -| value_loss | 0.000101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5866 | -| time_elapsed | 41683 | -| total_timesteps | 750848 | -| train/ | | -| approx_kl | 0.027205132 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.0215 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 58650 | -| policy_gradient_loss | -0.0166 | -| std | 0.237 | -| value_loss | 0.000447 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 18 | -| iterations | 5867 | -| time_elapsed | 41686 | -| total_timesteps | 750976 | -| train/ | | -| approx_kl | 0.008277336 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.0216 | -| explained_variance | -3.25 | -| learning_rate | 0.0003 | -| loss | 0.00134 | -| n_updates | 58660 | -| policy_gradient_loss | -4.79e-05 | -| std | 0.237 | -| value_loss | 0.000374 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5868 | -| time_elapsed | 41689 | -| total_timesteps | 751104 | -| train/ | | -| approx_kl | 0.00068135094 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0227 | -| explained_variance | 0.254 | -| learning_rate | 0.0003 | -| loss | -0.000278 | -| n_updates | 58670 | -| policy_gradient_loss | -8.42e-05 | -| std | 0.237 | -| value_loss | 7.97e-05 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5869 | -| time_elapsed | 41697 | -| total_timesteps | 751232 | -| train/ | | -| approx_kl | 0.5093389 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 0.0228 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.000232 | -| n_updates | 58680 | -| policy_gradient_loss | 0.00625 | -| std | 0.236 | -| value_loss | 0.000633 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5870 | -| time_elapsed | 41699 | -| total_timesteps | 751360 | -| train/ | | -| approx_kl | 0.032661784 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.0231 | -| explained_variance | -2.69 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 58690 | -| policy_gradient_loss | -0.00986 | -| std | 0.236 | -| value_loss | 0.000101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5871 | -| time_elapsed | 41702 | -| total_timesteps | 751488 | -| train/ | | -| approx_kl | 0.009259882 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.0236 | -| explained_variance | -3.87 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 58700 | -| policy_gradient_loss | -0.00275 | -| std | 0.236 | -| value_loss | 8.92e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5872 | -| time_elapsed | 41705 | -| total_timesteps | 751616 | -| train/ | | -| approx_kl | 0.011396978 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 0.0235 | -| explained_variance | -3.65 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 58710 | -| policy_gradient_loss | -0.00124 | -| std | 0.237 | -| value_loss | 9.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5873 | -| time_elapsed | 41708 | -| total_timesteps | 751744 | -| train/ | | -| approx_kl | 0.006345806 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.0211 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 58720 | -| policy_gradient_loss | -0.00258 | -| std | 0.237 | -| value_loss | 3.59e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5874 | -| time_elapsed | 41712 | -| total_timesteps | 751872 | -| train/ | | -| approx_kl | 0.017187111 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 0.0197 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | 0.00305 | -| n_updates | 58730 | -| policy_gradient_loss | 0.000283 | -| std | 0.237 | -| value_loss | 3.07e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5875 | -| time_elapsed | 41716 | -| total_timesteps | 752000 | -| train/ | | -| approx_kl | 0.016761873 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.0201 | -| explained_variance | -2.89 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 58740 | -| policy_gradient_loss | -0.0123 | -| std | 0.237 | -| value_loss | 3.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5876 | -| time_elapsed | 41720 | -| total_timesteps | 752128 | -| train/ | | -| approx_kl | 0.018878544 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.0202 | -| explained_variance | -0.992 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 58750 | -| policy_gradient_loss | -0.00369 | -| std | 0.237 | -| value_loss | 3.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5877 | -| time_elapsed | 41727 | -| total_timesteps | 752256 | -| train/ | | -| approx_kl | 0.014561684 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 0.0207 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 58760 | -| policy_gradient_loss | -0.0145 | -| std | 0.237 | -| value_loss | 0.00101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5878 | -| time_elapsed | 41730 | -| total_timesteps | 752384 | -| train/ | | -| approx_kl | 0.039515205 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.0212 | -| explained_variance | -0.898 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 58770 | -| policy_gradient_loss | -0.0173 | -| std | 0.237 | -| value_loss | 6.27e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5879 | -| time_elapsed | 41733 | -| total_timesteps | 752512 | -| train/ | | -| approx_kl | 0.0019606645 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.0196 | -| explained_variance | -2.57 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 58780 | -| policy_gradient_loss | -0.000892 | -| std | 0.238 | -| value_loss | 0.000103 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5880 | -| time_elapsed | 41736 | -| total_timesteps | 752640 | -| train/ | | -| approx_kl | 0.006851073 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 0.0159 | -| explained_variance | -4.64 | -| learning_rate | 0.0003 | -| loss | -0.00816 | -| n_updates | 58790 | -| policy_gradient_loss | -0.00537 | -| std | 0.238 | -| value_loss | 3.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5881 | -| time_elapsed | 41739 | -| total_timesteps | 752768 | -| train/ | | -| approx_kl | 0.010858318 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | 0.0148 | -| explained_variance | 0.252 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 58800 | -| policy_gradient_loss | 3.56e-05 | -| std | 0.238 | -| value_loss | 1.3e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 18 | -| iterations | 5882 | -| time_elapsed | 41742 | -| total_timesteps | 752896 | -| train/ | | -| approx_kl | 0.02132324 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.0166 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | -0.00795 | -| n_updates | 58810 | -| policy_gradient_loss | -0.00768 | -| std | 0.238 | -| value_loss | 0.000158 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5883 | -| time_elapsed | 41746 | -| total_timesteps | 753024 | -| train/ | | -| approx_kl | 0.02408317 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 0.0181 | -| explained_variance | -1.54 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 58820 | -| policy_gradient_loss | -0.00504 | -| std | 0.237 | -| value_loss | 7.44e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5884 | -| time_elapsed | 41753 | -| total_timesteps | 753152 | -| train/ | | -| approx_kl | 0.021735191 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 0.0197 | -| explained_variance | -0.0978 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 58830 | -| policy_gradient_loss | -0.0145 | -| std | 0.237 | -| value_loss | 0.00232 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5885 | -| time_elapsed | 41757 | -| total_timesteps | 753280 | -| train/ | | -| approx_kl | 0.024665346 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.0209 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 58840 | -| policy_gradient_loss | -0.0151 | -| std | 0.237 | -| value_loss | 0.00026 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5886 | -| time_elapsed | 41760 | -| total_timesteps | 753408 | -| train/ | | -| approx_kl | 0.02034679 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 0.0219 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | -0.00954 | -| n_updates | 58850 | -| policy_gradient_loss | -0.00893 | -| std | 0.237 | -| value_loss | 2.31e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5887 | -| time_elapsed | 41763 | -| total_timesteps | 753536 | -| train/ | | -| approx_kl | 0.009462908 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.0222 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 58860 | -| policy_gradient_loss | -0.000894 | -| std | 0.237 | -| value_loss | 0.000134 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5888 | -| time_elapsed | 41766 | -| total_timesteps | 753664 | -| train/ | | -| approx_kl | 0.0056263655 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.0231 | -| explained_variance | -3.8 | -| learning_rate | 0.0003 | -| loss | -0.000756 | -| n_updates | 58870 | -| policy_gradient_loss | 9.27e-05 | -| std | 0.236 | -| value_loss | 4.8e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5889 | -| time_elapsed | 41770 | -| total_timesteps | 753792 | -| train/ | | -| approx_kl | 0.017228477 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.0253 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 58880 | -| policy_gradient_loss | -0.00599 | -| std | 0.236 | -| value_loss | 8.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 18 | -| iterations | 5890 | -| time_elapsed | 41772 | -| total_timesteps | 753920 | -| train/ | | -| approx_kl | 0.009840855 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 0.0258 | -| explained_variance | -3.01 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 58890 | -| policy_gradient_loss | -0.000828 | -| std | 0.236 | -| value_loss | 0.000112 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5891 | -| time_elapsed | 41775 | -| total_timesteps | 754048 | -| train/ | | -| approx_kl | 0.0061686696 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.0266 | -| explained_variance | -3.66 | -| learning_rate | 0.0003 | -| loss | -0.000901 | -| n_updates | 58900 | -| policy_gradient_loss | 0.000109 | -| std | 0.235 | -| value_loss | 0.000112 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5892 | -| time_elapsed | 41780 | -| total_timesteps | 754176 | -| train/ | | -| approx_kl | 0.04836219 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.0292 | -| explained_variance | 0.903 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 58910 | -| policy_gradient_loss | -0.0155 | -| std | 0.235 | -| value_loss | 0.00123 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5893 | -| time_elapsed | 41784 | -| total_timesteps | 754304 | -| train/ | | -| approx_kl | 0.024565667 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.0294 | -| explained_variance | -0.92 | -| learning_rate | 0.0003 | -| loss | -0.00729 | -| n_updates | 58920 | -| policy_gradient_loss | -0.00634 | -| std | 0.235 | -| value_loss | 7.05e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5894 | -| time_elapsed | 41787 | -| total_timesteps | 754432 | -| train/ | | -| approx_kl | 0.027618444 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.0291 | -| explained_variance | -9.02 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 58930 | -| policy_gradient_loss | -0.0155 | -| std | 0.235 | -| value_loss | 1.45e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5895 | -| time_elapsed | 41791 | -| total_timesteps | 754560 | -| train/ | | -| approx_kl | 0.014202281 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 0.0287 | -| explained_variance | -0.437 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 58940 | -| policy_gradient_loss | -0.00338 | -| std | 0.235 | -| value_loss | 5.82e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5896 | -| time_elapsed | 41795 | -| total_timesteps | 754688 | -| train/ | | -| approx_kl | 0.015831431 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.0273 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | 0.00072 | -| n_updates | 58950 | -| policy_gradient_loss | -0.0012 | -| std | 0.236 | -| value_loss | 1.99e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5897 | -| time_elapsed | 41799 | -| total_timesteps | 754816 | -| train/ | | -| approx_kl | 0.021545827 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.0259 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | -0.00948 | -| n_updates | 58960 | -| policy_gradient_loss | -0.00809 | -| std | 0.236 | -| value_loss | 3.78e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 18 | -| iterations | 5898 | -| time_elapsed | 41802 | -| total_timesteps | 754944 | -| train/ | | -| approx_kl | 0.016317418 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.0259 | -| explained_variance | -1.57 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 58970 | -| policy_gradient_loss | -0.00897 | -| std | 0.236 | -| value_loss | 2.8e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5899 | -| time_elapsed | 41806 | -| total_timesteps | 755072 | -| train/ | | -| approx_kl | 0.018320052 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.026 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 58980 | -| policy_gradient_loss | -0.00184 | -| std | 0.236 | -| value_loss | 9.29e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5900 | -| time_elapsed | 41812 | -| total_timesteps | 755200 | -| train/ | | -| approx_kl | 0.5654646 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.0249 | -| explained_variance | 0.876 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 58990 | -| policy_gradient_loss | -0.0158 | -| std | 0.236 | -| value_loss | 0.000566 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5901 | -| time_elapsed | 41815 | -| total_timesteps | 755328 | -| train/ | | -| approx_kl | 0.013286794 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.0242 | -| explained_variance | 0.708 | -| learning_rate | 0.0003 | -| loss | 0.00229 | -| n_updates | 59000 | -| policy_gradient_loss | 0.000392 | -| std | 0.236 | -| value_loss | 4.89e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5902 | -| time_elapsed | 41819 | -| total_timesteps | 755456 | -| train/ | | -| approx_kl | 0.013855243 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.0253 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | 0.00421 | -| n_updates | 59010 | -| policy_gradient_loss | 0.0026 | -| std | 0.236 | -| value_loss | 0.00025 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5903 | -| time_elapsed | 41823 | -| total_timesteps | 755584 | -| train/ | | -| approx_kl | 0.019173253 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.0272 | -| explained_variance | -4.55 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 59020 | -| policy_gradient_loss | -0.00529 | -| std | 0.235 | -| value_loss | 4.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5904 | -| time_elapsed | 41826 | -| total_timesteps | 755712 | -| train/ | | -| approx_kl | 0.004633865 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.0281 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 59030 | -| policy_gradient_loss | -0.00028 | -| std | 0.235 | -| value_loss | 5.02e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5905 | -| time_elapsed | 41830 | -| total_timesteps | 755840 | -| train/ | | -| approx_kl | 0.010507135 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.0278 | -| explained_variance | -3.61 | -| learning_rate | 0.0003 | -| loss | -0.00947 | -| n_updates | 59040 | -| policy_gradient_loss | -0.00243 | -| std | 0.235 | -| value_loss | 0.000172 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 18 | -| iterations | 5906 | -| time_elapsed | 41833 | -| total_timesteps | 755968 | -| train/ | | -| approx_kl | 0.004529084 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.0275 | -| explained_variance | -2.83 | -| learning_rate | 0.0003 | -| loss | -0.00752 | -| n_updates | 59050 | -| policy_gradient_loss | -0.000438 | -| std | 0.236 | -| value_loss | 5.06e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5907 | -| time_elapsed | 41837 | -| total_timesteps | 756096 | -| train/ | | -| approx_kl | 0.0019200654 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0261 | -| explained_variance | -2.51 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 59060 | -| policy_gradient_loss | 0.0016 | -| std | 0.236 | -| value_loss | 0.000132 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5908 | -| time_elapsed | 41846 | -| total_timesteps | 756224 | -| train/ | | -| approx_kl | 0.022834674 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.0256 | -| explained_variance | 0.863 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 59070 | -| policy_gradient_loss | -0.0134 | -| std | 0.236 | -| value_loss | 0.000547 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5909 | -| time_elapsed | 41850 | -| total_timesteps | 756352 | -| train/ | | -| approx_kl | 0.014409223 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.0262 | -| explained_variance | 0.405 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 59080 | -| policy_gradient_loss | -0.00378 | -| std | 0.236 | -| value_loss | 1.69e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5910 | -| time_elapsed | 41854 | -| total_timesteps | 756480 | -| train/ | | -| approx_kl | 0.009105654 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.0277 | -| explained_variance | -2.28 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 59090 | -| policy_gradient_loss | -0.00183 | -| std | 0.235 | -| value_loss | 6.91e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5911 | -| time_elapsed | 41858 | -| total_timesteps | 756608 | -| train/ | | -| approx_kl | 0.01192338 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.0286 | -| explained_variance | -0.618 | -| learning_rate | 0.0003 | -| loss | 0.00175 | -| n_updates | 59100 | -| policy_gradient_loss | 0.00171 | -| std | 0.235 | -| value_loss | 3.01e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5912 | -| time_elapsed | 41860 | -| total_timesteps | 756736 | -| train/ | | -| approx_kl | 0.012449428 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.0284 | -| explained_variance | -3.03 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 59110 | -| policy_gradient_loss | -0.00252 | -| std | 0.235 | -| value_loss | 4.64e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5913 | -| time_elapsed | 41863 | -| total_timesteps | 756864 | -| train/ | | -| approx_kl | 0.0006345846 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0285 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | 0.000151 | -| n_updates | 59120 | -| policy_gradient_loss | 0.000146 | -| std | 0.235 | -| value_loss | 4.19e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5914 | -| time_elapsed | 41867 | -| total_timesteps | 756992 | -| train/ | | -| approx_kl | 0.016051214 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.0288 | -| explained_variance | -3.19 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 59130 | -| policy_gradient_loss | -0.00608 | -| std | 0.235 | -| value_loss | 5.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5915 | -| time_elapsed | 41870 | -| total_timesteps | 757120 | -| train/ | | -| approx_kl | 0.009402741 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.0285 | -| explained_variance | -0.765 | -| learning_rate | 0.0003 | -| loss | 0.00188 | -| n_updates | 59140 | -| policy_gradient_loss | 0.000559 | -| std | 0.235 | -| value_loss | 1.63e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5916 | -| time_elapsed | 41878 | -| total_timesteps | 757248 | -| train/ | | -| approx_kl | 0.042418484 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | 0.0274 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 59150 | -| policy_gradient_loss | -0.013 | -| std | 0.236 | -| value_loss | 9.85e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5917 | -| time_elapsed | 41883 | -| total_timesteps | 757376 | -| train/ | | -| approx_kl | 0.012554751 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.0261 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 59160 | -| policy_gradient_loss | -0.0116 | -| std | 0.236 | -| value_loss | 2.09e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5918 | -| time_elapsed | 41886 | -| total_timesteps | 757504 | -| train/ | | -| approx_kl | 0.016269231 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.0261 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -0.00981 | -| n_updates | 59170 | -| policy_gradient_loss | -0.00504 | -| std | 0.236 | -| value_loss | 1.47e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5919 | -| time_elapsed | 41889 | -| total_timesteps | 757632 | -| train/ | | -| approx_kl | 0.027362775 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.0257 | -| explained_variance | -0.252 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 59180 | -| policy_gradient_loss | -0.0112 | -| std | 0.236 | -| value_loss | 2.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5920 | -| time_elapsed | 41893 | -| total_timesteps | 757760 | -| train/ | | -| approx_kl | 0.014924521 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.0246 | -| explained_variance | 0.326 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 59190 | -| policy_gradient_loss | -0.000505 | -| std | 0.236 | -| value_loss | 1.45e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 18 | -| iterations | 5921 | -| time_elapsed | 41896 | -| total_timesteps | 757888 | -| train/ | | -| approx_kl | 0.00900546 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.0243 | -| explained_variance | -6.96 | -| learning_rate | 0.0003 | -| loss | 0.000819 | -| n_updates | 59200 | -| policy_gradient_loss | 0.000648 | -| std | 0.236 | -| value_loss | 7.25e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5922 | -| time_elapsed | 41901 | -| total_timesteps | 758016 | -| train/ | | -| approx_kl | 0.015112274 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 0.0245 | -| explained_variance | -3.56 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 59210 | -| policy_gradient_loss | 0.000879 | -| std | 0.236 | -| value_loss | 6.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5923 | -| time_elapsed | 41910 | -| total_timesteps | 758144 | -| train/ | | -| approx_kl | 0.009852989 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | 0.025 | -| explained_variance | -254 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 59220 | -| policy_gradient_loss | -0.0158 | -| std | 0.236 | -| value_loss | 0.00521 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5924 | -| time_elapsed | 41913 | -| total_timesteps | 758272 | -| train/ | | -| approx_kl | 0.02713781 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.0251 | -| explained_variance | -3.87 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 59230 | -| policy_gradient_loss | -0.00963 | -| std | 0.236 | -| value_loss | 3.6e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5925 | -| time_elapsed | 41917 | -| total_timesteps | 758400 | -| train/ | | -| approx_kl | 0.004709276 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.0252 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | -0.000621 | -| n_updates | 59240 | -| policy_gradient_loss | 0.00033 | -| std | 0.236 | -| value_loss | 1.87e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5926 | -| time_elapsed | 41921 | -| total_timesteps | 758528 | -| train/ | | -| approx_kl | 0.023346888 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 0.0256 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 59250 | -| policy_gradient_loss | -0.00567 | -| std | 0.236 | -| value_loss | 3.46e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5927 | -| time_elapsed | 41925 | -| total_timesteps | 758656 | -| train/ | | -| approx_kl | 0.0032491158 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.0257 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 59260 | -| policy_gradient_loss | -8.76e-05 | -| std | 0.236 | -| value_loss | 7.14e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5928 | -| time_elapsed | 41929 | -| total_timesteps | 758784 | -| train/ | | -| approx_kl | 0.0004933267 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0271 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | -0.000498 | -| n_updates | 59270 | -| policy_gradient_loss | -0.000184 | -| std | 0.235 | -| value_loss | 1.06e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 18 | -| iterations | 5929 | -| time_elapsed | 41933 | -| total_timesteps | 758912 | -| train/ | | -| approx_kl | 0.008315515 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.0319 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 59280 | -| policy_gradient_loss | 0.000826 | -| std | 0.234 | -| value_loss | 8.73e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5930 | -| time_elapsed | 41936 | -| total_timesteps | 759040 | -| train/ | | -| approx_kl | 0.01419499 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 0.0352 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | -0.00034 | -| n_updates | 59290 | -| policy_gradient_loss | -0.000477 | -| std | 0.233 | -| value_loss | 3.84e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5931 | -| time_elapsed | 41944 | -| total_timesteps | 759168 | -| train/ | | -| approx_kl | 0.039746724 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.0372 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 59300 | -| policy_gradient_loss | -0.0175 | -| std | 0.233 | -| value_loss | 0.000515 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5932 | -| time_elapsed | 41948 | -| total_timesteps | 759296 | -| train/ | | -| approx_kl | 0.021710934 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.0374 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 59310 | -| policy_gradient_loss | -0.0121 | -| std | 0.233 | -| value_loss | 2.41e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5933 | -| time_elapsed | 41952 | -| total_timesteps | 759424 | -| train/ | | -| approx_kl | 0.011592485 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.0372 | -| explained_variance | -3.16 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 59320 | -| policy_gradient_loss | -0.000816 | -| std | 0.233 | -| value_loss | 3.44e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5934 | -| time_elapsed | 41956 | -| total_timesteps | 759552 | -| train/ | | -| approx_kl | 0.02956047 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.0368 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 59330 | -| policy_gradient_loss | -0.0139 | -| std | 0.233 | -| value_loss | 1.53e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5935 | -| time_elapsed | 41960 | -| total_timesteps | 759680 | -| train/ | | -| approx_kl | 0.02396847 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.0366 | -| explained_variance | 0.0557 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 59340 | -| policy_gradient_loss | -0.00645 | -| std | 0.233 | -| value_loss | 2.28e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5936 | -| time_elapsed | 41963 | -| total_timesteps | 759808 | -| train/ | | -| approx_kl | 0.013877541 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.0361 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 59350 | -| policy_gradient_loss | -0.00527 | -| std | 0.233 | -| value_loss | 2.73e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 18 | -| iterations | 5937 | -| time_elapsed | 41967 | -| total_timesteps | 759936 | -| train/ | | -| approx_kl | 0.0003053844 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0361 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.000124 | -| n_updates | 59360 | -| policy_gradient_loss | 3.07e-05 | -| std | 0.233 | -| value_loss | 1.78e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5938 | -| time_elapsed | 41970 | -| total_timesteps | 760064 | -| train/ | | -| approx_kl | 0.034817282 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 0.0366 | -| explained_variance | -2.17 | -| learning_rate | 0.0003 | -| loss | -0.00894 | -| n_updates | 59370 | -| policy_gradient_loss | -0.00919 | -| std | 0.233 | -| value_loss | 2.84e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5939 | -| time_elapsed | 41977 | -| total_timesteps | 760192 | -| train/ | | -| approx_kl | 0.47796875 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.0361 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0278 | -| n_updates | 59380 | -| policy_gradient_loss | -0.0183 | -| std | 0.233 | -| value_loss | 2.63e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5940 | -| time_elapsed | 41982 | -| total_timesteps | 760320 | -| train/ | | -| approx_kl | 0.017781379 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.0354 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.00788 | -| n_updates | 59390 | -| policy_gradient_loss | -0.00645 | -| std | 0.234 | -| value_loss | 2.19e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5941 | -| time_elapsed | 41985 | -| total_timesteps | 760448 | -| train/ | | -| approx_kl | 0.0055316878 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.0351 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 59400 | -| policy_gradient_loss | -0.000908 | -| std | 0.234 | -| value_loss | 2.94e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5942 | -| time_elapsed | 41988 | -| total_timesteps | 760576 | -| train/ | | -| approx_kl | 0.024248963 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 0.0356 | -| explained_variance | -4.67 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 59410 | -| policy_gradient_loss | -0.0105 | -| std | 0.233 | -| value_loss | 7.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5943 | -| time_elapsed | 41992 | -| total_timesteps | 760704 | -| train/ | | -| approx_kl | 0.020824004 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 0.0361 | -| explained_variance | -3.16 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 59420 | -| policy_gradient_loss | -0.00764 | -| std | 0.233 | -| value_loss | 2.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5944 | -| time_elapsed | 41996 | -| total_timesteps | 760832 | -| train/ | | -| approx_kl | 0.018463047 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 0.0364 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 59430 | -| policy_gradient_loss | -0.013 | -| std | 0.233 | -| value_loss | 6.21e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 18 | -| iterations | 5945 | -| time_elapsed | 42001 | -| total_timesteps | 760960 | -| train/ | | -| approx_kl | 4.1071326e-07 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0364 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | -2.99e-05 | -| n_updates | 59440 | -| policy_gradient_loss | 6.06e-05 | -| std | 0.233 | -| value_loss | 1.2e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5946 | -| time_elapsed | 42005 | -| total_timesteps | 761088 | -| train/ | | -| approx_kl | 0.004576222 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 0.0368 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | -8.31e-05 | -| n_updates | 59450 | -| policy_gradient_loss | -8.38e-05 | -| std | 0.234 | -| value_loss | 1.49e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5947 | -| time_elapsed | 42012 | -| total_timesteps | 761216 | -| train/ | | -| approx_kl | 0.010451549 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.0348 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 59460 | -| policy_gradient_loss | -0.0162 | -| std | 0.234 | -| value_loss | 0.000646 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5948 | -| time_elapsed | 42015 | -| total_timesteps | 761344 | -| train/ | | -| approx_kl | 0.0125242155 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 0.0334 | -| explained_variance | -2.7 | -| learning_rate | 0.0003 | -| loss | 0.000266 | -| n_updates | 59470 | -| policy_gradient_loss | -2.47e-05 | -| std | 0.234 | -| value_loss | 3.91e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5949 | -| time_elapsed | 42018 | -| total_timesteps | 761472 | -| train/ | | -| approx_kl | 0.015699577 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 0.0328 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 59480 | -| policy_gradient_loss | -0.00611 | -| std | 0.234 | -| value_loss | 3.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5950 | -| time_elapsed | 42021 | -| total_timesteps | 761600 | -| train/ | | -| approx_kl | 0.016207328 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.0324 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 59490 | -| policy_gradient_loss | -0.00342 | -| std | 0.234 | -| value_loss | 4.76e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5951 | -| time_elapsed | 42024 | -| total_timesteps | 761728 | -| train/ | | -| approx_kl | 0.01725938 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 0.0315 | -| explained_variance | -5.26 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 59500 | -| policy_gradient_loss | -0.00331 | -| std | 0.235 | -| value_loss | 8.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5952 | -| time_elapsed | 42028 | -| total_timesteps | 761856 | -| train/ | | -| approx_kl | 0.011270452 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.0297 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 59510 | -| policy_gradient_loss | -0.00248 | -| std | 0.235 | -| value_loss | 8.33e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 18 | -| iterations | 5953 | -| time_elapsed | 42032 | -| total_timesteps | 761984 | -| train/ | | -| approx_kl | 0.021343894 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.0281 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.000169 | -| n_updates | 59520 | -| policy_gradient_loss | -0.00264 | -| std | 0.235 | -| value_loss | 3.84e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5954 | -| time_elapsed | 42036 | -| total_timesteps | 762112 | -| train/ | | -| approx_kl | 0.009414969 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.0276 | -| explained_variance | -2.17 | -| learning_rate | 0.0003 | -| loss | 0.00024 | -| n_updates | 59530 | -| policy_gradient_loss | -0.000704 | -| std | 0.235 | -| value_loss | 2.81e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5955 | -| time_elapsed | 42042 | -| total_timesteps | 762240 | -| train/ | | -| approx_kl | 0.30293664 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 0.0278 | -| explained_variance | 0.654 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 59540 | -| policy_gradient_loss | -0.012 | -| std | 0.235 | -| value_loss | 0.000547 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5956 | -| time_elapsed | 42046 | -| total_timesteps | 762368 | -| train/ | | -| approx_kl | 0.009240411 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.029 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 59550 | -| policy_gradient_loss | -0.00199 | -| std | 0.235 | -| value_loss | 7.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5957 | -| time_elapsed | 42050 | -| total_timesteps | 762496 | -| train/ | | -| approx_kl | 0.015144588 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.0297 | -| explained_variance | -2.6 | -| learning_rate | 0.0003 | -| loss | 0.00642 | -| n_updates | 59560 | -| policy_gradient_loss | 0.000877 | -| std | 0.235 | -| value_loss | 1.18e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5958 | -| time_elapsed | 42052 | -| total_timesteps | 762624 | -| train/ | | -| approx_kl | 0.01935821 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.0305 | -| explained_variance | -0.543 | -| learning_rate | 0.0003 | -| loss | -0.00784 | -| n_updates | 59570 | -| policy_gradient_loss | -0.00636 | -| std | 0.235 | -| value_loss | 4.55e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5959 | -| time_elapsed | 42055 | -| total_timesteps | 762752 | -| train/ | | -| approx_kl | 0.017611707 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.0314 | -| explained_variance | 0.305 | -| learning_rate | 0.0003 | -| loss | -0.000224 | -| n_updates | 59580 | -| policy_gradient_loss | -0.00212 | -| std | 0.234 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5960 | -| time_elapsed | 42056 | -| total_timesteps | 762880 | -| train/ | | -| approx_kl | 0.018624054 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.0328 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.0081 | -| n_updates | 59590 | -| policy_gradient_loss | -0.00705 | -| std | 0.234 | -| value_loss | 2.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5961 | -| time_elapsed | 42058 | -| total_timesteps | 763008 | -| train/ | | -| approx_kl | 0.015737234 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.0337 | -| explained_variance | -4.13 | -| learning_rate | 0.0003 | -| loss | -0.00062 | -| n_updates | 59600 | -| policy_gradient_loss | -0.00149 | -| std | 0.234 | -| value_loss | 2.18e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5962 | -| time_elapsed | 42068 | -| total_timesteps | 763136 | -| train/ | | -| approx_kl | 0.020834986 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.0323 | -| explained_variance | 0.611 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 59610 | -| policy_gradient_loss | -0.0135 | -| std | 0.234 | -| value_loss | 0.000464 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5963 | -| time_elapsed | 42070 | -| total_timesteps | 763264 | -| train/ | | -| approx_kl | 0.03296848 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 0.032 | -| explained_variance | -2.83 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 59620 | -| policy_gradient_loss | -0.00568 | -| std | 0.234 | -| value_loss | 2.42e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5964 | -| time_elapsed | 42073 | -| total_timesteps | 763392 | -| train/ | | -| approx_kl | 0.0053624418 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.0325 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.00467 | -| n_updates | 59630 | -| policy_gradient_loss | -0.00295 | -| std | 0.234 | -| value_loss | 1.67e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5965 | -| time_elapsed | 42076 | -| total_timesteps | 763520 | -| train/ | | -| approx_kl | 0.008359352 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | 0.0314 | -| explained_variance | -4.03 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 59640 | -| policy_gradient_loss | -0.00223 | -| std | 0.235 | -| value_loss | 5.98e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5966 | -| time_elapsed | 42079 | -| total_timesteps | 763648 | -| train/ | | -| approx_kl | 0.022785995 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.0306 | -| explained_variance | -0.366 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 59650 | -| policy_gradient_loss | -0.0105 | -| std | 0.235 | -| value_loss | 1.99e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5967 | -| time_elapsed | 42081 | -| total_timesteps | 763776 | -| train/ | | -| approx_kl | 0.017149076 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.0306 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.000991 | -| n_updates | 59660 | -| policy_gradient_loss | -0.00318 | -| std | 0.235 | -| value_loss | 1.26e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 18 | -| iterations | 5968 | -| time_elapsed | 42085 | -| total_timesteps | 763904 | -| train/ | | -| approx_kl | 0.0049409107 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.0323 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | -0.000489 | -| n_updates | 59670 | -| policy_gradient_loss | -0.000241 | -| std | 0.234 | -| value_loss | 2.58e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5969 | -| time_elapsed | 42088 | -| total_timesteps | 764032 | -| train/ | | -| approx_kl | 0.015428353 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.0356 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | 9.68e-05 | -| n_updates | 59680 | -| policy_gradient_loss | -0.0017 | -| std | 0.233 | -| value_loss | 9.21e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5970 | -| time_elapsed | 42096 | -| total_timesteps | 764160 | -| train/ | | -| approx_kl | 0.16553114 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.0365 | -| explained_variance | -34.1 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 59690 | -| policy_gradient_loss | -0.0108 | -| std | 0.233 | -| value_loss | 0.0019 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5971 | -| time_elapsed | 42101 | -| total_timesteps | 764288 | -| train/ | | -| approx_kl | 0.016360473 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.0368 | -| explained_variance | -0.21 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 59700 | -| policy_gradient_loss | -0.00338 | -| std | 0.233 | -| value_loss | 1.37e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5972 | -| time_elapsed | 42105 | -| total_timesteps | 764416 | -| train/ | | -| approx_kl | 0.0064402362 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.0376 | -| explained_variance | -0.337 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 59710 | -| policy_gradient_loss | -0.00236 | -| std | 0.233 | -| value_loss | 1.7e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5973 | -| time_elapsed | 42109 | -| total_timesteps | 764544 | -| train/ | | -| approx_kl | 0.007881964 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.0386 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 59720 | -| policy_gradient_loss | -0.000443 | -| std | 0.233 | -| value_loss | 1.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5974 | -| time_elapsed | 42112 | -| total_timesteps | 764672 | -| train/ | | -| approx_kl | 0.011526102 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 0.0388 | -| explained_variance | -0.912 | -| learning_rate | 0.0003 | -| loss | 0.000222 | -| n_updates | 59730 | -| policy_gradient_loss | -0.000357 | -| std | 0.233 | -| value_loss | 9.22e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5975 | -| time_elapsed | 42115 | -| total_timesteps | 764800 | -| train/ | | -| approx_kl | 0.02661243 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.0401 | -| explained_variance | -4.58 | -| learning_rate | 0.0003 | -| loss | -0.00926 | -| n_updates | 59740 | -| policy_gradient_loss | -0.00752 | -| std | 0.232 | -| value_loss | 6.61e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 18 | -| iterations | 5976 | -| time_elapsed | 42118 | -| total_timesteps | 764928 | -| train/ | | -| approx_kl | 0.009082505 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 0.0402 | -| explained_variance | -2.11 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 59750 | -| policy_gradient_loss | -0.00101 | -| std | 0.232 | -| value_loss | 4.65e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5977 | -| time_elapsed | 42121 | -| total_timesteps | 765056 | -| train/ | | -| approx_kl | 0.020388449 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 0.0413 | -| explained_variance | -0.779 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 59760 | -| policy_gradient_loss | -0.00898 | -| std | 0.232 | -| value_loss | 2.38e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5978 | -| time_elapsed | 42128 | -| total_timesteps | 765184 | -| train/ | | -| approx_kl | 0.0037023649 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | 0.0418 | -| explained_variance | -209 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 59770 | -| policy_gradient_loss | -0.00938 | -| std | 0.232 | -| value_loss | 0.00174 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5979 | -| time_elapsed | 42132 | -| total_timesteps | 765312 | -| train/ | | -| approx_kl | 0.014808727 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.042 | -| explained_variance | -0.785 | -| learning_rate | 0.0003 | -| loss | 0.00247 | -| n_updates | 59780 | -| policy_gradient_loss | 0.000409 | -| std | 0.232 | -| value_loss | 1.13e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5980 | -| time_elapsed | 42135 | -| total_timesteps | 765440 | -| train/ | | -| approx_kl | 0.010173865 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.0419 | -| explained_variance | -7.45 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 59790 | -| policy_gradient_loss | -0.00417 | -| std | 0.232 | -| value_loss | 7.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5981 | -| time_elapsed | 42139 | -| total_timesteps | 765568 | -| train/ | | -| approx_kl | 0.021550138 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 0.0408 | -| explained_variance | -3.98 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 59800 | -| policy_gradient_loss | -0.00723 | -| std | 0.232 | -| value_loss | 1.29e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5982 | -| time_elapsed | 42144 | -| total_timesteps | 765696 | -| train/ | | -| approx_kl | 0.00806074 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | 0.0405 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00793 | -| n_updates | 59810 | -| policy_gradient_loss | -0.00115 | -| std | 0.232 | -| value_loss | 1.61e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5983 | -| time_elapsed | 42147 | -| total_timesteps | 765824 | -| train/ | | -| approx_kl | 0.0059672906 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | 0.0402 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | -0.000482 | -| n_updates | 59820 | -| policy_gradient_loss | -0.00033 | -| std | 0.233 | -| value_loss | 6.48e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 18 | -| iterations | 5984 | -| time_elapsed | 42150 | -| total_timesteps | 765952 | -| train/ | | -| approx_kl | 0.0008711256 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0422 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 59830 | -| policy_gradient_loss | -0.000972 | -| std | 0.231 | -| value_loss | 4.08e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5985 | -| time_elapsed | 42153 | -| total_timesteps | 766080 | -| train/ | | -| approx_kl | 0.015454942 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.0513 | -| explained_variance | -0.781 | -| learning_rate | 0.0003 | -| loss | -0.00362 | -| n_updates | 59840 | -| policy_gradient_loss | -0.00395 | -| std | 0.229 | -| value_loss | 3.37e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5986 | -| time_elapsed | 42161 | -| total_timesteps | 766208 | -| train/ | | -| approx_kl | 0.01741779 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 0.0559 | -| explained_variance | -7.34 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 59850 | -| policy_gradient_loss | -0.0151 | -| std | 0.229 | -| value_loss | 0.000738 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5987 | -| time_elapsed | 42165 | -| total_timesteps | 766336 | -| train/ | | -| approx_kl | 0.010255546 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.0578 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 59860 | -| policy_gradient_loss | -0.00247 | -| std | 0.228 | -| value_loss | 4.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5988 | -| time_elapsed | 42168 | -| total_timesteps | 766464 | -| train/ | | -| approx_kl | 0.011088101 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.0583 | -| explained_variance | 0.259 | -| learning_rate | 0.0003 | -| loss | 0.0053 | -| n_updates | 59870 | -| policy_gradient_loss | 0.00343 | -| std | 0.228 | -| value_loss | 7.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5989 | -| time_elapsed | 42172 | -| total_timesteps | 766592 | -| train/ | | -| approx_kl | 0.017681658 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.0579 | -| explained_variance | -6.02 | -| learning_rate | 0.0003 | -| loss | -0.00602 | -| n_updates | 59880 | -| policy_gradient_loss | -0.00564 | -| std | 0.228 | -| value_loss | 6.64e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5990 | -| time_elapsed | 42176 | -| total_timesteps | 766720 | -| train/ | | -| approx_kl | 0.02879109 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 0.0581 | -| explained_variance | -0.649 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 59890 | -| policy_gradient_loss | -0.00757 | -| std | 0.228 | -| value_loss | 1.54e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5991 | -| time_elapsed | 42180 | -| total_timesteps | 766848 | -| train/ | | -| approx_kl | 0.014395025 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.0589 | -| explained_variance | -4.05 | -| learning_rate | 0.0003 | -| loss | -0.00557 | -| n_updates | 59900 | -| policy_gradient_loss | -0.00452 | -| std | 0.228 | -| value_loss | 4.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 18 | -| iterations | 5992 | -| time_elapsed | 42184 | -| total_timesteps | 766976 | -| train/ | | -| approx_kl | 0.013347546 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.0603 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 59910 | -| policy_gradient_loss | -0.00226 | -| std | 0.228 | -| value_loss | 9.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 18 | -| iterations | 5993 | -| time_elapsed | 42187 | -| total_timesteps | 767104 | -| train/ | | -| approx_kl | 0.0114117265 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.0605 | -| explained_variance | -2.98 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 59920 | -| policy_gradient_loss | -0.00118 | -| std | 0.228 | -| value_loss | 6.52e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 18 | -| iterations | 5994 | -| time_elapsed | 42196 | -| total_timesteps | 767232 | -| train/ | | -| approx_kl | 0.041293535 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.0593 | -| explained_variance | -17 | -| learning_rate | 0.0003 | -| loss | -0.00543 | -| n_updates | 59930 | -| policy_gradient_loss | -0.00433 | -| std | 0.228 | -| value_loss | 0.000848 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 18 | -| iterations | 5995 | -| time_elapsed | 42198 | -| total_timesteps | 767360 | -| train/ | | -| approx_kl | 0.020982804 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 0.0573 | -| explained_variance | -0.678 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 59940 | -| policy_gradient_loss | -0.0075 | -| std | 0.229 | -| value_loss | 1.16e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 18 | -| iterations | 5996 | -| time_elapsed | 42201 | -| total_timesteps | 767488 | -| train/ | | -| approx_kl | 0.014856648 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.0569 | -| explained_variance | 0.0622 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 59950 | -| policy_gradient_loss | -0.00515 | -| std | 0.229 | -| value_loss | 8.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 18 | -| iterations | 5997 | -| time_elapsed | 42204 | -| total_timesteps | 767616 | -| train/ | | -| approx_kl | 0.023411978 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.0565 | -| explained_variance | -2.37 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 59960 | -| policy_gradient_loss | -0.0107 | -| std | 0.229 | -| value_loss | 3.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 18 | -| iterations | 5998 | -| time_elapsed | 42207 | -| total_timesteps | 767744 | -| train/ | | -| approx_kl | 0.015938397 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.0562 | -| explained_variance | -4.19 | -| learning_rate | 0.0003 | -| loss | -0.000219 | -| n_updates | 59970 | -| policy_gradient_loss | -0.00137 | -| std | 0.229 | -| value_loss | 2.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 18 | -| iterations | 5999 | -| time_elapsed | 42211 | -| total_timesteps | 767872 | -| train/ | | -| approx_kl | 0.010328127 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.0556 | -| explained_variance | -0.543 | -| learning_rate | 0.0003 | -| loss | -0.00982 | -| n_updates | 59980 | -| policy_gradient_loss | -0.00678 | -| std | 0.229 | -| value_loss | 2.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6000 | -| time_elapsed | 42213 | -| total_timesteps | 768000 | -| train/ | | -| approx_kl | 0.013707893 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.0552 | -| explained_variance | -0.936 | -| learning_rate | 0.0003 | -| loss | -0.00759 | -| n_updates | 59990 | -| policy_gradient_loss | -0.00597 | -| std | 0.229 | -| value_loss | 3.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6001 | -| time_elapsed | 42216 | -| total_timesteps | 768128 | -| train/ | | -| approx_kl | 0.011457357 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.0543 | -| explained_variance | -3.19 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 60000 | -| policy_gradient_loss | -0.0017 | -| std | 0.229 | -| value_loss | 2.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6002 | -| time_elapsed | 42223 | -| total_timesteps | 768256 | -| train/ | | -| approx_kl | 0.012123795 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 0.054 | -| explained_variance | -6.17 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 60010 | -| policy_gradient_loss | -0.014 | -| std | 0.229 | -| value_loss | 0.000454 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6003 | -| time_elapsed | 42226 | -| total_timesteps | 768384 | -| train/ | | -| approx_kl | 0.01973126 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.0539 | -| explained_variance | -0.869 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 60020 | -| policy_gradient_loss | -0.00548 | -| std | 0.229 | -| value_loss | 3.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6004 | -| time_elapsed | 42230 | -| total_timesteps | 768512 | -| train/ | | -| approx_kl | 0.014296665 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.0525 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 60030 | -| policy_gradient_loss | -0.00164 | -| std | 0.23 | -| value_loss | 5.83e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6005 | -| time_elapsed | 42233 | -| total_timesteps | 768640 | -| train/ | | -| approx_kl | 0.0198154 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 0.0505 | -| explained_variance | -0.849 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 60040 | -| policy_gradient_loss | -0.00576 | -| std | 0.23 | -| value_loss | 3.88e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6006 | -| time_elapsed | 42237 | -| total_timesteps | 768768 | -| train/ | | -| approx_kl | 0.004175915 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.0493 | -| explained_variance | -1.84 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 60050 | -| policy_gradient_loss | -0.00388 | -| std | 0.231 | -| value_loss | 2.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 18 | -| iterations | 6007 | -| time_elapsed | 42240 | -| total_timesteps | 768896 | -| train/ | | -| approx_kl | 0.013937615 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 0.0471 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.00269 | -| n_updates | 60060 | -| policy_gradient_loss | -0.00117 | -| std | 0.231 | -| value_loss | 3.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6008 | -| time_elapsed | 42244 | -| total_timesteps | 769024 | -| train/ | | -| approx_kl | 0.016301744 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.046 | -| explained_variance | -2.75 | -| learning_rate | 0.0003 | -| loss | -0.00976 | -| n_updates | 60070 | -| policy_gradient_loss | -0.00811 | -| std | 0.231 | -| value_loss | 7.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6009 | -| time_elapsed | 42253 | -| total_timesteps | 769152 | -| train/ | | -| approx_kl | 0.012852697 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.0464 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 60080 | -| policy_gradient_loss | -0.0112 | -| std | 0.231 | -| value_loss | 0.000719 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6010 | -| time_elapsed | 42255 | -| total_timesteps | 769280 | -| train/ | | -| approx_kl | 0.014354063 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.047 | -| explained_variance | -2.47 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 60090 | -| policy_gradient_loss | -0.00243 | -| std | 0.231 | -| value_loss | 2.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6011 | -| time_elapsed | 42259 | -| total_timesteps | 769408 | -| train/ | | -| approx_kl | 0.011666044 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 0.0471 | -| explained_variance | -0.744 | -| learning_rate | 0.0003 | -| loss | 0.000535 | -| n_updates | 60100 | -| policy_gradient_loss | -0.00028 | -| std | 0.231 | -| value_loss | 3.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6012 | -| time_elapsed | 42262 | -| total_timesteps | 769536 | -| train/ | | -| approx_kl | 0.015081657 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.0472 | -| explained_variance | -4.4 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 60110 | -| policy_gradient_loss | -0.00378 | -| std | 0.231 | -| value_loss | 3.93e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6013 | -| time_elapsed | 42264 | -| total_timesteps | 769664 | -| train/ | | -| approx_kl | 0.0049163005 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.0475 | -| explained_variance | -0.437 | -| learning_rate | 0.0003 | -| loss | -0.000897 | -| n_updates | 60120 | -| policy_gradient_loss | 0.000737 | -| std | 0.231 | -| value_loss | 2.94e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6014 | -| time_elapsed | 42268 | -| total_timesteps | 769792 | -| train/ | | -| approx_kl | 0.010168971 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 0.0464 | -| explained_variance | 0.804 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 60130 | -| policy_gradient_loss | -0.000765 | -| std | 0.231 | -| value_loss | 1.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 18 | -| iterations | 6015 | -| time_elapsed | 42271 | -| total_timesteps | 769920 | -| train/ | | -| approx_kl | 0.009811981 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.0449 | -| explained_variance | -0.639 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 60140 | -| policy_gradient_loss | -0.00181 | -| std | 0.231 | -| value_loss | 3.73e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6016 | -| time_elapsed | 42274 | -| total_timesteps | 770048 | -| train/ | | -| approx_kl | 0.0025939485 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 0.0427 | -| explained_variance | -4.06 | -| learning_rate | 0.0003 | -| loss | -0.000884 | -| n_updates | 60150 | -| policy_gradient_loss | -0.000333 | -| std | 0.233 | -| value_loss | 1.04e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6017 | -| time_elapsed | 42279 | -| total_timesteps | 770176 | -| train/ | | -| approx_kl | 0.019477248 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.0367 | -| explained_variance | -2.67 | -| learning_rate | 0.0003 | -| loss | -0.00876 | -| n_updates | 60160 | -| policy_gradient_loss | -0.00556 | -| std | 0.234 | -| value_loss | 0.000493 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6018 | -| time_elapsed | 42282 | -| total_timesteps | 770304 | -| train/ | | -| approx_kl | 0.0061079254 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.0332 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | -0.000817 | -| n_updates | 60170 | -| policy_gradient_loss | -0.000459 | -| std | 0.234 | -| value_loss | 4.3e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6019 | -| time_elapsed | 42284 | -| total_timesteps | 770432 | -| train/ | | -| approx_kl | 0.00093608536 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 0.0318 | -| explained_variance | -1.95 | -| learning_rate | 0.0003 | -| loss | -0.000564 | -| n_updates | 60180 | -| policy_gradient_loss | -0.000229 | -| std | 0.235 | -| value_loss | 1.37e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6020 | -| time_elapsed | 42287 | -| total_timesteps | 770560 | -| train/ | | -| approx_kl | 0.0031242333 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.0294 | -| explained_variance | -9.95 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 60190 | -| policy_gradient_loss | -0.00207 | -| std | 0.235 | -| value_loss | 1.94e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6021 | -| time_elapsed | 42291 | -| total_timesteps | 770688 | -| train/ | | -| approx_kl | 0.008328413 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.0288 | -| explained_variance | -0.446 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 60200 | -| policy_gradient_loss | -0.00121 | -| std | 0.235 | -| value_loss | 8.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6022 | -| time_elapsed | 42293 | -| total_timesteps | 770816 | -| train/ | | -| approx_kl | 0.012342904 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.0296 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 60210 | -| policy_gradient_loss | -0.004 | -| std | 0.235 | -| value_loss | 3.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 18 | -| iterations | 6023 | -| time_elapsed | 42296 | -| total_timesteps | 770944 | -| train/ | | -| approx_kl | 0.01068148 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.0305 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 60220 | -| policy_gradient_loss | -0.00161 | -| std | 0.235 | -| value_loss | 1.54e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6024 | -| time_elapsed | 42300 | -| total_timesteps | 771072 | -| train/ | | -| approx_kl | 0.013032152 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.0307 | -| explained_variance | -2.55 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 60230 | -| policy_gradient_loss | -0.000294 | -| std | 0.235 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6025 | -| time_elapsed | 42306 | -| total_timesteps | 771200 | -| train/ | | -| approx_kl | 0.12971464 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 0.0288 | -| explained_variance | 0.855 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 60240 | -| policy_gradient_loss | -0.0104 | -| std | 0.235 | -| value_loss | 4.13e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6026 | -| time_elapsed | 42309 | -| total_timesteps | 771328 | -| train/ | | -| approx_kl | 0.03221376 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 0.0276 | -| explained_variance | -0.67 | -| learning_rate | 0.0003 | -| loss | -0.00982 | -| n_updates | 60250 | -| policy_gradient_loss | -0.0107 | -| std | 0.235 | -| value_loss | 3.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6027 | -| time_elapsed | 42312 | -| total_timesteps | 771456 | -| train/ | | -| approx_kl | 0.005409881 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.0277 | -| explained_variance | -1.39 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 60260 | -| policy_gradient_loss | -0.000559 | -| std | 0.235 | -| value_loss | 8.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6028 | -| time_elapsed | 42316 | -| total_timesteps | 771584 | -| train/ | | -| approx_kl | 0.016273541 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 0.0287 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 60270 | -| policy_gradient_loss | -0.00726 | -| std | 0.235 | -| value_loss | 1.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6029 | -| time_elapsed | 42319 | -| total_timesteps | 771712 | -| train/ | | -| approx_kl | 0.022863727 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 0.0291 | -| explained_variance | -3.13 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 60280 | -| policy_gradient_loss | -0.0116 | -| std | 0.235 | -| value_loss | 2.22e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6030 | -| time_elapsed | 42323 | -| total_timesteps | 771840 | -| train/ | | -| approx_kl | 0.0175222 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 0.0294 | -| explained_variance | -0.624 | -| learning_rate | 0.0003 | -| loss | -0.00568 | -| n_updates | 60290 | -| policy_gradient_loss | -0.00605 | -| std | 0.235 | -| value_loss | 6.29e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6031 | -| time_elapsed | 42325 | -| total_timesteps | 771968 | -| train/ | | -| approx_kl | 0.013593266 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 0.0301 | -| explained_variance | -2.22 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 60300 | -| policy_gradient_loss | -0.00185 | -| std | 0.235 | -| value_loss | 9.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6032 | -| time_elapsed | 42330 | -| total_timesteps | 772096 | -| train/ | | -| approx_kl | 0.019146614 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.0299 | -| explained_variance | -6.51 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 60310 | -| policy_gradient_loss | -0.00945 | -| std | 0.235 | -| value_loss | 3.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6033 | -| time_elapsed | 42338 | -| total_timesteps | 772224 | -| train/ | | -| approx_kl | 0.003558698 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.0295 | -| explained_variance | -201 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 60320 | -| policy_gradient_loss | -0.0129 | -| std | 0.235 | -| value_loss | 0.000412 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6034 | -| time_elapsed | 42340 | -| total_timesteps | 772352 | -| train/ | | -| approx_kl | 0.005147841 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.0299 | -| explained_variance | -2.79 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 60330 | -| policy_gradient_loss | -8.32e-05 | -| std | 0.235 | -| value_loss | 1.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6035 | -| time_elapsed | 42342 | -| total_timesteps | 772480 | -| train/ | | -| approx_kl | 0.009579819 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 0.0318 | -| explained_variance | -2.47 | -| learning_rate | 0.0003 | -| loss | -0.00633 | -| n_updates | 60340 | -| policy_gradient_loss | -0.00195 | -| std | 0.234 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6036 | -| time_elapsed | 42345 | -| total_timesteps | 772608 | -| train/ | | -| approx_kl | 0.007340471 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.0316 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 60350 | -| policy_gradient_loss | -0.000417 | -| std | 0.235 | -| value_loss | 3.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6037 | -| time_elapsed | 42347 | -| total_timesteps | 772736 | -| train/ | | -| approx_kl | 0.008969843 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.0298 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 60360 | -| policy_gradient_loss | -0.0017 | -| std | 0.235 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6038 | -| time_elapsed | 42350 | -| total_timesteps | 772864 | -| train/ | | -| approx_kl | 0.010013657 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.0291 | -| explained_variance | -2.94 | -| learning_rate | 0.0003 | -| loss | 0.000474 | -| n_updates | 60370 | -| policy_gradient_loss | -0.000138 | -| std | 0.235 | -| value_loss | 1.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 18 | -| iterations | 6039 | -| time_elapsed | 42353 | -| total_timesteps | 772992 | -| train/ | | -| approx_kl | 0.024460176 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.0309 | -| explained_variance | -0.756 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 60380 | -| policy_gradient_loss | -0.00581 | -| std | 0.234 | -| value_loss | 1.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.798 | -| time/ | | -| fps | 18 | -| iterations | 6040 | -| time_elapsed | 42355 | -| total_timesteps | 773120 | -| train/ | | -| approx_kl | 0.02279412 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.0325 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00467 | -| n_updates | 60390 | -| policy_gradient_loss | -0.00547 | -| std | 0.234 | -| value_loss | 3.45e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.798 | -| time/ | | -| fps | 18 | -| iterations | 6041 | -| time_elapsed | 42364 | -| total_timesteps | 773248 | -| train/ | | -| approx_kl | 0.0013296665 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 0.0329 | -| explained_variance | -988 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 60400 | -| policy_gradient_loss | -0.00117 | -| std | 0.234 | -| value_loss | 0.000389 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.798 | -| time/ | | -| fps | 18 | -| iterations | 6042 | -| time_elapsed | 42368 | -| total_timesteps | 773376 | -| train/ | | -| approx_kl | 0.009154893 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 0.0309 | -| explained_variance | 0.516 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 60410 | -| policy_gradient_loss | -0.00326 | -| std | 0.235 | -| value_loss | 5.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.798 | -| time/ | | -| fps | 18 | -| iterations | 6043 | -| time_elapsed | 42371 | -| total_timesteps | 773504 | -| train/ | | -| approx_kl | 0.011521234 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.0298 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | -0.00629 | -| n_updates | 60420 | -| policy_gradient_loss | -0.00498 | -| std | 0.235 | -| value_loss | 9.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.798 | -| time/ | | -| fps | 18 | -| iterations | 6044 | -| time_elapsed | 42373 | -| total_timesteps | 773632 | -| train/ | | -| approx_kl | 0.00920763 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 0.0299 | -| explained_variance | -5.64 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 60430 | -| policy_gradient_loss | -0.000107 | -| std | 0.235 | -| value_loss | 7.71e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.798 | -| time/ | | -| fps | 18 | -| iterations | 6045 | -| time_elapsed | 42377 | -| total_timesteps | 773760 | -| train/ | | -| approx_kl | 0.010920266 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.0312 | -| explained_variance | -0.459 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 60440 | -| policy_gradient_loss | 7.82e-05 | -| std | 0.234 | -| value_loss | 3.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.798 | -| time/ | | -| fps | 18 | -| iterations | 6046 | -| time_elapsed | 42379 | -| total_timesteps | 773888 | -| train/ | | -| approx_kl | 0.011561353 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.0341 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 60450 | -| policy_gradient_loss | -0.000605 | -| std | 0.234 | -| value_loss | 1.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6047 | -| time_elapsed | 42382 | -| total_timesteps | 774016 | -| train/ | | -| approx_kl | 0.018033018 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.0359 | -| explained_variance | -2.37 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 60460 | -| policy_gradient_loss | -0.00627 | -| std | 0.233 | -| value_loss | 2.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6048 | -| time_elapsed | 42390 | -| total_timesteps | 774144 | -| train/ | | -| approx_kl | 0.002224844 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 0.0369 | -| explained_variance | -475 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 60470 | -| policy_gradient_loss | -0.00645 | -| std | 0.233 | -| value_loss | 0.000256 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6049 | -| time_elapsed | 42395 | -| total_timesteps | 774272 | -| train/ | | -| approx_kl | 0.030270666 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 0.037 | -| explained_variance | -3.88 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 60480 | -| policy_gradient_loss | -0.0105 | -| std | 0.233 | -| value_loss | 4.63e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6050 | -| time_elapsed | 42398 | -| total_timesteps | 774400 | -| train/ | | -| approx_kl | 0.0042565605 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 0.0365 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | -0.000283 | -| n_updates | 60490 | -| policy_gradient_loss | -0.000169 | -| std | 0.234 | -| value_loss | 1.38e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6051 | -| time_elapsed | 42401 | -| total_timesteps | 774528 | -| train/ | | -| approx_kl | 0.008007333 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.0349 | -| explained_variance | -5.12 | -| learning_rate | 0.0003 | -| loss | -0.000559 | -| n_updates | 60500 | -| policy_gradient_loss | -0.000245 | -| std | 0.234 | -| value_loss | 8.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6052 | -| time_elapsed | 42406 | -| total_timesteps | 774656 | -| train/ | | -| approx_kl | 0.009184167 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 0.035 | -| explained_variance | -0.315 | -| learning_rate | 0.0003 | -| loss | 0.00077 | -| n_updates | 60510 | -| policy_gradient_loss | -0.000351 | -| std | 0.234 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6053 | -| time_elapsed | 42408 | -| total_timesteps | 774784 | -| train/ | | -| approx_kl | 0.0034523043 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | 0.0359 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 60520 | -| policy_gradient_loss | -0.00107 | -| std | 0.233 | -| value_loss | 6.33e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.787 | -| time/ | | -| fps | 18 | -| iterations | 6054 | -| time_elapsed | 42411 | -| total_timesteps | 774912 | -| train/ | | -| approx_kl | 0.012541672 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.0379 | -| explained_variance | -1.52 | -| learning_rate | 0.0003 | -| loss | -0.00611 | -| n_updates | 60530 | -| policy_gradient_loss | -0.00248 | -| std | 0.233 | -| value_loss | 8.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6055 | -| time_elapsed | 42414 | -| total_timesteps | 775040 | -| train/ | | -| approx_kl | 0.020639392 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.0403 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | 0.00503 | -| n_updates | 60540 | -| policy_gradient_loss | 0.00234 | -| std | 0.232 | -| value_loss | 7.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6056 | -| time_elapsed | 42422 | -| total_timesteps | 775168 | -| train/ | | -| approx_kl | 0.010831678 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.0412 | -| explained_variance | -2.2e+03 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 60550 | -| policy_gradient_loss | -0.0106 | -| std | 0.232 | -| value_loss | 0.000236 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6057 | -| time_elapsed | 42426 | -| total_timesteps | 775296 | -| train/ | | -| approx_kl | 0.019647302 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.042 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 60560 | -| policy_gradient_loss | -0.00129 | -| std | 0.232 | -| value_loss | 5.19e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6058 | -| time_elapsed | 42428 | -| total_timesteps | 775424 | -| train/ | | -| approx_kl | 0.025697019 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.0426 | -| explained_variance | -6.01 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 60570 | -| policy_gradient_loss | -0.00872 | -| std | 0.232 | -| value_loss | 1.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6059 | -| time_elapsed | 42432 | -| total_timesteps | 775552 | -| train/ | | -| approx_kl | 0.012666615 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.0438 | -| explained_variance | -0.748 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 60580 | -| policy_gradient_loss | -0.00302 | -| std | 0.231 | -| value_loss | 3.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6060 | -| time_elapsed | 42435 | -| total_timesteps | 775680 | -| train/ | | -| approx_kl | 0.00972268 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.0442 | -| explained_variance | -2.46 | -| learning_rate | 0.0003 | -| loss | -0.00077 | -| n_updates | 60590 | -| policy_gradient_loss | -0.000796 | -| std | 0.232 | -| value_loss | 1.31e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6061 | -| time_elapsed | 42438 | -| total_timesteps | 775808 | -| train/ | | -| approx_kl | 0.048908222 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 0.0416 | -| explained_variance | 0.325 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 60600 | -| policy_gradient_loss | -0.0145 | -| std | 0.232 | -| value_loss | 4.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.784 | -| time/ | | -| fps | 18 | -| iterations | 6062 | -| time_elapsed | 42442 | -| total_timesteps | 775936 | -| train/ | | -| approx_kl | 0.039473183 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.0403 | -| explained_variance | -2.31 | -| learning_rate | 0.0003 | -| loss | -0.0235 | -| n_updates | 60610 | -| policy_gradient_loss | -0.0175 | -| std | 0.233 | -| value_loss | 6.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6063 | -| time_elapsed | 42444 | -| total_timesteps | 776064 | -| train/ | | -| approx_kl | 0.0061906674 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.04 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | -0.000193 | -| n_updates | 60620 | -| policy_gradient_loss | -0.000289 | -| std | 0.232 | -| value_loss | 5.08e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6064 | -| time_elapsed | 42450 | -| total_timesteps | 776192 | -| train/ | | -| approx_kl | 0.0042979443 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.0408 | -| explained_variance | -3.92e+03 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 60630 | -| policy_gradient_loss | -0.0122 | -| std | 0.232 | -| value_loss | 0.000194 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6065 | -| time_elapsed | 42454 | -| total_timesteps | 776320 | -| train/ | | -| approx_kl | 0.029402414 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 0.0414 | -| explained_variance | -1.02 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 60640 | -| policy_gradient_loss | -0.0154 | -| std | 0.232 | -| value_loss | 5.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6066 | -| time_elapsed | 42458 | -| total_timesteps | 776448 | -| train/ | | -| approx_kl | 0.020484474 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.0417 | -| explained_variance | -0.769 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 60650 | -| policy_gradient_loss | -0.00669 | -| std | 0.232 | -| value_loss | 6.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6067 | -| time_elapsed | 42461 | -| total_timesteps | 776576 | -| train/ | | -| approx_kl | 0.017882098 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.0413 | -| explained_variance | -5.28 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 60660 | -| policy_gradient_loss | -0.00791 | -| std | 0.232 | -| value_loss | 2.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6068 | -| time_elapsed | 42465 | -| total_timesteps | 776704 | -| train/ | | -| approx_kl | 0.021577701 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.041 | -| explained_variance | -1.85 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 60670 | -| policy_gradient_loss | -0.00777 | -| std | 0.232 | -| value_loss | 3.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6069 | -| time_elapsed | 42469 | -| total_timesteps | 776832 | -| train/ | | -| approx_kl | 0.004638279 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 0.042 | -| explained_variance | -2.61 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 60680 | -| policy_gradient_loss | -0.000247 | -| std | 0.232 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.768 | -| time/ | | -| fps | 18 | -| iterations | 6070 | -| time_elapsed | 42473 | -| total_timesteps | 776960 | -| train/ | | -| approx_kl | 0.002514379 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 0.0454 | -| explained_variance | -8.71 | -| learning_rate | 0.0003 | -| loss | -0.000385 | -| n_updates | 60690 | -| policy_gradient_loss | -0.000203 | -| std | 0.231 | -| value_loss | 6.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6071 | -| time_elapsed | 42476 | -| total_timesteps | 777088 | -| train/ | | -| approx_kl | 0.015533738 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.0482 | -| explained_variance | -4.49 | -| learning_rate | 0.0003 | -| loss | -0.00849 | -| n_updates | 60700 | -| policy_gradient_loss | -0.00632 | -| std | 0.23 | -| value_loss | 1.64e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6072 | -| time_elapsed | 42483 | -| total_timesteps | 777216 | -| train/ | | -| approx_kl | 0.1678134 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.0488 | -| explained_variance | -5.35e+03 | -| learning_rate | 0.0003 | -| loss | -0.000265 | -| n_updates | 60710 | -| policy_gradient_loss | 0.000416 | -| std | 0.231 | -| value_loss | 0.000158 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6073 | -| time_elapsed | 42487 | -| total_timesteps | 777344 | -| train/ | | -| approx_kl | 0.024844006 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.0471 | -| explained_variance | -6.06 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 60720 | -| policy_gradient_loss | -0.00759 | -| std | 0.231 | -| value_loss | 1.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6074 | -| time_elapsed | 42491 | -| total_timesteps | 777472 | -| train/ | | -| approx_kl | 0.015890932 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.0452 | -| explained_variance | -8.03 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 60730 | -| policy_gradient_loss | -0.00196 | -| std | 0.232 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6075 | -| time_elapsed | 42494 | -| total_timesteps | 777600 | -| train/ | | -| approx_kl | 0.0010441095 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.0442 | -| explained_variance | -9.92 | -| learning_rate | 0.0003 | -| loss | -0.000648 | -| n_updates | 60740 | -| policy_gradient_loss | -0.00027 | -| std | 0.231 | -| value_loss | 6.18e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6076 | -| time_elapsed | 42497 | -| total_timesteps | 777728 | -| train/ | | -| approx_kl | 0.014175103 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.047 | -| explained_variance | -9.19 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 60750 | -| policy_gradient_loss | -0.0034 | -| std | 0.23 | -| value_loss | 5.78e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6077 | -| time_elapsed | 42500 | -| total_timesteps | 777856 | -| train/ | | -| approx_kl | 0.02190494 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.0494 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 60760 | -| policy_gradient_loss | -0.00575 | -| std | 0.23 | -| value_loss | 4.73e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6078 | -| time_elapsed | 42502 | -| total_timesteps | 777984 | -| train/ | | -| approx_kl | 0.03278294 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 0.0499 | -| explained_variance | -5.64 | -| learning_rate | 0.0003 | -| loss | 0.00309 | -| n_updates | 60770 | -| policy_gradient_loss | -0.00236 | -| std | 0.23 | -| value_loss | 1.43e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 18 | -| iterations | 6079 | -| time_elapsed | 42505 | -| total_timesteps | 778112 | -| train/ | | -| approx_kl | 0.006884757 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.0502 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | -0.000255 | -| n_updates | 60780 | -| policy_gradient_loss | -8.47e-05 | -| std | 0.23 | -| value_loss | 1.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 18 | -| iterations | 6080 | -| time_elapsed | 42515 | -| total_timesteps | 778240 | -| train/ | | -| approx_kl | 0.015188053 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.0508 | -| explained_variance | -6.78e+03 | -| learning_rate | 0.0003 | -| loss | -0.00959 | -| n_updates | 60790 | -| policy_gradient_loss | -0.00687 | -| std | 0.23 | -| value_loss | 0.000104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 18 | -| iterations | 6081 | -| time_elapsed | 42519 | -| total_timesteps | 778368 | -| train/ | | -| approx_kl | 0.035294797 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.051 | -| explained_variance | -4.12 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 60800 | -| policy_gradient_loss | -0.00996 | -| std | 0.23 | -| value_loss | 4.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 18 | -| iterations | 6082 | -| time_elapsed | 42522 | -| total_timesteps | 778496 | -| train/ | | -| approx_kl | 0.009210528 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 0.0496 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 60810 | -| policy_gradient_loss | -0.000583 | -| std | 0.231 | -| value_loss | 2.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 18 | -| iterations | 6083 | -| time_elapsed | 42526 | -| total_timesteps | 778624 | -| train/ | | -| approx_kl | 0.015176649 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.0469 | -| explained_variance | -13.8 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 60820 | -| policy_gradient_loss | -0.00489 | -| std | 0.231 | -| value_loss | 1.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 18 | -| iterations | 6084 | -| time_elapsed | 42529 | -| total_timesteps | 778752 | -| train/ | | -| approx_kl | 0.017130187 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.0456 | -| explained_variance | -12.8 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 60830 | -| policy_gradient_loss | -0.00409 | -| std | 0.231 | -| value_loss | 3.53e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.75 | -| time/ | | -| fps | 18 | -| iterations | 6085 | -| time_elapsed | 42532 | -| total_timesteps | 778880 | -| train/ | | -| approx_kl | 0.018281266 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.0452 | -| explained_variance | -11.5 | -| learning_rate | 0.0003 | -| loss | -0.00443 | -| n_updates | 60840 | -| policy_gradient_loss | -0.004 | -| std | 0.231 | -| value_loss | 3.9e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6086 | -| time_elapsed | 42533 | -| total_timesteps | 779008 | -| train/ | | -| approx_kl | 0.0014925646 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0443 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.000224 | -| n_updates | 60850 | -| policy_gradient_loss | -6.93e-05 | -| std | 0.232 | -| value_loss | 2.52e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6087 | -| time_elapsed | 42542 | -| total_timesteps | 779136 | -| train/ | | -| approx_kl | 0.0119795045 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.0431 | -| explained_variance | -5.1e+03 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 60860 | -| policy_gradient_loss | -0.00807 | -| std | 0.232 | -| value_loss | 9.73e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6088 | -| time_elapsed | 42545 | -| total_timesteps | 779264 | -| train/ | | -| approx_kl | 0.13077495 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.0427 | -| explained_variance | -7.2 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 60870 | -| policy_gradient_loss | -0.0112 | -| std | 0.232 | -| value_loss | 5.95e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6089 | -| time_elapsed | 42549 | -| total_timesteps | 779392 | -| train/ | | -| approx_kl | 0.00051551964 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0427 | -| explained_variance | -3.71 | -| learning_rate | 0.0003 | -| loss | -9.93e-05 | -| n_updates | 60880 | -| policy_gradient_loss | -4.31e-05 | -| std | 0.232 | -| value_loss | 1.13e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6090 | -| time_elapsed | 42551 | -| total_timesteps | 779520 | -| train/ | | -| approx_kl | 0.0070753116 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.0423 | -| explained_variance | -4.11 | -| learning_rate | 0.0003 | -| loss | 0.000525 | -| n_updates | 60890 | -| policy_gradient_loss | 4.06e-05 | -| std | 0.232 | -| value_loss | 8.3e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6091 | -| time_elapsed | 42555 | -| total_timesteps | 779648 | -| train/ | | -| approx_kl | 0.007738346 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | 0.0411 | -| explained_variance | -10.3 | -| learning_rate | 0.0003 | -| loss | -0.000933 | -| n_updates | 60900 | -| policy_gradient_loss | -0.000846 | -| std | 0.232 | -| value_loss | 7.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6092 | -| time_elapsed | 42559 | -| total_timesteps | 779776 | -| train/ | | -| approx_kl | 0.012454786 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.0406 | -| explained_variance | -8.5 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 60910 | -| policy_gradient_loss | 0.000484 | -| std | 0.232 | -| value_loss | 5.53e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.741 | -| time/ | | -| fps | 18 | -| iterations | 6093 | -| time_elapsed | 42562 | -| total_timesteps | 779904 | -| train/ | | -| approx_kl | 0.026411125 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.0422 | -| explained_variance | -5.46 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 60920 | -| policy_gradient_loss | -0.0106 | -| std | 0.232 | -| value_loss | 6.19e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6094 | -| time_elapsed | 42566 | -| total_timesteps | 780032 | -| train/ | | -| approx_kl | 0.007117633 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.0428 | -| explained_variance | -4.88 | -| learning_rate | 0.0003 | -| loss | -0.00801 | -| n_updates | 60930 | -| policy_gradient_loss | -0.00534 | -| std | 0.232 | -| value_loss | 1.22e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6095 | -| time_elapsed | 42573 | -| total_timesteps | 780160 | -| train/ | | -| approx_kl | 39.595863 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.044 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 60940 | -| policy_gradient_loss | 0.0845 | -| std | 0.231 | -| value_loss | 0.0195 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6096 | -| time_elapsed | 42576 | -| total_timesteps | 780288 | -| train/ | | -| approx_kl | 64.18245 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 0.0447 | -| explained_variance | -0.000761 | -| learning_rate | 0.0003 | -| loss | 0.492 | -| n_updates | 60950 | -| policy_gradient_loss | 0.258 | -| std | 0.231 | -| value_loss | 0.498 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6097 | -| time_elapsed | 42580 | -| total_timesteps | 780416 | -| train/ | | -| approx_kl | 0.018033646 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 0.0448 | -| explained_variance | 0.00614 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 60960 | -| policy_gradient_loss | -0.009 | -| std | 0.231 | -| value_loss | 0.00257 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6098 | -| time_elapsed | 42584 | -| total_timesteps | 780544 | -| train/ | | -| approx_kl | 0.017957801 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.0449 | -| explained_variance | -0.00914 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 60970 | -| policy_gradient_loss | -0.00237 | -| std | 0.231 | -| value_loss | 0.00195 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6099 | -| time_elapsed | 42586 | -| total_timesteps | 780672 | -| train/ | | -| approx_kl | 0.019213779 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.0452 | -| explained_variance | -0.00365 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 60980 | -| policy_gradient_loss | -0.00317 | -| std | 0.231 | -| value_loss | 0.00118 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6100 | -| time_elapsed | 42590 | -| total_timesteps | 780800 | -| train/ | | -| approx_kl | 0.0045125624 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.0459 | -| explained_variance | -0.00526 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 60990 | -| policy_gradient_loss | -0.000664 | -| std | 0.231 | -| value_loss | 0.000723 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6101 | -| time_elapsed | 42593 | -| total_timesteps | 780928 | -| train/ | | -| approx_kl | 0.009396207 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.0473 | -| explained_variance | -0.00996 | -| learning_rate | 0.0003 | -| loss | 0.00065 | -| n_updates | 61000 | -| policy_gradient_loss | -0.000186 | -| std | 0.23 | -| value_loss | 0.000482 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6102 | -| time_elapsed | 42596 | -| total_timesteps | 781056 | -| train/ | | -| approx_kl | 0.008302186 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.0497 | -| explained_variance | -0.00877 | -| learning_rate | 0.0003 | -| loss | -0.000567 | -| n_updates | 61010 | -| policy_gradient_loss | 0.000969 | -| std | 0.23 | -| value_loss | 0.000456 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6103 | -| time_elapsed | 42600 | -| total_timesteps | 781184 | -| train/ | | -| approx_kl | 12.744279 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.051 | -| explained_variance | 0.00889 | -| learning_rate | 0.0003 | -| loss | 0.211 | -| n_updates | 61020 | -| policy_gradient_loss | 0.166 | -| std | 0.23 | -| value_loss | 0.0237 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6104 | -| time_elapsed | 42603 | -| total_timesteps | 781312 | -| train/ | | -| approx_kl | 0.015434541 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 0.0512 | -| explained_variance | 0.00115 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 61030 | -| policy_gradient_loss | -0.00561 | -| std | 0.23 | -| value_loss | 0.00102 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6105 | -| time_elapsed | 42606 | -| total_timesteps | 781440 | -| train/ | | -| approx_kl | 0.010591381 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.051 | -| explained_variance | -0.00109 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 61040 | -| policy_gradient_loss | -0.00091 | -| std | 0.23 | -| value_loss | 0.000213 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6106 | -| time_elapsed | 42609 | -| total_timesteps | 781568 | -| train/ | | -| approx_kl | 0.022460647 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 0.0501 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.00191 | -| n_updates | 61050 | -| policy_gradient_loss | -0.00122 | -| std | 0.23 | -| value_loss | 0.000171 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6107 | -| time_elapsed | 42610 | -| total_timesteps | 781696 | -| train/ | | -| approx_kl | 0.003169661 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.0494 | -| explained_variance | -0.00739 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 61060 | -| policy_gradient_loss | -0.00171 | -| std | 0.23 | -| value_loss | 9.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6108 | -| time_elapsed | 42614 | -| total_timesteps | 781824 | -| train/ | | -| approx_kl | 0.013510425 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.049 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | -0.000907 | -| n_updates | 61070 | -| policy_gradient_loss | -0.000491 | -| std | 0.23 | -| value_loss | 7.4e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6109 | -| time_elapsed | 42618 | -| total_timesteps | 781952 | -| train/ | | -| approx_kl | 0.024516145 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.0496 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 61080 | -| policy_gradient_loss | -0.00472 | -| std | 0.23 | -| value_loss | 3.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6110 | -| time_elapsed | 42621 | -| total_timesteps | 782080 | -| train/ | | -| approx_kl | 0.014629878 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.0501 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 61090 | -| policy_gradient_loss | -0.00655 | -| std | 0.23 | -| value_loss | 1.77e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6111 | -| time_elapsed | 42627 | -| total_timesteps | 782208 | -| train/ | | -| approx_kl | 2.7482524 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.0504 | -| explained_variance | 0.0212 | -| learning_rate | 0.0003 | -| loss | 0.0429 | -| n_updates | 61100 | -| policy_gradient_loss | 0.0655 | -| std | 0.23 | -| value_loss | 0.00696 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6112 | -| time_elapsed | 42631 | -| total_timesteps | 782336 | -| train/ | | -| approx_kl | 0.005479171 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 0.0498 | -| explained_variance | 0.00408 | -| learning_rate | 0.0003 | -| loss | -0.000235 | -| n_updates | 61110 | -| policy_gradient_loss | -0.000128 | -| std | 0.23 | -| value_loss | 5.46e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6113 | -| time_elapsed | 42635 | -| total_timesteps | 782464 | -| train/ | | -| approx_kl | 0.0013757055 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0504 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.000392 | -| n_updates | 61120 | -| policy_gradient_loss | -0.00017 | -| std | 0.23 | -| value_loss | 2.26e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6114 | -| time_elapsed | 42637 | -| total_timesteps | 782592 | -| train/ | | -| approx_kl | 0.02987501 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 0.0546 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.00811 | -| n_updates | 61130 | -| policy_gradient_loss | -0.00771 | -| std | 0.229 | -| value_loss | 5.04e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6115 | -| time_elapsed | 42640 | -| total_timesteps | 782720 | -| train/ | | -| approx_kl | 0.0027068383 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.0582 | -| explained_variance | -0.00115 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 61140 | -| policy_gradient_loss | -0.00137 | -| std | 0.228 | -| value_loss | 1.2e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6116 | -| time_elapsed | 42644 | -| total_timesteps | 782848 | -| train/ | | -| approx_kl | 0.0062221973 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.0607 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.000846 | -| n_updates | 61150 | -| policy_gradient_loss | -0.000572 | -| std | 0.228 | -| value_loss | 6.68e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.762 | -| time/ | | -| fps | 18 | -| iterations | 6117 | -| time_elapsed | 42648 | -| total_timesteps | 782976 | -| train/ | | -| approx_kl | 0.03277707 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 0.062 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | -0.00567 | -| n_updates | 61160 | -| policy_gradient_loss | -0.00861 | -| std | 0.227 | -| value_loss | 2.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 18 | -| iterations | 6118 | -| time_elapsed | 42651 | -| total_timesteps | 783104 | -| train/ | | -| approx_kl | 0.020422533 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.0624 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.00857 | -| n_updates | 61170 | -| policy_gradient_loss | -0.00774 | -| std | 0.227 | -| value_loss | 1.7e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 18 | -| iterations | 6119 | -| time_elapsed | 42661 | -| total_timesteps | 783232 | -| train/ | | -| approx_kl | 0.03675094 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 0.0628 | -| explained_variance | -5.89 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 61180 | -| policy_gradient_loss | -0.0136 | -| std | 0.227 | -| value_loss | 0.00013 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 18 | -| iterations | 6120 | -| time_elapsed | 42664 | -| total_timesteps | 783360 | -| train/ | | -| approx_kl | 0.021765664 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.0628 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 61190 | -| policy_gradient_loss | -0.00468 | -| std | 0.227 | -| value_loss | 3.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 18 | -| iterations | 6121 | -| time_elapsed | 42668 | -| total_timesteps | 783488 | -| train/ | | -| approx_kl | 0.008480882 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 0.0612 | -| explained_variance | -3.55 | -| learning_rate | 0.0003 | -| loss | 3.95e-06 | -| n_updates | 61200 | -| policy_gradient_loss | -0.000246 | -| std | 0.228 | -| value_loss | 2.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 18 | -| iterations | 6122 | -| time_elapsed | 42671 | -| total_timesteps | 783616 | -| train/ | | -| approx_kl | 0.016252182 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.0586 | -| explained_variance | -2.51 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 61210 | -| policy_gradient_loss | -0.00354 | -| std | 0.228 | -| value_loss | 3.2e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 18 | -| iterations | 6123 | -| time_elapsed | 42674 | -| total_timesteps | 783744 | -| train/ | | -| approx_kl | 0.0011570384 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0595 | -| explained_variance | -0.721 | -| learning_rate | 0.0003 | -| loss | -0.000998 | -| n_updates | 61220 | -| policy_gradient_loss | -0.00042 | -| std | 0.227 | -| value_loss | 1.62e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.751 | -| time/ | | -| fps | 18 | -| iterations | 6124 | -| time_elapsed | 42677 | -| total_timesteps | 783872 | -| train/ | | -| approx_kl | 0.005332253 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.0654 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 61230 | -| policy_gradient_loss | -0.000791 | -| std | 0.226 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6125 | -| time_elapsed | 42680 | -| total_timesteps | 784000 | -| train/ | | -| approx_kl | 0.009494001 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | 0.069 | -| explained_variance | -0.0689 | -| learning_rate | 0.0003 | -| loss | 0.000636 | -| n_updates | 61240 | -| policy_gradient_loss | -0.000326 | -| std | 0.226 | -| value_loss | 1.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6126 | -| time_elapsed | 42683 | -| total_timesteps | 784128 | -| train/ | | -| approx_kl | 0.012598366 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.0698 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | -0.00591 | -| n_updates | 61250 | -| policy_gradient_loss | -0.00434 | -| std | 0.226 | -| value_loss | 1.61e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6127 | -| time_elapsed | 42690 | -| total_timesteps | 784256 | -| train/ | | -| approx_kl | 0.04576091 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 0.0696 | -| explained_variance | -518 | -| learning_rate | 0.0003 | -| loss | -0.00534 | -| n_updates | 61260 | -| policy_gradient_loss | -0.00526 | -| std | 0.226 | -| value_loss | 0.00012 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6128 | -| time_elapsed | 42694 | -| total_timesteps | 784384 | -| train/ | | -| approx_kl | 0.008698859 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 0.0693 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | -0.000589 | -| n_updates | 61270 | -| policy_gradient_loss | -0.000804 | -| std | 0.226 | -| value_loss | 3.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6129 | -| time_elapsed | 42697 | -| total_timesteps | 784512 | -| train/ | | -| approx_kl | 0.012377594 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.0688 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 61280 | -| policy_gradient_loss | -0.00243 | -| std | 0.226 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6130 | -| time_elapsed | 42701 | -| total_timesteps | 784640 | -| train/ | | -| approx_kl | 0.0086118225 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.0686 | -| explained_variance | 0.0535 | -| learning_rate | 0.0003 | -| loss | -0.00868 | -| n_updates | 61290 | -| policy_gradient_loss | -0.00674 | -| std | 0.226 | -| value_loss | 0.00174 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6131 | -| time_elapsed | 42705 | -| total_timesteps | 784768 | -| train/ | | -| approx_kl | 0.019210879 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.0693 | -| explained_variance | 0.483 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 61300 | -| policy_gradient_loss | -0.00976 | -| std | 0.226 | -| value_loss | 5.8e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.74 | -| time/ | | -| fps | 18 | -| iterations | 6132 | -| time_elapsed | 42708 | -| total_timesteps | 784896 | -| train/ | | -| approx_kl | 0.01890824 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.0697 | -| explained_variance | 0.386 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 61310 | -| policy_gradient_loss | -0.0036 | -| std | 0.226 | -| value_loss | 4.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6133 | -| time_elapsed | 42711 | -| total_timesteps | 785024 | -| train/ | | -| approx_kl | 0.013906601 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.0699 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | 0.000484 | -| n_updates | 61320 | -| policy_gradient_loss | -0.000887 | -| std | 0.226 | -| value_loss | 3.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6134 | -| time_elapsed | 42720 | -| total_timesteps | 785152 | -| train/ | | -| approx_kl | 0.02638216 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.0705 | -| explained_variance | -19 | -| learning_rate | 0.0003 | -| loss | -0.00713 | -| n_updates | 61330 | -| policy_gradient_loss | -0.00464 | -| std | 0.225 | -| value_loss | 0.000118 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6135 | -| time_elapsed | 42723 | -| total_timesteps | 785280 | -| train/ | | -| approx_kl | 0.005707875 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.0726 | -| explained_variance | -0.593 | -| learning_rate | 0.0003 | -| loss | -0.000507 | -| n_updates | 61340 | -| policy_gradient_loss | -0.000419 | -| std | 0.224 | -| value_loss | 1.05e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6136 | -| time_elapsed | 42726 | -| total_timesteps | 785408 | -| train/ | | -| approx_kl | 0.01535772 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.0768 | -| explained_variance | -0.654 | -| learning_rate | 0.0003 | -| loss | 0.00517 | -| n_updates | 61350 | -| policy_gradient_loss | 0.00283 | -| std | 0.224 | -| value_loss | 9.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6137 | -| time_elapsed | 42729 | -| total_timesteps | 785536 | -| train/ | | -| approx_kl | 0.011344878 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.0789 | -| explained_variance | -2.05 | -| learning_rate | 0.0003 | -| loss | -0.000373 | -| n_updates | 61360 | -| policy_gradient_loss | -0.00103 | -| std | 0.223 | -| value_loss | 1.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6138 | -| time_elapsed | 42732 | -| total_timesteps | 785664 | -| train/ | | -| approx_kl | 0.0054349434 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 0.0798 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 61370 | -| policy_gradient_loss | -0.00446 | -| std | 0.223 | -| value_loss | 7.48e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6139 | -| time_elapsed | 42735 | -| total_timesteps | 785792 | -| train/ | | -| approx_kl | 0.0059954775 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | 0.0792 | -| explained_variance | 0.234 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 61380 | -| policy_gradient_loss | -0.000317 | -| std | 0.224 | -| value_loss | 3.48e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.733 | -| time/ | | -| fps | 18 | -| iterations | 6140 | -| time_elapsed | 42738 | -| total_timesteps | 785920 | -| train/ | | -| approx_kl | 0.012331614 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.076 | -| explained_variance | 0.298 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 61390 | -| policy_gradient_loss | -0.00219 | -| std | 0.225 | -| value_loss | 3.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6141 | -| time_elapsed | 42742 | -| total_timesteps | 786048 | -| train/ | | -| approx_kl | 0.016576998 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.0745 | -| explained_variance | -2.58 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 61400 | -| policy_gradient_loss | -0.0152 | -| std | 0.225 | -| value_loss | 9.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6142 | -| time_elapsed | 42748 | -| total_timesteps | 786176 | -| train/ | | -| approx_kl | 0.05929211 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 0.0736 | -| explained_variance | -86.4 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 61410 | -| policy_gradient_loss | -0.00287 | -| std | 0.225 | -| value_loss | 0.000106 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6143 | -| time_elapsed | 42751 | -| total_timesteps | 786304 | -| train/ | | -| approx_kl | 0.000608284 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 0.0723 | -| explained_variance | 0.476 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 61420 | -| policy_gradient_loss | 0.00289 | -| std | 0.225 | -| value_loss | 2.85e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6144 | -| time_elapsed | 42754 | -| total_timesteps | 786432 | -| train/ | | -| approx_kl | 0.02648396 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 0.0713 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 61430 | -| policy_gradient_loss | -0.0158 | -| std | 0.225 | -| value_loss | 1.19e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6145 | -| time_elapsed | 42758 | -| total_timesteps | 786560 | -| train/ | | -| approx_kl | 0.0084242895 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.0704 | -| explained_variance | -0.598 | -| learning_rate | 0.0003 | -| loss | 1.27e-05 | -| n_updates | 61440 | -| policy_gradient_loss | 0.000601 | -| std | 0.226 | -| value_loss | 6.13e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6146 | -| time_elapsed | 42761 | -| total_timesteps | 786688 | -| train/ | | -| approx_kl | 0.02237773 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.0697 | -| explained_variance | -2.83 | -| learning_rate | 0.0003 | -| loss | 0.00366 | -| n_updates | 61450 | -| policy_gradient_loss | 0.00016 | -| std | 0.226 | -| value_loss | 1.36e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6147 | -| time_elapsed | 42764 | -| total_timesteps | 786816 | -| train/ | | -| approx_kl | 0.01680173 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 0.0699 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 61460 | -| policy_gradient_loss | -0.00166 | -| std | 0.226 | -| value_loss | 2.06e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.724 | -| time/ | | -| fps | 18 | -| iterations | 6148 | -| time_elapsed | 42768 | -| total_timesteps | 786944 | -| train/ | | -| approx_kl | 0.0052708713 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 0.0711 | -| explained_variance | -4.61 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 61470 | -| policy_gradient_loss | 0.000197 | -| std | 0.225 | -| value_loss | 1.06e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6149 | -| time_elapsed | 42770 | -| total_timesteps | 787072 | -| train/ | | -| approx_kl | 0.013850289 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.0743 | -| explained_variance | 0.267 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 61480 | -| policy_gradient_loss | -0.0046 | -| std | 0.224 | -| value_loss | 1.96e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6150 | -| time_elapsed | 42776 | -| total_timesteps | 787200 | -| train/ | | -| approx_kl | 0.0019643302 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 0.076 | -| explained_variance | -584 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 61490 | -| policy_gradient_loss | 0.00189 | -| std | 0.224 | -| value_loss | 0.0001 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6151 | -| time_elapsed | 42778 | -| total_timesteps | 787328 | -| train/ | | -| approx_kl | 0.0072812443 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.0774 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.00185 | -| n_updates | 61500 | -| policy_gradient_loss | 0.00478 | -| std | 0.224 | -| value_loss | 5.11e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6152 | -| time_elapsed | 42780 | -| total_timesteps | 787456 | -| train/ | | -| approx_kl | 0.0111950915 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 0.0788 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 61510 | -| policy_gradient_loss | -0.000449 | -| std | 0.224 | -| value_loss | 1.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6153 | -| time_elapsed | 42784 | -| total_timesteps | 787584 | -| train/ | | -| approx_kl | 0.025168447 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 0.0794 | -| explained_variance | 0.0754 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 61520 | -| policy_gradient_loss | -0.0118 | -| std | 0.224 | -| value_loss | 8.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6154 | -| time_elapsed | 42787 | -| total_timesteps | 787712 | -| train/ | | -| approx_kl | 0.01562332 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.0793 | -| explained_variance | -2.14 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 61530 | -| policy_gradient_loss | -0.00967 | -| std | 0.223 | -| value_loss | 1.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6155 | -| time_elapsed | 42790 | -| total_timesteps | 787840 | -| train/ | | -| approx_kl | 0.030466102 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.0794 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 61540 | -| policy_gradient_loss | -0.00632 | -| std | 0.224 | -| value_loss | 4.95e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.718 | -| time/ | | -| fps | 18 | -| iterations | 6156 | -| time_elapsed | 42793 | -| total_timesteps | 787968 | -| train/ | | -| approx_kl | 0.0029745707 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 0.0789 | -| explained_variance | -0.665 | -| learning_rate | 0.0003 | -| loss | -0.000214 | -| n_updates | 61550 | -| policy_gradient_loss | 3.22e-05 | -| std | 0.224 | -| value_loss | 3e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6157 | -| time_elapsed | 42797 | -| total_timesteps | 788096 | -| train/ | | -| approx_kl | 0.014153515 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 0.0785 | -| explained_variance | -2.11 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 61560 | -| policy_gradient_loss | -0.00253 | -| std | 0.224 | -| value_loss | 1.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6158 | -| time_elapsed | 42805 | -| total_timesteps | 788224 | -| train/ | | -| approx_kl | 0.069005206 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 0.079 | -| explained_variance | -60.7 | -| learning_rate | 0.0003 | -| loss | -0.00738 | -| n_updates | 61570 | -| policy_gradient_loss | -0.00527 | -| std | 0.224 | -| value_loss | 9.98e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6159 | -| time_elapsed | 42808 | -| total_timesteps | 788352 | -| train/ | | -| approx_kl | 0.0075977463 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 0.0787 | -| explained_variance | -0.408 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 61580 | -| policy_gradient_loss | -0.000593 | -| std | 0.224 | -| value_loss | 1.33e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6160 | -| time_elapsed | 42810 | -| total_timesteps | 788480 | -| train/ | | -| approx_kl | 0.02940305 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 0.0781 | -| explained_variance | -0.426 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 61590 | -| policy_gradient_loss | -0.00741 | -| std | 0.224 | -| value_loss | 1.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6161 | -| time_elapsed | 42813 | -| total_timesteps | 788608 | -| train/ | | -| approx_kl | 0.01779105 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.0785 | -| explained_variance | -1.97 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 61600 | -| policy_gradient_loss | -0.00657 | -| std | 0.224 | -| value_loss | 1.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6162 | -| time_elapsed | 42817 | -| total_timesteps | 788736 | -| train/ | | -| approx_kl | 0.014637165 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.0782 | -| explained_variance | -3.24 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 61610 | -| policy_gradient_loss | -0.00192 | -| std | 0.224 | -| value_loss | 9.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6163 | -| time_elapsed | 42820 | -| total_timesteps | 788864 | -| train/ | | -| approx_kl | 0.023756372 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.0774 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 61620 | -| policy_gradient_loss | -0.00155 | -| std | 0.224 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.716 | -| time/ | | -| fps | 18 | -| iterations | 6164 | -| time_elapsed | 42824 | -| total_timesteps | 788992 | -| train/ | | -| approx_kl | 0.025140611 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.0766 | -| explained_variance | 0.317 | -| learning_rate | 0.0003 | -| loss | -0.00591 | -| n_updates | 61630 | -| policy_gradient_loss | -0.00575 | -| std | 0.224 | -| value_loss | 2.33e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.71 | -| time/ | | -| fps | 18 | -| iterations | 6165 | -| time_elapsed | 42826 | -| total_timesteps | 789120 | -| train/ | | -| approx_kl | 0.00570716 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | 0.0767 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.000293 | -| n_updates | 61640 | -| policy_gradient_loss | -0.000304 | -| std | 0.224 | -| value_loss | 2.08e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.71 | -| time/ | | -| fps | 18 | -| iterations | 6166 | -| time_elapsed | 42834 | -| total_timesteps | 789248 | -| train/ | | -| approx_kl | 0.046476793 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.0791 | -| explained_variance | -82.4 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 61650 | -| policy_gradient_loss | -0.00812 | -| std | 0.223 | -| value_loss | 9.4e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.71 | -| time/ | | -| fps | 18 | -| iterations | 6167 | -| time_elapsed | 42837 | -| total_timesteps | 789376 | -| train/ | | -| approx_kl | 0.030277506 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 0.0802 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 61660 | -| policy_gradient_loss | -0.00921 | -| std | 0.223 | -| value_loss | 7.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.71 | -| time/ | | -| fps | 18 | -| iterations | 6168 | -| time_elapsed | 42840 | -| total_timesteps | 789504 | -| train/ | | -| approx_kl | 0.012435699 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 0.0798 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 61670 | -| policy_gradient_loss | -0.00273 | -| std | 0.223 | -| value_loss | 1.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.71 | -| time/ | | -| fps | 18 | -| iterations | 6169 | -| time_elapsed | 42842 | -| total_timesteps | 789632 | -| train/ | | -| approx_kl | 0.007765089 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 0.0795 | -| explained_variance | -3.54 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 61680 | -| policy_gradient_loss | -0.000864 | -| std | 0.224 | -| value_loss | 4.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.71 | -| time/ | | -| fps | 18 | -| iterations | 6170 | -| time_elapsed | 42846 | -| total_timesteps | 789760 | -| train/ | | -| approx_kl | 0.0023491331 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | 0.0795 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.000402 | -| n_updates | 61690 | -| policy_gradient_loss | 6.59e-05 | -| std | 0.223 | -| value_loss | 3.85e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.71 | -| time/ | | -| fps | 18 | -| iterations | 6171 | -| time_elapsed | 42850 | -| total_timesteps | 789888 | -| train/ | | -| approx_kl | 0.011474957 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.0796 | -| explained_variance | -3.34 | -| learning_rate | 0.0003 | -| loss | 0.000994 | -| n_updates | 61700 | -| policy_gradient_loss | 0.00014 | -| std | 0.224 | -| value_loss | 1.92e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6172 | -| time_elapsed | 42853 | -| total_timesteps | 790016 | -| train/ | | -| approx_kl | 0.014850523 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.0779 | -| explained_variance | -0.787 | -| learning_rate | 0.0003 | -| loss | -0.00393 | -| n_updates | 61710 | -| policy_gradient_loss | -0.00364 | -| std | 0.224 | -| value_loss | 5.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6173 | -| time_elapsed | 42863 | -| total_timesteps | 790144 | -| train/ | | -| approx_kl | 0.061860017 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 0.0772 | -| explained_variance | -543 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 61720 | -| policy_gradient_loss | -0.0134 | -| std | 0.224 | -| value_loss | 9.05e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6174 | -| time_elapsed | 42867 | -| total_timesteps | 790272 | -| train/ | | -| approx_kl | 0.005670905 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.0772 | -| explained_variance | -0.272 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 61730 | -| policy_gradient_loss | -0.00373 | -| std | 0.224 | -| value_loss | 1.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6175 | -| time_elapsed | 42870 | -| total_timesteps | 790400 | -| train/ | | -| approx_kl | 0.004527908 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | 0.0782 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | -0.000444 | -| n_updates | 61740 | -| policy_gradient_loss | -0.000171 | -| std | 0.223 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6176 | -| time_elapsed | 42873 | -| total_timesteps | 790528 | -| train/ | | -| approx_kl | 0.015128186 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.081 | -| explained_variance | -0.602 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 61750 | -| policy_gradient_loss | -0.00596 | -| std | 0.223 | -| value_loss | 8.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6177 | -| time_elapsed | 42876 | -| total_timesteps | 790656 | -| train/ | | -| approx_kl | 0.023096584 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.0818 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 61760 | -| policy_gradient_loss | -0.00396 | -| std | 0.223 | -| value_loss | 3.55e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6178 | -| time_elapsed | 42880 | -| total_timesteps | 790784 | -| train/ | | -| approx_kl | 0.0045437166 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.0811 | -| explained_variance | 0.262 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 61770 | -| policy_gradient_loss | -0.00272 | -| std | 0.223 | -| value_loss | 1.43e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.702 | -| time/ | | -| fps | 18 | -| iterations | 6179 | -| time_elapsed | 42883 | -| total_timesteps | 790912 | -| train/ | | -| approx_kl | 0.0109660765 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.0809 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 61780 | -| policy_gradient_loss | -0.00768 | -| std | 0.223 | -| value_loss | 8.54e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6180 | -| time_elapsed | 42886 | -| total_timesteps | 791040 | -| train/ | | -| approx_kl | 0.011082057 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.0801 | -| explained_variance | 0.13 | -| learning_rate | 0.0003 | -| loss | 0.000749 | -| n_updates | 61790 | -| policy_gradient_loss | -0.000158 | -| std | 0.224 | -| value_loss | 3.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6181 | -| time_elapsed | 42892 | -| total_timesteps | 791168 | -| train/ | | -| approx_kl | 0.016180394 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.0782 | -| explained_variance | -72.9 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 61800 | -| policy_gradient_loss | -0.0165 | -| std | 0.224 | -| value_loss | 9.03e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6182 | -| time_elapsed | 42895 | -| total_timesteps | 791296 | -| train/ | | -| approx_kl | 0.00924281 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.0781 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | 0.000718 | -| n_updates | 61810 | -| policy_gradient_loss | 0.000769 | -| std | 0.224 | -| value_loss | 1.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6183 | -| time_elapsed | 42899 | -| total_timesteps | 791424 | -| train/ | | -| approx_kl | 0.00718478 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.079 | -| explained_variance | -0.549 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 61820 | -| policy_gradient_loss | 0.000831 | -| std | 0.223 | -| value_loss | 2.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6184 | -| time_elapsed | 42902 | -| total_timesteps | 791552 | -| train/ | | -| approx_kl | 0.004348707 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.081 | -| explained_variance | -3.56 | -| learning_rate | 0.0003 | -| loss | -0.000381 | -| n_updates | 61830 | -| policy_gradient_loss | 0.00252 | -| std | 0.223 | -| value_loss | 2.98e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6185 | -| time_elapsed | 42905 | -| total_timesteps | 791680 | -| train/ | | -| approx_kl | 0.0008964981 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0847 | -| explained_variance | -0.578 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 61840 | -| policy_gradient_loss | -0.000317 | -| std | 0.221 | -| value_loss | 1.23e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6186 | -| time_elapsed | 42908 | -| total_timesteps | 791808 | -| train/ | | -| approx_kl | 0.01990246 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 0.091 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 61850 | -| policy_gradient_loss | -0.00792 | -| std | 0.22 | -| value_loss | 4.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.688 | -| time/ | | -| fps | 18 | -| iterations | 6187 | -| time_elapsed | 42912 | -| total_timesteps | 791936 | -| train/ | | -| approx_kl | 0.009440163 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 0.0943 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | 0.000921 | -| n_updates | 61860 | -| policy_gradient_loss | -0.000344 | -| std | 0.22 | -| value_loss | 3.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6188 | -| time_elapsed | 42915 | -| total_timesteps | 792064 | -| train/ | | -| approx_kl | 0.009833999 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.0956 | -| explained_variance | -4.22 | -| learning_rate | 0.0003 | -| loss | 0.000468 | -| n_updates | 61870 | -| policy_gradient_loss | -1.15e-05 | -| std | 0.22 | -| value_loss | 2.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6189 | -| time_elapsed | 42922 | -| total_timesteps | 792192 | -| train/ | | -| approx_kl | 0.016054586 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.0947 | -| explained_variance | -101 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 61880 | -| policy_gradient_loss | -0.0119 | -| std | 0.22 | -| value_loss | 8.67e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6190 | -| time_elapsed | 42924 | -| total_timesteps | 792320 | -| train/ | | -| approx_kl | 0.013941035 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.0946 | -| explained_variance | -5.51 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 61890 | -| policy_gradient_loss | -0.00619 | -| std | 0.22 | -| value_loss | 5.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6191 | -| time_elapsed | 42927 | -| total_timesteps | 792448 | -| train/ | | -| approx_kl | 0.011167716 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 0.0941 | -| explained_variance | -0.596 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 61900 | -| policy_gradient_loss | -0.0011 | -| std | 0.22 | -| value_loss | 3.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6192 | -| time_elapsed | 42932 | -| total_timesteps | 792576 | -| train/ | | -| approx_kl | 0.01838605 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.0929 | -| explained_variance | -0.756 | -| learning_rate | 0.0003 | -| loss | -0.0259 | -| n_updates | 61910 | -| policy_gradient_loss | -0.0095 | -| std | 0.221 | -| value_loss | 4.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6193 | -| time_elapsed | 42935 | -| total_timesteps | 792704 | -| train/ | | -| approx_kl | 0.009186698 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.0914 | -| explained_variance | 0.271 | -| learning_rate | 0.0003 | -| loss | -0.000589 | -| n_updates | 61920 | -| policy_gradient_loss | 0.000141 | -| std | 0.221 | -| value_loss | 5.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6194 | -| time_elapsed | 42938 | -| total_timesteps | 792832 | -| train/ | | -| approx_kl | 0.008414067 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.0892 | -| explained_variance | -14.9 | -| learning_rate | 0.0003 | -| loss | -0.00636 | -| n_updates | 61930 | -| policy_gradient_loss | -0.00452 | -| std | 0.221 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.685 | -| time/ | | -| fps | 18 | -| iterations | 6195 | -| time_elapsed | 42942 | -| total_timesteps | 792960 | -| train/ | | -| approx_kl | 0.012240801 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.0887 | -| explained_variance | -0.00896 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 61940 | -| policy_gradient_loss | -0.00305 | -| std | 0.221 | -| value_loss | 4.4e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6196 | -| time_elapsed | 42945 | -| total_timesteps | 793088 | -| train/ | | -| approx_kl | 0.0012390222 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.0888 | -| explained_variance | -0.66 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 61950 | -| policy_gradient_loss | 0.000817 | -| std | 0.221 | -| value_loss | 9.36e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6197 | -| time_elapsed | 42950 | -| total_timesteps | 793216 | -| train/ | | -| approx_kl | 0.010309548 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 0.0897 | -| explained_variance | -39.8 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 61960 | -| policy_gradient_loss | -0.00922 | -| std | 0.221 | -| value_loss | 8.61e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6198 | -| time_elapsed | 42954 | -| total_timesteps | 793344 | -| train/ | | -| approx_kl | 0.008663851 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.0896 | -| explained_variance | -3.94 | -| learning_rate | 0.0003 | -| loss | 0.000864 | -| n_updates | 61970 | -| policy_gradient_loss | 0.00157 | -| std | 0.221 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6199 | -| time_elapsed | 42957 | -| total_timesteps | 793472 | -| train/ | | -| approx_kl | 0.010610904 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 0.0892 | -| explained_variance | -0.538 | -| learning_rate | 0.0003 | -| loss | -0.000691 | -| n_updates | 61980 | -| policy_gradient_loss | -0.000635 | -| std | 0.221 | -| value_loss | 3.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6200 | -| time_elapsed | 42960 | -| total_timesteps | 793600 | -| train/ | | -| approx_kl | 0.007815627 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.09 | -| explained_variance | -0.946 | -| learning_rate | 0.0003 | -| loss | -0.000389 | -| n_updates | 61990 | -| policy_gradient_loss | 0.000547 | -| std | 0.221 | -| value_loss | 1.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6201 | -| time_elapsed | 42964 | -| total_timesteps | 793728 | -| train/ | | -| approx_kl | 0.015718007 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 0.0909 | -| explained_variance | -4.02 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 62000 | -| policy_gradient_loss | -0.00196 | -| std | 0.221 | -| value_loss | 5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6202 | -| time_elapsed | 42967 | -| total_timesteps | 793856 | -| train/ | | -| approx_kl | 0.013011074 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.0916 | -| explained_variance | -1.43 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 62010 | -| policy_gradient_loss | -0.00208 | -| std | 0.221 | -| value_loss | 2.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.676 | -| time/ | | -| fps | 18 | -| iterations | 6203 | -| time_elapsed | 42970 | -| total_timesteps | 793984 | -| train/ | | -| approx_kl | 0.007812753 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.091 | -| explained_variance | -2.2 | -| learning_rate | 0.0003 | -| loss | 0.00062 | -| n_updates | 62020 | -| policy_gradient_loss | -0.000191 | -| std | 0.221 | -| value_loss | 2.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.67 | -| time/ | | -| fps | 18 | -| iterations | 6204 | -| time_elapsed | 42973 | -| total_timesteps | 794112 | -| train/ | | -| approx_kl | 0.026532106 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.0888 | -| explained_variance | -0.972 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 62030 | -| policy_gradient_loss | -0.00943 | -| std | 0.222 | -| value_loss | 1.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.67 | -| time/ | | -| fps | 18 | -| iterations | 6205 | -| time_elapsed | 42980 | -| total_timesteps | 794240 | -| train/ | | -| approx_kl | 0.037298296 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.0878 | -| explained_variance | -210 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 62040 | -| policy_gradient_loss | -0.00489 | -| std | 0.222 | -| value_loss | 7.79e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.67 | -| time/ | | -| fps | 18 | -| iterations | 6206 | -| time_elapsed | 42984 | -| total_timesteps | 794368 | -| train/ | | -| approx_kl | 0.015364994 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.087 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 62050 | -| policy_gradient_loss | -0.00696 | -| std | 0.222 | -| value_loss | 8.82e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.67 | -| time/ | | -| fps | 18 | -| iterations | 6207 | -| time_elapsed | 42987 | -| total_timesteps | 794496 | -| train/ | | -| approx_kl | 0.0036754995 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.0881 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 62060 | -| policy_gradient_loss | -0.000799 | -| std | 0.221 | -| value_loss | 1.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.67 | -| time/ | | -| fps | 18 | -| iterations | 6208 | -| time_elapsed | 42991 | -| total_timesteps | 794624 | -| train/ | | -| approx_kl | 0.016762812 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 0.0913 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 62070 | -| policy_gradient_loss | -0.00609 | -| std | 0.221 | -| value_loss | 2.47e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.67 | -| time/ | | -| fps | 18 | -| iterations | 6209 | -| time_elapsed | 42995 | -| total_timesteps | 794752 | -| train/ | | -| approx_kl | 0.0079151075 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.0937 | -| explained_variance | -2.94 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 62080 | -| policy_gradient_loss | 0.000525 | -| std | 0.22 | -| value_loss | 2.71e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.67 | -| time/ | | -| fps | 18 | -| iterations | 6210 | -| time_elapsed | 42999 | -| total_timesteps | 794880 | -| train/ | | -| approx_kl | 0.006914344 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.0953 | -| explained_variance | 0.0662 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 62090 | -| policy_gradient_loss | -0.00111 | -| std | 0.22 | -| value_loss | 3.45e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6211 | -| time_elapsed | 43003 | -| total_timesteps | 795008 | -| train/ | | -| approx_kl | 0.01970151 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.0954 | -| explained_variance | -2.4 | -| learning_rate | 0.0003 | -| loss | -0.00635 | -| n_updates | 62100 | -| policy_gradient_loss | -0.00647 | -| std | 0.22 | -| value_loss | 1.54e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6212 | -| time_elapsed | 43013 | -| total_timesteps | 795136 | -| train/ | | -| approx_kl | 0.040410843 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.0951 | -| explained_variance | -281 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 62110 | -| policy_gradient_loss | -0.00586 | -| std | 0.22 | -| value_loss | 7.71e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6213 | -| time_elapsed | 43017 | -| total_timesteps | 795264 | -| train/ | | -| approx_kl | 0.0070479466 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.0947 | -| explained_variance | -0.911 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 62120 | -| policy_gradient_loss | -0.00237 | -| std | 0.22 | -| value_loss | 7.7e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6214 | -| time_elapsed | 43021 | -| total_timesteps | 795392 | -| train/ | | -| approx_kl | 0.010306023 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.0944 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.032 | -| n_updates | 62130 | -| policy_gradient_loss | -0.00637 | -| std | 0.22 | -| value_loss | 1e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6215 | -| time_elapsed | 43025 | -| total_timesteps | 795520 | -| train/ | | -| approx_kl | 0.0011579827 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.094 | -| explained_variance | -2.66 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 62140 | -| policy_gradient_loss | 0.0014 | -| std | 0.22 | -| value_loss | 1.14e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6216 | -| time_elapsed | 43028 | -| total_timesteps | 795648 | -| train/ | | -| approx_kl | 0.009039959 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.0931 | -| explained_variance | -2.61 | -| learning_rate | 0.0003 | -| loss | -0.00516 | -| n_updates | 62150 | -| policy_gradient_loss | -0.00325 | -| std | 0.221 | -| value_loss | 1.45e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6217 | -| time_elapsed | 43031 | -| total_timesteps | 795776 | -| train/ | | -| approx_kl | 0.0143200345 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 0.0924 | -| explained_variance | -0.83 | -| learning_rate | 0.0003 | -| loss | -0.00405 | -| n_updates | 62160 | -| policy_gradient_loss | -0.00279 | -| std | 0.221 | -| value_loss | 8.89e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.669 | -| time/ | | -| fps | 18 | -| iterations | 6218 | -| time_elapsed | 43035 | -| total_timesteps | 795904 | -| train/ | | -| approx_kl | 0.0050210273 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.0916 | -| explained_variance | -4.48 | -| learning_rate | 0.0003 | -| loss | -0.000993 | -| n_updates | 62170 | -| policy_gradient_loss | -0.000283 | -| std | 0.221 | -| value_loss | 2.18e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6219 | -| time_elapsed | 43038 | -| total_timesteps | 796032 | -| train/ | | -| approx_kl | 0.000513501 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0919 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | -0.000257 | -| n_updates | 62180 | -| policy_gradient_loss | 9.05e-05 | -| std | 0.22 | -| value_loss | 7.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6220 | -| time_elapsed | 43044 | -| total_timesteps | 796160 | -| train/ | | -| approx_kl | 0.013273492 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.0933 | -| explained_variance | -114 | -| learning_rate | 0.0003 | -| loss | -0.00199 | -| n_updates | 62190 | -| policy_gradient_loss | -0.000851 | -| std | 0.22 | -| value_loss | 7.5e-05 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6221 | -| time_elapsed | 43047 | -| total_timesteps | 796288 | -| train/ | | -| approx_kl | 0.017962 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 0.0927 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 62200 | -| policy_gradient_loss | -0.00476 | -| std | 0.221 | -| value_loss | 7.99e-07 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6222 | -| time_elapsed | 43050 | -| total_timesteps | 796416 | -| train/ | | -| approx_kl | 0.0032484261 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 0.0927 | -| explained_variance | -2.42 | -| learning_rate | 0.0003 | -| loss | -5.21e-06 | -| n_updates | 62210 | -| policy_gradient_loss | 1.08e-05 | -| std | 0.22 | -| value_loss | 2.74e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6223 | -| time_elapsed | 43052 | -| total_timesteps | 796544 | -| train/ | | -| approx_kl | 0.00489212 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 0.0929 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 62220 | -| policy_gradient_loss | -0.00314 | -| std | 0.221 | -| value_loss | 3.21e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6224 | -| time_elapsed | 43055 | -| total_timesteps | 796672 | -| train/ | | -| approx_kl | 0.027689165 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.0926 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 62230 | -| policy_gradient_loss | -0.00685 | -| std | 0.221 | -| value_loss | 6.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6225 | -| time_elapsed | 43057 | -| total_timesteps | 796800 | -| train/ | | -| approx_kl | 0.018821843 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 0.0924 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 62240 | -| policy_gradient_loss | -0.00679 | -| std | 0.221 | -| value_loss | 0.00102 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.659 | -| time/ | | -| fps | 18 | -| iterations | 6226 | -| time_elapsed | 43058 | -| total_timesteps | 796928 | -| train/ | | -| approx_kl | 0.006075917 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.0924 | -| explained_variance | -0.593 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 62250 | -| policy_gradient_loss | -0.00211 | -| std | 0.221 | -| value_loss | 2.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6227 | -| time_elapsed | 43060 | -| total_timesteps | 797056 | -| train/ | | -| approx_kl | 0.023744695 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 0.0928 | -| explained_variance | 0.563 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 62260 | -| policy_gradient_loss | -0.0158 | -| std | 0.22 | -| value_loss | 5.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6228 | -| time_elapsed | 43064 | -| total_timesteps | 797184 | -| train/ | | -| approx_kl | 0.038343366 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 0.093 | -| explained_variance | -4.76 | -| learning_rate | 0.0003 | -| loss | -0.00338 | -| n_updates | 62270 | -| policy_gradient_loss | -0.00576 | -| std | 0.22 | -| value_loss | 8.14e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6229 | -| time_elapsed | 43068 | -| total_timesteps | 797312 | -| train/ | | -| approx_kl | 0.018373128 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.0928 | -| explained_variance | -0.742 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 62280 | -| policy_gradient_loss | -0.00446 | -| std | 0.221 | -| value_loss | 1.47e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6230 | -| time_elapsed | 43071 | -| total_timesteps | 797440 | -| train/ | | -| approx_kl | 0.0036958898 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.0914 | -| explained_variance | -0.0752 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 62290 | -| policy_gradient_loss | -0.0012 | -| std | 0.221 | -| value_loss | 2.82e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6231 | -| time_elapsed | 43074 | -| total_timesteps | 797568 | -| train/ | | -| approx_kl | 0.01094142 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.0897 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 62300 | -| policy_gradient_loss | -0.00139 | -| std | 0.221 | -| value_loss | 4.43e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6232 | -| time_elapsed | 43078 | -| total_timesteps | 797696 | -| train/ | | -| approx_kl | 0.0076367636 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 0.0887 | -| explained_variance | 0.0262 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 62310 | -| policy_gradient_loss | -0.0048 | -| std | 0.221 | -| value_loss | 0.00639 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6233 | -| time_elapsed | 43080 | -| total_timesteps | 797824 | -| train/ | | -| approx_kl | 0.012503022 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.0885 | -| explained_variance | 0.00332 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 62320 | -| policy_gradient_loss | -0.00296 | -| std | 0.221 | -| value_loss | 9.21e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.658 | -| time/ | | -| fps | 18 | -| iterations | 6234 | -| time_elapsed | 43081 | -| total_timesteps | 797952 | -| train/ | | -| approx_kl | 0.017007202 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.0888 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 62330 | -| policy_gradient_loss | -0.00258 | -| std | 0.221 | -| value_loss | 3.34e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6235 | -| time_elapsed | 43084 | -| total_timesteps | 798080 | -| train/ | | -| approx_kl | 0.010168938 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.0889 | -| explained_variance | 0.244 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 62340 | -| policy_gradient_loss | -0.00166 | -| std | 0.221 | -| value_loss | 2.15e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6236 | -| time_elapsed | 43088 | -| total_timesteps | 798208 | -| train/ | | -| approx_kl | 0.000670312 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | 0.0889 | -| explained_variance | -0.742 | -| learning_rate | 0.0003 | -| loss | -0.000117 | -| n_updates | 62350 | -| policy_gradient_loss | 0.000278 | -| std | 0.221 | -| value_loss | 0.000184 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6237 | -| time_elapsed | 43090 | -| total_timesteps | 798336 | -| train/ | | -| approx_kl | 0.0054339035 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 0.0879 | -| explained_variance | -0.553 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 62360 | -| policy_gradient_loss | -0.0015 | -| std | 0.222 | -| value_loss | 0.000132 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6238 | -| time_elapsed | 43093 | -| total_timesteps | 798464 | -| train/ | | -| approx_kl | 0.011946093 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.0867 | -| explained_variance | 0.429 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 62370 | -| policy_gradient_loss | -0.0125 | -| std | 0.222 | -| value_loss | 4.63e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6239 | -| time_elapsed | 43095 | -| total_timesteps | 798592 | -| train/ | | -| approx_kl | 0.019288708 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.0862 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 62380 | -| policy_gradient_loss | -0.00219 | -| std | 0.222 | -| value_loss | 1.53e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6240 | -| time_elapsed | 43098 | -| total_timesteps | 798720 | -| train/ | | -| approx_kl | 0.015958715 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.0852 | -| explained_variance | 0.323 | -| learning_rate | 0.0003 | -| loss | -0.00947 | -| n_updates | 62390 | -| policy_gradient_loss | -0.00461 | -| std | 0.222 | -| value_loss | 6.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6241 | -| time_elapsed | 43101 | -| total_timesteps | 798848 | -| train/ | | -| approx_kl | 0.008432432 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 0.0849 | -| explained_variance | 0.0983 | -| learning_rate | 0.0003 | -| loss | 0.0027 | -| n_updates | 62400 | -| policy_gradient_loss | 0.000217 | -| std | 0.222 | -| value_loss | 4.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.651 | -| time/ | | -| fps | 18 | -| iterations | 6242 | -| time_elapsed | 43105 | -| total_timesteps | 798976 | -| train/ | | -| approx_kl | 0.004114446 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 0.0866 | -| explained_variance | -6.33 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 62410 | -| policy_gradient_loss | -0.00233 | -| std | 0.222 | -| value_loss | 1.89e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6243 | -| time_elapsed | 43109 | -| total_timesteps | 799104 | -| train/ | | -| approx_kl | 0.0106479395 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.0882 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 62420 | -| policy_gradient_loss | -0.00182 | -| std | 0.221 | -| value_loss | 1.73e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6244 | -| time_elapsed | 43117 | -| total_timesteps | 799232 | -| train/ | | -| approx_kl | 0.015573369 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 0.0892 | -| explained_variance | -56.6 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 62430 | -| policy_gradient_loss | -0.000841 | -| std | 0.221 | -| value_loss | 6.17e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6245 | -| time_elapsed | 43121 | -| total_timesteps | 799360 | -| train/ | | -| approx_kl | 0.0162262 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 0.0885 | -| explained_variance | -0.093 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 62440 | -| policy_gradient_loss | 0.000348 | -| std | 0.221 | -| value_loss | 2.35e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6246 | -| time_elapsed | 43126 | -| total_timesteps | 799488 | -| train/ | | -| approx_kl | 0.013593245 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.0889 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | 0.000721 | -| n_updates | 62450 | -| policy_gradient_loss | -0.000624 | -| std | 0.221 | -| value_loss | 1.91e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6247 | -| time_elapsed | 43128 | -| total_timesteps | 799616 | -| train/ | | -| approx_kl | 0.03198801 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.0907 | -| explained_variance | 0.0266 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 62460 | -| policy_gradient_loss | -0.0158 | -| std | 0.221 | -| value_loss | 0.000285 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6248 | -| time_elapsed | 43133 | -| total_timesteps | 799744 | -| train/ | | -| approx_kl | 0.011630025 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.0918 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | 0.000539 | -| n_updates | 62470 | -| policy_gradient_loss | -0.001 | -| std | 0.221 | -| value_loss | 3.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6249 | -| time_elapsed | 43138 | -| total_timesteps | 799872 | -| train/ | | -| approx_kl | 0.014231949 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.0929 | -| explained_variance | -0.46 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 62480 | -| policy_gradient_loss | -0.000511 | -| std | 0.22 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6250 | -| time_elapsed | 43141 | -| total_timesteps | 800000 | -| train/ | | -| approx_kl | 0.034966365 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 0.0942 | -| explained_variance | -0.0796 | -| learning_rate | 0.0003 | -| loss | -0.0248 | -| n_updates | 62490 | -| policy_gradient_loss | -0.0153 | -| std | 0.22 | -| value_loss | 0.00013 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6251 | -| time_elapsed | 43145 | -| total_timesteps | 800128 | -| train/ | | -| approx_kl | 0.005931938 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.0938 | -| explained_variance | 0.00661 | -| learning_rate | 0.0003 | -| loss | -0.000122 | -| n_updates | 62500 | -| policy_gradient_loss | 0.00114 | -| std | 0.22 | -| value_loss | 0.00019 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6252 | -| time_elapsed | 43153 | -| total_timesteps | 800256 | -| train/ | | -| approx_kl | 0.010225823 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.0923 | -| explained_variance | -0.000986 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 62510 | -| policy_gradient_loss | -0.00418 | -| std | 0.221 | -| value_loss | 0.0069 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6253 | -| time_elapsed | 43157 | -| total_timesteps | 800384 | -| train/ | | -| approx_kl | 0.0064422954 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.0915 | -| explained_variance | 0.000144 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 62520 | -| policy_gradient_loss | -0.002 | -| std | 0.221 | -| value_loss | 0.00195 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6254 | -| time_elapsed | 43160 | -| total_timesteps | 800512 | -| train/ | | -| approx_kl | 0.011785222 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 0.0908 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.00919 | -| n_updates | 62530 | -| policy_gradient_loss | -0.00273 | -| std | 0.221 | -| value_loss | 0.000189 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6255 | -| time_elapsed | 43163 | -| total_timesteps | 800640 | -| train/ | | -| approx_kl | 0.023938335 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 0.0894 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 62540 | -| policy_gradient_loss | -0.0122 | -| std | 0.221 | -| value_loss | 6.88e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6256 | -| time_elapsed | 43167 | -| total_timesteps | 800768 | -| train/ | | -| approx_kl | 0.016686922 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.0884 | -| explained_variance | 0.00393 | -| learning_rate | 0.0003 | -| loss | 0.0647 | -| n_updates | 62550 | -| policy_gradient_loss | -0.00915 | -| std | 0.222 | -| value_loss | 0.204 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.638 | -| time/ | | -| fps | 18 | -| iterations | 6257 | -| time_elapsed | 43170 | -| total_timesteps | 800896 | -| train/ | | -| approx_kl | 0.016354643 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.0877 | -| explained_variance | -0.00186 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 62560 | -| policy_gradient_loss | -0.00742 | -| std | 0.222 | -| value_loss | 0.0128 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6258 | -| time_elapsed | 43173 | -| total_timesteps | 801024 | -| train/ | | -| approx_kl | 0.026300259 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.087 | -| explained_variance | -0.00368 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 62570 | -| policy_gradient_loss | -0.0103 | -| std | 0.222 | -| value_loss | 0.00633 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6259 | -| time_elapsed | 43181 | -| total_timesteps | 801152 | -| train/ | | -| approx_kl | 0.013944444 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.0872 | -| explained_variance | -0.000115 | -| learning_rate | 0.0003 | -| loss | 0.0616 | -| n_updates | 62580 | -| policy_gradient_loss | -0.00519 | -| std | 0.222 | -| value_loss | 0.178 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6260 | -| time_elapsed | 43183 | -| total_timesteps | 801280 | -| train/ | | -| approx_kl | 0.0020196838 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 0.0875 | -| explained_variance | -0.00564 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 62590 | -| policy_gradient_loss | -9.05e-05 | -| std | 0.221 | -| value_loss | 0.358 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6261 | -| time_elapsed | 43186 | -| total_timesteps | 801408 | -| train/ | | -| approx_kl | 0.017191842 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.0893 | -| explained_variance | -0.0616 | -| learning_rate | 0.0003 | -| loss | -0.000571 | -| n_updates | 62600 | -| policy_gradient_loss | -0.00849 | -| std | 0.221 | -| value_loss | 0.0176 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6262 | -| time_elapsed | 43188 | -| total_timesteps | 801536 | -| train/ | | -| approx_kl | 0.02489237 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 0.0902 | -| explained_variance | -0.00574 | -| learning_rate | 0.0003 | -| loss | 0.0618 | -| n_updates | 62610 | -| policy_gradient_loss | -0.0124 | -| std | 0.221 | -| value_loss | 0.194 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6263 | -| time_elapsed | 43193 | -| total_timesteps | 801664 | -| train/ | | -| approx_kl | 0.0022319471 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0911 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | 0.00529 | -| n_updates | 62620 | -| policy_gradient_loss | -3.4e-05 | -| std | 0.221 | -| value_loss | 0.0143 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6264 | -| time_elapsed | 43196 | -| total_timesteps | 801792 | -| train/ | | -| approx_kl | 0.010360988 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 0.0925 | -| explained_variance | -0.00552 | -| learning_rate | 0.0003 | -| loss | 0.035 | -| n_updates | 62630 | -| policy_gradient_loss | -0.00142 | -| std | 0.221 | -| value_loss | 0.0881 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.715 | -| time/ | | -| fps | 18 | -| iterations | 6265 | -| time_elapsed | 43199 | -| total_timesteps | 801920 | -| train/ | | -| approx_kl | 0.009543483 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 0.0926 | -| explained_variance | -0.00623 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 62640 | -| policy_gradient_loss | -0.00108 | -| std | 0.221 | -| value_loss | 0.499 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6266 | -| time_elapsed | 43202 | -| total_timesteps | 802048 | -| train/ | | -| approx_kl | 0.015314753 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.0925 | -| explained_variance | -0.00748 | -| learning_rate | 0.0003 | -| loss | 0.229 | -| n_updates | 62650 | -| policy_gradient_loss | -0.00419 | -| std | 0.221 | -| value_loss | 0.462 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6267 | -| time_elapsed | 43208 | -| total_timesteps | 802176 | -| train/ | | -| approx_kl | 0.0155969225 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.0928 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 62660 | -| policy_gradient_loss | -0.0062 | -| std | 0.221 | -| value_loss | 0.349 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6268 | -| time_elapsed | 43213 | -| total_timesteps | 802304 | -| train/ | | -| approx_kl | 0.011122064 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.0929 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 62670 | -| policy_gradient_loss | -0.003 | -| std | 0.22 | -| value_loss | 0.104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6269 | -| time_elapsed | 43216 | -| total_timesteps | 802432 | -| train/ | | -| approx_kl | 0.019311491 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 0.0935 | -| explained_variance | -0.0098 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 62680 | -| policy_gradient_loss | -0.00421 | -| std | 0.22 | -| value_loss | 0.0703 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6270 | -| time_elapsed | 43218 | -| total_timesteps | 802560 | -| train/ | | -| approx_kl | 0.0019501131 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.0949 | -| explained_variance | 0.000476 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 62690 | -| policy_gradient_loss | -0.000154 | -| std | 0.22 | -| value_loss | 0.03 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6271 | -| time_elapsed | 43221 | -| total_timesteps | 802688 | -| train/ | | -| approx_kl | 0.012097536 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 0.098 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 62700 | -| policy_gradient_loss | -0.000233 | -| std | 0.219 | -| value_loss | 0.227 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6272 | -| time_elapsed | 43225 | -| total_timesteps | 802816 | -| train/ | | -| approx_kl | 0.011370057 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.0995 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 62710 | -| policy_gradient_loss | -0.00216 | -| std | 0.219 | -| value_loss | 0.288 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 18 | -| iterations | 6273 | -| time_elapsed | 43227 | -| total_timesteps | 802944 | -| train/ | | -| approx_kl | 0.0029440615 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 0.1 | -| explained_variance | 0.00822 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 62720 | -| policy_gradient_loss | -0.000197 | -| std | 0.219 | -| value_loss | 0.0774 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6274 | -| time_elapsed | 43230 | -| total_timesteps | 803072 | -| train/ | | -| approx_kl | 0.021693137 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.102 | -| explained_variance | 0.00134 | -| learning_rate | 0.0003 | -| loss | -0.000988 | -| n_updates | 62730 | -| policy_gradient_loss | -0.00642 | -| std | 0.218 | -| value_loss | 0.0695 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6275 | -| time_elapsed | 43235 | -| total_timesteps | 803200 | -| train/ | | -| approx_kl | 0.007023845 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.103 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 62740 | -| policy_gradient_loss | -0.00155 | -| std | 0.218 | -| value_loss | 0.409 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6276 | -| time_elapsed | 43238 | -| total_timesteps | 803328 | -| train/ | | -| approx_kl | 0.0010698307 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.103 | -| explained_variance | -0.00769 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 62750 | -| policy_gradient_loss | 1.84e-05 | -| std | 0.218 | -| value_loss | 0.0544 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6277 | -| time_elapsed | 43242 | -| total_timesteps | 803456 | -| train/ | | -| approx_kl | 0.0058643627 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.104 | -| explained_variance | -0.00637 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 62760 | -| policy_gradient_loss | -0.0013 | -| std | 0.218 | -| value_loss | 0.027 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6278 | -| time_elapsed | 43247 | -| total_timesteps | 803584 | -| train/ | | -| approx_kl | 0.0116493935 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.105 | -| explained_variance | -0.00545 | -| learning_rate | 0.0003 | -| loss | 0.00571 | -| n_updates | 62770 | -| policy_gradient_loss | -0.000999 | -| std | 0.218 | -| value_loss | 0.0122 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6279 | -| time_elapsed | 43251 | -| total_timesteps | 803712 | -| train/ | | -| approx_kl | 0.018149592 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.105 | -| explained_variance | -0.00539 | -| learning_rate | 0.0003 | -| loss | 0.00833 | -| n_updates | 62780 | -| policy_gradient_loss | -0.0131 | -| std | 0.218 | -| value_loss | 0.0579 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6280 | -| time_elapsed | 43255 | -| total_timesteps | 803840 | -| train/ | | -| approx_kl | 1.1177268e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | 0.000261 | -| learning_rate | 0.0003 | -| loss | 0.000795 | -| n_updates | 62790 | -| policy_gradient_loss | -0.000237 | -| std | 0.217 | -| value_loss | 0.0289 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.2 | -| time/ | | -| fps | 18 | -| iterations | 6281 | -| time_elapsed | 43257 | -| total_timesteps | 803968 | -| train/ | | -| approx_kl | 0.0014612651 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.109 | -| explained_variance | -0.0017 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 62800 | -| policy_gradient_loss | -0.000493 | -| std | 0.217 | -| value_loss | 0.0109 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6282 | -| time_elapsed | 43261 | -| total_timesteps | 804096 | -| train/ | | -| approx_kl | 0.021265963 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.107 | -| explained_variance | -0.00221 | -| learning_rate | 0.0003 | -| loss | 0.00394 | -| n_updates | 62810 | -| policy_gradient_loss | -0.00253 | -| std | 0.218 | -| value_loss | 0.0127 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6283 | -| time_elapsed | 43269 | -| total_timesteps | 804224 | -| train/ | | -| approx_kl | 0.006772835 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | 0.000893 | -| learning_rate | 0.0003 | -| loss | 0.0466 | -| n_updates | 62820 | -| policy_gradient_loss | -0.00046 | -| std | 0.218 | -| value_loss | 0.0959 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6284 | -| time_elapsed | 43272 | -| total_timesteps | 804352 | -| train/ | | -| approx_kl | 0.0029547047 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | -0.00437 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 62830 | -| policy_gradient_loss | -0.00289 | -| std | 0.218 | -| value_loss | 0.00925 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6285 | -| time_elapsed | 43275 | -| total_timesteps | 804480 | -| train/ | | -| approx_kl | 0.011582012 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | -0.00933 | -| learning_rate | 0.0003 | -| loss | 8.8e-05 | -| n_updates | 62840 | -| policy_gradient_loss | -0.00104 | -| std | 0.218 | -| value_loss | 0.00502 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6286 | -| time_elapsed | 43278 | -| total_timesteps | 804608 | -| train/ | | -| approx_kl | 0.024348754 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.00298 | -| n_updates | 62850 | -| policy_gradient_loss | -0.00188 | -| std | 0.218 | -| value_loss | 0.00301 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6287 | -| time_elapsed | 43283 | -| total_timesteps | 804736 | -| train/ | | -| approx_kl | 0.0039122077 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.00205 | -| n_updates | 62860 | -| policy_gradient_loss | -0.000584 | -| std | 0.218 | -| value_loss | 0.00348 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6288 | -| time_elapsed | 43286 | -| total_timesteps | 804864 | -| train/ | | -| approx_kl | 0.009890706 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.104 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 62870 | -| policy_gradient_loss | -0.00126 | -| std | 0.218 | -| value_loss | 0.00151 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 18 | -| iterations | 6289 | -| time_elapsed | 43288 | -| total_timesteps | 804992 | -| train/ | | -| approx_kl | 0.015368776 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.104 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 62880 | -| policy_gradient_loss | -0.00347 | -| std | 0.218 | -| value_loss | 0.000647 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.31 | -| time/ | | -| fps | 18 | -| iterations | 6290 | -| time_elapsed | 43290 | -| total_timesteps | 805120 | -| train/ | | -| approx_kl | 0.03220911 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 0.104 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 62890 | -| policy_gradient_loss | -0.0079 | -| std | 0.218 | -| value_loss | 0.000398 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.31 | -| time/ | | -| fps | 18 | -| iterations | 6291 | -| time_elapsed | 43299 | -| total_timesteps | 805248 | -| train/ | | -| approx_kl | 0.0097730905 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.105 | -| explained_variance | 0.135 | -| learning_rate | 0.0003 | -| loss | 0.00972 | -| n_updates | 62900 | -| policy_gradient_loss | -0.00442 | -| std | 0.218 | -| value_loss | 0.0361 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.31 | -| time/ | | -| fps | 18 | -| iterations | 6292 | -| time_elapsed | 43302 | -| total_timesteps | 805376 | -| train/ | | -| approx_kl | 0.014653035 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.105 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 62910 | -| policy_gradient_loss | -0.00287 | -| std | 0.218 | -| value_loss | 0.00365 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.31 | -| time/ | | -| fps | 18 | -| iterations | 6293 | -| time_elapsed | 43306 | -| total_timesteps | 805504 | -| train/ | | -| approx_kl | 0.007265105 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.105 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.000218 | -| n_updates | 62920 | -| policy_gradient_loss | -0.000133 | -| std | 0.218 | -| value_loss | 0.00105 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.31 | -| time/ | | -| fps | 18 | -| iterations | 6294 | -| time_elapsed | 43310 | -| total_timesteps | 805632 | -| train/ | | -| approx_kl | 0.019920334 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 62930 | -| policy_gradient_loss | -0.00314 | -| std | 0.218 | -| value_loss | 0.000854 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.31 | -| time/ | | -| fps | 18 | -| iterations | 6295 | -| time_elapsed | 43313 | -| total_timesteps | 805760 | -| train/ | | -| approx_kl | 0.005230771 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.107 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 62940 | -| policy_gradient_loss | -0.000865 | -| std | 0.217 | -| value_loss | 0.00028 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.31 | -| time/ | | -| fps | 18 | -| iterations | 6296 | -| time_elapsed | 43316 | -| total_timesteps | 805888 | -| train/ | | -| approx_kl | 0.016909689 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.108 | -| explained_variance | -0.0557 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 62950 | -| policy_gradient_loss | -0.00309 | -| std | 0.217 | -| value_loss | 0.000434 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6297 | -| time_elapsed | 43321 | -| total_timesteps | 806016 | -| train/ | | -| approx_kl | 0.011778624 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 0.109 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 62960 | -| policy_gradient_loss | -0.000203 | -| std | 0.217 | -| value_loss | 0.000143 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6298 | -| time_elapsed | 43329 | -| total_timesteps | 806144 | -| train/ | | -| approx_kl | 0.022926282 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.109 | -| explained_variance | 0.288 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 62970 | -| policy_gradient_loss | -0.000182 | -| std | 0.217 | -| value_loss | 0.0213 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6299 | -| time_elapsed | 43332 | -| total_timesteps | 806272 | -| train/ | | -| approx_kl | 0.00845824 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 0.108 | -| explained_variance | 0.00606 | -| learning_rate | 0.0003 | -| loss | 0.00317 | -| n_updates | 62980 | -| policy_gradient_loss | -7.16e-05 | -| std | 0.217 | -| value_loss | 0.00459 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6300 | -| time_elapsed | 43335 | -| total_timesteps | 806400 | -| train/ | | -| approx_kl | 0.013463268 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 0.106 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | 0.00856 | -| n_updates | 62990 | -| policy_gradient_loss | -0.00284 | -| std | 0.218 | -| value_loss | 0.0492 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6301 | -| time_elapsed | 43339 | -| total_timesteps | 806528 | -| train/ | | -| approx_kl | 0.019904416 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 0.104 | -| explained_variance | 0.00428 | -| learning_rate | 0.0003 | -| loss | 0.00204 | -| n_updates | 63000 | -| policy_gradient_loss | -0.00138 | -| std | 0.218 | -| value_loss | 0.00467 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6302 | -| time_elapsed | 43343 | -| total_timesteps | 806656 | -| train/ | | -| approx_kl | 0.023698425 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 0.104 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 63010 | -| policy_gradient_loss | -0.0081 | -| std | 0.218 | -| value_loss | 0.0116 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6303 | -| time_elapsed | 43346 | -| total_timesteps | 806784 | -| train/ | | -| approx_kl | 0.013484169 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.104 | -| explained_variance | 0.0018 | -| learning_rate | 0.0003 | -| loss | -0.000104 | -| n_updates | 63020 | -| policy_gradient_loss | -0.00124 | -| std | 0.218 | -| value_loss | 0.00577 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.32 | -| time/ | | -| fps | 18 | -| iterations | 6304 | -| time_elapsed | 43350 | -| total_timesteps | 806912 | -| train/ | | -| approx_kl | 0.007897476 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.105 | -| explained_variance | -0.00676 | -| learning_rate | 0.0003 | -| loss | 0.000721 | -| n_updates | 63030 | -| policy_gradient_loss | -0.000371 | -| std | 0.217 | -| value_loss | 0.0028 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6305 | -| time_elapsed | 43353 | -| total_timesteps | 807040 | -| train/ | | -| approx_kl | 0.019010786 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.109 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.000965 | -| n_updates | 63040 | -| policy_gradient_loss | -0.00209 | -| std | 0.217 | -| value_loss | 0.00183 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6306 | -| time_elapsed | 43360 | -| total_timesteps | 807168 | -| train/ | | -| approx_kl | 0.021788003 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.112 | -| explained_variance | 0.112 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 63050 | -| policy_gradient_loss | -0.0118 | -| std | 0.216 | -| value_loss | 0.00965 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6307 | -| time_elapsed | 43364 | -| total_timesteps | 807296 | -| train/ | | -| approx_kl | 0.012151451 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.114 | -| explained_variance | 0.0899 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 63060 | -| policy_gradient_loss | -0.00248 | -| std | 0.216 | -| value_loss | 0.000624 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6308 | -| time_elapsed | 43367 | -| total_timesteps | 807424 | -| train/ | | -| approx_kl | 0.019784587 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.114 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | -0.00852 | -| n_updates | 63070 | -| policy_gradient_loss | -0.00807 | -| std | 0.216 | -| value_loss | 0.000375 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6309 | -| time_elapsed | 43370 | -| total_timesteps | 807552 | -| train/ | | -| approx_kl | 0.025981031 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.115 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 63080 | -| policy_gradient_loss | -0.012 | -| std | 0.216 | -| value_loss | 0.000227 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6310 | -| time_elapsed | 43373 | -| total_timesteps | 807680 | -| train/ | | -| approx_kl | 0.016684378 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.115 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 63090 | -| policy_gradient_loss | -0.00145 | -| std | 0.216 | -| value_loss | 0.000124 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6311 | -| time_elapsed | 43377 | -| total_timesteps | 807808 | -| train/ | | -| approx_kl | 0.007061589 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.116 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 63100 | -| policy_gradient_loss | -0.00173 | -| std | 0.216 | -| value_loss | 7.2e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.37 | -| time/ | | -| fps | 18 | -| iterations | 6312 | -| time_elapsed | 43379 | -| total_timesteps | 807936 | -| train/ | | -| approx_kl | 0.009253997 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 0.115 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 63110 | -| policy_gradient_loss | -0.00295 | -| std | 0.216 | -| value_loss | 4.32e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6313 | -| time_elapsed | 43382 | -| total_timesteps | 808064 | -| train/ | | -| approx_kl | 0.0113168135 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.114 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 63120 | -| policy_gradient_loss | -0.00294 | -| std | 0.216 | -| value_loss | 2.71e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6314 | -| time_elapsed | 43387 | -| total_timesteps | 808192 | -| train/ | | -| approx_kl | 0.0001816377 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.115 | -| explained_variance | 0.136 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 63130 | -| policy_gradient_loss | -0.00013 | -| std | 0.215 | -| value_loss | 0.0447 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6315 | -| time_elapsed | 43389 | -| total_timesteps | 808320 | -| train/ | | -| approx_kl | 0.027675342 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 0.119 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 63140 | -| policy_gradient_loss | -0.0128 | -| std | 0.215 | -| value_loss | 0.00174 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6316 | -| time_elapsed | 43392 | -| total_timesteps | 808448 | -| train/ | | -| approx_kl | 0.013623729 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.121 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 63150 | -| policy_gradient_loss | -0.0161 | -| std | 0.214 | -| value_loss | 0.000278 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6317 | -| time_elapsed | 43395 | -| total_timesteps | 808576 | -| train/ | | -| approx_kl | 0.008465087 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.121 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | -0.00578 | -| n_updates | 63160 | -| policy_gradient_loss | -0.00372 | -| std | 0.214 | -| value_loss | 0.000143 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6318 | -| time_elapsed | 43397 | -| total_timesteps | 808704 | -| train/ | | -| approx_kl | 0.014094964 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.122 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 63170 | -| policy_gradient_loss | -0.00389 | -| std | 0.214 | -| value_loss | 0.000101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6319 | -| time_elapsed | 43400 | -| total_timesteps | 808832 | -| train/ | | -| approx_kl | 0.015719205 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.123 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 63180 | -| policy_gradient_loss | -0.00176 | -| std | 0.214 | -| value_loss | 6.32e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.36 | -| time/ | | -| fps | 18 | -| iterations | 6320 | -| time_elapsed | 43402 | -| total_timesteps | 808960 | -| train/ | | -| approx_kl | 0.019491527 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 0.124 | -| explained_variance | -0.0633 | -| learning_rate | 0.0003 | -| loss | -0.000509 | -| n_updates | 63190 | -| policy_gradient_loss | -0.00156 | -| std | 0.214 | -| value_loss | 4.05e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6321 | -| time_elapsed | 43406 | -| total_timesteps | 809088 | -| train/ | | -| approx_kl | 0.016188089 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.125 | -| explained_variance | -0.0795 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 63200 | -| policy_gradient_loss | -0.00306 | -| std | 0.213 | -| value_loss | 2.01e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6322 | -| time_elapsed | 43414 | -| total_timesteps | 809216 | -| train/ | | -| approx_kl | 0.016877294 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.126 | -| explained_variance | 0.229 | -| learning_rate | 0.0003 | -| loss | 0.00971 | -| n_updates | 63210 | -| policy_gradient_loss | -0.00158 | -| std | 0.213 | -| value_loss | 0.0233 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6323 | -| time_elapsed | 43418 | -| total_timesteps | 809344 | -| train/ | | -| approx_kl | 0.026903007 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.127 | -| explained_variance | -0.236 | -| learning_rate | 0.0003 | -| loss | -0.0255 | -| n_updates | 63220 | -| policy_gradient_loss | -0.0138 | -| std | 0.213 | -| value_loss | 0.00206 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6324 | -| time_elapsed | 43421 | -| total_timesteps | 809472 | -| train/ | | -| approx_kl | 0.00012161024 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 0.129 | -| explained_variance | 0.00958 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 63230 | -| policy_gradient_loss | -0.000465 | -| std | 0.212 | -| value_loss | 0.000277 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6325 | -| time_elapsed | 43425 | -| total_timesteps | 809600 | -| train/ | | -| approx_kl | 0.00021982146 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.136 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | -0.000399 | -| n_updates | 63240 | -| policy_gradient_loss | -0.000274 | -| std | 0.21 | -| value_loss | 0.000268 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6326 | -| time_elapsed | 43429 | -| total_timesteps | 809728 | -| train/ | | -| approx_kl | 0.019479848 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 0.141 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 63250 | -| policy_gradient_loss | -0.00341 | -| std | 0.21 | -| value_loss | 0.000229 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6327 | -| time_elapsed | 43433 | -| total_timesteps | 809856 | -| train/ | | -| approx_kl | 0.012407794 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 0.144 | -| explained_variance | -0.00584 | -| learning_rate | 0.0003 | -| loss | 0.00193 | -| n_updates | 63260 | -| policy_gradient_loss | 2.41e-05 | -| std | 0.209 | -| value_loss | 9.31e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.38 | -| time/ | | -| fps | 18 | -| iterations | 6328 | -| time_elapsed | 43437 | -| total_timesteps | 809984 | -| train/ | | -| approx_kl | 0.020133965 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.146 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 63270 | -| policy_gradient_loss | -0.00239 | -| std | 0.209 | -| value_loss | 5.85e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 18 | -| iterations | 6329 | -| time_elapsed | 43442 | -| total_timesteps | 810112 | -| train/ | | -| approx_kl | 0.022432502 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.148 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | -0.00442 | -| n_updates | 63280 | -| policy_gradient_loss | -0.00405 | -| std | 0.208 | -| value_loss | 2.44e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 18 | -| iterations | 6330 | -| time_elapsed | 43449 | -| total_timesteps | 810240 | -| train/ | | -| approx_kl | 0.02089363 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 0.15 | -| explained_variance | 0.229 | -| learning_rate | 0.0003 | -| loss | 0.0074 | -| n_updates | 63290 | -| policy_gradient_loss | -0.00643 | -| std | 0.208 | -| value_loss | 0.0345 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 18 | -| iterations | 6331 | -| time_elapsed | 43452 | -| total_timesteps | 810368 | -| train/ | | -| approx_kl | 0.012053439 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.152 | -| explained_variance | -0.00229 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 63300 | -| policy_gradient_loss | -0.00814 | -| std | 0.208 | -| value_loss | 0.000389 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 18 | -| iterations | 6332 | -| time_elapsed | 43456 | -| total_timesteps | 810496 | -| train/ | | -| approx_kl | 0.012976326 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.153 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 63310 | -| policy_gradient_loss | -0.00275 | -| std | 0.207 | -| value_loss | 7.77e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 18 | -| iterations | 6333 | -| time_elapsed | 43460 | -| total_timesteps | 810624 | -| train/ | | -| approx_kl | 0.018732168 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.155 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 63320 | -| policy_gradient_loss | -0.00452 | -| std | 0.207 | -| value_loss | 2.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 18 | -| iterations | 6334 | -| time_elapsed | 43462 | -| total_timesteps | 810752 | -| train/ | | -| approx_kl | 0.016453397 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.156 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 63330 | -| policy_gradient_loss | -0.00137 | -| std | 0.207 | -| value_loss | 1.13e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.39 | -| time/ | | -| fps | 18 | -| iterations | 6335 | -| time_elapsed | 43465 | -| total_timesteps | 810880 | -| train/ | | -| approx_kl | 0.012043269 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.158 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 63340 | -| policy_gradient_loss | -0.00231 | -| std | 0.207 | -| value_loss | 8.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6336 | -| time_elapsed | 43468 | -| total_timesteps | 811008 | -| train/ | | -| approx_kl | 0.023731776 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.159 | -| explained_variance | -0.0908 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 63350 | -| policy_gradient_loss | -0.00595 | -| std | 0.206 | -| value_loss | 3.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6337 | -| time_elapsed | 43479 | -| total_timesteps | 811136 | -| train/ | | -| approx_kl | 0.018454295 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.16 | -| explained_variance | 0.433 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 63360 | -| policy_gradient_loss | -0.000897 | -| std | 0.206 | -| value_loss | 0.0109 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6338 | -| time_elapsed | 43482 | -| total_timesteps | 811264 | -| train/ | | -| approx_kl | 0.021857012 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.161 | -| explained_variance | 0.0956 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 63370 | -| policy_gradient_loss | -0.00906 | -| std | 0.206 | -| value_loss | 0.000121 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6339 | -| time_elapsed | 43485 | -| total_timesteps | 811392 | -| train/ | | -| approx_kl | 0.01649202 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.162 | -| explained_variance | -0.629 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 63380 | -| policy_gradient_loss | -0.00459 | -| std | 0.206 | -| value_loss | 1.63e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6340 | -| time_elapsed | 43488 | -| total_timesteps | 811520 | -| train/ | | -| approx_kl | 0.0125204045 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.161 | -| explained_variance | -0.358 | -| learning_rate | 0.0003 | -| loss | -0.00926 | -| n_updates | 63390 | -| policy_gradient_loss | -0.00582 | -| std | 0.206 | -| value_loss | 5.02e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6341 | -| time_elapsed | 43490 | -| total_timesteps | 811648 | -| train/ | | -| approx_kl | 0.0077724922 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.161 | -| explained_variance | -0.27 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 63400 | -| policy_gradient_loss | -0.00282 | -| std | 0.206 | -| value_loss | 2.91e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6342 | -| time_elapsed | 43493 | -| total_timesteps | 811776 | -| train/ | | -| approx_kl | 0.014561497 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 0.161 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 63410 | -| policy_gradient_loss | -0.00359 | -| std | 0.206 | -| value_loss | 9.84e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.4 | -| time/ | | -| fps | 18 | -| iterations | 6343 | -| time_elapsed | 43495 | -| total_timesteps | 811904 | -| train/ | | -| approx_kl | 0.0036948444 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.159 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.000239 | -| n_updates | 63420 | -| policy_gradient_loss | 0.000108 | -| std | 0.207 | -| value_loss | 1.43e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6344 | -| time_elapsed | 43498 | -| total_timesteps | 812032 | -| train/ | | -| approx_kl | 0.0002098172 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.157 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -6.25e-05 | -| n_updates | 63430 | -| policy_gradient_loss | 9.79e-05 | -| std | 0.207 | -| value_loss | 3.64e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6345 | -| time_elapsed | 43505 | -| total_timesteps | 812160 | -| train/ | | -| approx_kl | 0.012443065 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.159 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | -0.000787 | -| n_updates | 63440 | -| policy_gradient_loss | -0.000727 | -| std | 0.206 | -| value_loss | 0.000285 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6346 | -| time_elapsed | 43509 | -| total_timesteps | 812288 | -| train/ | | -| approx_kl | 0.009485228 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 0.16 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | -0.00016 | -| n_updates | 63450 | -| policy_gradient_loss | 0.000728 | -| std | 0.206 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6347 | -| time_elapsed | 43513 | -| total_timesteps | 812416 | -| train/ | | -| approx_kl | 0.007916281 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.161 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | 0.00083 | -| n_updates | 63460 | -| policy_gradient_loss | 0.00274 | -| std | 0.206 | -| value_loss | 1.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6348 | -| time_elapsed | 43516 | -| total_timesteps | 812544 | -| train/ | | -| approx_kl | 0.012809385 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 0.161 | -| explained_variance | -0.37 | -| learning_rate | 0.0003 | -| loss | -0.0084 | -| n_updates | 63470 | -| policy_gradient_loss | -0.00266 | -| std | 0.206 | -| value_loss | 2.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6349 | -| time_elapsed | 43519 | -| total_timesteps | 812672 | -| train/ | | -| approx_kl | 0.013646388 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.161 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 63480 | -| policy_gradient_loss | -0.00506 | -| std | 0.206 | -| value_loss | 1.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6350 | -| time_elapsed | 43523 | -| total_timesteps | 812800 | -| train/ | | -| approx_kl | 0.026523314 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.16 | -| explained_variance | -0.0916 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 63490 | -| policy_gradient_loss | -0.0171 | -| std | 0.206 | -| value_loss | 8.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6351 | -| time_elapsed | 43527 | -| total_timesteps | 812928 | -| train/ | | -| approx_kl | 0.021335654 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.16 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | -0.00767 | -| n_updates | 63500 | -| policy_gradient_loss | -0.00814 | -| std | 0.206 | -| value_loss | 4.81e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6352 | -| time_elapsed | 43530 | -| total_timesteps | 813056 | -| train/ | | -| approx_kl | 0.009414082 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.16 | -| explained_variance | -0.0854 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 63510 | -| policy_gradient_loss | -0.00166 | -| std | 0.206 | -| value_loss | 3.22e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6353 | -| time_elapsed | 43535 | -| total_timesteps | 813184 | -| train/ | | -| approx_kl | 0.0038387394 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 0.162 | -| explained_variance | 0.533 | -| learning_rate | 0.0003 | -| loss | 0.00257 | -| n_updates | 63520 | -| policy_gradient_loss | -0.00034 | -| std | 0.205 | -| value_loss | 0.00679 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6354 | -| time_elapsed | 43539 | -| total_timesteps | 813312 | -| train/ | | -| approx_kl | 0.014816566 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.164 | -| explained_variance | -0.563 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 63530 | -| policy_gradient_loss | -0.00195 | -| std | 0.205 | -| value_loss | 0.000155 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6355 | -| time_elapsed | 43542 | -| total_timesteps | 813440 | -| train/ | | -| approx_kl | 0.060936097 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.164 | -| explained_variance | -52.9 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 63540 | -| policy_gradient_loss | -0.00556 | -| std | 0.205 | -| value_loss | 1.82e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6356 | -| time_elapsed | 43544 | -| total_timesteps | 813568 | -| train/ | | -| approx_kl | 0.03708234 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 0.164 | -| explained_variance | -42.7 | -| learning_rate | 0.0003 | -| loss | -0.00774 | -| n_updates | 63550 | -| policy_gradient_loss | -0.00657 | -| std | 0.206 | -| value_loss | 6.93e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6357 | -| time_elapsed | 43547 | -| total_timesteps | 813696 | -| train/ | | -| approx_kl | 0.011830112 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.163 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 63560 | -| policy_gradient_loss | 0.000564 | -| std | 0.206 | -| value_loss | 1.86e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6358 | -| time_elapsed | 43550 | -| total_timesteps | 813824 | -| train/ | | -| approx_kl | 0.0064293467 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.163 | -| explained_variance | -0.0824 | -| learning_rate | 0.0003 | -| loss | -0.000766 | -| n_updates | 63570 | -| policy_gradient_loss | -0.000544 | -| std | 0.206 | -| value_loss | 2.31e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6359 | -| time_elapsed | 43554 | -| total_timesteps | 813952 | -| train/ | | -| approx_kl | 0.02869725 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 0.163 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 63580 | -| policy_gradient_loss | -0.0104 | -| std | 0.205 | -| value_loss | 3.78e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6360 | -| time_elapsed | 43557 | -| total_timesteps | 814080 | -| train/ | | -| approx_kl | 0.011629852 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 0.164 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 63590 | -| policy_gradient_loss | -0.00787 | -| std | 0.205 | -| value_loss | 6.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6361 | -| time_elapsed | 43563 | -| total_timesteps | 814208 | -| train/ | | -| approx_kl | 0.020733757 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 0.164 | -| explained_variance | 0.52 | -| learning_rate | 0.0003 | -| loss | 0.0035 | -| n_updates | 63600 | -| policy_gradient_loss | -0.00191 | -| std | 0.205 | -| value_loss | 0.0107 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6362 | -| time_elapsed | 43567 | -| total_timesteps | 814336 | -| train/ | | -| approx_kl | 0.016551754 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.166 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 63610 | -| policy_gradient_loss | -0.00314 | -| std | 0.205 | -| value_loss | 2.79e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6363 | -| time_elapsed | 43571 | -| total_timesteps | 814464 | -| train/ | | -| approx_kl | 0.020513678 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 0.167 | -| explained_variance | -0.702 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 63620 | -| policy_gradient_loss | -0.0035 | -| std | 0.205 | -| value_loss | 1.31e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6364 | -| time_elapsed | 43573 | -| total_timesteps | 814592 | -| train/ | | -| approx_kl | 0.02770828 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 0.168 | -| explained_variance | -0.55 | -| learning_rate | 0.0003 | -| loss | 0.00304 | -| n_updates | 63630 | -| policy_gradient_loss | -0.000525 | -| std | 0.205 | -| value_loss | 5.19e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6365 | -| time_elapsed | 43577 | -| total_timesteps | 814720 | -| train/ | | -| approx_kl | 0.0093369745 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.168 | -| explained_variance | -0.421 | -| learning_rate | 0.0003 | -| loss | -0.000752 | -| n_updates | 63640 | -| policy_gradient_loss | -0.000717 | -| std | 0.204 | -| value_loss | 1.64e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6366 | -| time_elapsed | 43580 | -| total_timesteps | 814848 | -| train/ | | -| approx_kl | 0.009827627 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 0.17 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.00112 | -| n_updates | 63650 | -| policy_gradient_loss | -6.38e-05 | -| std | 0.204 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.41 | -| time/ | | -| fps | 18 | -| iterations | 6367 | -| time_elapsed | 43583 | -| total_timesteps | 814976 | -| train/ | | -| approx_kl | 0.011765098 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 0.172 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.00712 | -| n_updates | 63660 | -| policy_gradient_loss | -0.00551 | -| std | 0.203 | -| value_loss | 6.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6368 | -| time_elapsed | 43587 | -| total_timesteps | 815104 | -| train/ | | -| approx_kl | 0.011399096 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.173 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 63670 | -| policy_gradient_loss | -0.00161 | -| std | 0.203 | -| value_loss | 2.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6369 | -| time_elapsed | 43595 | -| total_timesteps | 815232 | -| train/ | | -| approx_kl | 0.012789355 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.173 | -| explained_variance | 0.435 | -| learning_rate | 0.0003 | -| loss | 0.00838 | -| n_updates | 63680 | -| policy_gradient_loss | -0.00142 | -| std | 0.204 | -| value_loss | 0.0208 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6370 | -| time_elapsed | 43598 | -| total_timesteps | 815360 | -| train/ | | -| approx_kl | 0.017310359 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.173 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 63690 | -| policy_gradient_loss | -0.00403 | -| std | 0.204 | -| value_loss | 6.17e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6371 | -| time_elapsed | 43601 | -| total_timesteps | 815488 | -| train/ | | -| approx_kl | 0.020179749 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.173 | -| explained_variance | -0.938 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 63700 | -| policy_gradient_loss | -0.0133 | -| std | 0.204 | -| value_loss | 3.72e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6372 | -| time_elapsed | 43604 | -| total_timesteps | 815616 | -| train/ | | -| approx_kl | 0.0036142156 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 0.172 | -| explained_variance | -0.374 | -| learning_rate | 0.0003 | -| loss | -0.000246 | -| n_updates | 63710 | -| policy_gradient_loss | -5.75e-05 | -| std | 0.204 | -| value_loss | 1.81e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6373 | -| time_elapsed | 43608 | -| total_timesteps | 815744 | -| train/ | | -| approx_kl | 0.015624877 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.17 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 63720 | -| policy_gradient_loss | -0.00174 | -| std | 0.204 | -| value_loss | 1.73e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6374 | -| time_elapsed | 43612 | -| total_timesteps | 815872 | -| train/ | | -| approx_kl | 0.014740447 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.17 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.000591 | -| n_updates | 63730 | -| policy_gradient_loss | -0.00159 | -| std | 0.204 | -| value_loss | 9.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6375 | -| time_elapsed | 43616 | -| total_timesteps | 816000 | -| train/ | | -| approx_kl | 0.01482157 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.171 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 63740 | -| policy_gradient_loss | -0.00282 | -| std | 0.204 | -| value_loss | 4.23e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6376 | -| time_elapsed | 43620 | -| total_timesteps | 816128 | -| train/ | | -| approx_kl | 0.014040299 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.171 | -| explained_variance | 0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 63750 | -| policy_gradient_loss | -0.00261 | -| std | 0.204 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6377 | -| time_elapsed | 43626 | -| total_timesteps | 816256 | -| train/ | | -| approx_kl | 0.014650159 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.171 | -| explained_variance | 0.557 | -| learning_rate | 0.0003 | -| loss | 0.00519 | -| n_updates | 63760 | -| policy_gradient_loss | -0.0015 | -| std | 0.204 | -| value_loss | 0.0119 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6378 | -| time_elapsed | 43631 | -| total_timesteps | 816384 | -| train/ | | -| approx_kl | 0.018412666 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.17 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 63770 | -| policy_gradient_loss | -0.00555 | -| std | 0.204 | -| value_loss | 6.34e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6379 | -| time_elapsed | 43634 | -| total_timesteps | 816512 | -| train/ | | -| approx_kl | 0.012664776 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.17 | -| explained_variance | -0.336 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 63780 | -| policy_gradient_loss | -0.00818 | -| std | 0.204 | -| value_loss | 1.45e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6380 | -| time_elapsed | 43638 | -| total_timesteps | 816640 | -| train/ | | -| approx_kl | 0.0097725075 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.17 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 63790 | -| policy_gradient_loss | -0.0015 | -| std | 0.204 | -| value_loss | 2.01e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6381 | -| time_elapsed | 43641 | -| total_timesteps | 816768 | -| train/ | | -| approx_kl | 0.01040536 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.17 | -| explained_variance | -0.639 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 63800 | -| policy_gradient_loss | -3.49e-05 | -| std | 0.204 | -| value_loss | 7.27e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6382 | -| time_elapsed | 43646 | -| total_timesteps | 816896 | -| train/ | | -| approx_kl | 0.0127909 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.169 | -| explained_variance | -0.515 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 63810 | -| policy_gradient_loss | -0.00207 | -| std | 0.204 | -| value_loss | 1.76e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6383 | -| time_elapsed | 43650 | -| total_timesteps | 817024 | -| train/ | | -| approx_kl | 0.011418754 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.169 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 63820 | -| policy_gradient_loss | -0.000185 | -| std | 0.204 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6384 | -| time_elapsed | 43657 | -| total_timesteps | 817152 | -| train/ | | -| approx_kl | 0.016292084 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.169 | -| explained_variance | 0.605 | -| learning_rate | 0.0003 | -| loss | 0.00463 | -| n_updates | 63830 | -| policy_gradient_loss | -0.000705 | -| std | 0.204 | -| value_loss | 0.00962 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6385 | -| time_elapsed | 43661 | -| total_timesteps | 817280 | -| train/ | | -| approx_kl | 0.0178881 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.169 | -| explained_variance | 0.178 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 63840 | -| policy_gradient_loss | -0.00862 | -| std | 0.204 | -| value_loss | 4.59e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6386 | -| time_elapsed | 43665 | -| total_timesteps | 817408 | -| train/ | | -| approx_kl | 0.0014469572 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 0.171 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 63850 | -| policy_gradient_loss | -0.000473 | -| std | 0.203 | -| value_loss | 4.33e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6387 | -| time_elapsed | 43669 | -| total_timesteps | 817536 | -| train/ | | -| approx_kl | 0.004765712 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.177 | -| explained_variance | -0.268 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 63860 | -| policy_gradient_loss | -0.00924 | -| std | 0.202 | -| value_loss | 3.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6388 | -| time_elapsed | 43674 | -| total_timesteps | 817664 | -| train/ | | -| approx_kl | 0.026253937 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 0.181 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 63870 | -| policy_gradient_loss | -0.014 | -| std | 0.202 | -| value_loss | 3.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6389 | -| time_elapsed | 43679 | -| total_timesteps | 817792 | -| train/ | | -| approx_kl | 0.009562949 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.182 | -| explained_variance | -0.33 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 63880 | -| policy_gradient_loss | -0.00067 | -| std | 0.202 | -| value_loss | 9.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6390 | -| time_elapsed | 43683 | -| total_timesteps | 817920 | -| train/ | | -| approx_kl | 0.003596384 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.182 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | -0.000714 | -| n_updates | 63890 | -| policy_gradient_loss | 0.00126 | -| std | 0.202 | -| value_loss | 1.99e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6391 | -| time_elapsed | 43687 | -| total_timesteps | 818048 | -| train/ | | -| approx_kl | 0.019862834 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.182 | -| explained_variance | -0.397 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 63900 | -| policy_gradient_loss | -0.0132 | -| std | 0.202 | -| value_loss | 2.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6392 | -| time_elapsed | 43693 | -| total_timesteps | 818176 | -| train/ | | -| approx_kl | 0.018647213 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 0.183 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 63910 | -| policy_gradient_loss | -0.00198 | -| std | 0.201 | -| value_loss | 0.000461 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6393 | -| time_elapsed | 43695 | -| total_timesteps | 818304 | -| train/ | | -| approx_kl | 0.014848996 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.184 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 63920 | -| policy_gradient_loss | -0.00175 | -| std | 0.201 | -| value_loss | 1.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6394 | -| time_elapsed | 43698 | -| total_timesteps | 818432 | -| train/ | | -| approx_kl | 0.032508828 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.185 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 63930 | -| policy_gradient_loss | -0.00972 | -| std | 0.201 | -| value_loss | 1.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6395 | -| time_elapsed | 43701 | -| total_timesteps | 818560 | -| train/ | | -| approx_kl | 0.007502813 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.186 | -| explained_variance | -2.55 | -| learning_rate | 0.0003 | -| loss | -0.00489 | -| n_updates | 63940 | -| policy_gradient_loss | -0.0027 | -| std | 0.201 | -| value_loss | 2.19e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6396 | -| time_elapsed | 43705 | -| total_timesteps | 818688 | -| train/ | | -| approx_kl | 0.00954541 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.187 | -| explained_variance | -0.445 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 63950 | -| policy_gradient_loss | 0.000116 | -| std | 0.201 | -| value_loss | 7.34e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6397 | -| time_elapsed | 43708 | -| total_timesteps | 818816 | -| train/ | | -| approx_kl | 0.011536652 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 0.189 | -| explained_variance | -0.0872 | -| learning_rate | 0.0003 | -| loss | 2.4e-05 | -| n_updates | 63960 | -| policy_gradient_loss | -0.000542 | -| std | 0.2 | -| value_loss | 8.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6398 | -| time_elapsed | 43712 | -| total_timesteps | 818944 | -| train/ | | -| approx_kl | 0.010383552 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.19 | -| explained_variance | -0.477 | -| learning_rate | 0.0003 | -| loss | -0.000956 | -| n_updates | 63970 | -| policy_gradient_loss | -0.00135 | -| std | 0.2 | -| value_loss | 2.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6399 | -| time_elapsed | 43715 | -| total_timesteps | 819072 | -| train/ | | -| approx_kl | 0.028461007 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.19 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 63980 | -| policy_gradient_loss | -0.00713 | -| std | 0.2 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6400 | -| time_elapsed | 43720 | -| total_timesteps | 819200 | -| train/ | | -| approx_kl | 0.008731727 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.19 | -| explained_variance | 0.698 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 63990 | -| policy_gradient_loss | -0.00304 | -| std | 0.2 | -| value_loss | 0.00566 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6401 | -| time_elapsed | 43724 | -| total_timesteps | 819328 | -| train/ | | -| approx_kl | 0.008942584 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.191 | -| explained_variance | -0.493 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 64000 | -| policy_gradient_loss | -0.00146 | -| std | 0.2 | -| value_loss | 1.41e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6402 | -| time_elapsed | 43727 | -| total_timesteps | 819456 | -| train/ | | -| approx_kl | 0.020384436 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.192 | -| explained_variance | -1.32 | -| learning_rate | 0.0003 | -| loss | 0.00282 | -| n_updates | 64010 | -| policy_gradient_loss | 0.00103 | -| std | 0.2 | -| value_loss | 1.4e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6403 | -| time_elapsed | 43730 | -| total_timesteps | 819584 | -| train/ | | -| approx_kl | 0.024292331 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.193 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 64020 | -| policy_gradient_loss | -0.00383 | -| std | 0.2 | -| value_loss | 1.88e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6404 | -| time_elapsed | 43734 | -| total_timesteps | 819712 | -| train/ | | -| approx_kl | 0.007425226 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.192 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 64030 | -| policy_gradient_loss | -0.000707 | -| std | 0.2 | -| value_loss | 1.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6405 | -| time_elapsed | 43738 | -| total_timesteps | 819840 | -| train/ | | -| approx_kl | 0.014862416 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.19 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | -0.000649 | -| n_updates | 64040 | -| policy_gradient_loss | -0.00133 | -| std | 0.2 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6406 | -| time_elapsed | 43741 | -| total_timesteps | 819968 | -| train/ | | -| approx_kl | 0.024114516 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 0.191 | -| explained_variance | -0.236 | -| learning_rate | 0.0003 | -| loss | -0.00789 | -| n_updates | 64050 | -| policy_gradient_loss | -0.00726 | -| std | 0.2 | -| value_loss | 6.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6407 | -| time_elapsed | 43744 | -| total_timesteps | 820096 | -| train/ | | -| approx_kl | 0.006810175 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.191 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.00785 | -| n_updates | 64060 | -| policy_gradient_loss | -0.00534 | -| std | 0.2 | -| value_loss | 2.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6408 | -| time_elapsed | 43752 | -| total_timesteps | 820224 | -| train/ | | -| approx_kl | 0.084015206 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 0.19 | -| explained_variance | -0.698 | -| learning_rate | 0.0003 | -| loss | -0.00343 | -| n_updates | 64070 | -| policy_gradient_loss | -0.00545 | -| std | 0.2 | -| value_loss | 0.00146 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6409 | -| time_elapsed | 43756 | -| total_timesteps | 820352 | -| train/ | | -| approx_kl | 0.025271595 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 0.189 | -| explained_variance | -24.6 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 64080 | -| policy_gradient_loss | -0.00443 | -| std | 0.2 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6410 | -| time_elapsed | 43759 | -| total_timesteps | 820480 | -| train/ | | -| approx_kl | 0.055355437 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.189 | -| explained_variance | -51.6 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 64090 | -| policy_gradient_loss | -0.0105 | -| std | 0.2 | -| value_loss | 1.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6411 | -| time_elapsed | 43763 | -| total_timesteps | 820608 | -| train/ | | -| approx_kl | 0.01935844 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.19 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 64100 | -| policy_gradient_loss | -0.00365 | -| std | 0.2 | -| value_loss | 6.54e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6412 | -| time_elapsed | 43766 | -| total_timesteps | 820736 | -| train/ | | -| approx_kl | 0.010819006 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 0.191 | -| explained_variance | -0.989 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 64110 | -| policy_gradient_loss | 0.000142 | -| std | 0.2 | -| value_loss | 5.28e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6413 | -| time_elapsed | 43768 | -| total_timesteps | 820864 | -| train/ | | -| approx_kl | 0.016687095 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.192 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 64120 | -| policy_gradient_loss | -0.00164 | -| std | 0.2 | -| value_loss | 1.62e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6414 | -| time_elapsed | 43773 | -| total_timesteps | 820992 | -| train/ | | -| approx_kl | 0.013703689 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 0.193 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00922 | -| n_updates | 64130 | -| policy_gradient_loss | -0.00376 | -| std | 0.199 | -| value_loss | 7.42e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6415 | -| time_elapsed | 43777 | -| total_timesteps | 821120 | -| train/ | | -| approx_kl | 0.0050481535 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.194 | -| explained_variance | -0.00487 | -| learning_rate | 0.0003 | -| loss | -0.0041 | -| n_updates | 64140 | -| policy_gradient_loss | -0.0024 | -| std | 0.199 | -| value_loss | 6.8e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6416 | -| time_elapsed | 43786 | -| total_timesteps | 821248 | -| train/ | | -| approx_kl | 0.017431984 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.195 | -| explained_variance | 0.626 | -| learning_rate | 0.0003 | -| loss | 0.00374 | -| n_updates | 64150 | -| policy_gradient_loss | -0.00134 | -| std | 0.199 | -| value_loss | 0.0108 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6417 | -| time_elapsed | 43791 | -| total_timesteps | 821376 | -| train/ | | -| approx_kl | 0.0078042387 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.196 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 64160 | -| policy_gradient_loss | -0.0081 | -| std | 0.199 | -| value_loss | 0.000121 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6418 | -| time_elapsed | 43795 | -| total_timesteps | 821504 | -| train/ | | -| approx_kl | 0.01341008 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 0.197 | -| explained_variance | -0.458 | -| learning_rate | 0.0003 | -| loss | 0.000123 | -| n_updates | 64170 | -| policy_gradient_loss | -0.000471 | -| std | 0.199 | -| value_loss | 1.61e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6419 | -| time_elapsed | 43798 | -| total_timesteps | 821632 | -| train/ | | -| approx_kl | 0.010785552 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.198 | -| explained_variance | -0.387 | -| learning_rate | 0.0003 | -| loss | -0.00561 | -| n_updates | 64180 | -| policy_gradient_loss | -0.00408 | -| std | 0.199 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6420 | -| time_elapsed | 43801 | -| total_timesteps | 821760 | -| train/ | | -| approx_kl | 0.027619524 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 0.198 | -| explained_variance | -0.629 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 64190 | -| policy_gradient_loss | -0.0106 | -| std | 0.198 | -| value_loss | 3.78e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.42 | -| time/ | | -| fps | 18 | -| iterations | 6421 | -| time_elapsed | 43806 | -| total_timesteps | 821888 | -| train/ | | -| approx_kl | 0.0004712399 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.2 | -| explained_variance | -0.47 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 64200 | -| policy_gradient_loss | -0.00043 | -| std | 0.198 | -| value_loss | 2.2e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6422 | -| time_elapsed | 43809 | -| total_timesteps | 822016 | -| train/ | | -| approx_kl | 0.01829731 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.205 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 64210 | -| policy_gradient_loss | -0.00345 | -| std | 0.197 | -| value_loss | 9.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6423 | -| time_elapsed | 43818 | -| total_timesteps | 822144 | -| train/ | | -| approx_kl | 0.021914229 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 0.208 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 64220 | -| policy_gradient_loss | -0.00322 | -| std | 0.196 | -| value_loss | 0.000148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6424 | -| time_elapsed | 43821 | -| total_timesteps | 822272 | -| train/ | | -| approx_kl | 0.014909664 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.209 | -| explained_variance | 0.383 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 64230 | -| policy_gradient_loss | -0.00394 | -| std | 0.196 | -| value_loss | 4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6425 | -| time_elapsed | 43824 | -| total_timesteps | 822400 | -| train/ | | -| approx_kl | 0.011653315 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 0.21 | -| explained_variance | -0.597 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 64240 | -| policy_gradient_loss | -0.00208 | -| std | 0.196 | -| value_loss | 5.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6426 | -| time_elapsed | 43828 | -| total_timesteps | 822528 | -| train/ | | -| approx_kl | 0.015438989 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.21 | -| explained_variance | -0.23 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 64250 | -| policy_gradient_loss | -0.00269 | -| std | 0.196 | -| value_loss | 8.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6427 | -| time_elapsed | 43831 | -| total_timesteps | 822656 | -| train/ | | -| approx_kl | 0.009177048 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.21 | -| explained_variance | -0.897 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 64260 | -| policy_gradient_loss | -0.00226 | -| std | 0.196 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6428 | -| time_elapsed | 43834 | -| total_timesteps | 822784 | -| train/ | | -| approx_kl | 0.012556882 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.21 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 64270 | -| policy_gradient_loss | 4.46e-06 | -| std | 0.196 | -| value_loss | 1.19e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6429 | -| time_elapsed | 43838 | -| total_timesteps | 822912 | -| train/ | | -| approx_kl | 0.006003543 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.211 | -| explained_variance | -0.0718 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 64280 | -| policy_gradient_loss | -0.00179 | -| std | 0.196 | -| value_loss | 1.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6430 | -| time_elapsed | 43842 | -| total_timesteps | 823040 | -| train/ | | -| approx_kl | 0.028352406 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.211 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 64290 | -| policy_gradient_loss | -0.00687 | -| std | 0.196 | -| value_loss | 1.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6431 | -| time_elapsed | 43849 | -| total_timesteps | 823168 | -| train/ | | -| approx_kl | 0.017443176 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.211 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 64300 | -| policy_gradient_loss | -0.0067 | -| std | 0.196 | -| value_loss | 0.00397 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6432 | -| time_elapsed | 43853 | -| total_timesteps | 823296 | -| train/ | | -| approx_kl | 0.026721638 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.212 | -| explained_variance | -0.581 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 64310 | -| policy_gradient_loss | -0.00513 | -| std | 0.196 | -| value_loss | 8.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6433 | -| time_elapsed | 43857 | -| total_timesteps | 823424 | -| train/ | | -| approx_kl | 0.034630623 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.213 | -| explained_variance | -2.44 | -| learning_rate | 0.0003 | -| loss | -0.00634 | -| n_updates | 64320 | -| policy_gradient_loss | -0.00536 | -| std | 0.196 | -| value_loss | 1.96e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6434 | -| time_elapsed | 43861 | -| total_timesteps | 823552 | -| train/ | | -| approx_kl | 0.01368198 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.213 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.000232 | -| n_updates | 64330 | -| policy_gradient_loss | -0.000888 | -| std | 0.195 | -| value_loss | 1.96e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6435 | -| time_elapsed | 43865 | -| total_timesteps | 823680 | -| train/ | | -| approx_kl | 0.0049298326 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.214 | -| explained_variance | -0.571 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 64340 | -| policy_gradient_loss | -0.0139 | -| std | 0.195 | -| value_loss | 1.74e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6436 | -| time_elapsed | 43869 | -| total_timesteps | 823808 | -| train/ | | -| approx_kl | 0.013637582 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.216 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 64350 | -| policy_gradient_loss | -0.00124 | -| std | 0.195 | -| value_loss | 2.6e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 18 | -| iterations | 6437 | -| time_elapsed | 43871 | -| total_timesteps | 823936 | -| train/ | | -| approx_kl | 0.010983311 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.217 | -| explained_variance | -0.564 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 64360 | -| policy_gradient_loss | 0.00166 | -| std | 0.195 | -| value_loss | 5.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6438 | -| time_elapsed | 43874 | -| total_timesteps | 824064 | -| train/ | | -| approx_kl | 0.020191196 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.218 | -| explained_variance | -0.597 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 64370 | -| policy_gradient_loss | -0.00648 | -| std | 0.195 | -| value_loss | 2.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6439 | -| time_elapsed | 43880 | -| total_timesteps | 824192 | -| train/ | | -| approx_kl | 0.015814563 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.218 | -| explained_variance | 0.236 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 64380 | -| policy_gradient_loss | -0.00032 | -| std | 0.194 | -| value_loss | 0.0744 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6440 | -| time_elapsed | 43885 | -| total_timesteps | 824320 | -| train/ | | -| approx_kl | 0.0021096803 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 0.221 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 64390 | -| policy_gradient_loss | -0.000878 | -| std | 0.193 | -| value_loss | 0.000897 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6441 | -| time_elapsed | 43888 | -| total_timesteps | 824448 | -| train/ | | -| approx_kl | 0.00046246173 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.227 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.000253 | -| n_updates | 64400 | -| policy_gradient_loss | -0.000117 | -| std | 0.192 | -| value_loss | 0.000701 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6442 | -| time_elapsed | 43891 | -| total_timesteps | 824576 | -| train/ | | -| approx_kl | 0.016201442 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.231 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 64410 | -| policy_gradient_loss | -0.00963 | -| std | 0.192 | -| value_loss | 0.00138 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6443 | -| time_elapsed | 43894 | -| total_timesteps | 824704 | -| train/ | | -| approx_kl | 0.020596212 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.232 | -| explained_variance | -0.323 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 64420 | -| policy_gradient_loss | -0.00427 | -| std | 0.192 | -| value_loss | 0.000449 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6444 | -| time_elapsed | 43897 | -| total_timesteps | 824832 | -| train/ | | -| approx_kl | 0.025897304 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 64430 | -| policy_gradient_loss | -0.00827 | -| std | 0.192 | -| value_loss | 0.000938 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.44 | -| time/ | | -| fps | 18 | -| iterations | 6445 | -| time_elapsed | 43900 | -| total_timesteps | 824960 | -| train/ | | -| approx_kl | 0.0077490057 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 64440 | -| policy_gradient_loss | -0.000306 | -| std | 0.192 | -| value_loss | 0.00014 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6446 | -| time_elapsed | 43903 | -| total_timesteps | 825088 | -| train/ | | -| approx_kl | 0.029731613 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 0.234 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 64450 | -| policy_gradient_loss | -0.00882 | -| std | 0.192 | -| value_loss | 0.000245 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6447 | -| time_elapsed | 43910 | -| total_timesteps | 825216 | -| train/ | | -| approx_kl | 0.019245407 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 0.234 | -| explained_variance | 0.516 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 64460 | -| policy_gradient_loss | -0.00872 | -| std | 0.192 | -| value_loss | 0.0172 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6448 | -| time_elapsed | 43913 | -| total_timesteps | 825344 | -| train/ | | -| approx_kl | 0.019419141 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -8.5e-05 | -| learning_rate | 0.0003 | -| loss | 0.000286 | -| n_updates | 64470 | -| policy_gradient_loss | -0.00196 | -| std | 0.192 | -| value_loss | 0.000141 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6449 | -| time_elapsed | 43917 | -| total_timesteps | 825472 | -| train/ | | -| approx_kl | 0.01883612 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.397 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 64480 | -| policy_gradient_loss | -0.00528 | -| std | 0.192 | -| value_loss | 6.16e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6450 | -| time_elapsed | 43921 | -| total_timesteps | 825600 | -| train/ | | -| approx_kl | 0.008579646 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.468 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 64490 | -| policy_gradient_loss | -0.00043 | -| std | 0.192 | -| value_loss | 4.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6451 | -| time_elapsed | 43925 | -| total_timesteps | 825728 | -| train/ | | -| approx_kl | 0.029138446 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.517 | -| learning_rate | 0.0003 | -| loss | -0.00773 | -| n_updates | 64500 | -| policy_gradient_loss | -0.00816 | -| std | 0.192 | -| value_loss | 1.95e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6452 | -| time_elapsed | 43927 | -| total_timesteps | 825856 | -| train/ | | -| approx_kl | 0.017699478 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.49 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 64510 | -| policy_gradient_loss | -0.0075 | -| std | 0.192 | -| value_loss | 5.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6453 | -| time_elapsed | 43929 | -| total_timesteps | 825984 | -| train/ | | -| approx_kl | 0.0062333574 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | -0.000983 | -| n_updates | 64520 | -| policy_gradient_loss | -0.000483 | -| std | 0.192 | -| value_loss | 3.6e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.46 | -| time/ | | -| fps | 18 | -| iterations | 6454 | -| time_elapsed | 43932 | -| total_timesteps | 826112 | -| train/ | | -| approx_kl | 0.0035941084 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | 0.233 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.000233 | -| n_updates | 64530 | -| policy_gradient_loss | 0.000165 | -| std | 0.192 | -| value_loss | 4.06e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.46 | -| time/ | | -| fps | 18 | -| iterations | 6455 | -| time_elapsed | 43940 | -| total_timesteps | 826240 | -| train/ | | -| approx_kl | 0.0070293397 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.23 | -| explained_variance | 0.49 | -| learning_rate | 0.0003 | -| loss | -0.000161 | -| n_updates | 64540 | -| policy_gradient_loss | 0.000123 | -| std | 0.192 | -| value_loss | 0.000932 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.46 | -| time/ | | -| fps | 18 | -| iterations | 6456 | -| time_elapsed | 43943 | -| total_timesteps | 826368 | -| train/ | | -| approx_kl | 0.013987824 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | -0.787 | -| learning_rate | 0.0003 | -| loss | 0.00537 | -| n_updates | 64550 | -| policy_gradient_loss | 0.00516 | -| std | 0.192 | -| value_loss | 7.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.46 | -| time/ | | -| fps | 18 | -| iterations | 6457 | -| time_elapsed | 43947 | -| total_timesteps | 826496 | -| train/ | | -| approx_kl | 0.025742363 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | 0.0253 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 64560 | -| policy_gradient_loss | -0.00465 | -| std | 0.192 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.46 | -| time/ | | -| fps | 18 | -| iterations | 6458 | -| time_elapsed | 43949 | -| total_timesteps | 826624 | -| train/ | | -| approx_kl | 0.012141915 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.00243 | -| n_updates | 64570 | -| policy_gradient_loss | 0.000235 | -| std | 0.192 | -| value_loss | 5.15e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.46 | -| time/ | | -| fps | 18 | -| iterations | 6459 | -| time_elapsed | 43954 | -| total_timesteps | 826752 | -| train/ | | -| approx_kl | 0.0012515299 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | 0.00295 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 64580 | -| policy_gradient_loss | -0.000555 | -| std | 0.192 | -| value_loss | 7.39e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.46 | -| time/ | | -| fps | 18 | -| iterations | 6460 | -| time_elapsed | 43958 | -| total_timesteps | 826880 | -| train/ | | -| approx_kl | 0.0031619417 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.000988 | -| n_updates | 64590 | -| policy_gradient_loss | 0.000424 | -| std | 0.192 | -| value_loss | 1.21e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6461 | -| time_elapsed | 43962 | -| total_timesteps | 827008 | -| train/ | | -| approx_kl | 0.026928127 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | -0.379 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 64600 | -| policy_gradient_loss | -0.00907 | -| std | 0.192 | -| value_loss | 3.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6462 | -| time_elapsed | 43971 | -| total_timesteps | 827136 | -| train/ | | -| approx_kl | 0.060577154 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.00803 | -| n_updates | 64610 | -| policy_gradient_loss | -0.00631 | -| std | 0.192 | -| value_loss | 9.01e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6463 | -| time_elapsed | 43974 | -| total_timesteps | 827264 | -| train/ | | -| approx_kl | 0.012141939 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.229 | -| explained_variance | -0.00362 | -| learning_rate | 0.0003 | -| loss | 0.0955 | -| n_updates | 64620 | -| policy_gradient_loss | -0.000631 | -| std | 0.192 | -| value_loss | 0.206 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6464 | -| time_elapsed | 43977 | -| total_timesteps | 827392 | -| train/ | | -| approx_kl | 0.0163249 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.23 | -| explained_variance | -0.0633 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 64630 | -| policy_gradient_loss | -0.000559 | -| std | 0.192 | -| value_loss | 0.0787 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6465 | -| time_elapsed | 43979 | -| total_timesteps | 827520 | -| train/ | | -| approx_kl | 0.012603112 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.231 | -| explained_variance | 0.00418 | -| learning_rate | 0.0003 | -| loss | 0.00282 | -| n_updates | 64640 | -| policy_gradient_loss | -0.00157 | -| std | 0.192 | -| value_loss | 0.013 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6466 | -| time_elapsed | 43983 | -| total_timesteps | 827648 | -| train/ | | -| approx_kl | 0.02463926 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 0.231 | -| explained_variance | 0.00239 | -| learning_rate | 0.0003 | -| loss | 0.000426 | -| n_updates | 64650 | -| policy_gradient_loss | -0.00236 | -| std | 0.192 | -| value_loss | 0.00532 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6467 | -| time_elapsed | 43986 | -| total_timesteps | 827776 | -| train/ | | -| approx_kl | 0.008582089 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 0.231 | -| explained_variance | -0.00173 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 64660 | -| policy_gradient_loss | -0.00233 | -| std | 0.192 | -| value_loss | 0.00323 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.45 | -| time/ | | -| fps | 18 | -| iterations | 6468 | -| time_elapsed | 43989 | -| total_timesteps | 827904 | -| train/ | | -| approx_kl | 0.0055854884 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 0.232 | -| explained_variance | 0.00341 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 64670 | -| policy_gradient_loss | -7.48e-05 | -| std | 0.192 | -| value_loss | 0.00291 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6469 | -| time_elapsed | 43993 | -| total_timesteps | 828032 | -| train/ | | -| approx_kl | 0.016589137 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.232 | -| explained_variance | -0.00899 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 64680 | -| policy_gradient_loss | -0.00792 | -| std | 0.192 | -| value_loss | 0.00308 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6470 | -| time_elapsed | 44000 | -| total_timesteps | 828160 | -| train/ | | -| approx_kl | 0.00090310955 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 0.234 | -| explained_variance | 0.0878 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 64690 | -| policy_gradient_loss | -0.000334 | -| std | 0.191 | -| value_loss | 0.0223 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6471 | -| time_elapsed | 44004 | -| total_timesteps | 828288 | -| train/ | | -| approx_kl | 0.010653713 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.238 | -| explained_variance | 0.000824 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 64700 | -| policy_gradient_loss | -0.00176 | -| std | 0.19 | -| value_loss | 0.00111 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6472 | -| time_elapsed | 44008 | -| total_timesteps | 828416 | -| train/ | | -| approx_kl | 0.031393904 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 0.24 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 64710 | -| policy_gradient_loss | -0.00748 | -| std | 0.19 | -| value_loss | 0.000607 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6473 | -| time_elapsed | 44011 | -| total_timesteps | 828544 | -| train/ | | -| approx_kl | 0.008677887 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 0.24 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 64720 | -| policy_gradient_loss | -0.00134 | -| std | 0.19 | -| value_loss | 0.000347 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6474 | -| time_elapsed | 44014 | -| total_timesteps | 828672 | -| train/ | | -| approx_kl | 0.028529594 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.24 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.00737 | -| n_updates | 64730 | -| policy_gradient_loss | -0.00767 | -| std | 0.19 | -| value_loss | 0.000249 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6475 | -| time_elapsed | 44016 | -| total_timesteps | 828800 | -| train/ | | -| approx_kl | 0.00051407935 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.241 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.000353 | -| n_updates | 64740 | -| policy_gradient_loss | -0.000324 | -| std | 0.19 | -| value_loss | 0.000262 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6476 | -| time_elapsed | 44020 | -| total_timesteps | 828928 | -| train/ | | -| approx_kl | 0.011253262 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.243 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 64750 | -| policy_gradient_loss | -0.00134 | -| std | 0.189 | -| value_loss | 0.000514 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6477 | -| time_elapsed | 44023 | -| total_timesteps | 829056 | -| train/ | | -| approx_kl | 0.021261562 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.245 | -| explained_variance | 0.00183 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 64760 | -| policy_gradient_loss | -0.00728 | -| std | 0.189 | -| value_loss | 9.73e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6478 | -| time_elapsed | 44029 | -| total_timesteps | 829184 | -| train/ | | -| approx_kl | 0.0066379677 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.246 | -| explained_variance | 0.255 | -| learning_rate | 0.0003 | -| loss | 0.00303 | -| n_updates | 64770 | -| policy_gradient_loss | -0.00244 | -| std | 0.189 | -| value_loss | 0.0166 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6479 | -| time_elapsed | 44033 | -| total_timesteps | 829312 | -| train/ | | -| approx_kl | 0.004651728 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.246 | -| explained_variance | -0.00139 | -| learning_rate | 0.0003 | -| loss | -0.000647 | -| n_updates | 64780 | -| policy_gradient_loss | 0.00348 | -| std | 0.189 | -| value_loss | 8.88e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6480 | -| time_elapsed | 44036 | -| total_timesteps | 829440 | -| train/ | | -| approx_kl | 0.011535863 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 0.245 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 64790 | -| policy_gradient_loss | 7.45e-05 | -| std | 0.19 | -| value_loss | 4.37e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6481 | -| time_elapsed | 44039 | -| total_timesteps | 829568 | -| train/ | | -| approx_kl | 0.01625066 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 0.244 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 64800 | -| policy_gradient_loss | -0.0113 | -| std | 0.19 | -| value_loss | 2.98e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6482 | -| time_elapsed | 44042 | -| total_timesteps | 829696 | -| train/ | | -| approx_kl | 0.017002728 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.244 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 64810 | -| policy_gradient_loss | -0.000927 | -| std | 0.19 | -| value_loss | 1.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6483 | -| time_elapsed | 44046 | -| total_timesteps | 829824 | -| train/ | | -| approx_kl | 0.005788083 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 0.244 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.000991 | -| n_updates | 64820 | -| policy_gradient_loss | -0.0001 | -| std | 0.19 | -| value_loss | 1.41e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.51 | -| time/ | | -| fps | 18 | -| iterations | 6484 | -| time_elapsed | 44049 | -| total_timesteps | 829952 | -| train/ | | -| approx_kl | 0.0002508713 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.244 | -| explained_variance | -0.0992 | -| learning_rate | 0.0003 | -| loss | -0.000217 | -| n_updates | 64830 | -| policy_gradient_loss | 5.33e-05 | -| std | 0.189 | -| value_loss | 3.36e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6485 | -| time_elapsed | 44052 | -| total_timesteps | 830080 | -| train/ | | -| approx_kl | 0.011366706 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 64840 | -| policy_gradient_loss | -0.00167 | -| std | 0.189 | -| value_loss | 8.9e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6486 | -| time_elapsed | 44058 | -| total_timesteps | 830208 | -| train/ | | -| approx_kl | 0.0127308555 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.249 | -| explained_variance | 0.11 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 64850 | -| policy_gradient_loss | -0.0051 | -| std | 0.189 | -| value_loss | 0.0621 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6487 | -| time_elapsed | 44060 | -| total_timesteps | 830336 | -| train/ | | -| approx_kl | 0.0059376964 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.249 | -| explained_variance | 0.00459 | -| learning_rate | 0.0003 | -| loss | 0.0861 | -| n_updates | 64860 | -| policy_gradient_loss | 0.000617 | -| std | 0.189 | -| value_loss | 0.231 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6488 | -| time_elapsed | 44064 | -| total_timesteps | 830464 | -| train/ | | -| approx_kl | 0.011348234 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.249 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.0083 | -| n_updates | 64870 | -| policy_gradient_loss | -0.00039 | -| std | 0.189 | -| value_loss | 0.0171 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6489 | -| time_elapsed | 44067 | -| total_timesteps | 830592 | -| train/ | | -| approx_kl | 0.014259907 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 0.248 | -| explained_variance | 0.00494 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 64880 | -| policy_gradient_loss | -0.00126 | -| std | 0.189 | -| value_loss | 0.004 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6490 | -| time_elapsed | 44070 | -| total_timesteps | 830720 | -| train/ | | -| approx_kl | 0.013038391 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.248 | -| explained_variance | -0.00263 | -| learning_rate | 0.0003 | -| loss | 0.000246 | -| n_updates | 64890 | -| policy_gradient_loss | -0.000987 | -| std | 0.189 | -| value_loss | 0.00207 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6491 | -| time_elapsed | 44073 | -| total_timesteps | 830848 | -| train/ | | -| approx_kl | 0.007151699 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | -0.00637 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 64900 | -| policy_gradient_loss | -0.000764 | -| std | 0.189 | -| value_loss | 0.0013 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.52 | -| time/ | | -| fps | 18 | -| iterations | 6492 | -| time_elapsed | 44076 | -| total_timesteps | 830976 | -| train/ | | -| approx_kl | 0.0015332112 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.246 | -| explained_variance | -0.00981 | -| learning_rate | 0.0003 | -| loss | 0.000197 | -| n_updates | 64910 | -| policy_gradient_loss | -0.000194 | -| std | 0.189 | -| value_loss | 0.000886 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.56 | -| time/ | | -| fps | 18 | -| iterations | 6493 | -| time_elapsed | 44080 | -| total_timesteps | 831104 | -| train/ | | -| approx_kl | 0.012659382 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 64920 | -| policy_gradient_loss | -0.00272 | -| std | 0.189 | -| value_loss | 0.00104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.56 | -| time/ | | -| fps | 18 | -| iterations | 6494 | -| time_elapsed | 44087 | -| total_timesteps | 831232 | -| train/ | | -| approx_kl | 0.030025994 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | 0.026 | -| learning_rate | 0.0003 | -| loss | 0.0959 | -| n_updates | 64930 | -| policy_gradient_loss | -0.00584 | -| std | 0.189 | -| value_loss | 0.226 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.56 | -| time/ | | -| fps | 18 | -| iterations | 6495 | -| time_elapsed | 44091 | -| total_timesteps | 831360 | -| train/ | | -| approx_kl | 0.018892175 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | 0.00705 | -| learning_rate | 0.0003 | -| loss | 0.00339 | -| n_updates | 64940 | -| policy_gradient_loss | -0.00137 | -| std | 0.189 | -| value_loss | 0.00342 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.56 | -| time/ | | -| fps | 18 | -| iterations | 6496 | -| time_elapsed | 44094 | -| total_timesteps | 831488 | -| train/ | | -| approx_kl | 0.014428118 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | -0.00962 | -| learning_rate | 0.0003 | -| loss | 0.000714 | -| n_updates | 64950 | -| policy_gradient_loss | -0.0011 | -| std | 0.189 | -| value_loss | 0.00457 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.56 | -| time/ | | -| fps | 18 | -| iterations | 6497 | -| time_elapsed | 44098 | -| total_timesteps | 831616 | -| train/ | | -| approx_kl | 0.020451115 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.248 | -| explained_variance | 8.03e-05 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 64960 | -| policy_gradient_loss | -0.00432 | -| std | 0.189 | -| value_loss | 0.0033 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.56 | -| time/ | | -| fps | 18 | -| iterations | 6498 | -| time_elapsed | 44101 | -| total_timesteps | 831744 | -| train/ | | -| approx_kl | 0.017596643 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | -0.00221 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 64970 | -| policy_gradient_loss | -0.00314 | -| std | 0.189 | -| value_loss | 0.00203 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.56 | -| time/ | | -| fps | 18 | -| iterations | 6499 | -| time_elapsed | 44104 | -| total_timesteps | 831872 | -| train/ | | -| approx_kl | 0.008572724 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 0.246 | -| explained_variance | 0.00166 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 64980 | -| policy_gradient_loss | -0.00354 | -| std | 0.189 | -| value_loss | 0.00483 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6500 | -| time_elapsed | 44107 | -| total_timesteps | 832000 | -| train/ | | -| approx_kl | 0.015432449 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.244 | -| explained_variance | 0.00274 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 64990 | -| policy_gradient_loss | -0.000835 | -| std | 0.19 | -| value_loss | 0.0875 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6501 | -| time_elapsed | 44109 | -| total_timesteps | 832128 | -| train/ | | -| approx_kl | 0.01499936 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.243 | -| explained_variance | 0.00249 | -| learning_rate | 0.0003 | -| loss | 0.271 | -| n_updates | 65000 | -| policy_gradient_loss | -0.00167 | -| std | 0.19 | -| value_loss | 0.733 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6502 | -| time_elapsed | 44118 | -| total_timesteps | 832256 | -| train/ | | -| approx_kl | 0.003941211 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.243 | -| explained_variance | 0.0187 | -| learning_rate | 0.0003 | -| loss | 0.00815 | -| n_updates | 65010 | -| policy_gradient_loss | -0.000902 | -| std | 0.19 | -| value_loss | 0.0146 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6503 | -| time_elapsed | 44121 | -| total_timesteps | 832384 | -| train/ | | -| approx_kl | 0.01358577 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.244 | -| explained_variance | 0.00388 | -| learning_rate | 0.0003 | -| loss | -0.00578 | -| n_updates | 65020 | -| policy_gradient_loss | -0.00583 | -| std | 0.19 | -| value_loss | 0.00645 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6504 | -| time_elapsed | 44125 | -| total_timesteps | 832512 | -| train/ | | -| approx_kl | 0.012044514 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.245 | -| explained_variance | 0.000606 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 65030 | -| policy_gradient_loss | -0.00161 | -| std | 0.189 | -| value_loss | 0.393 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6505 | -| time_elapsed | 44127 | -| total_timesteps | 832640 | -| train/ | | -| approx_kl | 0.023343112 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.245 | -| explained_variance | -0.000799 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 65040 | -| policy_gradient_loss | -0.00139 | -| std | 0.189 | -| value_loss | 0.0872 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6506 | -| time_elapsed | 44129 | -| total_timesteps | 832768 | -| train/ | | -| approx_kl | 0.02589882 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.246 | -| explained_variance | -0.000701 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 65050 | -| policy_gradient_loss | -0.00945 | -| std | 0.189 | -| value_loss | 0.0682 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.7 | -| time/ | | -| fps | 18 | -| iterations | 6507 | -| time_elapsed | 44131 | -| total_timesteps | 832896 | -| train/ | | -| approx_kl | 0.018826239 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | 0.00085 | -| learning_rate | 0.0003 | -| loss | 0.00729 | -| n_updates | 65060 | -| policy_gradient_loss | 0.000406 | -| std | 0.189 | -| value_loss | 0.0184 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6508 | -| time_elapsed | 44135 | -| total_timesteps | 833024 | -| train/ | | -| approx_kl | 0.016883196 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.247 | -| explained_variance | -0.00197 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 65070 | -| policy_gradient_loss | -0.00547 | -| std | 0.189 | -| value_loss | 0.0129 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6509 | -| time_elapsed | 44143 | -| total_timesteps | 833152 | -| train/ | | -| approx_kl | 0.0008785948 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.248 | -| explained_variance | 0.000912 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 65080 | -| policy_gradient_loss | -5.7e-06 | -| std | 0.189 | -| value_loss | 0.0719 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6510 | -| time_elapsed | 44146 | -| total_timesteps | 833280 | -| train/ | | -| approx_kl | 0.004370253 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 0.25 | -| explained_variance | 0.000373 | -| learning_rate | 0.0003 | -| loss | 1.03 | -| n_updates | 65090 | -| policy_gradient_loss | -0.000383 | -| std | 0.188 | -| value_loss | 2.34 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6511 | -| time_elapsed | 44149 | -| total_timesteps | 833408 | -| train/ | | -| approx_kl | 0.011192315 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.251 | -| explained_variance | -0.00341 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 65100 | -| policy_gradient_loss | -0.00397 | -| std | 0.188 | -| value_loss | 0.0821 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6512 | -| time_elapsed | 44153 | -| total_timesteps | 833536 | -| train/ | | -| approx_kl | 0.037596487 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.252 | -| explained_variance | -0.00603 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 65110 | -| policy_gradient_loss | -0.0103 | -| std | 0.188 | -| value_loss | 0.0639 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6513 | -| time_elapsed | 44155 | -| total_timesteps | 833664 | -| train/ | | -| approx_kl | 0.017720554 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.252 | -| explained_variance | -0.00253 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 65120 | -| policy_gradient_loss | -0.00402 | -| std | 0.188 | -| value_loss | 0.0188 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6514 | -| time_elapsed | 44158 | -| total_timesteps | 833792 | -| train/ | | -| approx_kl | 0.0064884555 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 0.253 | -| explained_variance | -0.00229 | -| learning_rate | 0.0003 | -| loss | 0.00867 | -| n_updates | 65130 | -| policy_gradient_loss | -0.00107 | -| std | 0.188 | -| value_loss | 0.0217 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.82 | -| time/ | | -| fps | 18 | -| iterations | 6515 | -| time_elapsed | 44161 | -| total_timesteps | 833920 | -| train/ | | -| approx_kl | 0.015385338 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 0.254 | -| explained_variance | -0.000535 | -| learning_rate | 0.0003 | -| loss | 0.00556 | -| n_updates | 65140 | -| policy_gradient_loss | -0.00285 | -| std | 0.188 | -| value_loss | 0.0281 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6516 | -| time_elapsed | 44164 | -| total_timesteps | 834048 | -| train/ | | -| approx_kl | 0.012543201 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 0.255 | -| explained_variance | -0.00249 | -| learning_rate | 0.0003 | -| loss | 0.000809 | -| n_updates | 65150 | -| policy_gradient_loss | -0.00113 | -| std | 0.187 | -| value_loss | 0.00765 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6517 | -| time_elapsed | 44169 | -| total_timesteps | 834176 | -| train/ | | -| approx_kl | 0.004742871 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.256 | -| explained_variance | 0.000904 | -| learning_rate | 0.0003 | -| loss | 0.0571 | -| n_updates | 65160 | -| policy_gradient_loss | -0.000288 | -| std | 0.187 | -| value_loss | 0.128 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6518 | -| time_elapsed | 44172 | -| total_timesteps | 834304 | -| train/ | | -| approx_kl | 8.199038e-05 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | 0.256 | -| explained_variance | -0.000767 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 65170 | -| policy_gradient_loss | 7.94e-05 | -| std | 0.187 | -| value_loss | 0.00768 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6519 | -| time_elapsed | 44175 | -| total_timesteps | 834432 | -| train/ | | -| approx_kl | 0.026570363 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.256 | -| explained_variance | -0.000378 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 65180 | -| policy_gradient_loss | -0.00943 | -| std | 0.187 | -| value_loss | 0.0571 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6520 | -| time_elapsed | 44178 | -| total_timesteps | 834560 | -| train/ | | -| approx_kl | 0.0052811955 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.257 | -| explained_variance | 7.14e-05 | -| learning_rate | 0.0003 | -| loss | 0.916 | -| n_updates | 65190 | -| policy_gradient_loss | -0.000968 | -| std | 0.187 | -| value_loss | 1.99 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6521 | -| time_elapsed | 44181 | -| total_timesteps | 834688 | -| train/ | | -| approx_kl | 0.0009681792 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.258 | -| explained_variance | 0.00017 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 65200 | -| policy_gradient_loss | 4.61e-05 | -| std | 0.187 | -| value_loss | 0.0335 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6522 | -| time_elapsed | 44184 | -| total_timesteps | 834816 | -| train/ | | -| approx_kl | 0.015854498 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 0.259 | -| explained_variance | -0.000341 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 65210 | -| policy_gradient_loss | -0.00993 | -| std | 0.187 | -| value_loss | 0.0176 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 18 | -| iterations | 6523 | -| time_elapsed | 44187 | -| total_timesteps | 834944 | -| train/ | | -| approx_kl | 0.024321184 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.259 | -| explained_variance | -0.000641 | -| learning_rate | 0.0003 | -| loss | -0.000384 | -| n_updates | 65220 | -| policy_gradient_loss | -0.00494 | -| std | 0.187 | -| value_loss | 0.0188 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6524 | -| time_elapsed | 44190 | -| total_timesteps | 835072 | -| train/ | | -| approx_kl | 0.02159977 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 0.26 | -| explained_variance | -0.000557 | -| learning_rate | 0.0003 | -| loss | 0.00459 | -| n_updates | 65230 | -| policy_gradient_loss | -0.00313 | -| std | 0.187 | -| value_loss | 0.0177 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6525 | -| time_elapsed | 44197 | -| total_timesteps | 835200 | -| train/ | | -| approx_kl | 0.01645189 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.259 | -| explained_variance | 0.00387 | -| learning_rate | 0.0003 | -| loss | 0.0787 | -| n_updates | 65240 | -| policy_gradient_loss | -0.000727 | -| std | 0.187 | -| value_loss | 0.153 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6526 | -| time_elapsed | 44200 | -| total_timesteps | 835328 | -| train/ | | -| approx_kl | 0.012946616 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.259 | -| explained_variance | 0.001 | -| learning_rate | 0.0003 | -| loss | 0.00607 | -| n_updates | 65250 | -| policy_gradient_loss | -0.00319 | -| std | 0.187 | -| value_loss | 0.0207 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6527 | -| time_elapsed | 44204 | -| total_timesteps | 835456 | -| train/ | | -| approx_kl | 0.012814665 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.259 | -| explained_variance | -0.00114 | -| learning_rate | 0.0003 | -| loss | 0.000871 | -| n_updates | 65260 | -| policy_gradient_loss | -0.00128 | -| std | 0.187 | -| value_loss | 0.0125 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6528 | -| time_elapsed | 44206 | -| total_timesteps | 835584 | -| train/ | | -| approx_kl | 0.012943212 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 0.261 | -| explained_variance | -0.00376 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 65270 | -| policy_gradient_loss | 0.00422 | -| std | 0.186 | -| value_loss | 0.00728 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6529 | -| time_elapsed | 44210 | -| total_timesteps | 835712 | -| train/ | | -| approx_kl | 0.037464865 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 0.261 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 65280 | -| policy_gradient_loss | -0.0176 | -| std | 0.186 | -| value_loss | 0.00591 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6530 | -| time_elapsed | 44214 | -| total_timesteps | 835840 | -| train/ | | -| approx_kl | 0.0075665726 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.262 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | 0.000821 | -| n_updates | 65290 | -| policy_gradient_loss | 0.000103 | -| std | 0.186 | -| value_loss | 0.00357 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.17 | -| time/ | | -| fps | 18 | -| iterations | 6531 | -| time_elapsed | 44216 | -| total_timesteps | 835968 | -| train/ | | -| approx_kl | 0.00069806445 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.264 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | -0.000313 | -| n_updates | 65300 | -| policy_gradient_loss | -7.5e-05 | -| std | 0.185 | -| value_loss | 0.00203 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6532 | -| time_elapsed | 44219 | -| total_timesteps | 836096 | -| train/ | | -| approx_kl | 0.015592776 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.269 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | -0.0084 | -| n_updates | 65310 | -| policy_gradient_loss | -0.00857 | -| std | 0.185 | -| value_loss | 0.00787 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6533 | -| time_elapsed | 44226 | -| total_timesteps | 836224 | -| train/ | | -| approx_kl | 0.000986136 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.272 | -| explained_variance | 0.0903 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 65320 | -| policy_gradient_loss | -0.00182 | -| std | 0.184 | -| value_loss | 0.0353 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6534 | -| time_elapsed | 44230 | -| total_timesteps | 836352 | -| train/ | | -| approx_kl | 0.0025240919 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.273 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 65330 | -| policy_gradient_loss | -0.000621 | -| std | 0.184 | -| value_loss | 0.00113 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6535 | -| time_elapsed | 44234 | -| total_timesteps | 836480 | -| train/ | | -| approx_kl | 0.008124255 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.271 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | 0.00223 | -| n_updates | 65340 | -| policy_gradient_loss | 0.00127 | -| std | 0.185 | -| value_loss | 0.00209 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6536 | -| time_elapsed | 44238 | -| total_timesteps | 836608 | -| train/ | | -| approx_kl | 0.0017466964 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.269 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 65350 | -| policy_gradient_loss | -0.000688 | -| std | 0.185 | -| value_loss | 0.000453 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6537 | -| time_elapsed | 44241 | -| total_timesteps | 836736 | -| train/ | | -| approx_kl | 0.026470777 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.267 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00785 | -| n_updates | 65360 | -| policy_gradient_loss | -0.00563 | -| std | 0.185 | -| value_loss | 0.000433 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6538 | -| time_elapsed | 44244 | -| total_timesteps | 836864 | -| train/ | | -| approx_kl | 0.0025721746 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 0.267 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 65370 | -| policy_gradient_loss | -0.00267 | -| std | 0.185 | -| value_loss | 0.000108 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6539 | -| time_elapsed | 44247 | -| total_timesteps | 836992 | -| train/ | | -| approx_kl | 0.011117794 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.268 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 65380 | -| policy_gradient_loss | -0.00334 | -| std | 0.185 | -| value_loss | 0.000158 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6540 | -| time_elapsed | 44251 | -| total_timesteps | 837120 | -| train/ | | -| approx_kl | 0.046318255 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 0.269 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 65390 | -| policy_gradient_loss | -0.0178 | -| std | 0.185 | -| value_loss | 4.38e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6541 | -| time_elapsed | 44262 | -| total_timesteps | 837248 | -| train/ | | -| approx_kl | 0.0017333799 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.269 | -| explained_variance | 0.138 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 65400 | -| policy_gradient_loss | -0.00112 | -| std | 0.185 | -| value_loss | 0.0839 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6542 | -| time_elapsed | 44265 | -| total_timesteps | 837376 | -| train/ | | -| approx_kl | 0.018261664 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.27 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 65410 | -| policy_gradient_loss | -0.014 | -| std | 0.185 | -| value_loss | 0.0016 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6543 | -| time_elapsed | 44269 | -| total_timesteps | 837504 | -| train/ | | -| approx_kl | 0.009588457 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.271 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 65420 | -| policy_gradient_loss | -0.0012 | -| std | 0.184 | -| value_loss | 0.000608 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6544 | -| time_elapsed | 44273 | -| total_timesteps | 837632 | -| train/ | | -| approx_kl | 0.000615343 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | 0.272 | -| explained_variance | -0.0977 | -| learning_rate | 0.0003 | -| loss | 0.000115 | -| n_updates | 65430 | -| policy_gradient_loss | 0.000122 | -| std | 0.184 | -| value_loss | 0.000871 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6545 | -| time_elapsed | 44276 | -| total_timesteps | 837760 | -| train/ | | -| approx_kl | 0.016230904 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 0.274 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.001 | -| n_updates | 65440 | -| policy_gradient_loss | 5.41e-05 | -| std | 0.184 | -| value_loss | 0.00204 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.19 | -| time/ | | -| fps | 18 | -| iterations | 6546 | -| time_elapsed | 44280 | -| total_timesteps | 837888 | -| train/ | | -| approx_kl | 0.032327928 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 0.276 | -| explained_variance | -0.000238 | -| learning_rate | 0.0003 | -| loss | 0.000516 | -| n_updates | 65450 | -| policy_gradient_loss | -0.00311 | -| std | 0.184 | -| value_loss | 0.000319 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6547 | -| time_elapsed | 44282 | -| total_timesteps | 838016 | -| train/ | | -| approx_kl | 0.008117756 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.276 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 65460 | -| policy_gradient_loss | -0.00258 | -| std | 0.184 | -| value_loss | 0.000118 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6548 | -| time_elapsed | 44292 | -| total_timesteps | 838144 | -| train/ | | -| approx_kl | 0.0027721715 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.277 | -| explained_variance | 0.588 | -| learning_rate | 0.0003 | -| loss | -0.000508 | -| n_updates | 65470 | -| policy_gradient_loss | 0.000922 | -| std | 0.183 | -| value_loss | 0.00269 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6549 | -| time_elapsed | 44295 | -| total_timesteps | 838272 | -| train/ | | -| approx_kl | 0.0014238697 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.28 | -| explained_variance | 0.182 | -| learning_rate | 0.0003 | -| loss | -0.000917 | -| n_updates | 65480 | -| policy_gradient_loss | -3.16e-05 | -| std | 0.182 | -| value_loss | 7.35e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6550 | -| time_elapsed | 44298 | -| total_timesteps | 838400 | -| train/ | | -| approx_kl | 0.00066048745 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | -0.0958 | -| learning_rate | 0.0003 | -| loss | -0.000391 | -| n_updates | 65490 | -| policy_gradient_loss | 0.000196 | -| std | 0.182 | -| value_loss | 2.7e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6551 | -| time_elapsed | 44301 | -| total_timesteps | 838528 | -| train/ | | -| approx_kl | 0.012588587 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 65500 | -| policy_gradient_loss | -0.00506 | -| std | 0.182 | -| value_loss | 2.03e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6552 | -| time_elapsed | 44304 | -| total_timesteps | 838656 | -| train/ | | -| approx_kl | 0.01987202 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 65510 | -| policy_gradient_loss | -0.00843 | -| std | 0.182 | -| value_loss | 8.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6553 | -| time_elapsed | 44306 | -| total_timesteps | 838784 | -| train/ | | -| approx_kl | 0.031649895 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.284 | -| explained_variance | -0.0864 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 65520 | -| policy_gradient_loss | -0.0099 | -| std | 0.182 | -| value_loss | 6.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.21 | -| time/ | | -| fps | 18 | -| iterations | 6554 | -| time_elapsed | 44309 | -| total_timesteps | 838912 | -| train/ | | -| approx_kl | 0.014031429 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.284 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.000444 | -| n_updates | 65530 | -| policy_gradient_loss | -0.00174 | -| std | 0.182 | -| value_loss | 3.22e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6555 | -| time_elapsed | 44312 | -| total_timesteps | 839040 | -| train/ | | -| approx_kl | 0.02359844 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.284 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 65540 | -| policy_gradient_loss | -0.00541 | -| std | 0.182 | -| value_loss | 2.2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6556 | -| time_elapsed | 44318 | -| total_timesteps | 839168 | -| train/ | | -| approx_kl | 0.018035011 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.284 | -| explained_variance | 0.233 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 65550 | -| policy_gradient_loss | -0.00885 | -| std | 0.182 | -| value_loss | 0.0447 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6557 | -| time_elapsed | 44323 | -| total_timesteps | 839296 | -| train/ | | -| approx_kl | 0.02626066 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.284 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 65560 | -| policy_gradient_loss | -0.00787 | -| std | 0.182 | -| value_loss | 0.105 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6558 | -| time_elapsed | 44326 | -| total_timesteps | 839424 | -| train/ | | -| approx_kl | 0.005778552 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.00415 | -| n_updates | 65570 | -| policy_gradient_loss | -0.00255 | -| std | 0.182 | -| value_loss | 0.0133 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6559 | -| time_elapsed | 44330 | -| total_timesteps | 839552 | -| train/ | | -| approx_kl | 0.012902999 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | 0.00518 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 65580 | -| policy_gradient_loss | -0.00496 | -| std | 0.182 | -| value_loss | 0.326 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6560 | -| time_elapsed | 44333 | -| total_timesteps | 839680 | -| train/ | | -| approx_kl | 0.010592202 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | -0.00131 | -| learning_rate | 0.0003 | -| loss | 0.0576 | -| n_updates | 65590 | -| policy_gradient_loss | -0.00504 | -| std | 0.182 | -| value_loss | 0.134 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6561 | -| time_elapsed | 44335 | -| total_timesteps | 839808 | -| train/ | | -| approx_kl | 0.0016093869 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | 0.00382 | -| learning_rate | 0.0003 | -| loss | 0.00622 | -| n_updates | 65600 | -| policy_gradient_loss | -0.00038 | -| std | 0.182 | -| value_loss | 0.0173 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.22 | -| time/ | | -| fps | 18 | -| iterations | 6562 | -| time_elapsed | 44338 | -| total_timesteps | 839936 | -| train/ | | -| approx_kl | 0.0007643951 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.282 | -| explained_variance | 0.00143 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 65610 | -| policy_gradient_loss | 0.000365 | -| std | 0.183 | -| value_loss | 0.0546 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6563 | -| time_elapsed | 44342 | -| total_timesteps | 840064 | -| train/ | | -| approx_kl | 0.0003851992 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.283 | -| explained_variance | 0.00041 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 65620 | -| policy_gradient_loss | -0.000934 | -| std | 0.182 | -| value_loss | 0.0551 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6564 | -| time_elapsed | 44347 | -| total_timesteps | 840192 | -| train/ | | -| approx_kl | 0.0002546711 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.29 | -| explained_variance | 0.00156 | -| learning_rate | 0.0003 | -| loss | 0.0554 | -| n_updates | 65630 | -| policy_gradient_loss | -0.000476 | -| std | 0.18 | -| value_loss | 0.116 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6565 | -| time_elapsed | 44349 | -| total_timesteps | 840320 | -| train/ | | -| approx_kl | 0.013299691 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.297 | -| explained_variance | 0.00186 | -| learning_rate | 0.0003 | -| loss | 0.00446 | -| n_updates | 65640 | -| policy_gradient_loss | -0.000761 | -| std | 0.18 | -| value_loss | 0.00945 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6566 | -| time_elapsed | 44353 | -| total_timesteps | 840448 | -| train/ | | -| approx_kl | 0.020130653 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 0.299 | -| explained_variance | 0.00027 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 65650 | -| policy_gradient_loss | -0.000889 | -| std | 0.179 | -| value_loss | 0.114 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6567 | -| time_elapsed | 44356 | -| total_timesteps | 840576 | -| train/ | | -| approx_kl | 0.00741293 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 0.301 | -| explained_variance | 0.000375 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 65660 | -| policy_gradient_loss | -0.00276 | -| std | 0.179 | -| value_loss | 0.0433 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6568 | -| time_elapsed | 44359 | -| total_timesteps | 840704 | -| train/ | | -| approx_kl | 0.01089913 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.301 | -| explained_variance | 0.00131 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 65670 | -| policy_gradient_loss | -0.00129 | -| std | 0.179 | -| value_loss | 0.00636 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6569 | -| time_elapsed | 44361 | -| total_timesteps | 840832 | -| train/ | | -| approx_kl | 0.040323414 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 0.302 | -| explained_variance | 0.000153 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 65680 | -| policy_gradient_loss | -0.0163 | -| std | 0.179 | -| value_loss | 0.0206 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.4 | -| time/ | | -| fps | 18 | -| iterations | 6570 | -| time_elapsed | 44363 | -| total_timesteps | 840960 | -| train/ | | -| approx_kl | 0.025743028 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 0.302 | -| explained_variance | -0.000132 | -| learning_rate | 0.0003 | -| loss | -0.00927 | -| n_updates | 65690 | -| policy_gradient_loss | -0.0141 | -| std | 0.179 | -| value_loss | 0.0195 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6571 | -| time_elapsed | 44366 | -| total_timesteps | 841088 | -| train/ | | -| approx_kl | 0.003512911 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.303 | -| explained_variance | -0.000274 | -| learning_rate | 0.0003 | -| loss | 0.00393 | -| n_updates | 65700 | -| policy_gradient_loss | -0.000346 | -| std | 0.178 | -| value_loss | 0.0162 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6572 | -| time_elapsed | 44372 | -| total_timesteps | 841216 | -| train/ | | -| approx_kl | 0.016712887 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | 0.00284 | -| learning_rate | 0.0003 | -| loss | 0.0506 | -| n_updates | 65710 | -| policy_gradient_loss | -0.00341 | -| std | 0.178 | -| value_loss | 0.11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6573 | -| time_elapsed | 44376 | -| total_timesteps | 841344 | -| train/ | | -| approx_kl | 0.015141316 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.307 | -| explained_variance | -0.000717 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 65720 | -| policy_gradient_loss | -0.00104 | -| std | 0.178 | -| value_loss | 0.0132 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6574 | -| time_elapsed | 44379 | -| total_timesteps | 841472 | -| train/ | | -| approx_kl | 0.0135040935 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 0.309 | -| explained_variance | -0.0011 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 65730 | -| policy_gradient_loss | -0.00124 | -| std | 0.178 | -| value_loss | 0.0111 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6575 | -| time_elapsed | 44382 | -| total_timesteps | 841600 | -| train/ | | -| approx_kl | 0.0008696453 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 0.309 | -| explained_variance | -0.00136 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 65740 | -| policy_gradient_loss | -5.28e-05 | -| std | 0.178 | -| value_loss | 0.00795 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6576 | -| time_elapsed | 44385 | -| total_timesteps | 841728 | -| train/ | | -| approx_kl | 0.01677964 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.307 | -| explained_variance | -0.00393 | -| learning_rate | 0.0003 | -| loss | 0.000477 | -| n_updates | 65750 | -| policy_gradient_loss | -0.00154 | -| std | 0.178 | -| value_loss | 0.00552 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6577 | -| time_elapsed | 44387 | -| total_timesteps | 841856 | -| train/ | | -| approx_kl | 0.004192364 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | -0.00477 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 65760 | -| policy_gradient_loss | -0.00151 | -| std | 0.178 | -| value_loss | 0.00486 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.48 | -| time/ | | -| fps | 18 | -| iterations | 6578 | -| time_elapsed | 44390 | -| total_timesteps | 841984 | -| train/ | | -| approx_kl | 0.0049705016 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.305 | -| explained_variance | -0.00571 | -| learning_rate | 0.0003 | -| loss | 0.00053 | -| n_updates | 65770 | -| policy_gradient_loss | -7.83e-06 | -| std | 0.178 | -| value_loss | 0.00268 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 18 | -| iterations | 6579 | -| time_elapsed | 44392 | -| total_timesteps | 842112 | -| train/ | | -| approx_kl | 0.008287197 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.304 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 65780 | -| policy_gradient_loss | -0.00111 | -| std | 0.179 | -| value_loss | 0.00156 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 18 | -| iterations | 6580 | -| time_elapsed | 44402 | -| total_timesteps | 842240 | -| train/ | | -| approx_kl | 0.015797244 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.304 | -| explained_variance | 0.0212 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 65790 | -| policy_gradient_loss | -0.000361 | -| std | 0.178 | -| value_loss | 0.251 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 18 | -| iterations | 6581 | -| time_elapsed | 44406 | -| total_timesteps | 842368 | -| train/ | | -| approx_kl | 0.02129457 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.305 | -| explained_variance | 0.0079 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 65800 | -| policy_gradient_loss | -0.00448 | -| std | 0.178 | -| value_loss | 0.00834 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 18 | -| iterations | 6582 | -| time_elapsed | 44410 | -| total_timesteps | 842496 | -| train/ | | -| approx_kl | 0.013815921 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | -0.00492 | -| learning_rate | 0.0003 | -| loss | 0.000668 | -| n_updates | 65810 | -| policy_gradient_loss | -0.00186 | -| std | 0.178 | -| value_loss | 0.00531 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 18 | -| iterations | 6583 | -| time_elapsed | 44414 | -| total_timesteps | 842624 | -| train/ | | -| approx_kl | 0.028464798 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | 9.69e-05 | -| learning_rate | 0.0003 | -| loss | 0.00636 | -| n_updates | 65820 | -| policy_gradient_loss | 0.000665 | -| std | 0.178 | -| value_loss | 0.0052 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 18 | -| iterations | 6584 | -| time_elapsed | 44418 | -| total_timesteps | 842752 | -| train/ | | -| approx_kl | 0.0077703246 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | -0.00169 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 65830 | -| policy_gradient_loss | -0.00397 | -| std | 0.178 | -| value_loss | 0.00484 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.49 | -| time/ | | -| fps | 18 | -| iterations | 6585 | -| time_elapsed | 44421 | -| total_timesteps | 842880 | -| train/ | | -| approx_kl | 0.017204745 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 0.307 | -| explained_variance | -0.0042 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 65840 | -| policy_gradient_loss | -0.00223 | -| std | 0.178 | -| value_loss | 0.00298 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6586 | -| time_elapsed | 44424 | -| total_timesteps | 843008 | -| train/ | | -| approx_kl | 0.004158312 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | 0.307 | -| explained_variance | 0.000552 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 65850 | -| policy_gradient_loss | -0.000876 | -| std | 0.178 | -| value_loss | 0.00226 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6587 | -| time_elapsed | 44434 | -| total_timesteps | 843136 | -| train/ | | -| approx_kl | 0.021005206 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | 0.0933 | -| learning_rate | 0.0003 | -| loss | 0.00312 | -| n_updates | 65860 | -| policy_gradient_loss | -0.00526 | -| std | 0.178 | -| value_loss | 0.0248 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6588 | -| time_elapsed | 44437 | -| total_timesteps | 843264 | -| train/ | | -| approx_kl | 0.007511906 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 0.305 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 65870 | -| policy_gradient_loss | -0.00471 | -| std | 0.178 | -| value_loss | 0.0175 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6589 | -| time_elapsed | 44441 | -| total_timesteps | 843392 | -| train/ | | -| approx_kl | 0.013314001 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.304 | -| explained_variance | -0.00783 | -| learning_rate | 0.0003 | -| loss | -0.00077 | -| n_updates | 65880 | -| policy_gradient_loss | -0.001 | -| std | 0.179 | -| value_loss | 0.00182 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6590 | -| time_elapsed | 44444 | -| total_timesteps | 843520 | -| train/ | | -| approx_kl | 0.0061877584 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.303 | -| explained_variance | -0.00995 | -| learning_rate | 0.0003 | -| loss | -0.00945 | -| n_updates | 65890 | -| policy_gradient_loss | -0.00678 | -| std | 0.179 | -| value_loss | 0.000967 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6591 | -| time_elapsed | 44447 | -| total_timesteps | 843648 | -| train/ | | -| approx_kl | 0.009426236 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.304 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.00216 | -| n_updates | 65900 | -| policy_gradient_loss | 0.000158 | -| std | 0.178 | -| value_loss | 0.000538 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6592 | -| time_elapsed | 44450 | -| total_timesteps | 843776 | -| train/ | | -| approx_kl | 0.008908095 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 0.307 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | -0.00606 | -| n_updates | 65910 | -| policy_gradient_loss | -0.0039 | -| std | 0.178 | -| value_loss | 0.000317 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 18 | -| iterations | 6593 | -| time_elapsed | 44453 | -| total_timesteps | 843904 | -| train/ | | -| approx_kl | 0.023773402 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.309 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 65920 | -| policy_gradient_loss | -0.00509 | -| std | 0.178 | -| value_loss | 0.000272 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6594 | -| time_elapsed | 44455 | -| total_timesteps | 844032 | -| train/ | | -| approx_kl | 0.005391586 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.31 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 65930 | -| policy_gradient_loss | -0.000677 | -| std | 0.177 | -| value_loss | 0.000176 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6595 | -| time_elapsed | 44463 | -| total_timesteps | 844160 | -| train/ | | -| approx_kl | 0.017310249 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.312 | -| explained_variance | 0.209 | -| learning_rate | 0.0003 | -| loss | 0.00831 | -| n_updates | 65940 | -| policy_gradient_loss | -0.00174 | -| std | 0.177 | -| value_loss | 0.021 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6596 | -| time_elapsed | 44467 | -| total_timesteps | 844288 | -| train/ | | -| approx_kl | 0.0023437692 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | 0.313 | -| explained_variance | -0.00203 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 65950 | -| policy_gradient_loss | -0.000455 | -| std | 0.177 | -| value_loss | 0.000141 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6597 | -| time_elapsed | 44471 | -| total_timesteps | 844416 | -| train/ | | -| approx_kl | 0.0016318755 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.313 | -| explained_variance | -0.00658 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 65960 | -| policy_gradient_loss | -0.000441 | -| std | 0.177 | -| value_loss | 8.6e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6598 | -| time_elapsed | 44474 | -| total_timesteps | 844544 | -| train/ | | -| approx_kl | 0.0050405758 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.313 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 65970 | -| policy_gradient_loss | -0.004 | -| std | 0.177 | -| value_loss | 6.85e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6599 | -| time_elapsed | 44478 | -| total_timesteps | 844672 | -| train/ | | -| approx_kl | 0.0034413207 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.313 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 65980 | -| policy_gradient_loss | -0.00142 | -| std | 0.177 | -| value_loss | 4.15e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6600 | -| time_elapsed | 44482 | -| total_timesteps | 844800 | -| train/ | | -| approx_kl | 0.005641838 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 0.313 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 65990 | -| policy_gradient_loss | -6.97e-05 | -| std | 0.177 | -| value_loss | 2.59e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6601 | -| time_elapsed | 44486 | -| total_timesteps | 844928 | -| train/ | | -| approx_kl | 0.014925342 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.313 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 66000 | -| policy_gradient_loss | -0.000233 | -| std | 0.177 | -| value_loss | 1.73e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6602 | -| time_elapsed | 44489 | -| total_timesteps | 845056 | -| train/ | | -| approx_kl | 0.0021393918 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 0.312 | -| explained_variance | -0.0935 | -| learning_rate | 0.0003 | -| loss | -0.000549 | -| n_updates | 66010 | -| policy_gradient_loss | -0.000228 | -| std | 0.177 | -| value_loss | 1.83e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6603 | -| time_elapsed | 44495 | -| total_timesteps | 845184 | -| train/ | | -| approx_kl | 0.0052969395 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 0.309 | -| explained_variance | 0.296 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 66020 | -| policy_gradient_loss | -0.00353 | -| std | 0.178 | -| value_loss | 0.0168 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6604 | -| time_elapsed | 44499 | -| total_timesteps | 845312 | -| train/ | | -| approx_kl | 0.00716336 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 66030 | -| policy_gradient_loss | -0.00497 | -| std | 0.178 | -| value_loss | 0.000427 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6605 | -| time_elapsed | 44503 | -| total_timesteps | 845440 | -| train/ | | -| approx_kl | 0.002591528 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 0.305 | -| explained_variance | 0.00507 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 66040 | -| policy_gradient_loss | -0.00271 | -| std | 0.178 | -| value_loss | 6.49e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 18 | -| iterations | 6606 | -| time_elapsed | 44507 | -| total_timesteps | 845568 | -| train/ | | -| approx_kl | 0.020625012 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.306 | -| explained_variance | -0.0993 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 66050 | -| policy_gradient_loss | -0.0117 | -| std | 0.178 | -| value_loss | 8.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6607 | -| time_elapsed | 44509 | -| total_timesteps | 845696 | -| train/ | | -| approx_kl | 0.053709798 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 0.307 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.0305 | -| n_updates | 66060 | -| policy_gradient_loss | -0.0261 | -| std | 0.178 | -| value_loss | 3.63e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6608 | -| time_elapsed | 44512 | -| total_timesteps | 845824 | -| train/ | | -| approx_kl | 0.009674069 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.307 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 66070 | -| policy_gradient_loss | -0.00245 | -| std | 0.178 | -| value_loss | 2.17e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6609 | -| time_elapsed | 44516 | -| total_timesteps | 845952 | -| train/ | | -| approx_kl | 0.012429613 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.308 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 66080 | -| policy_gradient_loss | -0.0018 | -| std | 0.178 | -| value_loss | 1.33e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6610 | -| time_elapsed | 44518 | -| total_timesteps | 846080 | -| train/ | | -| approx_kl | 0.016966755 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 0.308 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 66090 | -| policy_gradient_loss | -0.00227 | -| std | 0.178 | -| value_loss | 9.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6611 | -| time_elapsed | 44526 | -| total_timesteps | 846208 | -| train/ | | -| approx_kl | 0.010166274 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 0.309 | -| explained_variance | 0.381 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 66100 | -| policy_gradient_loss | -0.00184 | -| std | 0.177 | -| value_loss | 0.0113 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6612 | -| time_elapsed | 44530 | -| total_timesteps | 846336 | -| train/ | | -| approx_kl | 0.012101922 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.311 | -| explained_variance | 0.00853 | -| learning_rate | 0.0003 | -| loss | 0.00085 | -| n_updates | 66110 | -| policy_gradient_loss | 0.00103 | -| std | 0.177 | -| value_loss | 3.61e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6613 | -| time_elapsed | 44533 | -| total_timesteps | 846464 | -| train/ | | -| approx_kl | 0.026886243 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.312 | -| explained_variance | -0.237 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 66120 | -| policy_gradient_loss | -0.00742 | -| std | 0.177 | -| value_loss | 1.79e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6614 | -| time_elapsed | 44537 | -| total_timesteps | 846592 | -| train/ | | -| approx_kl | 0.013039414 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.312 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.000977 | -| n_updates | 66130 | -| policy_gradient_loss | 0.00322 | -| std | 0.177 | -| value_loss | 1.39e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6615 | -| time_elapsed | 44540 | -| total_timesteps | 846720 | -| train/ | | -| approx_kl | 0.015253088 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 0.311 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 66140 | -| policy_gradient_loss | -0.00125 | -| std | 0.177 | -| value_loss | 5.66e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6616 | -| time_elapsed | 44543 | -| total_timesteps | 846848 | -| train/ | | -| approx_kl | 0.02067247 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.311 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.000789 | -| n_updates | 66150 | -| policy_gradient_loss | -0.00189 | -| std | 0.177 | -| value_loss | 3.93e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6617 | -| time_elapsed | 44546 | -| total_timesteps | 846976 | -| train/ | | -| approx_kl | 0.011109022 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.311 | -| explained_variance | -0.0715 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 66160 | -| policy_gradient_loss | 0.000374 | -| std | 0.177 | -| value_loss | 2.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6618 | -| time_elapsed | 44549 | -| total_timesteps | 847104 | -| train/ | | -| approx_kl | 0.024248287 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 0.311 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 66170 | -| policy_gradient_loss | -0.0118 | -| std | 0.177 | -| value_loss | 1.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6619 | -| time_elapsed | 44557 | -| total_timesteps | 847232 | -| train/ | | -| approx_kl | 0.011929639 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.311 | -| explained_variance | 0.673 | -| learning_rate | 0.0003 | -| loss | -9.65e-05 | -| n_updates | 66180 | -| policy_gradient_loss | -0.000609 | -| std | 0.177 | -| value_loss | 0.00215 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6620 | -| time_elapsed | 44561 | -| total_timesteps | 847360 | -| train/ | | -| approx_kl | 0.016943011 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.313 | -| explained_variance | 0.00911 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 66190 | -| policy_gradient_loss | -0.00861 | -| std | 0.177 | -| value_loss | 9.53e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6621 | -| time_elapsed | 44564 | -| total_timesteps | 847488 | -| train/ | | -| approx_kl | 0.01858177 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.314 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | 0.0017 | -| n_updates | 66200 | -| policy_gradient_loss | -0.000741 | -| std | 0.176 | -| value_loss | 2.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6622 | -| time_elapsed | 44567 | -| total_timesteps | 847616 | -| train/ | | -| approx_kl | 0.015877895 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.316 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | -0.000332 | -| n_updates | 66210 | -| policy_gradient_loss | -0.000885 | -| std | 0.176 | -| value_loss | 1.39e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6623 | -| time_elapsed | 44571 | -| total_timesteps | 847744 | -| train/ | | -| approx_kl | 0.00037466083 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.319 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.00088 | -| n_updates | 66220 | -| policy_gradient_loss | -0.00034 | -| std | 0.175 | -| value_loss | 8.12e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6624 | -| time_elapsed | 44574 | -| total_timesteps | 847872 | -| train/ | | -| approx_kl | 0.0208244 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.325 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 66230 | -| policy_gradient_loss | -0.00442 | -| std | 0.175 | -| value_loss | 2.57e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6625 | -| time_elapsed | 44576 | -| total_timesteps | 848000 | -| train/ | | -| approx_kl | 0.0040604617 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 0.327 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 66240 | -| policy_gradient_loss | -2.38e-05 | -| std | 0.174 | -| value_loss | 8.04e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6626 | -| time_elapsed | 44580 | -| total_timesteps | 848128 | -| train/ | | -| approx_kl | 0.02000518 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.328 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 66250 | -| policy_gradient_loss | -0.00267 | -| std | 0.174 | -| value_loss | 1.69e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6627 | -| time_elapsed | 44587 | -| total_timesteps | 848256 | -| train/ | | -| approx_kl | 0.022338804 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.327 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 66260 | -| policy_gradient_loss | -0.000924 | -| std | 0.174 | -| value_loss | 8.28e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6628 | -| time_elapsed | 44591 | -| total_timesteps | 848384 | -| train/ | | -| approx_kl | 0.01660414 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.328 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 66270 | -| policy_gradient_loss | -0.00341 | -| std | 0.174 | -| value_loss | 7.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6629 | -| time_elapsed | 44595 | -| total_timesteps | 848512 | -| train/ | | -| approx_kl | 0.010831866 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.328 | -| explained_variance | -0.0958 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 66280 | -| policy_gradient_loss | -0.00453 | -| std | 0.174 | -| value_loss | 1.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6630 | -| time_elapsed | 44598 | -| total_timesteps | 848640 | -| train/ | | -| approx_kl | 0.019658554 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 0.329 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | 0.000882 | -| n_updates | 66290 | -| policy_gradient_loss | -0.000184 | -| std | 0.174 | -| value_loss | 1.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6631 | -| time_elapsed | 44602 | -| total_timesteps | 848768 | -| train/ | | -| approx_kl | 0.009811098 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.329 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 66300 | -| policy_gradient_loss | 0.000602 | -| std | 0.174 | -| value_loss | 9.95e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6632 | -| time_elapsed | 44605 | -| total_timesteps | 848896 | -| train/ | | -| approx_kl | 0.015971797 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 0.329 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 66310 | -| policy_gradient_loss | -0.00157 | -| std | 0.174 | -| value_loss | 2.92e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6633 | -| time_elapsed | 44608 | -| total_timesteps | 849024 | -| train/ | | -| approx_kl | 0.01456842 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 0.329 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 66320 | -| policy_gradient_loss | -0.00989 | -| std | 0.174 | -| value_loss | 1.7e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6634 | -| time_elapsed | 44615 | -| total_timesteps | 849152 | -| train/ | | -| approx_kl | 0.015579861 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 0.33 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 66330 | -| policy_gradient_loss | -0.0146 | -| std | 0.174 | -| value_loss | 0.000129 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6635 | -| time_elapsed | 44619 | -| total_timesteps | 849280 | -| train/ | | -| approx_kl | 8.496456e-06 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.33 | -| explained_variance | 0.55 | -| learning_rate | 0.0003 | -| loss | -2.35e-05 | -| n_updates | 66340 | -| policy_gradient_loss | 0.000166 | -| std | 0.174 | -| value_loss | 4.85e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6636 | -| time_elapsed | 44623 | -| total_timesteps | 849408 | -| train/ | | -| approx_kl | 0.008243354 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.331 | -| explained_variance | -11.7 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 66350 | -| policy_gradient_loss | -0.00111 | -| std | 0.174 | -| value_loss | 3.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6637 | -| time_elapsed | 44627 | -| total_timesteps | 849536 | -| train/ | | -| approx_kl | 0.021184145 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.333 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 66360 | -| policy_gradient_loss | -0.00238 | -| std | 0.173 | -| value_loss | 6.33e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6638 | -| time_elapsed | 44630 | -| total_timesteps | 849664 | -| train/ | | -| approx_kl | 0.022766013 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 0.333 | -| explained_variance | -0.917 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 66370 | -| policy_gradient_loss | -0.00897 | -| std | 0.173 | -| value_loss | 4.72e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6639 | -| time_elapsed | 44634 | -| total_timesteps | 849792 | -| train/ | | -| approx_kl | 0.023695346 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.333 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 66380 | -| policy_gradient_loss | -0.00214 | -| std | 0.173 | -| value_loss | 1.36e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6640 | -| time_elapsed | 44637 | -| total_timesteps | 849920 | -| train/ | | -| approx_kl | 0.021164326 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.333 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | 0.00214 | -| n_updates | 66390 | -| policy_gradient_loss | 0.000836 | -| std | 0.174 | -| value_loss | 1.13e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6641 | -| time_elapsed | 44641 | -| total_timesteps | 850048 | -| train/ | | -| approx_kl | 0.00041213492 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.333 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | -0.000122 | -| n_updates | 66400 | -| policy_gradient_loss | 0.000543 | -| std | 0.174 | -| value_loss | 1.2e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6642 | -| time_elapsed | 44648 | -| total_timesteps | 850176 | -| train/ | | -| approx_kl | 0.017611999 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.333 | -| explained_variance | 0.674 | -| learning_rate | 0.0003 | -| loss | -0.000459 | -| n_updates | 66410 | -| policy_gradient_loss | -0.0012 | -| std | 0.173 | -| value_loss | 0.00224 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6643 | -| time_elapsed | 44651 | -| total_timesteps | 850304 | -| train/ | | -| approx_kl | 0.0004814067 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.334 | -| explained_variance | 0.00604 | -| learning_rate | 0.0003 | -| loss | -0.000374 | -| n_updates | 66420 | -| policy_gradient_loss | -7.76e-05 | -| std | 0.173 | -| value_loss | 2.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6644 | -| time_elapsed | 44654 | -| total_timesteps | 850432 | -| train/ | | -| approx_kl | 0.0010129418 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 0.336 | -| explained_variance | -1.13 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 66430 | -| policy_gradient_loss | -0.0029 | -| std | 0.173 | -| value_loss | 5.48e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6645 | -| time_elapsed | 44657 | -| total_timesteps | 850560 | -| train/ | | -| approx_kl | 0.0039649615 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.337 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 66440 | -| policy_gradient_loss | -0.00161 | -| std | 0.173 | -| value_loss | 1.26e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6646 | -| time_elapsed | 44661 | -| total_timesteps | 850688 | -| train/ | | -| approx_kl | 0.02037609 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.339 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 66450 | -| policy_gradient_loss | -0.0036 | -| std | 0.172 | -| value_loss | 1.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6647 | -| time_elapsed | 44665 | -| total_timesteps | 850816 | -| train/ | | -| approx_kl | 0.027377266 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 0.339 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 66460 | -| policy_gradient_loss | -0.00272 | -| std | 0.172 | -| value_loss | 3.61e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6648 | -| time_elapsed | 44668 | -| total_timesteps | 850944 | -| train/ | | -| approx_kl | 0.02321125 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.34 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.00802 | -| n_updates | 66470 | -| policy_gradient_loss | -0.00488 | -| std | 0.172 | -| value_loss | 1.67e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6649 | -| time_elapsed | 44671 | -| total_timesteps | 851072 | -| train/ | | -| approx_kl | 0.025236504 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.34 | -| explained_variance | -0.0868 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 66480 | -| policy_gradient_loss | -0.0154 | -| std | 0.172 | -| value_loss | 1.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6650 | -| time_elapsed | 44677 | -| total_timesteps | 851200 | -| train/ | | -| approx_kl | 0.008346878 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 0.342 | -| explained_variance | 0.511 | -| learning_rate | 0.0003 | -| loss | 0.00243 | -| n_updates | 66490 | -| policy_gradient_loss | -0.000618 | -| std | 0.172 | -| value_loss | 0.00707 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6651 | -| time_elapsed | 44679 | -| total_timesteps | 851328 | -| train/ | | -| approx_kl | 0.012903115 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.344 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 66500 | -| policy_gradient_loss | -0.00125 | -| std | 0.171 | -| value_loss | 4.92e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6652 | -| time_elapsed | 44683 | -| total_timesteps | 851456 | -| train/ | | -| approx_kl | 0.0045503085 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.346 | -| explained_variance | -7.89 | -| learning_rate | 0.0003 | -| loss | -0.00569 | -| n_updates | 66510 | -| policy_gradient_loss | -0.00371 | -| std | 0.171 | -| value_loss | 4.5e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6653 | -| time_elapsed | 44686 | -| total_timesteps | 851584 | -| train/ | | -| approx_kl | 0.014269069 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.347 | -| explained_variance | -0.658 | -| learning_rate | 0.0003 | -| loss | -0.000841 | -| n_updates | 66520 | -| policy_gradient_loss | -0.000949 | -| std | 0.171 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6654 | -| time_elapsed | 44688 | -| total_timesteps | 851712 | -| train/ | | -| approx_kl | 0.016805436 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 0.347 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | -0.000113 | -| n_updates | 66530 | -| policy_gradient_loss | -0.00148 | -| std | 0.171 | -| value_loss | 2.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6655 | -| time_elapsed | 44692 | -| total_timesteps | 851840 | -| train/ | | -| approx_kl | 0.00457872 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.345 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 66540 | -| policy_gradient_loss | -0.00287 | -| std | 0.171 | -| value_loss | 8.12e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.5 | -| time/ | | -| fps | 19 | -| iterations | 6656 | -| time_elapsed | 44696 | -| total_timesteps | 851968 | -| train/ | | -| approx_kl | 0.025094012 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.344 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.00523 | -| n_updates | 66550 | -| policy_gradient_loss | -0.00538 | -| std | 0.172 | -| value_loss | 5.95e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6657 | -| time_elapsed | 44699 | -| total_timesteps | 852096 | -| train/ | | -| approx_kl | 0.011392679 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.344 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | -0.006 | -| n_updates | 66560 | -| policy_gradient_loss | -0.00416 | -| std | 0.172 | -| value_loss | 2.38e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6658 | -| time_elapsed | 44706 | -| total_timesteps | 852224 | -| train/ | | -| approx_kl | 0.09855116 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 0.343 | -| explained_variance | 0.481 | -| learning_rate | 0.0003 | -| loss | 0.000386 | -| n_updates | 66570 | -| policy_gradient_loss | -0.00616 | -| std | 0.172 | -| value_loss | 0.00989 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6659 | -| time_elapsed | 44709 | -| total_timesteps | 852352 | -| train/ | | -| approx_kl | 0.005593008 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 0.344 | -| explained_variance | 0.0058 | -| learning_rate | 0.0003 | -| loss | 0.00034 | -| n_updates | 66580 | -| policy_gradient_loss | 0.00111 | -| std | 0.171 | -| value_loss | 1.79e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6660 | -| time_elapsed | 44713 | -| total_timesteps | 852480 | -| train/ | | -| approx_kl | 0.014525997 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.345 | -| explained_variance | -1.52 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 66590 | -| policy_gradient_loss | -0.0121 | -| std | 0.171 | -| value_loss | 5.83e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6661 | -| time_elapsed | 44716 | -| total_timesteps | 852608 | -| train/ | | -| approx_kl | 0.019190578 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 0.345 | -| explained_variance | -0.68 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 66600 | -| policy_gradient_loss | -0.00918 | -| std | 0.171 | -| value_loss | 3.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6662 | -| time_elapsed | 44719 | -| total_timesteps | 852736 | -| train/ | | -| approx_kl | 0.015009258 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.345 | -| explained_variance | -0.378 | -| learning_rate | 0.0003 | -| loss | 0.000659 | -| n_updates | 66610 | -| policy_gradient_loss | -0.000476 | -| std | 0.171 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6663 | -| time_elapsed | 44723 | -| total_timesteps | 852864 | -| train/ | | -| approx_kl | 0.0051487363 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.348 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | -0.000823 | -| n_updates | 66620 | -| policy_gradient_loss | -0.000346 | -| std | 0.17 | -| value_loss | 1.1e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6664 | -| time_elapsed | 44727 | -| total_timesteps | 852992 | -| train/ | | -| approx_kl | 3.3585355e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.353 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | -0.000881 | -| n_updates | 66630 | -| policy_gradient_loss | -0.000365 | -| std | 0.169 | -| value_loss | 4.31e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6665 | -| time_elapsed | 44730 | -| total_timesteps | 853120 | -| train/ | | -| approx_kl | 0.001683576 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 0.36 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 66640 | -| policy_gradient_loss | -0.00232 | -| std | 0.168 | -| value_loss | 9.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6666 | -| time_elapsed | 44739 | -| total_timesteps | 853248 | -| train/ | | -| approx_kl | 0.041669674 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 0.364 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 66650 | -| policy_gradient_loss | -0.00918 | -| std | 0.168 | -| value_loss | 0.000383 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6667 | -| time_elapsed | 44743 | -| total_timesteps | 853376 | -| train/ | | -| approx_kl | 0.0027771913 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 0.367 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 66660 | -| policy_gradient_loss | -0.00267 | -| std | 0.167 | -| value_loss | 3.39e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6668 | -| time_elapsed | 44747 | -| total_timesteps | 853504 | -| train/ | | -| approx_kl | 0.0017139432 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.369 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | -0.000455 | -| n_updates | 66670 | -| policy_gradient_loss | 0.000188 | -| std | 0.167 | -| value_loss | 1.21e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6669 | -| time_elapsed | 44749 | -| total_timesteps | 853632 | -| train/ | | -| approx_kl | 0.01052271 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.368 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.000428 | -| n_updates | 66680 | -| policy_gradient_loss | 9.1e-05 | -| std | 0.167 | -| value_loss | 9.67e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6670 | -| time_elapsed | 44752 | -| total_timesteps | 853760 | -| train/ | | -| approx_kl | 0.032368563 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.369 | -| explained_variance | -0.936 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 66690 | -| policy_gradient_loss | -0.0062 | -| std | 0.167 | -| value_loss | 2.34e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6671 | -| time_elapsed | 44754 | -| total_timesteps | 853888 | -| train/ | | -| approx_kl | 0.012519648 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.369 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | -0.000891 | -| n_updates | 66700 | -| policy_gradient_loss | -0.00117 | -| std | 0.167 | -| value_loss | 1.48e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6672 | -| time_elapsed | 44758 | -| total_timesteps | 854016 | -| train/ | | -| approx_kl | 0.022628816 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.369 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 66710 | -| policy_gradient_loss | -0.00783 | -| std | 0.167 | -| value_loss | 3.49e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6673 | -| time_elapsed | 44765 | -| total_timesteps | 854144 | -| train/ | | -| approx_kl | 0.0015908736 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | 0.476 | -| learning_rate | 0.0003 | -| loss | 0.00384 | -| n_updates | 66720 | -| policy_gradient_loss | -0.0012 | -| std | 0.167 | -| value_loss | 0.0111 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6674 | -| time_elapsed | 44769 | -| total_timesteps | 854272 | -| train/ | | -| approx_kl | 0.030667892 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | 0.21 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 66730 | -| policy_gradient_loss | -0.00909 | -| std | 0.167 | -| value_loss | 1.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6675 | -| time_elapsed | 44772 | -| total_timesteps | 854400 | -| train/ | | -| approx_kl | 0.048710596 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -8.71 | -| learning_rate | 0.0003 | -| loss | -0.0277 | -| n_updates | 66740 | -| policy_gradient_loss | -0.0209 | -| std | 0.167 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6676 | -| time_elapsed | 44775 | -| total_timesteps | 854528 | -| train/ | | -| approx_kl | 0.036494166 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -2.6 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 66750 | -| policy_gradient_loss | -0.0077 | -| std | 0.167 | -| value_loss | 2.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6677 | -| time_elapsed | 44778 | -| total_timesteps | 854656 | -| train/ | | -| approx_kl | 0.015722133 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 66760 | -| policy_gradient_loss | -0.00242 | -| std | 0.167 | -| value_loss | 8.62e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6678 | -| time_elapsed | 44783 | -| total_timesteps | 854784 | -| train/ | | -| approx_kl | 0.0023370814 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.444 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 66770 | -| policy_gradient_loss | -0.000684 | -| std | 0.167 | -| value_loss | 9.17e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.51 | -| time/ | | -| fps | 19 | -| iterations | 6679 | -| time_elapsed | 44787 | -| total_timesteps | 854912 | -| train/ | | -| approx_kl | 0.0034486433 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | -0.447 | -| learning_rate | 0.0003 | -| loss | -0.000428 | -| n_updates | 66780 | -| policy_gradient_loss | -0.000247 | -| std | 0.167 | -| value_loss | 2.41e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6680 | -| time_elapsed | 44792 | -| total_timesteps | 855040 | -| train/ | | -| approx_kl | 0.026157498 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | -0.062 | -| learning_rate | 0.0003 | -| loss | -0.00979 | -| n_updates | 66790 | -| policy_gradient_loss | -0.00897 | -| std | 0.167 | -| value_loss | 9.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6681 | -| time_elapsed | 44800 | -| total_timesteps | 855168 | -| train/ | | -| approx_kl | 0.039716583 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | 0.537 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 66800 | -| policy_gradient_loss | -0.00307 | -| std | 0.167 | -| value_loss | 0.00873 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6682 | -| time_elapsed | 44803 | -| total_timesteps | 855296 | -| train/ | | -| approx_kl | 0.020464275 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.0899 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 66810 | -| policy_gradient_loss | -0.00504 | -| std | 0.167 | -| value_loss | 7.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6683 | -| time_elapsed | 44805 | -| total_timesteps | 855424 | -| train/ | | -| approx_kl | 0.027750375 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 66820 | -| policy_gradient_loss | -0.00539 | -| std | 0.167 | -| value_loss | 8.76e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6684 | -| time_elapsed | 44809 | -| total_timesteps | 855552 | -| train/ | | -| approx_kl | 0.0053567854 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.465 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 66830 | -| policy_gradient_loss | -0.000276 | -| std | 0.167 | -| value_loss | 4.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6685 | -| time_elapsed | 44812 | -| total_timesteps | 855680 | -| train/ | | -| approx_kl | 0.017234003 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.00642 | -| n_updates | 66840 | -| policy_gradient_loss | -0.00145 | -| std | 0.167 | -| value_loss | 2.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6686 | -| time_elapsed | 44816 | -| total_timesteps | 855808 | -| train/ | | -| approx_kl | 0.013587777 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 66850 | -| policy_gradient_loss | -0.00157 | -| std | 0.167 | -| value_loss | 1.55e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6687 | -| time_elapsed | 44820 | -| total_timesteps | 855936 | -| train/ | | -| approx_kl | 0.0133159775 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.373 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 66860 | -| policy_gradient_loss | -0.00443 | -| std | 0.167 | -| value_loss | 1.18e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6688 | -| time_elapsed | 44824 | -| total_timesteps | 856064 | -| train/ | | -| approx_kl | 0.008535188 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.374 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 66870 | -| policy_gradient_loss | 0.000582 | -| std | 0.167 | -| value_loss | 1.14e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6689 | -| time_elapsed | 44830 | -| total_timesteps | 856192 | -| train/ | | -| approx_kl | 0.00301161 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.374 | -| explained_variance | 0.567 | -| learning_rate | 0.0003 | -| loss | 0.00177 | -| n_updates | 66880 | -| policy_gradient_loss | -0.0008 | -| std | 0.166 | -| value_loss | 0.00692 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6690 | -| time_elapsed | 44834 | -| total_timesteps | 856320 | -| train/ | | -| approx_kl | 0.04903492 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 0.375 | -| explained_variance | -2.26 | -| learning_rate | 0.0003 | -| loss | -7.56e-05 | -| n_updates | 66890 | -| policy_gradient_loss | -0.00206 | -| std | 0.166 | -| value_loss | 7.89e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6691 | -| time_elapsed | 44839 | -| total_timesteps | 856448 | -| train/ | | -| approx_kl | 0.026289143 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 0.375 | -| explained_variance | -52.7 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 66900 | -| policy_gradient_loss | -0.0143 | -| std | 0.166 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6692 | -| time_elapsed | 44842 | -| total_timesteps | 856576 | -| train/ | | -| approx_kl | 0.0027636224 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 0.374 | -| explained_variance | -19.3 | -| learning_rate | 0.0003 | -| loss | -0.00091 | -| n_updates | 66910 | -| policy_gradient_loss | -0.000446 | -| std | 0.167 | -| value_loss | 1.61e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6693 | -| time_elapsed | 44844 | -| total_timesteps | 856704 | -| train/ | | -| approx_kl | 0.03094176 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -1.47 | -| learning_rate | 0.0003 | -| loss | -0.00709 | -| n_updates | 66920 | -| policy_gradient_loss | -0.00688 | -| std | 0.167 | -| value_loss | 8.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6694 | -| time_elapsed | 44847 | -| total_timesteps | 856832 | -| train/ | | -| approx_kl | 0.024919996 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.00557 | -| n_updates | 66930 | -| policy_gradient_loss | -0.00458 | -| std | 0.167 | -| value_loss | 1.12e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.52 | -| time/ | | -| fps | 19 | -| iterations | 6695 | -| time_elapsed | 44851 | -| total_timesteps | 856960 | -| train/ | | -| approx_kl | 0.00925247 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.458 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 66940 | -| policy_gradient_loss | -0.000949 | -| std | 0.167 | -| value_loss | 7.01e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6696 | -| time_elapsed | 44855 | -| total_timesteps | 857088 | -| train/ | | -| approx_kl | 0.012248348 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -0.293 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 66950 | -| policy_gradient_loss | -0.000311 | -| std | 0.167 | -| value_loss | 3.77e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6697 | -| time_elapsed | 44862 | -| total_timesteps | 857216 | -| train/ | | -| approx_kl | 0.042637512 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | 0.00176 | -| n_updates | 66960 | -| policy_gradient_loss | -0.000311 | -| std | 0.167 | -| value_loss | 0.000232 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6698 | -| time_elapsed | 44866 | -| total_timesteps | 857344 | -| train/ | | -| approx_kl | 0.026094534 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -0.962 | -| learning_rate | 0.0003 | -| loss | 7.97e-05 | -| n_updates | 66970 | -| policy_gradient_loss | -0.00106 | -| std | 0.167 | -| value_loss | 1.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6699 | -| time_elapsed | 44869 | -| total_timesteps | 857472 | -| train/ | | -| approx_kl | 0.010629203 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.571 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 66980 | -| policy_gradient_loss | -0.00189 | -| std | 0.167 | -| value_loss | 7.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6700 | -| time_elapsed | 44873 | -| total_timesteps | 857600 | -| train/ | | -| approx_kl | 0.020217553 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | -0.421 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 66990 | -| policy_gradient_loss | -0.00119 | -| std | 0.167 | -| value_loss | 3.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6701 | -| time_elapsed | 44876 | -| total_timesteps | 857728 | -| train/ | | -| approx_kl | 0.036056373 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.369 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 67000 | -| policy_gradient_loss | -0.0135 | -| std | 0.167 | -| value_loss | 9.62e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6702 | -| time_elapsed | 44880 | -| total_timesteps | 857856 | -| train/ | | -| approx_kl | 0.010679597 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.369 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 67010 | -| policy_gradient_loss | -0.00211 | -| std | 0.167 | -| value_loss | 1.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6703 | -| time_elapsed | 44883 | -| total_timesteps | 857984 | -| train/ | | -| approx_kl | 0.004112017 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | -0.000892 | -| n_updates | 67020 | -| policy_gradient_loss | 0.00288 | -| std | 0.167 | -| value_loss | 1.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6704 | -| time_elapsed | 44887 | -| total_timesteps | 858112 | -| train/ | | -| approx_kl | 0.011071062 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 67030 | -| policy_gradient_loss | 0.000867 | -| std | 0.167 | -| value_loss | 2.48e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6705 | -| time_elapsed | 44896 | -| total_timesteps | 858240 | -| train/ | | -| approx_kl | 0.006401059 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 67040 | -| policy_gradient_loss | 0.000231 | -| std | 0.167 | -| value_loss | 0.000165 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6706 | -| time_elapsed | 44900 | -| total_timesteps | 858368 | -| train/ | | -| approx_kl | 0.019221798 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.373 | -| explained_variance | -0.296 | -| learning_rate | 0.0003 | -| loss | -0.00944 | -| n_updates | 67050 | -| policy_gradient_loss | -0.00825 | -| std | 0.166 | -| value_loss | 8.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6707 | -| time_elapsed | 44903 | -| total_timesteps | 858496 | -| train/ | | -| approx_kl | 0.005220752 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.374 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.00498 | -| n_updates | 67060 | -| policy_gradient_loss | -0.00305 | -| std | 0.166 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6708 | -| time_elapsed | 44907 | -| total_timesteps | 858624 | -| train/ | | -| approx_kl | 0.023886437 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 0.375 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | -0.00048 | -| n_updates | 67070 | -| policy_gradient_loss | -0.000113 | -| std | 0.166 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6709 | -| time_elapsed | 44911 | -| total_timesteps | 858752 | -| train/ | | -| approx_kl | 0.017110363 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 0.374 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 67080 | -| policy_gradient_loss | -0.00146 | -| std | 0.166 | -| value_loss | 6.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6710 | -| time_elapsed | 44914 | -| total_timesteps | 858880 | -| train/ | | -| approx_kl | 0.010089109 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.374 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | -0.00083 | -| n_updates | 67090 | -| policy_gradient_loss | -0.000609 | -| std | 0.167 | -| value_loss | 3.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6711 | -| time_elapsed | 44917 | -| total_timesteps | 859008 | -| train/ | | -| approx_kl | 0.019692758 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 0.373 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | 0.001 | -| n_updates | 67100 | -| policy_gradient_loss | -0.000686 | -| std | 0.167 | -| value_loss | 1.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6712 | -| time_elapsed | 44925 | -| total_timesteps | 859136 | -| train/ | | -| approx_kl | 0.043617316 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.373 | -| explained_variance | 0.776 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 67110 | -| policy_gradient_loss | -0.00297 | -| std | 0.167 | -| value_loss | 0.00145 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6713 | -| time_elapsed | 44928 | -| total_timesteps | 859264 | -| train/ | | -| approx_kl | 0.032738727 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 0.373 | -| explained_variance | -4.21 | -| learning_rate | 0.0003 | -| loss | -0.00431 | -| n_updates | 67120 | -| policy_gradient_loss | -0.00505 | -| std | 0.167 | -| value_loss | 1.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6714 | -| time_elapsed | 44932 | -| total_timesteps | 859392 | -| train/ | | -| approx_kl | 0.020745857 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.373 | -| explained_variance | -6.5 | -| learning_rate | 0.0003 | -| loss | 0.000576 | -| n_updates | 67130 | -| policy_gradient_loss | -0.000676 | -| std | 0.167 | -| value_loss | 2.19e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6715 | -| time_elapsed | 44935 | -| total_timesteps | 859520 | -| train/ | | -| approx_kl | 0.02416988 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.372 | -| learning_rate | 0.0003 | -| loss | 0.00309 | -| n_updates | 67140 | -| policy_gradient_loss | 0.000211 | -| std | 0.167 | -| value_loss | 1.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6716 | -| time_elapsed | 44937 | -| total_timesteps | 859648 | -| train/ | | -| approx_kl | 0.012692188 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.369 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.000925 | -| n_updates | 67150 | -| policy_gradient_loss | -0.000209 | -| std | 0.167 | -| value_loss | 3.86e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6717 | -| time_elapsed | 44940 | -| total_timesteps | 859776 | -| train/ | | -| approx_kl | 0.01934905 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | -0.00408 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 67160 | -| policy_gradient_loss | -0.00152 | -| std | 0.167 | -| value_loss | 4.96e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6718 | -| time_elapsed | 44943 | -| total_timesteps | 859904 | -| train/ | | -| approx_kl | 0.0013580755 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.37 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 67170 | -| policy_gradient_loss | -0.000222 | -| std | 0.167 | -| value_loss | 4.03e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6719 | -| time_elapsed | 44946 | -| total_timesteps | 860032 | -| train/ | | -| approx_kl | 0.009492952 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 67180 | -| policy_gradient_loss | -0.00352 | -| std | 0.167 | -| value_loss | 5.98e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6720 | -| time_elapsed | 44954 | -| total_timesteps | 860160 | -| train/ | | -| approx_kl | 0.03019204 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 67190 | -| policy_gradient_loss | -0.00641 | -| std | 0.167 | -| value_loss | 0.000429 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6721 | -| time_elapsed | 44957 | -| total_timesteps | 860288 | -| train/ | | -| approx_kl | 0.010985873 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 0.371 | -| explained_variance | -0.361 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 67200 | -| policy_gradient_loss | -0.000322 | -| std | 0.167 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6722 | -| time_elapsed | 44961 | -| total_timesteps | 860416 | -| train/ | | -| approx_kl | 0.009816364 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.372 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 67210 | -| policy_gradient_loss | -0.000154 | -| std | 0.167 | -| value_loss | 3.15e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6723 | -| time_elapsed | 44965 | -| total_timesteps | 860544 | -| train/ | | -| approx_kl | 0.0061484165 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.375 | -| explained_variance | -0.402 | -| learning_rate | 0.0003 | -| loss | -0.000964 | -| n_updates | 67220 | -| policy_gradient_loss | 0.000393 | -| std | 0.166 | -| value_loss | 1.94e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6724 | -| time_elapsed | 44969 | -| total_timesteps | 860672 | -| train/ | | -| approx_kl | 0.008730145 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 0.376 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 67230 | -| policy_gradient_loss | 0.0003 | -| std | 0.166 | -| value_loss | 3.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6725 | -| time_elapsed | 44971 | -| total_timesteps | 860800 | -| train/ | | -| approx_kl | 0.000601653 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.377 | -| explained_variance | -0.523 | -| learning_rate | 0.0003 | -| loss | -0.000924 | -| n_updates | 67240 | -| policy_gradient_loss | 0.000405 | -| std | 0.166 | -| value_loss | 2.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6726 | -| time_elapsed | 44974 | -| total_timesteps | 860928 | -| train/ | | -| approx_kl | 0.000743628 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.382 | -| explained_variance | -0.0811 | -| learning_rate | 0.0003 | -| loss | -0.000817 | -| n_updates | 67250 | -| policy_gradient_loss | 0.000232 | -| std | 0.165 | -| value_loss | 1.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6727 | -| time_elapsed | 44977 | -| total_timesteps | 861056 | -| train/ | | -| approx_kl | 0.042964492 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 0.386 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 67260 | -| policy_gradient_loss | -0.0103 | -| std | 0.164 | -| value_loss | 3.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6728 | -| time_elapsed | 44982 | -| total_timesteps | 861184 | -| train/ | | -| approx_kl | 0.039110903 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.388 | -| explained_variance | 0.764 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 67270 | -| policy_gradient_loss | -0.00246 | -| std | 0.164 | -| value_loss | 0.00147 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6729 | -| time_elapsed | 44985 | -| total_timesteps | 861312 | -| train/ | | -| approx_kl | 0.005411381 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 0.389 | -| explained_variance | -3.9 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 67280 | -| policy_gradient_loss | -0.000955 | -| std | 0.164 | -| value_loss | 6.62e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6730 | -| time_elapsed | 44988 | -| total_timesteps | 861440 | -| train/ | | -| approx_kl | 0.0031855325 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | 0.388 | -| explained_variance | -1.47 | -| learning_rate | 0.0003 | -| loss | -0.000487 | -| n_updates | 67290 | -| policy_gradient_loss | -0.000125 | -| std | 0.164 | -| value_loss | 2.46e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6731 | -| time_elapsed | 44991 | -| total_timesteps | 861568 | -| train/ | | -| approx_kl | 0.019592836 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 0.392 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | -0.00675 | -| n_updates | 67300 | -| policy_gradient_loss | -0.0057 | -| std | 0.163 | -| value_loss | 1.83e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6732 | -| time_elapsed | 44995 | -| total_timesteps | 861696 | -| train/ | | -| approx_kl | 0.010719899 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.395 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.00186 | -| n_updates | 67310 | -| policy_gradient_loss | 0.00204 | -| std | 0.163 | -| value_loss | 2.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6733 | -| time_elapsed | 44998 | -| total_timesteps | 861824 | -| train/ | | -| approx_kl | 0.027238807 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 0.395 | -| explained_variance | -0.365 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 67320 | -| policy_gradient_loss | -0.00319 | -| std | 0.163 | -| value_loss | 5.01e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6734 | -| time_elapsed | 45001 | -| total_timesteps | 861952 | -| train/ | | -| approx_kl | 0.013636621 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 0.395 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.000362 | -| n_updates | 67330 | -| policy_gradient_loss | -0.000872 | -| std | 0.163 | -| value_loss | 3.51e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6735 | -| time_elapsed | 45005 | -| total_timesteps | 862080 | -| train/ | | -| approx_kl | 0.021864861 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.394 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 67340 | -| policy_gradient_loss | -0.00178 | -| std | 0.163 | -| value_loss | 1.78e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6736 | -| time_elapsed | 45011 | -| total_timesteps | 862208 | -| train/ | | -| approx_kl | 0.024216129 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.394 | -| explained_variance | 0.874 | -| learning_rate | 0.0003 | -| loss | -0.00412 | -| n_updates | 67350 | -| policy_gradient_loss | -0.00343 | -| std | 0.163 | -| value_loss | 0.00025 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6737 | -| time_elapsed | 45014 | -| total_timesteps | 862336 | -| train/ | | -| approx_kl | 0.02517343 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.393 | -| explained_variance | -0.0618 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 67360 | -| policy_gradient_loss | -0.00457 | -| std | 0.163 | -| value_loss | 1.77e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6738 | -| time_elapsed | 45018 | -| total_timesteps | 862464 | -| train/ | | -| approx_kl | 0.0048037996 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.392 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 67370 | -| policy_gradient_loss | -0.0015 | -| std | 0.163 | -| value_loss | 2.28e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6739 | -| time_elapsed | 45021 | -| total_timesteps | 862592 | -| train/ | | -| approx_kl | 0.0033365414 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.392 | -| explained_variance | -0.706 | -| learning_rate | 0.0003 | -| loss | -0.000632 | -| n_updates | 67380 | -| policy_gradient_loss | -0.000245 | -| std | 0.164 | -| value_loss | 8.46e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6740 | -| time_elapsed | 45024 | -| total_timesteps | 862720 | -| train/ | | -| approx_kl | 0.020852294 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.389 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.00646 | -| n_updates | 67390 | -| policy_gradient_loss | 0.000992 | -| std | 0.164 | -| value_loss | 9.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6741 | -| time_elapsed | 45028 | -| total_timesteps | 862848 | -| train/ | | -| approx_kl | 0.015799139 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.387 | -| explained_variance | -0.399 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 67400 | -| policy_gradient_loss | -0.00325 | -| std | 0.164 | -| value_loss | 3.09e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6742 | -| time_elapsed | 45031 | -| total_timesteps | 862976 | -| train/ | | -| approx_kl | 0.0001607975 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 0.388 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | -0.000748 | -| n_updates | 67410 | -| policy_gradient_loss | -0.000232 | -| std | 0.164 | -| value_loss | 1.52e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6743 | -| time_elapsed | 45034 | -| total_timesteps | 863104 | -| train/ | | -| approx_kl | 0.047659494 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 0.394 | -| explained_variance | -0.00973 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 67420 | -| policy_gradient_loss | -0.00866 | -| std | 0.163 | -| value_loss | 8.59e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6744 | -| time_elapsed | 45043 | -| total_timesteps | 863232 | -| train/ | | -| approx_kl | 0.066428356 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.396 | -| explained_variance | 0.547 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 67430 | -| policy_gradient_loss | -0.00876 | -| std | 0.163 | -| value_loss | 0.007 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6745 | -| time_elapsed | 45047 | -| total_timesteps | 863360 | -| train/ | | -| approx_kl | 0.023997698 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.397 | -| explained_variance | -24.9 | -| learning_rate | 0.0003 | -| loss | 0.00011 | -| n_updates | 67440 | -| policy_gradient_loss | -0.00111 | -| std | 0.163 | -| value_loss | 2.85e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6746 | -| time_elapsed | 45051 | -| total_timesteps | 863488 | -| train/ | | -| approx_kl | 0.03928844 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 0.397 | -| explained_variance | -44.9 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 67450 | -| policy_gradient_loss | -0.0103 | -| std | 0.163 | -| value_loss | 2.28e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6747 | -| time_elapsed | 45054 | -| total_timesteps | 863616 | -| train/ | | -| approx_kl | 0.029381378 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 0.396 | -| explained_variance | -9.99 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 67460 | -| policy_gradient_loss | -0.00492 | -| std | 0.163 | -| value_loss | 2.53e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6748 | -| time_elapsed | 45058 | -| total_timesteps | 863744 | -| train/ | | -| approx_kl | 0.012520779 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.395 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 67470 | -| policy_gradient_loss | -0.0018 | -| std | 0.163 | -| value_loss | 8.17e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.53 | -| time/ | | -| fps | 19 | -| iterations | 6749 | -| time_elapsed | 45061 | -| total_timesteps | 863872 | -| train/ | | -| approx_kl | 0.021187527 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.394 | -| explained_variance | 0.00244 | -| learning_rate | 0.0003 | -| loss | 0.00184 | -| n_updates | 67480 | -| policy_gradient_loss | -0.000911 | -| std | 0.163 | -| value_loss | 3.59e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6750 | -| time_elapsed | 45065 | -| total_timesteps | 864000 | -| train/ | | -| approx_kl | 0.030931428 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.394 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 67490 | -| policy_gradient_loss | -0.00602 | -| std | 0.163 | -| value_loss | 3.34e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6751 | -| time_elapsed | 45067 | -| total_timesteps | 864128 | -| train/ | | -| approx_kl | 0.006755157 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.393 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 67500 | -| policy_gradient_loss | -0.00246 | -| std | 0.163 | -| value_loss | 7.29e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6752 | -| time_elapsed | 45075 | -| total_timesteps | 864256 | -| train/ | | -| approx_kl | 0.009006701 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.393 | -| explained_variance | 0.908 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 67510 | -| policy_gradient_loss | 0.00272 | -| std | 0.163 | -| value_loss | 0.000222 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6753 | -| time_elapsed | 45079 | -| total_timesteps | 864384 | -| train/ | | -| approx_kl | 0.024304304 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 0.392 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | -6.69e-05 | -| n_updates | 67520 | -| policy_gradient_loss | 0.00071 | -| std | 0.163 | -| value_loss | 4.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6754 | -| time_elapsed | 45084 | -| total_timesteps | 864512 | -| train/ | | -| approx_kl | 0.01785048 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.392 | -| explained_variance | -0.794 | -| learning_rate | 0.0003 | -| loss | -0.00047 | -| n_updates | 67530 | -| policy_gradient_loss | -0.000921 | -| std | 0.163 | -| value_loss | 2.08e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6755 | -| time_elapsed | 45088 | -| total_timesteps | 864640 | -| train/ | | -| approx_kl | 0.030278176 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 0.393 | -| explained_variance | -0.355 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 67540 | -| policy_gradient_loss | -0.0041 | -| std | 0.163 | -| value_loss | 1.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6756 | -| time_elapsed | 45092 | -| total_timesteps | 864768 | -| train/ | | -| approx_kl | 0.013627918 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 0.393 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 67550 | -| policy_gradient_loss | -0.0114 | -| std | 0.163 | -| value_loss | 5.28e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6757 | -| time_elapsed | 45095 | -| total_timesteps | 864896 | -| train/ | | -| approx_kl | 0.0008635917 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.392 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | -0.000115 | -| n_updates | 67560 | -| policy_gradient_loss | 3.26e-05 | -| std | 0.164 | -| value_loss | 7.3e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6758 | -| time_elapsed | 45099 | -| total_timesteps | 865024 | -| train/ | | -| approx_kl | 0.008861573 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.391 | -| explained_variance | -0.00167 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 67570 | -| policy_gradient_loss | -0.00784 | -| std | 0.164 | -| value_loss | 2.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6759 | -| time_elapsed | 45106 | -| total_timesteps | 865152 | -| train/ | | -| approx_kl | 0.02417763 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 0.391 | -| explained_variance | 0.648 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 67580 | -| policy_gradient_loss | -0.0144 | -| std | 0.164 | -| value_loss | 0.00427 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6760 | -| time_elapsed | 45110 | -| total_timesteps | 865280 | -| train/ | | -| approx_kl | 0.013785175 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.39 | -| explained_variance | -68 | -| learning_rate | 0.0003 | -| loss | -0.000319 | -| n_updates | 67590 | -| policy_gradient_loss | 0.000588 | -| std | 0.164 | -| value_loss | 2.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6761 | -| time_elapsed | 45114 | -| total_timesteps | 865408 | -| train/ | | -| approx_kl | 0.006936234 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.389 | -| explained_variance | -95.4 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 67600 | -| policy_gradient_loss | -0.000527 | -| std | 0.164 | -| value_loss | 9.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6762 | -| time_elapsed | 45118 | -| total_timesteps | 865536 | -| train/ | | -| approx_kl | 0.006614472 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.385 | -| explained_variance | -84.9 | -| learning_rate | 0.0003 | -| loss | -0.000932 | -| n_updates | 67610 | -| policy_gradient_loss | -0.000338 | -| std | 0.165 | -| value_loss | 1.33e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6763 | -| time_elapsed | 45122 | -| total_timesteps | 865664 | -| train/ | | -| approx_kl | 0.006266718 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.382 | -| explained_variance | -47.5 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 67620 | -| policy_gradient_loss | -0.000714 | -| std | 0.165 | -| value_loss | 2.84e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6764 | -| time_elapsed | 45126 | -| total_timesteps | 865792 | -| train/ | | -| approx_kl | 0.01650866 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.382 | -| explained_variance | -68.1 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 67630 | -| policy_gradient_loss | -0.000591 | -| std | 0.165 | -| value_loss | 1.38e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.54 | -| time/ | | -| fps | 19 | -| iterations | 6765 | -| time_elapsed | 45129 | -| total_timesteps | 865920 | -| train/ | | -| approx_kl | 0.0009090444 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 0.383 | -| explained_variance | -56.4 | -| learning_rate | 0.0003 | -| loss | -0.000345 | -| n_updates | 67640 | -| policy_gradient_loss | -0.000135 | -| std | 0.165 | -| value_loss | 1.46e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6766 | -| time_elapsed | 45132 | -| total_timesteps | 866048 | -| train/ | | -| approx_kl | 0.029200733 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 0.385 | -| explained_variance | -9.04 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 67650 | -| policy_gradient_loss | -0.00438 | -| std | 0.165 | -| value_loss | 1.29e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6767 | -| time_elapsed | 45139 | -| total_timesteps | 866176 | -| train/ | | -| approx_kl | 0.016367279 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.387 | -| explained_variance | 0.535 | -| learning_rate | 0.0003 | -| loss | 0.00373 | -| n_updates | 67660 | -| policy_gradient_loss | -0.00077 | -| std | 0.164 | -| value_loss | 0.00956 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6768 | -| time_elapsed | 45144 | -| total_timesteps | 866304 | -| train/ | | -| approx_kl | 0.015996762 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 0.389 | -| explained_variance | -89.7 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 67670 | -| policy_gradient_loss | -0.00265 | -| std | 0.164 | -| value_loss | 1.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6769 | -| time_elapsed | 45147 | -| total_timesteps | 866432 | -| train/ | | -| approx_kl | 0.009013312 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 0.391 | -| explained_variance | -68.6 | -| learning_rate | 0.0003 | -| loss | -0.00338 | -| n_updates | 67680 | -| policy_gradient_loss | -0.00196 | -| std | 0.164 | -| value_loss | 7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6770 | -| time_elapsed | 45151 | -| total_timesteps | 866560 | -| train/ | | -| approx_kl | 0.022077512 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.391 | -| explained_variance | -22.6 | -| learning_rate | 0.0003 | -| loss | 0.000734 | -| n_updates | 67690 | -| policy_gradient_loss | -0.000534 | -| std | 0.164 | -| value_loss | 7.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6771 | -| time_elapsed | 45153 | -| total_timesteps | 866688 | -| train/ | | -| approx_kl | 0.006919457 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 0.391 | -| explained_variance | -2.67 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 67700 | -| policy_gradient_loss | 0.000362 | -| std | 0.164 | -| value_loss | 1.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6772 | -| time_elapsed | 45157 | -| total_timesteps | 866816 | -| train/ | | -| approx_kl | 0.005530563 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | 0.391 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.000441 | -| n_updates | 67710 | -| policy_gradient_loss | -0.000132 | -| std | 0.164 | -| value_loss | 1.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.55 | -| time/ | | -| fps | 19 | -| iterations | 6773 | -| time_elapsed | 45160 | -| total_timesteps | 866944 | -| train/ | | -| approx_kl | 0.020318646 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 0.392 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.0076 | -| n_updates | 67720 | -| policy_gradient_loss | -0.00564 | -| std | 0.163 | -| value_loss | 5.07e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6774 | -| time_elapsed | 45163 | -| total_timesteps | 867072 | -| train/ | | -| approx_kl | 3.4574885e-05 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | 0.395 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 67730 | -| policy_gradient_loss | -0.000614 | -| std | 0.162 | -| value_loss | 3.63e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6775 | -| time_elapsed | 45169 | -| total_timesteps | 867200 | -| train/ | | -| approx_kl | 0.003157591 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.402 | -| explained_variance | 0.579 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 67740 | -| policy_gradient_loss | -0.000371 | -| std | 0.161 | -| value_loss | 0.00759 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6776 | -| time_elapsed | 45173 | -| total_timesteps | 867328 | -| train/ | | -| approx_kl | 0.053559907 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 0.407 | -| explained_variance | -56.4 | -| learning_rate | 0.0003 | -| loss | -0.00577 | -| n_updates | 67750 | -| policy_gradient_loss | -0.00487 | -| std | 0.161 | -| value_loss | 1.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6777 | -| time_elapsed | 45176 | -| total_timesteps | 867456 | -| train/ | | -| approx_kl | 0.020494157 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 0.409 | -| explained_variance | -50.6 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 67760 | -| policy_gradient_loss | -0.00489 | -| std | 0.161 | -| value_loss | 5.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6778 | -| time_elapsed | 45179 | -| total_timesteps | 867584 | -| train/ | | -| approx_kl | 0.026579436 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.409 | -| explained_variance | -15.2 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 67770 | -| policy_gradient_loss | -0.00402 | -| std | 0.161 | -| value_loss | 6.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6779 | -| time_elapsed | 45181 | -| total_timesteps | 867712 | -| train/ | | -| approx_kl | 0.019466478 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.409 | -| explained_variance | -2.07 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 67780 | -| policy_gradient_loss | -0.00187 | -| std | 0.161 | -| value_loss | 1.13e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6780 | -| time_elapsed | 45186 | -| total_timesteps | 867840 | -| train/ | | -| approx_kl | 0.0046373303 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.41 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 67790 | -| policy_gradient_loss | -0.000948 | -| std | 0.161 | -| value_loss | 3.54e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.57 | -| time/ | | -| fps | 19 | -| iterations | 6781 | -| time_elapsed | 45189 | -| total_timesteps | 867968 | -| train/ | | -| approx_kl | 0.00093788235 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.411 | -| explained_variance | 0.0185 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 67800 | -| policy_gradient_loss | -0.00218 | -| std | 0.16 | -| value_loss | 4.07e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6782 | -| time_elapsed | 45192 | -| total_timesteps | 868096 | -| train/ | | -| approx_kl | 0.005675311 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.412 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 67810 | -| policy_gradient_loss | -0.00181 | -| std | 0.16 | -| value_loss | 2.14e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6783 | -| time_elapsed | 45199 | -| total_timesteps | 868224 | -| train/ | | -| approx_kl | 0.028871845 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.414 | -| explained_variance | 0.558 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 67820 | -| policy_gradient_loss | -0.00772 | -| std | 0.16 | -| value_loss | 0.00795 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6784 | -| time_elapsed | 45203 | -| total_timesteps | 868352 | -| train/ | | -| approx_kl | 0.024064098 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.415 | -| explained_variance | -1.49 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 67830 | -| policy_gradient_loss | -0.00304 | -| std | 0.16 | -| value_loss | 3.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6785 | -| time_elapsed | 45206 | -| total_timesteps | 868480 | -| train/ | | -| approx_kl | 0.012359627 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.416 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 67840 | -| policy_gradient_loss | -0.00016 | -| std | 0.16 | -| value_loss | 4.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6786 | -| time_elapsed | 45209 | -| total_timesteps | 868608 | -| train/ | | -| approx_kl | 0.01261393 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.416 | -| explained_variance | 0.00597 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 67850 | -| policy_gradient_loss | -0.00486 | -| std | 0.16 | -| value_loss | 5.45e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6787 | -| time_elapsed | 45211 | -| total_timesteps | 868736 | -| train/ | | -| approx_kl | 0.044928417 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 0.415 | -| explained_variance | -0.28 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 67860 | -| policy_gradient_loss | -0.0183 | -| std | 0.16 | -| value_loss | 2.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6788 | -| time_elapsed | 45214 | -| total_timesteps | 868864 | -| train/ | | -| approx_kl | 0.006835186 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.414 | -| explained_variance | -0.69 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 67870 | -| policy_gradient_loss | -0.0011 | -| std | 0.16 | -| value_loss | 2.95e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.58 | -| time/ | | -| fps | 19 | -| iterations | 6789 | -| time_elapsed | 45217 | -| total_timesteps | 868992 | -| train/ | | -| approx_kl | 0.015392922 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.414 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 67880 | -| policy_gradient_loss | -0.00902 | -| std | 0.16 | -| value_loss | 5.76e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 19 | -| iterations | 6790 | -| time_elapsed | 45221 | -| total_timesteps | 869120 | -| train/ | | -| approx_kl | 0.01174612 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.414 | -| explained_variance | -0.392 | -| learning_rate | 0.0003 | -| loss | -0.00079 | -| n_updates | 67890 | -| policy_gradient_loss | -0.000608 | -| std | 0.16 | -| value_loss | 1.52e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 19 | -| iterations | 6791 | -| time_elapsed | 45230 | -| total_timesteps | 869248 | -| train/ | | -| approx_kl | 0.038615365 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.413 | -| explained_variance | 0.62 | -| learning_rate | 0.0003 | -| loss | 0.00338 | -| n_updates | 67900 | -| policy_gradient_loss | -0.000802 | -| std | 0.16 | -| value_loss | 0.00548 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 19 | -| iterations | 6792 | -| time_elapsed | 45234 | -| total_timesteps | 869376 | -| train/ | | -| approx_kl | 0.02863276 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 0.414 | -| explained_variance | -3.93 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 67910 | -| policy_gradient_loss | -0.00253 | -| std | 0.16 | -| value_loss | 2.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 19 | -| iterations | 6793 | -| time_elapsed | 45237 | -| total_timesteps | 869504 | -| train/ | | -| approx_kl | 0.004272783 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.414 | -| explained_variance | -0.813 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 67920 | -| policy_gradient_loss | -0.00116 | -| std | 0.16 | -| value_loss | 5.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 19 | -| iterations | 6794 | -| time_elapsed | 45241 | -| total_timesteps | 869632 | -| train/ | | -| approx_kl | 0.020639952 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.414 | -| explained_variance | -0.0702 | -| learning_rate | 0.0003 | -| loss | -0.000736 | -| n_updates | 67930 | -| policy_gradient_loss | -0.00262 | -| std | 0.16 | -| value_loss | 4.34e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 19 | -| iterations | 6795 | -| time_elapsed | 45244 | -| total_timesteps | 869760 | -| train/ | | -| approx_kl | 0.0007138201 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | 0.416 | -| explained_variance | -0.622 | -| learning_rate | 0.0003 | -| loss | -0.000571 | -| n_updates | 67940 | -| policy_gradient_loss | -0.000325 | -| std | 0.159 | -| value_loss | 1.18e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.59 | -| time/ | | -| fps | 19 | -| iterations | 6796 | -| time_elapsed | 45248 | -| total_timesteps | 869888 | -| train/ | | -| approx_kl | 0.039970912 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 0.419 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 67950 | -| policy_gradient_loss | -0.00689 | -| std | 0.159 | -| value_loss | 6.82e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6797 | -| time_elapsed | 45252 | -| total_timesteps | 870016 | -| train/ | | -| approx_kl | 0.02429156 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 0.42 | -| explained_variance | -0.0731 | -| learning_rate | 0.0003 | -| loss | -0.00592 | -| n_updates | 67960 | -| policy_gradient_loss | -0.0071 | -| std | 0.159 | -| value_loss | 6.97e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6798 | -| time_elapsed | 45261 | -| total_timesteps | 870144 | -| train/ | | -| approx_kl | 0.047182616 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 0.421 | -| explained_variance | 0.748 | -| learning_rate | 0.0003 | -| loss | -0.00704 | -| n_updates | 67970 | -| policy_gradient_loss | -0.00662 | -| std | 0.159 | -| value_loss | 0.00236 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6799 | -| time_elapsed | 45265 | -| total_timesteps | 870272 | -| train/ | | -| approx_kl | 0.014340099 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 0.422 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.00852 | -| n_updates | 67980 | -| policy_gradient_loss | -0.00551 | -| std | 0.159 | -| value_loss | 4.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6800 | -| time_elapsed | 45268 | -| total_timesteps | 870400 | -| train/ | | -| approx_kl | 0.012630187 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.423 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.00266 | -| n_updates | 67990 | -| policy_gradient_loss | -0.00165 | -| std | 0.158 | -| value_loss | 1.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6801 | -| time_elapsed | 45272 | -| total_timesteps | 870528 | -| train/ | | -| approx_kl | 0.006204218 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.424 | -| explained_variance | -0.577 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 68000 | -| policy_gradient_loss | -0.000621 | -| std | 0.158 | -| value_loss | 9.96e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6802 | -| time_elapsed | 45276 | -| total_timesteps | 870656 | -| train/ | | -| approx_kl | 0.0012970977 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 0.424 | -| explained_variance | -0.574 | -| learning_rate | 0.0003 | -| loss | -0.000374 | -| n_updates | 68010 | -| policy_gradient_loss | 5.98e-05 | -| std | 0.158 | -| value_loss | 3.45e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6803 | -| time_elapsed | 45279 | -| total_timesteps | 870784 | -| train/ | | -| approx_kl | 0.013271274 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.423 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 68020 | -| policy_gradient_loss | -0.00194 | -| std | 0.158 | -| value_loss | 5.75e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.61 | -| time/ | | -| fps | 19 | -| iterations | 6804 | -| time_elapsed | 45282 | -| total_timesteps | 870912 | -| train/ | | -| approx_kl | 0.0010722904 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.423 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | -0.000308 | -| n_updates | 68030 | -| policy_gradient_loss | -0.000164 | -| std | 0.158 | -| value_loss | 2.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6805 | -| time_elapsed | 45286 | -| total_timesteps | 871040 | -| train/ | | -| approx_kl | 0.010911504 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.424 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 68040 | -| policy_gradient_loss | -0.000961 | -| std | 0.158 | -| value_loss | 1.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6806 | -| time_elapsed | 45293 | -| total_timesteps | 871168 | -| train/ | | -| approx_kl | 0.047200076 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 0.425 | -| explained_variance | 0.756 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 68050 | -| policy_gradient_loss | -0.0091 | -| std | 0.158 | -| value_loss | 0.00267 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6807 | -| time_elapsed | 45296 | -| total_timesteps | 871296 | -| train/ | | -| approx_kl | 0.012474885 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.426 | -| explained_variance | -0.848 | -| learning_rate | 0.0003 | -| loss | 0.00115 | -| n_updates | 68060 | -| policy_gradient_loss | 0.00417 | -| std | 0.158 | -| value_loss | 1.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6808 | -| time_elapsed | 45299 | -| total_timesteps | 871424 | -| train/ | | -| approx_kl | 0.010680386 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.426 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | 0.000703 | -| n_updates | 68070 | -| policy_gradient_loss | -3.78e-05 | -| std | 0.158 | -| value_loss | 3.79e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6809 | -| time_elapsed | 45302 | -| total_timesteps | 871552 | -| train/ | | -| approx_kl | 0.0015514502 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | 0.426 | -| explained_variance | 0.0076 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 68080 | -| policy_gradient_loss | -0.000985 | -| std | 0.158 | -| value_loss | 3.25e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6810 | -| time_elapsed | 45307 | -| total_timesteps | 871680 | -| train/ | | -| approx_kl | 0.009329449 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | 0.0159 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 68090 | -| policy_gradient_loss | -0.000998 | -| std | 0.158 | -| value_loss | 3.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6811 | -| time_elapsed | 45311 | -| total_timesteps | 871808 | -| train/ | | -| approx_kl | 0.007629035 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | -0.233 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 68100 | -| policy_gradient_loss | 0.000108 | -| std | 0.158 | -| value_loss | 1.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.62 | -| time/ | | -| fps | 19 | -| iterations | 6812 | -| time_elapsed | 45315 | -| total_timesteps | 871936 | -| train/ | | -| approx_kl | 0.005107491 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.429 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 68110 | -| policy_gradient_loss | -0.00101 | -| std | 0.158 | -| value_loss | 2.19e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6813 | -| time_elapsed | 45317 | -| total_timesteps | 872064 | -| train/ | | -| approx_kl | 0.008669474 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.429 | -| explained_variance | -0.00616 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 68120 | -| policy_gradient_loss | -0.00242 | -| std | 0.158 | -| value_loss | 6.07e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6814 | -| time_elapsed | 45323 | -| total_timesteps | 872192 | -| train/ | | -| approx_kl | 0.05562332 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 0.429 | -| explained_variance | 0.782 | -| learning_rate | 0.0003 | -| loss | 0.00272 | -| n_updates | 68130 | -| policy_gradient_loss | -0.000414 | -| std | 0.158 | -| value_loss | 0.00144 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6815 | -| time_elapsed | 45327 | -| total_timesteps | 872320 | -| train/ | | -| approx_kl | 0.035830546 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 0.429 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 68140 | -| policy_gradient_loss | -0.016 | -| std | 0.158 | -| value_loss | 3.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6816 | -| time_elapsed | 45331 | -| total_timesteps | 872448 | -| train/ | | -| approx_kl | 0.006887137 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | -0.399 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 68150 | -| policy_gradient_loss | -0.0025 | -| std | 0.158 | -| value_loss | 3.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6817 | -| time_elapsed | 45335 | -| total_timesteps | 872576 | -| train/ | | -| approx_kl | 0.019722125 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | -0.689 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 68160 | -| policy_gradient_loss | -0.00131 | -| std | 0.158 | -| value_loss | 1.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6818 | -| time_elapsed | 45338 | -| total_timesteps | 872704 | -| train/ | | -| approx_kl | 0.032702908 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.427 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 68170 | -| policy_gradient_loss | -0.0102 | -| std | 0.158 | -| value_loss | 1.34e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6819 | -| time_elapsed | 45341 | -| total_timesteps | 872832 | -| train/ | | -| approx_kl | 0.0013693026 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 0.427 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 68180 | -| policy_gradient_loss | -0.0014 | -| std | 0.158 | -| value_loss | 5.99e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6820 | -| time_elapsed | 45345 | -| total_timesteps | 872960 | -| train/ | | -| approx_kl | 0.02454335 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 68190 | -| policy_gradient_loss | -0.00999 | -| std | 0.158 | -| value_loss | 2.69e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6821 | -| time_elapsed | 45349 | -| total_timesteps | 873088 | -| train/ | | -| approx_kl | 0.0283472 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 68200 | -| policy_gradient_loss | -0.0103 | -| std | 0.158 | -| value_loss | 1.42e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6822 | -| time_elapsed | 45355 | -| total_timesteps | 873216 | -| train/ | | -| approx_kl | 0.048293807 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | 0.77 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 68210 | -| policy_gradient_loss | -0.0023 | -| std | 0.158 | -| value_loss | 0.00239 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6823 | -| time_elapsed | 45358 | -| total_timesteps | 873344 | -| train/ | | -| approx_kl | 0.010364017 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 0.429 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 68220 | -| policy_gradient_loss | 0.0047 | -| std | 0.158 | -| value_loss | 5.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6824 | -| time_elapsed | 45362 | -| total_timesteps | 873472 | -| train/ | | -| approx_kl | 0.015300475 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.429 | -| explained_variance | -0.603 | -| learning_rate | 0.0003 | -| loss | 0.00234 | -| n_updates | 68230 | -| policy_gradient_loss | 0.000109 | -| std | 0.158 | -| value_loss | 4.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6825 | -| time_elapsed | 45366 | -| total_timesteps | 873600 | -| train/ | | -| approx_kl | 0.017408581 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 0.428 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 68240 | -| policy_gradient_loss | -0.00225 | -| std | 0.158 | -| value_loss | 7.34e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6826 | -| time_elapsed | 45369 | -| total_timesteps | 873728 | -| train/ | | -| approx_kl | 0.00050514285 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | 0.429 | -| explained_variance | -0.0932 | -| learning_rate | 0.0003 | -| loss | -0.000254 | -| n_updates | 68250 | -| policy_gradient_loss | -0.000104 | -| std | 0.157 | -| value_loss | 1.3e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6827 | -| time_elapsed | 45373 | -| total_timesteps | 873856 | -| train/ | | -| approx_kl | 0.008017499 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.431 | -| explained_variance | -0.0816 | -| learning_rate | 0.0003 | -| loss | -0.00389 | -| n_updates | 68260 | -| policy_gradient_loss | -0.00237 | -| std | 0.157 | -| value_loss | 1.12e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.63 | -| time/ | | -| fps | 19 | -| iterations | 6828 | -| time_elapsed | 45378 | -| total_timesteps | 873984 | -| train/ | | -| approx_kl | 0.0021039955 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 0.432 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 68270 | -| policy_gradient_loss | -0.000777 | -| std | 0.157 | -| value_loss | 1.12e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.64 | -| time/ | | -| fps | 19 | -| iterations | 6829 | -| time_elapsed | 45381 | -| total_timesteps | 874112 | -| train/ | | -| approx_kl | 0.006192712 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 0.431 | -| explained_variance | -0.00464 | -| learning_rate | 0.0003 | -| loss | -8.94e-05 | -| n_updates | 68280 | -| policy_gradient_loss | -0.00015 | -| std | 0.157 | -| value_loss | 9.32e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.64 | -| time/ | | -| fps | 19 | -| iterations | 6830 | -| time_elapsed | 45390 | -| total_timesteps | 874240 | -| train/ | | -| approx_kl | 0.03246206 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.431 | -| explained_variance | 0.722 | -| learning_rate | 0.0003 | -| loss | 0.000192 | -| n_updates | 68290 | -| policy_gradient_loss | -0.00114 | -| std | 0.157 | -| value_loss | 0.00388 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.64 | -| time/ | | -| fps | 19 | -| iterations | 6831 | -| time_elapsed | 45394 | -| total_timesteps | 874368 | -| train/ | | -| approx_kl | 0.04132396 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 0.433 | -| explained_variance | -21.4 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 68300 | -| policy_gradient_loss | -0.005 | -| std | 0.157 | -| value_loss | 3.35e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.64 | -| time/ | | -| fps | 19 | -| iterations | 6832 | -| time_elapsed | 45398 | -| total_timesteps | 874496 | -| train/ | | -| approx_kl | 0.0016066171 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.434 | -| explained_variance | -29.2 | -| learning_rate | 0.0003 | -| loss | -0.00623 | -| n_updates | 68310 | -| policy_gradient_loss | -0.00433 | -| std | 0.157 | -| value_loss | 1.37e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.64 | -| time/ | | -| fps | 19 | -| iterations | 6833 | -| time_elapsed | 45401 | -| total_timesteps | 874624 | -| train/ | | -| approx_kl | 0.07034692 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.435 | -| explained_variance | -6.31 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 68320 | -| policy_gradient_loss | -0.00877 | -| std | 0.157 | -| value_loss | 3.66e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.64 | -| time/ | | -| fps | 19 | -| iterations | 6834 | -| time_elapsed | 45405 | -| total_timesteps | 874752 | -| train/ | | -| approx_kl | 0.0017539817 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.435 | -| explained_variance | -0.38 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 68330 | -| policy_gradient_loss | -0.00174 | -| std | 0.157 | -| value_loss | 3.73e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.64 | -| time/ | | -| fps | 19 | -| iterations | 6835 | -| time_elapsed | 45408 | -| total_timesteps | 874880 | -| train/ | | -| approx_kl | 0.016823748 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.434 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00516 | -| n_updates | 68340 | -| policy_gradient_loss | -0.00461 | -| std | 0.157 | -| value_loss | 1.53e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6836 | -| time_elapsed | 45411 | -| total_timesteps | 875008 | -| train/ | | -| approx_kl | 0.03198658 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 0.434 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -0.000297 | -| n_updates | 68350 | -| policy_gradient_loss | -0.00232 | -| std | 0.157 | -| value_loss | 8.36e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6837 | -| time_elapsed | 45421 | -| total_timesteps | 875136 | -| train/ | | -| approx_kl | 0.032074213 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.433 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.00377 | -| n_updates | 68360 | -| policy_gradient_loss | -0.00329 | -| std | 0.157 | -| value_loss | 0.00107 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6838 | -| time_elapsed | 45425 | -| total_timesteps | 875264 | -| train/ | | -| approx_kl | 0.02275502 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.434 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 68370 | -| policy_gradient_loss | -0.00653 | -| std | 0.157 | -| value_loss | 7.61e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6839 | -| time_elapsed | 45429 | -| total_timesteps | 875392 | -| train/ | | -| approx_kl | 0.0021305508 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.435 | -| explained_variance | -13.9 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 68380 | -| policy_gradient_loss | -0.0008 | -| std | 0.156 | -| value_loss | 2.71e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6840 | -| time_elapsed | 45431 | -| total_timesteps | 875520 | -| train/ | | -| approx_kl | 0.0013803681 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 0.439 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | -0.000694 | -| n_updates | 68390 | -| policy_gradient_loss | -0.000421 | -| std | 0.156 | -| value_loss | 1.29e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6841 | -| time_elapsed | 45434 | -| total_timesteps | 875648 | -| train/ | | -| approx_kl | 0.009160484 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.442 | -| explained_variance | -0.378 | -| learning_rate | 0.0003 | -| loss | -0.00702 | -| n_updates | 68400 | -| policy_gradient_loss | -0.00472 | -| std | 0.155 | -| value_loss | 3.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6842 | -| time_elapsed | 45437 | -| total_timesteps | 875776 | -| train/ | | -| approx_kl | 0.016779471 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 0.443 | -| explained_variance | 0.00786 | -| learning_rate | 0.0003 | -| loss | 0.000276 | -| n_updates | 68410 | -| policy_gradient_loss | 0.00113 | -| std | 0.155 | -| value_loss | 4.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6843 | -| time_elapsed | 45440 | -| total_timesteps | 875904 | -| train/ | | -| approx_kl | 0.02324459 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | -0.767 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 68420 | -| policy_gradient_loss | -0.00181 | -| std | 0.155 | -| value_loss | 6.33e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6844 | -| time_elapsed | 45443 | -| total_timesteps | 876032 | -| train/ | | -| approx_kl | 0.007724451 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | -0.502 | -| learning_rate | 0.0003 | -| loss | -0.00801 | -| n_updates | 68430 | -| policy_gradient_loss | -0.00472 | -| std | 0.155 | -| value_loss | 1.73e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6845 | -| time_elapsed | 45450 | -| total_timesteps | 876160 | -| train/ | | -| approx_kl | 0.021554112 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | -0.487 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 68440 | -| policy_gradient_loss | -0.00447 | -| std | 0.155 | -| value_loss | 0.00169 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6846 | -| time_elapsed | 45454 | -| total_timesteps | 876288 | -| train/ | | -| approx_kl | 0.00031056255 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.443 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | -6.92e-05 | -| n_updates | 68450 | -| policy_gradient_loss | 0.000421 | -| std | 0.155 | -| value_loss | 8.72e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6847 | -| time_elapsed | 45457 | -| total_timesteps | 876416 | -| train/ | | -| approx_kl | 0.017859884 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 0.443 | -| explained_variance | -2.21 | -| learning_rate | 0.0003 | -| loss | -0.000159 | -| n_updates | 68460 | -| policy_gradient_loss | -0.000332 | -| std | 0.155 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6848 | -| time_elapsed | 45461 | -| total_timesteps | 876544 | -| train/ | | -| approx_kl | 0.007457049 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.443 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 68470 | -| policy_gradient_loss | 0.000479 | -| std | 0.155 | -| value_loss | 9.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6849 | -| time_elapsed | 45465 | -| total_timesteps | 876672 | -| train/ | | -| approx_kl | 0.03311836 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | 0.0167 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 68480 | -| policy_gradient_loss | -0.0115 | -| std | 0.155 | -| value_loss | 9.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6850 | -| time_elapsed | 45467 | -| total_timesteps | 876800 | -| train/ | | -| approx_kl | 0.050992902 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | -0.43 | -| learning_rate | 0.0003 | -| loss | -0.00796 | -| n_updates | 68490 | -| policy_gradient_loss | -0.0109 | -| std | 0.155 | -| value_loss | 2.94e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6851 | -| time_elapsed | 45472 | -| total_timesteps | 876928 | -| train/ | | -| approx_kl | 0.0031245695 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 0.445 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 68500 | -| policy_gradient_loss | 0.000641 | -| std | 0.155 | -| value_loss | 4.53e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6852 | -| time_elapsed | 45474 | -| total_timesteps | 877056 | -| train/ | | -| approx_kl | 0.010917929 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 0.446 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 68510 | -| policy_gradient_loss | -0.000907 | -| std | 0.155 | -| value_loss | 7.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6853 | -| time_elapsed | 45479 | -| total_timesteps | 877184 | -| train/ | | -| approx_kl | 0.047558535 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 0.448 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 68520 | -| policy_gradient_loss | -0.00528 | -| std | 0.155 | -| value_loss | 0.00143 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6854 | -| time_elapsed | 45482 | -| total_timesteps | 877312 | -| train/ | | -| approx_kl | 0.0010219906 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.449 | -| explained_variance | -0.23 | -| learning_rate | 0.0003 | -| loss | -0.00052 | -| n_updates | 68530 | -| policy_gradient_loss | -0.000249 | -| std | 0.154 | -| value_loss | 5.96e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6855 | -| time_elapsed | 45485 | -| total_timesteps | 877440 | -| train/ | | -| approx_kl | 0.02843843 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 0.452 | -| explained_variance | -3.74 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 68540 | -| policy_gradient_loss | -0.00344 | -| std | 0.154 | -| value_loss | 4.77e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6856 | -| time_elapsed | 45488 | -| total_timesteps | 877568 | -| train/ | | -| approx_kl | 0.0024403953 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 0.453 | -| explained_variance | -0.0813 | -| learning_rate | 0.0003 | -| loss | -0.000304 | -| n_updates | 68550 | -| policy_gradient_loss | -8.86e-05 | -| std | 0.154 | -| value_loss | 4.14e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6857 | -| time_elapsed | 45492 | -| total_timesteps | 877696 | -| train/ | | -| approx_kl | 0.004759265 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.452 | -| explained_variance | -0.461 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 68560 | -| policy_gradient_loss | -0.00604 | -| std | 0.154 | -| value_loss | 9.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6858 | -| time_elapsed | 45496 | -| total_timesteps | 877824 | -| train/ | | -| approx_kl | 0.020013414 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 0.451 | -| explained_variance | 0.0156 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 68570 | -| policy_gradient_loss | -0.00474 | -| std | 0.154 | -| value_loss | 2.94e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6859 | -| time_elapsed | 45500 | -| total_timesteps | 877952 | -| train/ | | -| approx_kl | 0.02732819 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.451 | -| explained_variance | -0.524 | -| learning_rate | 0.0003 | -| loss | 0.00228 | -| n_updates | 68580 | -| policy_gradient_loss | -0.00191 | -| std | 0.154 | -| value_loss | 6.23e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6860 | -| time_elapsed | 45504 | -| total_timesteps | 878080 | -| train/ | | -| approx_kl | 0.02819917 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.451 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 68590 | -| policy_gradient_loss | -0.0105 | -| std | 0.154 | -| value_loss | 2.16e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6861 | -| time_elapsed | 45512 | -| total_timesteps | 878208 | -| train/ | | -| approx_kl | 0.0005954262 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.45 | -| explained_variance | 0.692 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 68600 | -| policy_gradient_loss | -0.00792 | -| std | 0.154 | -| value_loss | 0.00656 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6862 | -| time_elapsed | 45517 | -| total_timesteps | 878336 | -| train/ | | -| approx_kl | 0.0029694433 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.448 | -| explained_variance | 0.00228 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 68610 | -| policy_gradient_loss | 0.00134 | -| std | 0.155 | -| value_loss | 5.23e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6863 | -| time_elapsed | 45519 | -| total_timesteps | 878464 | -| train/ | | -| approx_kl | 0.003994883 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.446 | -| explained_variance | -4.6 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 68620 | -| policy_gradient_loss | -0.00114 | -| std | 0.155 | -| value_loss | 4.2e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6864 | -| time_elapsed | 45522 | -| total_timesteps | 878592 | -| train/ | | -| approx_kl | 0.0014428985 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | -0.448 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 68630 | -| policy_gradient_loss | 0.000253 | -| std | 0.155 | -| value_loss | 5.89e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6865 | -| time_elapsed | 45525 | -| total_timesteps | 878720 | -| train/ | | -| approx_kl | 0.0017621242 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 0.443 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.000814 | -| n_updates | 68640 | -| policy_gradient_loss | -0.000308 | -| std | 0.156 | -| value_loss | 1.61e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6866 | -| time_elapsed | 45529 | -| total_timesteps | 878848 | -| train/ | | -| approx_kl | 0.036746662 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 68650 | -| policy_gradient_loss | -0.00531 | -| std | 0.156 | -| value_loss | 9.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6867 | -| time_elapsed | 45532 | -| total_timesteps | 878976 | -| train/ | | -| approx_kl | 0.018463887 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.436 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 68660 | -| policy_gradient_loss | -0.0136 | -| std | 0.156 | -| value_loss | 9.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6868 | -| time_elapsed | 45535 | -| total_timesteps | 879104 | -| train/ | | -| approx_kl | 0.004672586 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 0.436 | -| explained_variance | -0.403 | -| learning_rate | 0.0003 | -| loss | -0.000269 | -| n_updates | 68670 | -| policy_gradient_loss | -0.00013 | -| std | 0.156 | -| value_loss | 2.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6869 | -| time_elapsed | 45545 | -| total_timesteps | 879232 | -| train/ | | -| approx_kl | 0.019731766 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | 0.914 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 68680 | -| policy_gradient_loss | -0.0076 | -| std | 0.156 | -| value_loss | 0.000379 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6870 | -| time_elapsed | 45548 | -| total_timesteps | 879360 | -| train/ | | -| approx_kl | 0.017655462 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.439 | -| explained_variance | -0.786 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 68690 | -| policy_gradient_loss | -0.00543 | -| std | 0.156 | -| value_loss | 6.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6871 | -| time_elapsed | 45551 | -| total_timesteps | 879488 | -| train/ | | -| approx_kl | 0.025936395 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -10.7 | -| learning_rate | 0.0003 | -| loss | -0.00737 | -| n_updates | 68700 | -| policy_gradient_loss | -0.00663 | -| std | 0.156 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6872 | -| time_elapsed | 45554 | -| total_timesteps | 879616 | -| train/ | | -| approx_kl | 0.036263242 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -2.79 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 68710 | -| policy_gradient_loss | -0.00476 | -| std | 0.156 | -| value_loss | 2.81e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6873 | -| time_elapsed | 45558 | -| total_timesteps | 879744 | -| train/ | | -| approx_kl | 0.007120544 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -0.97 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 68720 | -| policy_gradient_loss | 7.25e-05 | -| std | 0.156 | -| value_loss | 8.59e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6874 | -| time_elapsed | 45560 | -| total_timesteps | 879872 | -| train/ | | -| approx_kl | 0.031818878 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 0.437 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 68730 | -| policy_gradient_loss | -0.0111 | -| std | 0.156 | -| value_loss | 3.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6875 | -| time_elapsed | 45563 | -| total_timesteps | 880000 | -| train/ | | -| approx_kl | 0.026389018 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.436 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 68740 | -| policy_gradient_loss | -0.00721 | -| std | 0.156 | -| value_loss | 2e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6876 | -| time_elapsed | 45566 | -| total_timesteps | 880128 | -| train/ | | -| approx_kl | 0.0051061213 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.436 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 68750 | -| policy_gradient_loss | -0.00276 | -| std | 0.156 | -| value_loss | 1.05e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6877 | -| time_elapsed | 45574 | -| total_timesteps | 880256 | -| train/ | | -| approx_kl | 0.054998204 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 0.436 | -| explained_variance | -1.97 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 68760 | -| policy_gradient_loss | -0.0156 | -| std | 0.156 | -| value_loss | 0.00191 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6878 | -| time_elapsed | 45576 | -| total_timesteps | 880384 | -| train/ | | -| approx_kl | 0.02073797 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.437 | -| explained_variance | -0.258 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 68770 | -| policy_gradient_loss | -0.00471 | -| std | 0.156 | -| value_loss | 3.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6879 | -| time_elapsed | 45580 | -| total_timesteps | 880512 | -| train/ | | -| approx_kl | 0.013515161 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.437 | -| explained_variance | -3.55 | -| learning_rate | 0.0003 | -| loss | -8.55e-05 | -| n_updates | 68780 | -| policy_gradient_loss | -0.000239 | -| std | 0.156 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6880 | -| time_elapsed | 45583 | -| total_timesteps | 880640 | -| train/ | | -| approx_kl | 0.032867104 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.000555 | -| n_updates | 68790 | -| policy_gradient_loss | -0.003 | -| std | 0.156 | -| value_loss | 7.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6881 | -| time_elapsed | 45587 | -| total_timesteps | 880768 | -| train/ | | -| approx_kl | 0.033301465 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | -0.00702 | -| n_updates | 68800 | -| policy_gradient_loss | -0.00688 | -| std | 0.156 | -| value_loss | 1.05e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.69 | -| time/ | | -| fps | 19 | -| iterations | 6882 | -| time_elapsed | 45590 | -| total_timesteps | 880896 | -| train/ | | -| approx_kl | 0.0033333274 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.437 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 68810 | -| policy_gradient_loss | 0.000774 | -| std | 0.156 | -| value_loss | 2.32e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6883 | -| time_elapsed | 45594 | -| total_timesteps | 881024 | -| train/ | | -| approx_kl | 0.017156404 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.435 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.00288 | -| n_updates | 68820 | -| policy_gradient_loss | -0.000455 | -| std | 0.157 | -| value_loss | 7.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6884 | -| time_elapsed | 45600 | -| total_timesteps | 881152 | -| train/ | | -| approx_kl | 0.01093315 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.434 | -| explained_variance | 0.712 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 68830 | -| policy_gradient_loss | -0.000129 | -| std | 0.157 | -| value_loss | 0.0056 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6885 | -| time_elapsed | 45603 | -| total_timesteps | 881280 | -| train/ | | -| approx_kl | 0.031023033 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.433 | -| explained_variance | 0.0422 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 68840 | -| policy_gradient_loss | -0.00986 | -| std | 0.157 | -| value_loss | 1.47e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6886 | -| time_elapsed | 45606 | -| total_timesteps | 881408 | -| train/ | | -| approx_kl | 0.0034956755 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.433 | -| explained_variance | -1.95 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 68850 | -| policy_gradient_loss | -0.000193 | -| std | 0.157 | -| value_loss | 1.37e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6887 | -| time_elapsed | 45610 | -| total_timesteps | 881536 | -| train/ | | -| approx_kl | 0.0006201719 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.435 | -| explained_variance | -0.387 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 68860 | -| policy_gradient_loss | -0.00177 | -| std | 0.156 | -| value_loss | 2.81e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6888 | -| time_elapsed | 45614 | -| total_timesteps | 881664 | -| train/ | | -| approx_kl | 0.00856195 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 0.44 | -| explained_variance | -0.00262 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 68870 | -| policy_gradient_loss | -0.00216 | -| std | 0.156 | -| value_loss | 8.31e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6889 | -| time_elapsed | 45618 | -| total_timesteps | 881792 | -| train/ | | -| approx_kl | 0.0013659075 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.441 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | -0.000726 | -| n_updates | 68880 | -| policy_gradient_loss | -0.000122 | -| std | 0.156 | -| value_loss | 5.69e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6890 | -| time_elapsed | 45621 | -| total_timesteps | 881920 | -| train/ | | -| approx_kl | 0.0061218743 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.439 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.000814 | -| n_updates | 68890 | -| policy_gradient_loss | 0.000163 | -| std | 0.156 | -| value_loss | 5.36e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6891 | -| time_elapsed | 45625 | -| total_timesteps | 882048 | -| train/ | | -| approx_kl | 0.007558741 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -0.000153 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 68900 | -| policy_gradient_loss | 0.00142 | -| std | 0.156 | -| value_loss | 4.3e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6892 | -| time_elapsed | 45631 | -| total_timesteps | 882176 | -| train/ | | -| approx_kl | 0.01770284 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 68910 | -| policy_gradient_loss | -0.00336 | -| std | 0.156 | -| value_loss | 0.000144 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6893 | -| time_elapsed | 45635 | -| total_timesteps | 882304 | -| train/ | | -| approx_kl | 0.052055467 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -90.3 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 68920 | -| policy_gradient_loss | -0.00526 | -| std | 0.156 | -| value_loss | 3.81e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6894 | -| time_elapsed | 45638 | -| total_timesteps | 882432 | -| train/ | | -| approx_kl | 0.01886918 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 0.438 | -| explained_variance | -9.18 | -| learning_rate | 0.0003 | -| loss | -4.73e-05 | -| n_updates | 68930 | -| policy_gradient_loss | -0.000944 | -| std | 0.156 | -| value_loss | 5.83e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6895 | -| time_elapsed | 45641 | -| total_timesteps | 882560 | -| train/ | | -| approx_kl | 0.003639795 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.439 | -| explained_variance | -0.496 | -| learning_rate | 0.0003 | -| loss | -0.00543 | -| n_updates | 68940 | -| policy_gradient_loss | -0.00414 | -| std | 0.156 | -| value_loss | 2.83e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6896 | -| time_elapsed | 45644 | -| total_timesteps | 882688 | -| train/ | | -| approx_kl | 0.017670516 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.44 | -| explained_variance | 0.0196 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 68950 | -| policy_gradient_loss | -0.00715 | -| std | 0.156 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6897 | -| time_elapsed | 45646 | -| total_timesteps | 882816 | -| train/ | | -| approx_kl | 0.034006704 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 0.441 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 68960 | -| policy_gradient_loss | -0.00794 | -| std | 0.156 | -| value_loss | 3.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.66 | -| time/ | | -| fps | 19 | -| iterations | 6898 | -| time_elapsed | 45650 | -| total_timesteps | 882944 | -| train/ | | -| approx_kl | 0.009164185 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.441 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 68970 | -| policy_gradient_loss | -0.00075 | -| std | 0.156 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6899 | -| time_elapsed | 45654 | -| total_timesteps | 883072 | -| train/ | | -| approx_kl | 0.016183116 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 0.442 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.0006 | -| n_updates | 68980 | -| policy_gradient_loss | -0.00112 | -| std | 0.156 | -| value_loss | 5.98e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6900 | -| time_elapsed | 45660 | -| total_timesteps | 883200 | -| train/ | | -| approx_kl | 0.027388059 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 0.442 | -| explained_variance | 0.666 | -| learning_rate | 0.0003 | -| loss | 0.00195 | -| n_updates | 68990 | -| policy_gradient_loss | -0.00201 | -| std | 0.155 | -| value_loss | 0.00849 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6901 | -| time_elapsed | 45664 | -| total_timesteps | 883328 | -| train/ | | -| approx_kl | 0.011101466 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.442 | -| explained_variance | -17.1 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 69000 | -| policy_gradient_loss | -0.000167 | -| std | 0.155 | -| value_loss | 1.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6902 | -| time_elapsed | 45667 | -| total_timesteps | 883456 | -| train/ | | -| approx_kl | 0.021176709 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.442 | -| explained_variance | -61.7 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 69010 | -| policy_gradient_loss | -0.0016 | -| std | 0.155 | -| value_loss | 3.47e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6903 | -| time_elapsed | 45670 | -| total_timesteps | 883584 | -| train/ | | -| approx_kl | 0.007540081 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.442 | -| explained_variance | 0.00379 | -| learning_rate | 0.0003 | -| loss | -0.00683 | -| n_updates | 69020 | -| policy_gradient_loss | -0.00359 | -| std | 0.155 | -| value_loss | 1.45e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6904 | -| time_elapsed | 45674 | -| total_timesteps | 883712 | -| train/ | | -| approx_kl | 0.018955937 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.443 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 69030 | -| policy_gradient_loss | -0.00184 | -| std | 0.155 | -| value_loss | 2.57e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6905 | -| time_elapsed | 45679 | -| total_timesteps | 883840 | -| train/ | | -| approx_kl | 0.0032876646 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | 0.0174 | -| learning_rate | 0.0003 | -| loss | -0.000777 | -| n_updates | 69040 | -| policy_gradient_loss | 0.000973 | -| std | 0.155 | -| value_loss | 1.1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.67 | -| time/ | | -| fps | 19 | -| iterations | 6906 | -| time_elapsed | 45683 | -| total_timesteps | 883968 | -| train/ | | -| approx_kl | 0.007971956 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 0.445 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.00029 | -| n_updates | 69050 | -| policy_gradient_loss | 0.00401 | -| std | 0.155 | -| value_loss | 4.75e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6907 | -| time_elapsed | 45687 | -| total_timesteps | 884096 | -| train/ | | -| approx_kl | 0.017865786 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.446 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 69060 | -| policy_gradient_loss | -0.000651 | -| std | 0.155 | -| value_loss | 1.23e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6908 | -| time_elapsed | 45696 | -| total_timesteps | 884224 | -| train/ | | -| approx_kl | 0.00043003354 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | 0.486 | -| learning_rate | 0.0003 | -| loss | -7.29e-05 | -| n_updates | 69070 | -| policy_gradient_loss | -0.000147 | -| std | 0.156 | -| value_loss | 0.000931 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6909 | -| time_elapsed | 45700 | -| total_timesteps | 884352 | -| train/ | | -| approx_kl | 0.0027289 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 0.44 | -| explained_variance | -73.5 | -| learning_rate | 0.0003 | -| loss | -0.000438 | -| n_updates | 69080 | -| policy_gradient_loss | -0.000178 | -| std | 0.156 | -| value_loss | 7.28e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6910 | -| time_elapsed | 45704 | -| total_timesteps | 884480 | -| train/ | | -| approx_kl | 0.030088859 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.442 | -| explained_variance | -79.8 | -| learning_rate | 0.0003 | -| loss | 0.00366 | -| n_updates | 69090 | -| policy_gradient_loss | 0.00142 | -| std | 0.155 | -| value_loss | 4.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6911 | -| time_elapsed | 45708 | -| total_timesteps | 884608 | -| train/ | | -| approx_kl | 0.011391673 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | -8.96 | -| learning_rate | 0.0003 | -| loss | -0.00759 | -| n_updates | 69100 | -| policy_gradient_loss | -0.00471 | -| std | 0.155 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6912 | -| time_elapsed | 45712 | -| total_timesteps | 884736 | -| train/ | | -| approx_kl | 0.02068726 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.444 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 69110 | -| policy_gradient_loss | -0.00177 | -| std | 0.155 | -| value_loss | 2.67e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6913 | -| time_elapsed | 45716 | -| total_timesteps | 884864 | -| train/ | | -| approx_kl | 0.0063616 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.445 | -| explained_variance | 0.00873 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 69120 | -| policy_gradient_loss | -0.00052 | -| std | 0.155 | -| value_loss | 2.75e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6914 | -| time_elapsed | 45719 | -| total_timesteps | 884992 | -| train/ | | -| approx_kl | 0.01977002 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.445 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 69130 | -| policy_gradient_loss | -0.0102 | -| std | 0.155 | -| value_loss | 1.69e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6915 | -| time_elapsed | 45723 | -| total_timesteps | 885120 | -| train/ | | -| approx_kl | 0.004457452 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.445 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 69140 | -| policy_gradient_loss | -0.00538 | -| std | 0.155 | -| value_loss | 9.33e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6916 | -| time_elapsed | 45733 | -| total_timesteps | 885248 | -| train/ | | -| approx_kl | 0.0031674658 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 0.447 | -| explained_variance | 0.708 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 69150 | -| policy_gradient_loss | -0.000346 | -| std | 0.154 | -| value_loss | 0.00525 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6917 | -| time_elapsed | 45738 | -| total_timesteps | 885376 | -| train/ | | -| approx_kl | 0.0033378112 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.452 | -| explained_variance | -2.29 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 69160 | -| policy_gradient_loss | -0.00238 | -| std | 0.154 | -| value_loss | 5.92e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6918 | -| time_elapsed | 45741 | -| total_timesteps | 885504 | -| train/ | | -| approx_kl | 0.05363241 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 0.455 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 69170 | -| policy_gradient_loss | -0.00926 | -| std | 0.153 | -| value_loss | 8.28e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6919 | -| time_elapsed | 45744 | -| total_timesteps | 885632 | -| train/ | | -| approx_kl | 0.0101762675 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.456 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 69180 | -| policy_gradient_loss | -0.00358 | -| std | 0.153 | -| value_loss | 5.86e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6920 | -| time_elapsed | 45748 | -| total_timesteps | 885760 | -| train/ | | -| approx_kl | 0.010831945 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -0.298 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 69190 | -| policy_gradient_loss | 0.000144 | -| std | 0.153 | -| value_loss | 6.56e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.68 | -| time/ | | -| fps | 19 | -| iterations | 6921 | -| time_elapsed | 45751 | -| total_timesteps | 885888 | -| train/ | | -| approx_kl | 0.0027135531 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 69200 | -| policy_gradient_loss | 0.000188 | -| std | 0.153 | -| value_loss | 4.03e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6922 | -| time_elapsed | 45755 | -| total_timesteps | 886016 | -| train/ | | -| approx_kl | 0.007818121 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 0.456 | -| explained_variance | -0.23 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 69210 | -| policy_gradient_loss | 0.00105 | -| std | 0.153 | -| value_loss | 2.49e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6923 | -| time_elapsed | 45764 | -| total_timesteps | 886144 | -| train/ | | -| approx_kl | 0.02436785 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.456 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 69220 | -| policy_gradient_loss | -0.00347 | -| std | 0.153 | -| value_loss | 0.000799 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6924 | -| time_elapsed | 45768 | -| total_timesteps | 886272 | -| train/ | | -| approx_kl | 0.017242454 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 0.456 | -| explained_variance | 0.185 | -| learning_rate | 0.0003 | -| loss | -0.00761 | -| n_updates | 69230 | -| policy_gradient_loss | -0.0034 | -| std | 0.153 | -| value_loss | 2.5e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6925 | -| time_elapsed | 45773 | -| total_timesteps | 886400 | -| train/ | | -| approx_kl | 0.005215603 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 69240 | -| policy_gradient_loss | -0.00113 | -| std | 0.153 | -| value_loss | 1e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6926 | -| time_elapsed | 45776 | -| total_timesteps | 886528 | -| train/ | | -| approx_kl | 0.0018396904 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -0.677 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 69250 | -| policy_gradient_loss | -0.00428 | -| std | 0.153 | -| value_loss | 4.65e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6927 | -| time_elapsed | 45779 | -| total_timesteps | 886656 | -| train/ | | -| approx_kl | 0.005183545 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00781 | -| n_updates | 69260 | -| policy_gradient_loss | -0.00437 | -| std | 0.153 | -| value_loss | 8.35e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6928 | -| time_elapsed | 45782 | -| total_timesteps | 886784 | -| train/ | | -| approx_kl | 0.0122054145 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -0.469 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 69270 | -| policy_gradient_loss | -0.000172 | -| std | 0.153 | -| value_loss | 4.44e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.7 | -| time/ | | -| fps | 19 | -| iterations | 6929 | -| time_elapsed | 45785 | -| total_timesteps | 886912 | -| train/ | | -| approx_kl | 0.028679252 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 69280 | -| policy_gradient_loss | -0.00552 | -| std | 0.153 | -| value_loss | 5.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6930 | -| time_elapsed | 45788 | -| total_timesteps | 887040 | -| train/ | | -| approx_kl | 0.019820813 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -0.603 | -| learning_rate | 0.0003 | -| loss | 1.98e-05 | -| n_updates | 69290 | -| policy_gradient_loss | -0.0007 | -| std | 0.153 | -| value_loss | 3.29e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6931 | -| time_elapsed | 45795 | -| total_timesteps | 887168 | -| train/ | | -| approx_kl | 0.0024775388 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | 0.843 | -| learning_rate | 0.0003 | -| loss | 0.000532 | -| n_updates | 69300 | -| policy_gradient_loss | -0.000284 | -| std | 0.153 | -| value_loss | 0.00283 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6932 | -| time_elapsed | 45800 | -| total_timesteps | 887296 | -| train/ | | -| approx_kl | 0.0321519 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.458 | -| explained_variance | -25.1 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 69310 | -| policy_gradient_loss | -0.00183 | -| std | 0.153 | -| value_loss | 6.96e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6933 | -| time_elapsed | 45804 | -| total_timesteps | 887424 | -| train/ | | -| approx_kl | 0.04335251 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 0.458 | -| explained_variance | -23.3 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 69320 | -| policy_gradient_loss | -0.00578 | -| std | 0.153 | -| value_loss | 2.89e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6934 | -| time_elapsed | 45808 | -| total_timesteps | 887552 | -| train/ | | -| approx_kl | 0.033186454 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.457 | -| explained_variance | -2.67 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 69330 | -| policy_gradient_loss | -0.00224 | -| std | 0.153 | -| value_loss | 7.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6935 | -| time_elapsed | 45811 | -| total_timesteps | 887680 | -| train/ | | -| approx_kl | 0.00912036 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.456 | -| explained_variance | 0.00296 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 69340 | -| policy_gradient_loss | -0.00344 | -| std | 0.153 | -| value_loss | 7.67e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6936 | -| time_elapsed | 45815 | -| total_timesteps | 887808 | -| train/ | | -| approx_kl | 0.023202106 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.455 | -| explained_variance | 0.02 | -| learning_rate | 0.0003 | -| loss | 0.00154 | -| n_updates | 69350 | -| policy_gradient_loss | -0.00167 | -| std | 0.154 | -| value_loss | 1.21e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.71 | -| time/ | | -| fps | 19 | -| iterations | 6937 | -| time_elapsed | 45819 | -| total_timesteps | 887936 | -| train/ | | -| approx_kl | 0.00014966493 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.455 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.000151 | -| n_updates | 69360 | -| policy_gradient_loss | 0.000191 | -| std | 0.154 | -| value_loss | 1.42e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6938 | -| time_elapsed | 45824 | -| total_timesteps | 888064 | -| train/ | | -| approx_kl | 0.008921186 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 0.454 | -| explained_variance | -0.472 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 69370 | -| policy_gradient_loss | -0.00215 | -| std | 0.154 | -| value_loss | 3.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6939 | -| time_elapsed | 45831 | -| total_timesteps | 888192 | -| train/ | | -| approx_kl | 0.021098046 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.453 | -| explained_variance | -0.312 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 69380 | -| policy_gradient_loss | -0.00254 | -| std | 0.154 | -| value_loss | 0.00279 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6940 | -| time_elapsed | 45835 | -| total_timesteps | 888320 | -| train/ | | -| approx_kl | 0.013578521 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.453 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.000968 | -| n_updates | 69390 | -| policy_gradient_loss | -0.00131 | -| std | 0.154 | -| value_loss | 3.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6941 | -| time_elapsed | 45837 | -| total_timesteps | 888448 | -| train/ | | -| approx_kl | 0.042035043 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 0.452 | -| explained_variance | -14.9 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 69400 | -| policy_gradient_loss | -0.0113 | -| std | 0.154 | -| value_loss | 1.75e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6942 | -| time_elapsed | 45841 | -| total_timesteps | 888576 | -| train/ | | -| approx_kl | 0.0064842007 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.451 | -| explained_variance | -2.26 | -| learning_rate | 0.0003 | -| loss | 0.00165 | -| n_updates | 69410 | -| policy_gradient_loss | 0.000127 | -| std | 0.155 | -| value_loss | 3.31e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6943 | -| time_elapsed | 45845 | -| total_timesteps | 888704 | -| train/ | | -| approx_kl | 0.023791144 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 0.446 | -| explained_variance | -0.0955 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 69420 | -| policy_gradient_loss | -0.00345 | -| std | 0.155 | -| value_loss | 5.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6944 | -| time_elapsed | 45848 | -| total_timesteps | 888832 | -| train/ | | -| approx_kl | 0.01873365 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.445 | -| explained_variance | -0.823 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 69430 | -| policy_gradient_loss | -0.000159 | -| std | 0.155 | -| value_loss | 1.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6945 | -| time_elapsed | 45852 | -| total_timesteps | 888960 | -| train/ | | -| approx_kl | 0.01183656 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 0.446 | -| explained_variance | 0.0243 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 69440 | -| policy_gradient_loss | -0.00915 | -| std | 0.155 | -| value_loss | 2.9e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6946 | -| time_elapsed | 45855 | -| total_timesteps | 889088 | -| train/ | | -| approx_kl | 0.0138198435 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.447 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 69450 | -| policy_gradient_loss | -0.00175 | -| std | 0.155 | -| value_loss | 1.87e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6947 | -| time_elapsed | 45861 | -| total_timesteps | 889216 | -| train/ | | -| approx_kl | 0.022933394 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.447 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 69460 | -| policy_gradient_loss | -0.00449 | -| std | 0.155 | -| value_loss | 0.000236 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6948 | -| time_elapsed | 45865 | -| total_timesteps | 889344 | -| train/ | | -| approx_kl | 0.035493918 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 0.446 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 69470 | -| policy_gradient_loss | -0.0131 | -| std | 0.155 | -| value_loss | 3.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6949 | -| time_elapsed | 45868 | -| total_timesteps | 889472 | -| train/ | | -| approx_kl | 0.020155674 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.446 | -| explained_variance | -9.34 | -| learning_rate | 0.0003 | -| loss | 0.00383 | -| n_updates | 69480 | -| policy_gradient_loss | 0.000695 | -| std | 0.155 | -| value_loss | 1.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6950 | -| time_elapsed | 45873 | -| total_timesteps | 889600 | -| train/ | | -| approx_kl | 0.009270169 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.448 | -| explained_variance | 0.00482 | -| learning_rate | 0.0003 | -| loss | 0.000463 | -| n_updates | 69490 | -| policy_gradient_loss | 0.000106 | -| std | 0.155 | -| value_loss | 1.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6951 | -| time_elapsed | 45877 | -| total_timesteps | 889728 | -| train/ | | -| approx_kl | 0.011545593 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.449 | -| explained_variance | 0.0186 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 69500 | -| policy_gradient_loss | 0.0001 | -| std | 0.154 | -| value_loss | 1.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6952 | -| time_elapsed | 45880 | -| total_timesteps | 889856 | -| train/ | | -| approx_kl | 0.02442589 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.45 | -| explained_variance | 0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00648 | -| n_updates | 69510 | -| policy_gradient_loss | -0.00585 | -| std | 0.154 | -| value_loss | 1.4e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 6953 | -| time_elapsed | 45884 | -| total_timesteps | 889984 | -| train/ | | -| approx_kl | 0.00049407966 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.45 | -| explained_variance | 0.0221 | -| learning_rate | 0.0003 | -| loss | -0.000667 | -| n_updates | 69520 | -| policy_gradient_loss | -0.000803 | -| std | 0.154 | -| value_loss | 8.55e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 19 | -| iterations | 6954 | -| time_elapsed | 45888 | -| total_timesteps | 890112 | -| train/ | | -| approx_kl | 0.014326086 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.451 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 69530 | -| policy_gradient_loss | 0.00095 | -| std | 0.154 | -| value_loss | 1.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 19 | -| iterations | 6955 | -| time_elapsed | 45898 | -| total_timesteps | 890240 | -| train/ | | -| approx_kl | 0.011539321 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 0.452 | -| explained_variance | 0.669 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 69540 | -| policy_gradient_loss | -0.00118 | -| std | 0.154 | -| value_loss | 0.00107 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 19 | -| iterations | 6956 | -| time_elapsed | 45902 | -| total_timesteps | 890368 | -| train/ | | -| approx_kl | 0.020147258 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 0.451 | -| explained_variance | -33.9 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 69550 | -| policy_gradient_loss | -0.000665 | -| std | 0.154 | -| value_loss | 9.89e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 19 | -| iterations | 6957 | -| time_elapsed | 45907 | -| total_timesteps | 890496 | -| train/ | | -| approx_kl | 0.0002479339 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 0.452 | -| explained_variance | -27.6 | -| learning_rate | 0.0003 | -| loss | -0.00034 | -| n_updates | 69560 | -| policy_gradient_loss | -2.17e-06 | -| std | 0.154 | -| value_loss | 3.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 19 | -| iterations | 6958 | -| time_elapsed | 45910 | -| total_timesteps | 890624 | -| train/ | | -| approx_kl | 0.007568524 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.455 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 69570 | -| policy_gradient_loss | -0.00254 | -| std | 0.153 | -| value_loss | 4.01e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 19 | -| iterations | 6959 | -| time_elapsed | 45914 | -| total_timesteps | 890752 | -| train/ | | -| approx_kl | 0.0148894265 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.456 | -| explained_variance | -0.541 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 69580 | -| policy_gradient_loss | -7.6e-05 | -| std | 0.153 | -| value_loss | 2.52e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.73 | -| time/ | | -| fps | 19 | -| iterations | 6960 | -| time_elapsed | 45918 | -| total_timesteps | 890880 | -| train/ | | -| approx_kl | 0.012197635 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.459 | -| explained_variance | -0.63 | -| learning_rate | 0.0003 | -| loss | 0.00277 | -| n_updates | 69590 | -| policy_gradient_loss | 0.000283 | -| std | 0.153 | -| value_loss | 6.63e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6961 | -| time_elapsed | 45922 | -| total_timesteps | 891008 | -| train/ | | -| approx_kl | 0.021149274 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.461 | -| explained_variance | -0.576 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 69600 | -| policy_gradient_loss | -0.00498 | -| std | 0.152 | -| value_loss | 6.39e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6962 | -| time_elapsed | 45930 | -| total_timesteps | 891136 | -| train/ | | -| approx_kl | 0.020870544 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 0.462 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 69610 | -| policy_gradient_loss | -0.0113 | -| std | 0.152 | -| value_loss | 0.00015 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6963 | -| time_elapsed | 45934 | -| total_timesteps | 891264 | -| train/ | | -| approx_kl | 0.026046792 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.463 | -| explained_variance | 0.691 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 69620 | -| policy_gradient_loss | -0.00304 | -| std | 0.152 | -| value_loss | 2.13e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6964 | -| time_elapsed | 45937 | -| total_timesteps | 891392 | -| train/ | | -| approx_kl | 0.02114093 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 0.463 | -| explained_variance | -5.42 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 69630 | -| policy_gradient_loss | -0.00122 | -| std | 0.152 | -| value_loss | 2.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6965 | -| time_elapsed | 45940 | -| total_timesteps | 891520 | -| train/ | | -| approx_kl | 0.008257079 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.463 | -| explained_variance | 0.0237 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 69640 | -| policy_gradient_loss | 0.000717 | -| std | 0.152 | -| value_loss | 6.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6966 | -| time_elapsed | 45944 | -| total_timesteps | 891648 | -| train/ | | -| approx_kl | 0.022358729 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.463 | -| explained_variance | -0.422 | -| learning_rate | 0.0003 | -| loss | 0.00537 | -| n_updates | 69650 | -| policy_gradient_loss | 0.000452 | -| std | 0.152 | -| value_loss | 2.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6967 | -| time_elapsed | 45948 | -| total_timesteps | 891776 | -| train/ | | -| approx_kl | 0.027381167 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 0.465 | -| explained_variance | -0.00365 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 69660 | -| policy_gradient_loss | -0.00727 | -| std | 0.152 | -| value_loss | 5.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6968 | -| time_elapsed | 45950 | -| total_timesteps | 891904 | -| train/ | | -| approx_kl | 0.013039507 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 0.465 | -| explained_variance | -0.792 | -| learning_rate | 0.0003 | -| loss | -0.00753 | -| n_updates | 69670 | -| policy_gradient_loss | -0.00437 | -| std | 0.152 | -| value_loss | 1.39e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6969 | -| time_elapsed | 45953 | -| total_timesteps | 892032 | -| train/ | | -| approx_kl | 3.719749e-05 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 0.466 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -2.07e-05 | -| n_updates | 69680 | -| policy_gradient_loss | 0.000164 | -| std | 0.152 | -| value_loss | 4.01e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6970 | -| time_elapsed | 45959 | -| total_timesteps | 892160 | -| train/ | | -| approx_kl | 0.010600881 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.468 | -| explained_variance | 0.949 | -| learning_rate | 0.0003 | -| loss | -0.000779 | -| n_updates | 69690 | -| policy_gradient_loss | 0.000326 | -| std | 0.151 | -| value_loss | 0.000415 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6971 | -| time_elapsed | 45963 | -| total_timesteps | 892288 | -| train/ | | -| approx_kl | 0.00570781 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.47 | -| explained_variance | -5.1 | -| learning_rate | 0.0003 | -| loss | 0.000624 | -| n_updates | 69700 | -| policy_gradient_loss | 0.000108 | -| std | 0.151 | -| value_loss | 4.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6972 | -| time_elapsed | 45967 | -| total_timesteps | 892416 | -| train/ | | -| approx_kl | 0.012818107 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.473 | -| explained_variance | -31.6 | -| learning_rate | 0.0003 | -| loss | 0.000355 | -| n_updates | 69710 | -| policy_gradient_loss | -0.000452 | -| std | 0.151 | -| value_loss | 1.41e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6973 | -| time_elapsed | 45971 | -| total_timesteps | 892544 | -| train/ | | -| approx_kl | 0.0155333 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.00015 | -| n_updates | 69720 | -| policy_gradient_loss | -0.00121 | -| std | 0.151 | -| value_loss | 4.62e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6974 | -| time_elapsed | 45974 | -| total_timesteps | 892672 | -| train/ | | -| approx_kl | 0.019962275 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 69730 | -| policy_gradient_loss | 0.00173 | -| std | 0.151 | -| value_loss | 1.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6975 | -| time_elapsed | 45978 | -| total_timesteps | 892800 | -| train/ | | -| approx_kl | 0.016033595 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.475 | -| explained_variance | -0.996 | -| learning_rate | 0.0003 | -| loss | 0.00801 | -| n_updates | 69740 | -| policy_gradient_loss | 0.00108 | -| std | 0.151 | -| value_loss | 1.99e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.74 | -| time/ | | -| fps | 19 | -| iterations | 6976 | -| time_elapsed | 45981 | -| total_timesteps | 892928 | -| train/ | | -| approx_kl | 0.028028969 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.475 | -| explained_variance | 0.0165 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 69750 | -| policy_gradient_loss | -0.00877 | -| std | 0.151 | -| value_loss | 2.67e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6977 | -| time_elapsed | 45984 | -| total_timesteps | 893056 | -| train/ | | -| approx_kl | 0.0050046407 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | -0.344 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 69760 | -| policy_gradient_loss | -0.00179 | -| std | 0.151 | -| value_loss | 7.34e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6978 | -| time_elapsed | 45991 | -| total_timesteps | 893184 | -| train/ | | -| approx_kl | 0.02467546 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 0.472 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 69770 | -| policy_gradient_loss | -0.0157 | -| std | 0.151 | -| value_loss | 0.000887 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6979 | -| time_elapsed | 45995 | -| total_timesteps | 893312 | -| train/ | | -| approx_kl | 0.02652832 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.471 | -| explained_variance | -26.3 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 69780 | -| policy_gradient_loss | -0.000609 | -| std | 0.151 | -| value_loss | 1.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6980 | -| time_elapsed | 45999 | -| total_timesteps | 893440 | -| train/ | | -| approx_kl | 0.035718605 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.47 | -| explained_variance | -37.6 | -| learning_rate | 0.0003 | -| loss | 0.00469 | -| n_updates | 69790 | -| policy_gradient_loss | 0.000778 | -| std | 0.151 | -| value_loss | 9.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6981 | -| time_elapsed | 46002 | -| total_timesteps | 893568 | -| train/ | | -| approx_kl | 0.015412221 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.471 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | 0.000732 | -| n_updates | 69800 | -| policy_gradient_loss | -0.000148 | -| std | 0.151 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6982 | -| time_elapsed | 46006 | -| total_timesteps | 893696 | -| train/ | | -| approx_kl | 0.010597089 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.472 | -| explained_variance | -3.31 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 69810 | -| policy_gradient_loss | -0.000854 | -| std | 0.151 | -| value_loss | 3.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6983 | -| time_elapsed | 46010 | -| total_timesteps | 893824 | -| train/ | | -| approx_kl | 0.013840374 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | -0.00886 | -| n_updates | 69820 | -| policy_gradient_loss | -0.00518 | -| std | 0.151 | -| value_loss | 3.18e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.75 | -| time/ | | -| fps | 19 | -| iterations | 6984 | -| time_elapsed | 46014 | -| total_timesteps | 893952 | -| train/ | | -| approx_kl | 0.002476676 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | -0.00515 | -| n_updates | 69830 | -| policy_gradient_loss | -0.00374 | -| std | 0.15 | -| value_loss | 2.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6985 | -| time_elapsed | 46017 | -| total_timesteps | 894080 | -| train/ | | -| approx_kl | 0.0046487437 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.475 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 69840 | -| policy_gradient_loss | -0.00216 | -| std | 0.15 | -| value_loss | 6.34e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6986 | -| time_elapsed | 46023 | -| total_timesteps | 894208 | -| train/ | | -| approx_kl | 0.004869482 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.476 | -| explained_variance | 0.933 | -| learning_rate | 0.0003 | -| loss | -0.000476 | -| n_updates | 69850 | -| policy_gradient_loss | 0.000644 | -| std | 0.15 | -| value_loss | 0.000334 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6987 | -| time_elapsed | 46028 | -| total_timesteps | 894336 | -| train/ | | -| approx_kl | 0.007873834 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.476 | -| explained_variance | -0.874 | -| learning_rate | 0.0003 | -| loss | -0.00574 | -| n_updates | 69860 | -| policy_gradient_loss | -0.00331 | -| std | 0.15 | -| value_loss | 6.95e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6988 | -| time_elapsed | 46031 | -| total_timesteps | 894464 | -| train/ | | -| approx_kl | 0.026676852 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.476 | -| explained_variance | -25.4 | -| learning_rate | 0.0003 | -| loss | -0.00824 | -| n_updates | 69870 | -| policy_gradient_loss | -0.00196 | -| std | 0.15 | -| value_loss | 4.1e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6989 | -| time_elapsed | 46035 | -| total_timesteps | 894592 | -| train/ | | -| approx_kl | 0.0036395495 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.475 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 69880 | -| policy_gradient_loss | 0.000481 | -| std | 0.151 | -| value_loss | 6.21e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6990 | -| time_elapsed | 46038 | -| total_timesteps | 894720 | -| train/ | | -| approx_kl | 0.010597622 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 0.473 | -| explained_variance | -0.309 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 69890 | -| policy_gradient_loss | -0.00883 | -| std | 0.151 | -| value_loss | 9.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6991 | -| time_elapsed | 46042 | -| total_timesteps | 894848 | -| train/ | | -| approx_kl | 0.008725656 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.473 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 69900 | -| policy_gradient_loss | 0.000434 | -| std | 0.151 | -| value_loss | 2.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.76 | -| time/ | | -| fps | 19 | -| iterations | 6992 | -| time_elapsed | 46045 | -| total_timesteps | 894976 | -| train/ | | -| approx_kl | 0.008915683 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | -6.63 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 69910 | -| policy_gradient_loss | -0.0116 | -| std | 0.151 | -| value_loss | 4.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 6993 | -| time_elapsed | 46049 | -| total_timesteps | 895104 | -| train/ | | -| approx_kl | 0.018421438 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | 0.0182 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 69920 | -| policy_gradient_loss | -0.00282 | -| std | 0.151 | -| value_loss | 2.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 6994 | -| time_elapsed | 46058 | -| total_timesteps | 895232 | -| train/ | | -| approx_kl | 0.018802956 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.473 | -| explained_variance | 0.562 | -| learning_rate | 0.0003 | -| loss | 0.00318 | -| n_updates | 69930 | -| policy_gradient_loss | 0.000452 | -| std | 0.151 | -| value_loss | 0.000889 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 6995 | -| time_elapsed | 46062 | -| total_timesteps | 895360 | -| train/ | | -| approx_kl | 0.030331625 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | -65.1 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 69940 | -| policy_gradient_loss | -0.00383 | -| std | 0.151 | -| value_loss | 3.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 6996 | -| time_elapsed | 46066 | -| total_timesteps | 895488 | -| train/ | | -| approx_kl | 0.022264909 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 0.474 | -| explained_variance | -51.8 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 69950 | -| policy_gradient_loss | -0.00492 | -| std | 0.15 | -| value_loss | 9.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 6997 | -| time_elapsed | 46068 | -| total_timesteps | 895616 | -| train/ | | -| approx_kl | 0.016762018 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 0.476 | -| explained_variance | -12.8 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 69960 | -| policy_gradient_loss | -0.0018 | -| std | 0.15 | -| value_loss | 8.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 6998 | -| time_elapsed | 46071 | -| total_timesteps | 895744 | -| train/ | | -| approx_kl | 0.029560674 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.477 | -| explained_variance | -0.792 | -| learning_rate | 0.0003 | -| loss | -0.000775 | -| n_updates | 69970 | -| policy_gradient_loss | -0.00172 | -| std | 0.15 | -| value_loss | 1.87e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 6999 | -| time_elapsed | 46074 | -| total_timesteps | 895872 | -| train/ | | -| approx_kl | 0.03647261 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 0.479 | -| explained_variance | 0.0179 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 69980 | -| policy_gradient_loss | -0.00928 | -| std | 0.15 | -| value_loss | 5.84e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7000 | -| time_elapsed | 46077 | -| total_timesteps | 896000 | -| train/ | | -| approx_kl | 0.016957287 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 0.48 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 69990 | -| policy_gradient_loss | 0.000605 | -| std | 0.15 | -| value_loss | 4.21e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7001 | -| time_elapsed | 46080 | -| total_timesteps | 896128 | -| train/ | | -| approx_kl | 0.03518377 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 0.481 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 70000 | -| policy_gradient_loss | -0.00369 | -| std | 0.15 | -| value_loss | 3.14e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7002 | -| time_elapsed | 46088 | -| total_timesteps | 896256 | -| train/ | | -| approx_kl | 0.0370535 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.481 | -| explained_variance | 0.369 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 70010 | -| policy_gradient_loss | -0.00612 | -| std | 0.15 | -| value_loss | 0.00105 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7003 | -| time_elapsed | 46091 | -| total_timesteps | 896384 | -| train/ | | -| approx_kl | 0.0010417262 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 0.481 | -| explained_variance | -80.5 | -| learning_rate | 0.0003 | -| loss | -0.000217 | -| n_updates | 70020 | -| policy_gradient_loss | -0.000165 | -| std | 0.15 | -| value_loss | 1.89e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7004 | -| time_elapsed | 46096 | -| total_timesteps | 896512 | -| train/ | | -| approx_kl | 0.015486084 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.481 | -| explained_variance | -81.7 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 70030 | -| policy_gradient_loss | -0.0119 | -| std | 0.15 | -| value_loss | 1.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7005 | -| time_elapsed | 46099 | -| total_timesteps | 896640 | -| train/ | | -| approx_kl | 0.03388566 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 0.482 | -| explained_variance | -80.5 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 70040 | -| policy_gradient_loss | -0.0109 | -| std | 0.149 | -| value_loss | 5.08e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7006 | -| time_elapsed | 46102 | -| total_timesteps | 896768 | -| train/ | | -| approx_kl | 0.0045381957 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 0.483 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | -0.00742 | -| n_updates | 70050 | -| policy_gradient_loss | -0.00524 | -| std | 0.149 | -| value_loss | 8.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7007 | -| time_elapsed | 46106 | -| total_timesteps | 896896 | -| train/ | | -| approx_kl | 0.011649922 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.483 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.000484 | -| n_updates | 70060 | -| policy_gradient_loss | -0.000723 | -| std | 0.149 | -| value_loss | 1.52e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7008 | -| time_elapsed | 46110 | -| total_timesteps | 897024 | -| train/ | | -| approx_kl | 0.0067336657 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.484 | -| explained_variance | -4.1 | -| learning_rate | 0.0003 | -| loss | -0.000587 | -| n_updates | 70070 | -| policy_gradient_loss | -0.000293 | -| std | 0.149 | -| value_loss | 9.78e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7009 | -| time_elapsed | 46118 | -| total_timesteps | 897152 | -| train/ | | -| approx_kl | 0.010461529 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.486 | -| explained_variance | 0.773 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 70080 | -| policy_gradient_loss | 0.00108 | -| std | 0.149 | -| value_loss | 0.00384 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7010 | -| time_elapsed | 46121 | -| total_timesteps | 897280 | -| train/ | | -| approx_kl | 0.020495959 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.486 | -| explained_variance | -1.36 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 70090 | -| policy_gradient_loss | -0.00181 | -| std | 0.149 | -| value_loss | 0.000183 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7011 | -| time_elapsed | 46125 | -| total_timesteps | 897408 | -| train/ | | -| approx_kl | 0.005809356 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | 0.000624 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 70100 | -| policy_gradient_loss | 0.000583 | -| std | 0.149 | -| value_loss | 0.000217 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7012 | -| time_elapsed | 46127 | -| total_timesteps | 897536 | -| train/ | | -| approx_kl | 0.005473261 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 70110 | -| policy_gradient_loss | 0.0014 | -| std | 0.149 | -| value_loss | 0.000119 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7013 | -| time_elapsed | 46130 | -| total_timesteps | 897664 | -| train/ | | -| approx_kl | 0.0012365547 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 70120 | -| policy_gradient_loss | 0.000912 | -| std | 0.149 | -| value_loss | 0.000141 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7014 | -| time_elapsed | 46133 | -| total_timesteps | 897792 | -| train/ | | -| approx_kl | 0.014919425 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 70130 | -| policy_gradient_loss | -0.00225 | -| std | 0.149 | -| value_loss | 1.87e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.77 | -| time/ | | -| fps | 19 | -| iterations | 7015 | -| time_elapsed | 46135 | -| total_timesteps | 897920 | -| train/ | | -| approx_kl | 0.011174375 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 70140 | -| policy_gradient_loss | -0.00438 | -| std | 0.149 | -| value_loss | 7.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7016 | -| time_elapsed | 46139 | -| total_timesteps | 898048 | -| train/ | | -| approx_kl | 0.041269407 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | -0.026 | -| n_updates | 70150 | -| policy_gradient_loss | -0.0138 | -| std | 0.149 | -| value_loss | 6.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7017 | -| time_elapsed | 46147 | -| total_timesteps | 898176 | -| train/ | | -| approx_kl | 0.036264997 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.00894 | -| n_updates | 70160 | -| policy_gradient_loss | -0.00636 | -| std | 0.149 | -| value_loss | 0.00255 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7018 | -| time_elapsed | 46149 | -| total_timesteps | 898304 | -| train/ | | -| approx_kl | 0.021372728 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 70170 | -| policy_gradient_loss | -0.000899 | -| std | 0.149 | -| value_loss | 4.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7019 | -| time_elapsed | 46153 | -| total_timesteps | 898432 | -| train/ | | -| approx_kl | 0.012653251 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 70180 | -| policy_gradient_loss | -0.00306 | -| std | 0.149 | -| value_loss | 3.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7020 | -| time_elapsed | 46157 | -| total_timesteps | 898560 | -| train/ | | -| approx_kl | 0.008971097 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.401 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 70190 | -| policy_gradient_loss | -0.00217 | -| std | 0.148 | -| value_loss | 3.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7021 | -| time_elapsed | 46160 | -| total_timesteps | 898688 | -| train/ | | -| approx_kl | 0.015854692 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.489 | -| explained_variance | -0.417 | -| learning_rate | 0.0003 | -| loss | -0.00759 | -| n_updates | 70200 | -| policy_gradient_loss | -0.00265 | -| std | 0.148 | -| value_loss | 1.37e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7022 | -| time_elapsed | 46163 | -| total_timesteps | 898816 | -| train/ | | -| approx_kl | 0.02281515 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.489 | -| explained_variance | -0.233 | -| learning_rate | 0.0003 | -| loss | 0.00303 | -| n_updates | 70210 | -| policy_gradient_loss | -0.000536 | -| std | 0.148 | -| value_loss | 4.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.78 | -| time/ | | -| fps | 19 | -| iterations | 7023 | -| time_elapsed | 46165 | -| total_timesteps | 898944 | -| train/ | | -| approx_kl | 0.011061907 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.49 | -| explained_variance | -0.0666 | -| learning_rate | 0.0003 | -| loss | -0.00905 | -| n_updates | 70220 | -| policy_gradient_loss | -0.00593 | -| std | 0.148 | -| value_loss | 5.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7024 | -| time_elapsed | 46169 | -| total_timesteps | 899072 | -| train/ | | -| approx_kl | 0.009035792 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.49 | -| explained_variance | -0.27 | -| learning_rate | 0.0003 | -| loss | -0.00269 | -| n_updates | 70230 | -| policy_gradient_loss | -0.000375 | -| std | 0.148 | -| value_loss | 2.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7025 | -| time_elapsed | 46174 | -| total_timesteps | 899200 | -| train/ | | -| approx_kl | 0.08355059 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 0.49 | -| explained_variance | 0.607 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 70240 | -| policy_gradient_loss | -0.0067 | -| std | 0.148 | -| value_loss | 0.000861 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7026 | -| time_elapsed | 46177 | -| total_timesteps | 899328 | -| train/ | | -| approx_kl | 0.034540743 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.49 | -| explained_variance | -16.8 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 70250 | -| policy_gradient_loss | -0.0026 | -| std | 0.148 | -| value_loss | 4.94e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7027 | -| time_elapsed | 46180 | -| total_timesteps | 899456 | -| train/ | | -| approx_kl | 0.024900554 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.489 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | 0.000202 | -| n_updates | 70260 | -| policy_gradient_loss | -0.00176 | -| std | 0.149 | -| value_loss | 3.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7028 | -| time_elapsed | 46184 | -| total_timesteps | 899584 | -| train/ | | -| approx_kl | 0.003129234 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.000119 | -| n_updates | 70270 | -| policy_gradient_loss | -6.32e-05 | -| std | 0.148 | -| value_loss | 6.49e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7029 | -| time_elapsed | 46186 | -| total_timesteps | 899712 | -| train/ | | -| approx_kl | 0.01347765 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.489 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 70280 | -| policy_gradient_loss | -0.00307 | -| std | 0.148 | -| value_loss | 6.24e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7030 | -| time_elapsed | 46190 | -| total_timesteps | 899840 | -| train/ | | -| approx_kl | 0.032666836 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.49 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | 0.00153 | -| n_updates | 70290 | -| policy_gradient_loss | -0.00196 | -| std | 0.148 | -| value_loss | 1.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7031 | -| time_elapsed | 46194 | -| total_timesteps | 899968 | -| train/ | | -| approx_kl | 0.011828784 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.49 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 70300 | -| policy_gradient_loss | -0.00224 | -| std | 0.148 | -| value_loss | 4.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7032 | -| time_elapsed | 46198 | -| total_timesteps | 900096 | -| train/ | | -| approx_kl | 0.015037756 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.489 | -| explained_variance | -0.545 | -| learning_rate | 0.0003 | -| loss | 0.000463 | -| n_updates | 70310 | -| policy_gradient_loss | 0.00222 | -| std | 0.148 | -| value_loss | 1.53e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7033 | -| time_elapsed | 46205 | -| total_timesteps | 900224 | -| train/ | | -| approx_kl | 0.0033742744 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | 0.732 | -| learning_rate | 0.0003 | -| loss | -0.000492 | -| n_updates | 70320 | -| policy_gradient_loss | -0.000751 | -| std | 0.149 | -| value_loss | 0.00616 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7034 | -| time_elapsed | 46209 | -| total_timesteps | 900352 | -| train/ | | -| approx_kl | 0.007498708 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.00638 | -| learning_rate | 0.0003 | -| loss | -0.000752 | -| n_updates | 70330 | -| policy_gradient_loss | 0.00246 | -| std | 0.149 | -| value_loss | 1.41e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7035 | -| time_elapsed | 46213 | -| total_timesteps | 900480 | -| train/ | | -| approx_kl | 0.015263189 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.516 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 70340 | -| policy_gradient_loss | -0.00479 | -| std | 0.149 | -| value_loss | 2.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7036 | -| time_elapsed | 46216 | -| total_timesteps | 900608 | -| train/ | | -| approx_kl | 0.028767236 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 70350 | -| policy_gradient_loss | -0.015 | -| std | 0.148 | -| value_loss | 7.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7037 | -| time_elapsed | 46220 | -| total_timesteps | 900736 | -| train/ | | -| approx_kl | 0.012183191 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.635 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 70360 | -| policy_gradient_loss | -0.00961 | -| std | 0.148 | -| value_loss | 1.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7038 | -| time_elapsed | 46224 | -| total_timesteps | 900864 | -| train/ | | -| approx_kl | 0.02154101 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 70370 | -| policy_gradient_loss | -0.0116 | -| std | 0.149 | -| value_loss | 1.9e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.79 | -| time/ | | -| fps | 19 | -| iterations | 7039 | -| time_elapsed | 46228 | -| total_timesteps | 900992 | -| train/ | | -| approx_kl | 0.0015948298 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 70380 | -| policy_gradient_loss | -0.000334 | -| std | 0.149 | -| value_loss | 1.6e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 7040 | -| time_elapsed | 46232 | -| total_timesteps | 901120 | -| train/ | | -| approx_kl | 0.012435045 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | 0.0172 | -| learning_rate | 0.0003 | -| loss | 0.00366 | -| n_updates | 70390 | -| policy_gradient_loss | 0.000568 | -| std | 0.149 | -| value_loss | 7.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 7041 | -| time_elapsed | 46242 | -| total_timesteps | 901248 | -| train/ | | -| approx_kl | 0.055350177 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | -2.72 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 70400 | -| policy_gradient_loss | -0.0159 | -| std | 0.149 | -| value_loss | 0.00264 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 7042 | -| time_elapsed | 46246 | -| total_timesteps | 901376 | -| train/ | | -| approx_kl | 0.023535816 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | -0.309 | -| learning_rate | 0.0003 | -| loss | -0.00599 | -| n_updates | 70410 | -| policy_gradient_loss | -0.00515 | -| std | 0.149 | -| value_loss | 4.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 7043 | -| time_elapsed | 46250 | -| total_timesteps | 901504 | -| train/ | | -| approx_kl | 0.004398405 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 70420 | -| policy_gradient_loss | -0.00249 | -| std | 0.149 | -| value_loss | 7.86e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 7044 | -| time_elapsed | 46254 | -| total_timesteps | 901632 | -| train/ | | -| approx_kl | 0.0053033894 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | -0.725 | -| learning_rate | 0.0003 | -| loss | 0.00028 | -| n_updates | 70430 | -| policy_gradient_loss | -3.33e-05 | -| std | 0.149 | -| value_loss | 2.86e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 7045 | -| time_elapsed | 46257 | -| total_timesteps | 901760 | -| train/ | | -| approx_kl | 0.030543514 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | -0.00243 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 70440 | -| policy_gradient_loss | -0.00993 | -| std | 0.149 | -| value_loss | 8.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.72 | -| time/ | | -| fps | 19 | -| iterations | 7046 | -| time_elapsed | 46261 | -| total_timesteps | 901888 | -| train/ | | -| approx_kl | 0.0074730106 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.00453 | -| n_updates | 70450 | -| policy_gradient_loss | -0.00231 | -| std | 0.149 | -| value_loss | 2.02e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7047 | -| time_elapsed | 46264 | -| total_timesteps | 902016 | -| train/ | | -| approx_kl | 0.048057683 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 70460 | -| policy_gradient_loss | -0.0148 | -| std | 0.148 | -| value_loss | 6.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7048 | -| time_elapsed | 46272 | -| total_timesteps | 902144 | -| train/ | | -| approx_kl | 0.023508905 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.488 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 70470 | -| policy_gradient_loss | -0.00128 | -| std | 0.149 | -| value_loss | 0.000602 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7049 | -| time_elapsed | 46276 | -| total_timesteps | 902272 | -| train/ | | -| approx_kl | 0.00085661793 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.487 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 70480 | -| policy_gradient_loss | -0.00128 | -| std | 0.149 | -| value_loss | 7.01e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7050 | -| time_elapsed | 46280 | -| total_timesteps | 902400 | -| train/ | | -| approx_kl | 0.0003803228 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.489 | -| explained_variance | -12.5 | -| learning_rate | 0.0003 | -| loss | -0.000847 | -| n_updates | 70490 | -| policy_gradient_loss | -0.000342 | -| std | 0.148 | -| value_loss | 4.4e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7051 | -| time_elapsed | 46284 | -| total_timesteps | 902528 | -| train/ | | -| approx_kl | 0.001176321 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.495 | -| explained_variance | -0.438 | -| learning_rate | 0.0003 | -| loss | -2.32e-05 | -| n_updates | 70500 | -| policy_gradient_loss | -5.44e-05 | -| std | 0.147 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7052 | -| time_elapsed | 46288 | -| total_timesteps | 902656 | -| train/ | | -| approx_kl | 0.010271749 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.498 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | 0.000524 | -| n_updates | 70510 | -| policy_gradient_loss | 0.000604 | -| std | 0.147 | -| value_loss | 1.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7053 | -| time_elapsed | 46290 | -| total_timesteps | 902784 | -| train/ | | -| approx_kl | 0.011959529 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.499 | -| explained_variance | -0.00169 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 70520 | -| policy_gradient_loss | 0.00158 | -| std | 0.147 | -| value_loss | 8.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.47 | -| time/ | | -| fps | 19 | -| iterations | 7054 | -| time_elapsed | 46293 | -| total_timesteps | 902912 | -| train/ | | -| approx_kl | 0.021403242 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.499 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 70530 | -| policy_gradient_loss | -0.00233 | -| std | 0.147 | -| value_loss | 4.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7055 | -| time_elapsed | 46295 | -| total_timesteps | 903040 | -| train/ | | -| approx_kl | 0.005523212 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.499 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 70540 | -| policy_gradient_loss | -0.00108 | -| std | 0.147 | -| value_loss | 2.83e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7056 | -| time_elapsed | 46301 | -| total_timesteps | 903168 | -| train/ | | -| approx_kl | 0.0009028902 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.5 | -| explained_variance | 0.624 | -| learning_rate | 0.0003 | -| loss | 0.00466 | -| n_updates | 70550 | -| policy_gradient_loss | 0.00058 | -| std | 0.147 | -| value_loss | 0.0133 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7057 | -| time_elapsed | 46305 | -| total_timesteps | 903296 | -| train/ | | -| approx_kl | 0.004135535 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.5 | -| explained_variance | 0.245 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 70560 | -| policy_gradient_loss | -0.000914 | -| std | 0.147 | -| value_loss | 0.00126 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7058 | -| time_elapsed | 46308 | -| total_timesteps | 903424 | -| train/ | | -| approx_kl | 0.034145243 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | -3.26 | -| learning_rate | 0.0003 | -| loss | -0.00602 | -| n_updates | 70570 | -| policy_gradient_loss | -0.00533 | -| std | 0.147 | -| value_loss | 0.00634 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7059 | -| time_elapsed | 46311 | -| total_timesteps | 903552 | -| train/ | | -| approx_kl | 0.01756462 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | 0.00594 | -| n_updates | 70580 | -| policy_gradient_loss | 0.00164 | -| std | 0.147 | -| value_loss | 0.00122 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7060 | -| time_elapsed | 46314 | -| total_timesteps | 903680 | -| train/ | | -| approx_kl | 0.0080000935 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | -39.9 | -| learning_rate | 0.0003 | -| loss | -7.84e-05 | -| n_updates | 70590 | -| policy_gradient_loss | -5.95e-05 | -| std | 0.147 | -| value_loss | 4.24e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7061 | -| time_elapsed | 46317 | -| total_timesteps | 903808 | -| train/ | | -| approx_kl | 0.024524886 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 70600 | -| policy_gradient_loss | -0.00558 | -| std | 0.147 | -| value_loss | 7.93e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.23 | -| time/ | | -| fps | 19 | -| iterations | 7062 | -| time_elapsed | 46322 | -| total_timesteps | 903936 | -| train/ | | -| approx_kl | 0.003630282 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 0.5 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | 0.000283 | -| n_updates | 70610 | -| policy_gradient_loss | -6.33e-05 | -| std | 0.147 | -| value_loss | 2.79e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7063 | -| time_elapsed | 46325 | -| total_timesteps | 904064 | -| train/ | | -| approx_kl | 0.032166425 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 0.497 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 70620 | -| policy_gradient_loss | -0.00598 | -| std | 0.147 | -| value_loss | 2.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7064 | -| time_elapsed | 46331 | -| total_timesteps | 904192 | -| train/ | | -| approx_kl | 0.023879567 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.496 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 70630 | -| policy_gradient_loss | -0.0154 | -| std | 0.147 | -| value_loss | 0.00654 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7065 | -| time_elapsed | 46334 | -| total_timesteps | 904320 | -| train/ | | -| approx_kl | 0.0037922487 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.497 | -| explained_variance | 0.0481 | -| learning_rate | 0.0003 | -| loss | -0.000425 | -| n_updates | 70640 | -| policy_gradient_loss | -0.000202 | -| std | 0.147 | -| value_loss | 6.87e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7066 | -| time_elapsed | 46336 | -| total_timesteps | 904448 | -| train/ | | -| approx_kl | 0.029538115 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 0.5 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 70650 | -| policy_gradient_loss | -0.00344 | -| std | 0.147 | -| value_loss | 7.57e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7067 | -| time_elapsed | 46340 | -| total_timesteps | 904576 | -| train/ | | -| approx_kl | 0.00055131456 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | -41.8 | -| learning_rate | 0.0003 | -| loss | -0.000467 | -| n_updates | 70660 | -| policy_gradient_loss | -0.000144 | -| std | 0.147 | -| value_loss | 2.69e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7068 | -| time_elapsed | 46343 | -| total_timesteps | 904704 | -| train/ | | -| approx_kl | 0.006325044 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 0.496 | -| explained_variance | -5.11 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 70670 | -| policy_gradient_loss | -0.000281 | -| std | 0.148 | -| value_loss | 9.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7069 | -| time_elapsed | 46347 | -| total_timesteps | 904832 | -| train/ | | -| approx_kl | 0.01637958 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.494 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 70680 | -| policy_gradient_loss | -0.00139 | -| std | 0.148 | -| value_loss | 7.8e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.15 | -| time/ | | -| fps | 19 | -| iterations | 7070 | -| time_elapsed | 46351 | -| total_timesteps | 904960 | -| train/ | | -| approx_kl | 0.008077843 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.493 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 70690 | -| policy_gradient_loss | -0.00133 | -| std | 0.148 | -| value_loss | 2.32e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7071 | -| time_elapsed | 46355 | -| total_timesteps | 905088 | -| train/ | | -| approx_kl | 0.00034443708 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 0.496 | -| explained_variance | -0.0542 | -| learning_rate | 0.0003 | -| loss | -0.000878 | -| n_updates | 70700 | -| policy_gradient_loss | -0.000276 | -| std | 0.147 | -| value_loss | 1.05e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7072 | -| time_elapsed | 46362 | -| total_timesteps | 905216 | -| train/ | | -| approx_kl | 0.015568692 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.502 | -| explained_variance | 0.919 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 70710 | -| policy_gradient_loss | -0.00771 | -| std | 0.146 | -| value_loss | 0.000931 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7073 | -| time_elapsed | 46366 | -| total_timesteps | 905344 | -| train/ | | -| approx_kl | 0.0014502723 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.503 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.000687 | -| n_updates | 70720 | -| policy_gradient_loss | -0.00036 | -| std | 0.146 | -| value_loss | 2.39e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7074 | -| time_elapsed | 46370 | -| total_timesteps | 905472 | -| train/ | | -| approx_kl | 0.027800739 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.502 | -| explained_variance | -45.5 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 70730 | -| policy_gradient_loss | -0.00522 | -| std | 0.147 | -| value_loss | 6.78e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7075 | -| time_elapsed | 46374 | -| total_timesteps | 905600 | -| train/ | | -| approx_kl | 0.021888776 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | -0.631 | -| learning_rate | 0.0003 | -| loss | 0.00633 | -| n_updates | 70740 | -| policy_gradient_loss | 0.000576 | -| std | 0.147 | -| value_loss | 5.18e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7076 | -| time_elapsed | 46377 | -| total_timesteps | 905728 | -| train/ | | -| approx_kl | 0.0073646572 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | -0.642 | -| learning_rate | 0.0003 | -| loss | -0.000155 | -| n_updates | 70750 | -| policy_gradient_loss | 0.000916 | -| std | 0.146 | -| value_loss | 3.91e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7077 | -| time_elapsed | 46381 | -| total_timesteps | 905856 | -| train/ | | -| approx_kl | 0.0068803863 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.503 | -| explained_variance | -0.0806 | -| learning_rate | 0.0003 | -| loss | 0.00204 | -| n_updates | 70760 | -| policy_gradient_loss | 0.000622 | -| std | 0.146 | -| value_loss | 5.47e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.14 | -| time/ | | -| fps | 19 | -| iterations | 7078 | -| time_elapsed | 46384 | -| total_timesteps | 905984 | -| train/ | | -| approx_kl | 0.00944942 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.503 | -| explained_variance | 0.0158 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 70770 | -| policy_gradient_loss | -0.00157 | -| std | 0.146 | -| value_loss | 3.57e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 19 | -| iterations | 7079 | -| time_elapsed | 46387 | -| total_timesteps | 906112 | -| train/ | | -| approx_kl | 0.019056907 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.503 | -| explained_variance | 0.0171 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 70780 | -| policy_gradient_loss | -0.0021 | -| std | 0.146 | -| value_loss | 3.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 19 | -| iterations | 7080 | -| time_elapsed | 46395 | -| total_timesteps | 906240 | -| train/ | | -| approx_kl | 0.004893742 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.503 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 70790 | -| policy_gradient_loss | -0.00105 | -| std | 0.147 | -| value_loss | 0.000199 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 19 | -| iterations | 7081 | -| time_elapsed | 46399 | -| total_timesteps | 906368 | -| train/ | | -| approx_kl | 0.020693552 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.501 | -| explained_variance | 0.000469 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 70800 | -| policy_gradient_loss | -0.0089 | -| std | 0.147 | -| value_loss | 4.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 19 | -| iterations | 7082 | -| time_elapsed | 46401 | -| total_timesteps | 906496 | -| train/ | | -| approx_kl | 0.009898121 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 0.5 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 70810 | -| policy_gradient_loss | -0.00406 | -| std | 0.147 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 19 | -| iterations | 7083 | -| time_elapsed | 46405 | -| total_timesteps | 906624 | -| train/ | | -| approx_kl | 0.019193534 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.5 | -| explained_variance | -0.524 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 70820 | -| policy_gradient_loss | -0.00175 | -| std | 0.147 | -| value_loss | 1.16e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 19 | -| iterations | 7084 | -| time_elapsed | 46408 | -| total_timesteps | 906752 | -| train/ | | -| approx_kl | 0.0020235516 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.502 | -| explained_variance | 0.00476 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 70830 | -| policy_gradient_loss | -0.00039 | -| std | 0.146 | -| value_loss | 1.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.13 | -| time/ | | -| fps | 19 | -| iterations | 7085 | -| time_elapsed | 46413 | -| total_timesteps | 906880 | -| train/ | | -| approx_kl | 0.0030486146 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 0.504 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 70840 | -| policy_gradient_loss | -0.00535 | -| std | 0.146 | -| value_loss | 1.02e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7086 | -| time_elapsed | 46416 | -| total_timesteps | 907008 | -| train/ | | -| approx_kl | 0.017650465 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.504 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 70850 | -| policy_gradient_loss | -0.00893 | -| std | 0.146 | -| value_loss | 3.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7087 | -| time_elapsed | 46424 | -| total_timesteps | 907136 | -| train/ | | -| approx_kl | 0.018333703 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.505 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | -0.000943 | -| n_updates | 70860 | -| policy_gradient_loss | -0.00197 | -| std | 0.146 | -| value_loss | 0.00219 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7088 | -| time_elapsed | 46427 | -| total_timesteps | 907264 | -| train/ | | -| approx_kl | 0.0157289 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 0.507 | -| explained_variance | 0.529 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 70870 | -| policy_gradient_loss | -0.00823 | -| std | 0.146 | -| value_loss | 0.000188 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7089 | -| time_elapsed | 46430 | -| total_timesteps | 907392 | -| train/ | | -| approx_kl | 0.021133369 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.507 | -| explained_variance | -11.6 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 70880 | -| policy_gradient_loss | -0.0061 | -| std | 0.146 | -| value_loss | 5.94e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7090 | -| time_elapsed | 46433 | -| total_timesteps | 907520 | -| train/ | | -| approx_kl | 0.009249117 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 0.507 | -| explained_variance | -5.47 | -| learning_rate | 0.0003 | -| loss | -0.000994 | -| n_updates | 70890 | -| policy_gradient_loss | -0.000304 | -| std | 0.146 | -| value_loss | 1.7e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7091 | -| time_elapsed | 46436 | -| total_timesteps | 907648 | -| train/ | | -| approx_kl | 0.0020880918 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.506 | -| explained_variance | -0.527 | -| learning_rate | 0.0003 | -| loss | -0.00581 | -| n_updates | 70900 | -| policy_gradient_loss | -0.00423 | -| std | 0.146 | -| value_loss | 1.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7092 | -| time_elapsed | 46439 | -| total_timesteps | 907776 | -| train/ | | -| approx_kl | 0.017162079 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.506 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.00398 | -| n_updates | 70910 | -| policy_gradient_loss | 0.000539 | -| std | 0.146 | -| value_loss | 5.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7093 | -| time_elapsed | 46442 | -| total_timesteps | 907904 | -| train/ | | -| approx_kl | 0.030883841 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.507 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.00295 | -| n_updates | 70920 | -| policy_gradient_loss | -0.00187 | -| std | 0.146 | -| value_loss | 4.59e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7094 | -| time_elapsed | 46446 | -| total_timesteps | 908032 | -| train/ | | -| approx_kl | 0.0023323935 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.508 | -| explained_variance | -0.319 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 70930 | -| policy_gradient_loss | 1.84e-05 | -| std | 0.146 | -| value_loss | 2.47e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7095 | -| time_elapsed | 46453 | -| total_timesteps | 908160 | -| train/ | | -| approx_kl | 0.023520024 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 0.508 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 70940 | -| policy_gradient_loss | -0.00365 | -| std | 0.146 | -| value_loss | 0.00393 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7096 | -| time_elapsed | 46458 | -| total_timesteps | 908288 | -| train/ | | -| approx_kl | 0.0055289646 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.509 | -| explained_variance | 0.403 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 70950 | -| policy_gradient_loss | -0.0017 | -| std | 0.145 | -| value_loss | 3.82e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7097 | -| time_elapsed | 46462 | -| total_timesteps | 908416 | -| train/ | | -| approx_kl | 0.05847139 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.511 | -| explained_variance | -8.71 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 70960 | -| policy_gradient_loss | -0.00815 | -| std | 0.145 | -| value_loss | 1.58e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7098 | -| time_elapsed | 46464 | -| total_timesteps | 908544 | -| train/ | | -| approx_kl | 0.008500138 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.513 | -| explained_variance | 0.0163 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 70970 | -| policy_gradient_loss | 0.000655 | -| std | 0.145 | -| value_loss | 2.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7099 | -| time_elapsed | 46467 | -| total_timesteps | 908672 | -| train/ | | -| approx_kl | 0.02018023 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.515 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.00626 | -| n_updates | 70980 | -| policy_gradient_loss | 0.00121 | -| std | 0.145 | -| value_loss | 2.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7100 | -| time_elapsed | 46468 | -| total_timesteps | 908800 | -| train/ | | -| approx_kl | 0.012863617 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.516 | -| explained_variance | 0.0252 | -| learning_rate | 0.0003 | -| loss | -0.00767 | -| n_updates | 70990 | -| policy_gradient_loss | -0.00488 | -| std | 0.144 | -| value_loss | 9.71e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7101 | -| time_elapsed | 46471 | -| total_timesteps | 908928 | -| train/ | | -| approx_kl | 0.0103115905 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.517 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 71000 | -| policy_gradient_loss | 0.000908 | -| std | 0.144 | -| value_loss | 1.11e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7102 | -| time_elapsed | 46474 | -| total_timesteps | 909056 | -| train/ | | -| approx_kl | 0.008578682 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.00081 | -| n_updates | 71010 | -| policy_gradient_loss | -0.000221 | -| std | 0.144 | -| value_loss | 8.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7103 | -| time_elapsed | 46480 | -| total_timesteps | 909184 | -| train/ | | -| approx_kl | 0.04558707 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 71020 | -| policy_gradient_loss | -0.00688 | -| std | 0.144 | -| value_loss | 0.000735 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7104 | -| time_elapsed | 46485 | -| total_timesteps | 909312 | -| train/ | | -| approx_kl | 0.049272176 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -54.5 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 71030 | -| policy_gradient_loss | -0.00457 | -| std | 0.144 | -| value_loss | 3.86e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7105 | -| time_elapsed | 46488 | -| total_timesteps | 909440 | -| train/ | | -| approx_kl | 0.01865841 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -18 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 71040 | -| policy_gradient_loss | -0.00096 | -| std | 0.144 | -| value_loss | 5.43e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7106 | -| time_elapsed | 46491 | -| total_timesteps | 909568 | -| train/ | | -| approx_kl | 0.0047350586 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.00092 | -| n_updates | 71050 | -| policy_gradient_loss | 0.00277 | -| std | 0.144 | -| value_loss | 5.65e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7107 | -| time_elapsed | 46494 | -| total_timesteps | 909696 | -| train/ | | -| approx_kl | 0.02213459 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -2.39 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 71060 | -| policy_gradient_loss | -0.00284 | -| std | 0.144 | -| value_loss | 7.58e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7108 | -| time_elapsed | 46496 | -| total_timesteps | 909824 | -| train/ | | -| approx_kl | 0.018776257 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -3.65 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 71070 | -| policy_gradient_loss | -0.00125 | -| std | 0.144 | -| value_loss | 4.77e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.09 | -| time/ | | -| fps | 19 | -| iterations | 7109 | -| time_elapsed | 46499 | -| total_timesteps | 909952 | -| train/ | | -| approx_kl | 0.0227913 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -1.58 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 71080 | -| policy_gradient_loss | -0.0165 | -| std | 0.144 | -| value_loss | 0.000139 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7110 | -| time_elapsed | 46501 | -| total_timesteps | 910080 | -| train/ | | -| approx_kl | 0.05002178 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -2.37 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 71090 | -| policy_gradient_loss | -0.0135 | -| std | 0.144 | -| value_loss | 0.00023 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7111 | -| time_elapsed | 46506 | -| total_timesteps | 910208 | -| train/ | | -| approx_kl | 0.005170448 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | 0.456 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 71100 | -| policy_gradient_loss | -0.0033 | -| std | 0.144 | -| value_loss | 0.00665 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7112 | -| time_elapsed | 46511 | -| total_timesteps | 910336 | -| train/ | | -| approx_kl | 0.029217467 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.517 | -| explained_variance | -1.36 | -| learning_rate | 0.0003 | -| loss | 0.00914 | -| n_updates | 71110 | -| policy_gradient_loss | 0.000621 | -| std | 0.144 | -| value_loss | 0.000125 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7113 | -| time_elapsed | 46515 | -| total_timesteps | 910464 | -| train/ | | -| approx_kl | 0.011698913 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | 0.00464 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 71120 | -| policy_gradient_loss | -0.000536 | -| std | 0.144 | -| value_loss | 9.6e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7114 | -| time_elapsed | 46518 | -| total_timesteps | 910592 | -| train/ | | -| approx_kl | 0.019316882 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -0.821 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 71130 | -| policy_gradient_loss | -0.00329 | -| std | 0.144 | -| value_loss | 2.3e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7115 | -| time_elapsed | 46522 | -| total_timesteps | 910720 | -| train/ | | -| approx_kl | 0.00047327252 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.52 | -| explained_variance | -0.402 | -| learning_rate | 0.0003 | -| loss | -0.000633 | -| n_updates | 71140 | -| policy_gradient_loss | 0.000164 | -| std | 0.144 | -| value_loss | 1.01e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7116 | -| time_elapsed | 46527 | -| total_timesteps | 910848 | -| train/ | | -| approx_kl | 0.023414318 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.523 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00087 | -| n_updates | 71150 | -| policy_gradient_loss | -0.00269 | -| std | 0.143 | -| value_loss | 9.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.08 | -| time/ | | -| fps | 19 | -| iterations | 7117 | -| time_elapsed | 46531 | -| total_timesteps | 910976 | -| train/ | | -| approx_kl | 0.009907233 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.524 | -| explained_variance | 0.0252 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 71160 | -| policy_gradient_loss | -0.000923 | -| std | 0.143 | -| value_loss | 5.83e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7118 | -| time_elapsed | 46535 | -| total_timesteps | 911104 | -| train/ | | -| approx_kl | 0.026689293 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.525 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | 0.00332 | -| n_updates | 71170 | -| policy_gradient_loss | -0.00183 | -| std | 0.143 | -| value_loss | 4.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7119 | -| time_elapsed | 46544 | -| total_timesteps | 911232 | -| train/ | | -| approx_kl | 0.045732982 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 0.525 | -| explained_variance | 0.932 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 71180 | -| policy_gradient_loss | -0.00635 | -| std | 0.143 | -| value_loss | 0.000905 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7120 | -| time_elapsed | 46548 | -| total_timesteps | 911360 | -| train/ | | -| approx_kl | 0.027179202 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 0.526 | -| explained_variance | -0.511 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 71190 | -| policy_gradient_loss | -0.0114 | -| std | 0.143 | -| value_loss | 5.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7121 | -| time_elapsed | 46551 | -| total_timesteps | 911488 | -| train/ | | -| approx_kl | 0.004793337 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.527 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.00039 | -| n_updates | 71200 | -| policy_gradient_loss | 0.00278 | -| std | 0.143 | -| value_loss | 1.61e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7122 | -| time_elapsed | 46555 | -| total_timesteps | 911616 | -| train/ | | -| approx_kl | 0.02845883 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 0.528 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 71210 | -| policy_gradient_loss | -0.00508 | -| std | 0.143 | -| value_loss | 1.57e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7123 | -| time_elapsed | 46559 | -| total_timesteps | 911744 | -| train/ | | -| approx_kl | 0.031483393 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.528 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00807 | -| n_updates | 71220 | -| policy_gradient_loss | -0.00467 | -| std | 0.143 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7124 | -| time_elapsed | 46562 | -| total_timesteps | 911872 | -| train/ | | -| approx_kl | 0.030267352 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 0.528 | -| explained_variance | -0.404 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 71230 | -| policy_gradient_loss | -0.0148 | -| std | 0.143 | -| value_loss | 3.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7125 | -| time_elapsed | 46565 | -| total_timesteps | 912000 | -| train/ | | -| approx_kl | 0.013794301 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.529 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.000939 | -| n_updates | 71240 | -| policy_gradient_loss | -0.00019 | -| std | 0.142 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7126 | -| time_elapsed | 46569 | -| total_timesteps | 912128 | -| train/ | | -| approx_kl | 0.0035113925 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.53 | -| explained_variance | 0.00135 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 71250 | -| policy_gradient_loss | -0.00171 | -| std | 0.142 | -| value_loss | 1.22e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7127 | -| time_elapsed | 46577 | -| total_timesteps | 912256 | -| train/ | | -| approx_kl | 0.041178327 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.53 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 71260 | -| policy_gradient_loss | -0.0105 | -| std | 0.142 | -| value_loss | 0.00136 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7128 | -| time_elapsed | 46580 | -| total_timesteps | 912384 | -| train/ | | -| approx_kl | 0.0022074333 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.53 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 71270 | -| policy_gradient_loss | -0.00215 | -| std | 0.142 | -| value_loss | 1.29e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7129 | -| time_elapsed | 46582 | -| total_timesteps | 912512 | -| train/ | | -| approx_kl | 0.021880403 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.531 | -| explained_variance | -14 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 71280 | -| policy_gradient_loss | -0.00183 | -| std | 0.142 | -| value_loss | 2.85e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7130 | -| time_elapsed | 46585 | -| total_timesteps | 912640 | -| train/ | | -| approx_kl | 0.005731307 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.53 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 71290 | -| policy_gradient_loss | 0.00187 | -| std | 0.143 | -| value_loss | 1.78e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7131 | -| time_elapsed | 46589 | -| total_timesteps | 912768 | -| train/ | | -| approx_kl | 0.00082783774 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.526 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 71300 | -| policy_gradient_loss | -0.00193 | -| std | 0.143 | -| value_loss | 3.61e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7132 | -| time_elapsed | 46593 | -| total_timesteps | 912896 | -| train/ | | -| approx_kl | 0.009051049 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.526 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.0003 | -| n_updates | 71310 | -| policy_gradient_loss | 9.49e-05 | -| std | 0.143 | -| value_loss | 7.41e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7133 | -| time_elapsed | 46597 | -| total_timesteps | 913024 | -| train/ | | -| approx_kl | 0.03313209 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.525 | -| explained_variance | -0.621 | -| learning_rate | 0.0003 | -| loss | -0.00364 | -| n_updates | 71320 | -| policy_gradient_loss | -0.0047 | -| std | 0.143 | -| value_loss | 1.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7134 | -| time_elapsed | 46607 | -| total_timesteps | 913152 | -| train/ | | -| approx_kl | 0.019623531 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 0.525 | -| explained_variance | 0.781 | -| learning_rate | 0.0003 | -| loss | 0.00156 | -| n_updates | 71330 | -| policy_gradient_loss | -0.00139 | -| std | 0.143 | -| value_loss | 0.00485 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7135 | -| time_elapsed | 46609 | -| total_timesteps | 913280 | -| train/ | | -| approx_kl | 0.00041122362 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 0.526 | -| explained_variance | 0.324 | -| learning_rate | 0.0003 | -| loss | -0.00034 | -| n_updates | 71340 | -| policy_gradient_loss | -0.000131 | -| std | 0.143 | -| value_loss | 1.23e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7136 | -| time_elapsed | 46612 | -| total_timesteps | 913408 | -| train/ | | -| approx_kl | 0.012780979 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.527 | -| explained_variance | -4.03 | -| learning_rate | 0.0003 | -| loss | -0.00489 | -| n_updates | 71350 | -| policy_gradient_loss | -0.00333 | -| std | 0.143 | -| value_loss | 1.02e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7137 | -| time_elapsed | 46615 | -| total_timesteps | 913536 | -| train/ | | -| approx_kl | 0.01420213 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 0.527 | -| explained_variance | -0.489 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 71360 | -| policy_gradient_loss | -0.007 | -| std | 0.143 | -| value_loss | 1.27e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7138 | -| time_elapsed | 46619 | -| total_timesteps | 913664 | -| train/ | | -| approx_kl | 0.008443767 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.526 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 71370 | -| policy_gradient_loss | -0.000334 | -| std | 0.143 | -| value_loss | 6.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7139 | -| time_elapsed | 46624 | -| total_timesteps | 913792 | -| train/ | | -| approx_kl | 0.010982626 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 0.525 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 71380 | -| policy_gradient_loss | -0.0024 | -| std | 0.143 | -| value_loss | 8.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7140 | -| time_elapsed | 46627 | -| total_timesteps | 913920 | -| train/ | | -| approx_kl | 0.0014040852 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 0.524 | -| explained_variance | -9.16 | -| learning_rate | 0.0003 | -| loss | -0.000963 | -| n_updates | 71390 | -| policy_gradient_loss | -0.000835 | -| std | 0.143 | -| value_loss | 2.35e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7141 | -| time_elapsed | 46631 | -| total_timesteps | 914048 | -| train/ | | -| approx_kl | 0.02848662 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.524 | -| explained_variance | -9.52 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 71400 | -| policy_gradient_loss | -0.00223 | -| std | 0.143 | -| value_loss | 1.5e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7142 | -| time_elapsed | 46635 | -| total_timesteps | 914176 | -| train/ | | -| approx_kl | 0.00841153 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.524 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 71410 | -| policy_gradient_loss | 0.00509 | -| std | 0.143 | -| value_loss | 0.00278 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7143 | -| time_elapsed | 46639 | -| total_timesteps | 914304 | -| train/ | | -| approx_kl | 0.019394431 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.525 | -| explained_variance | 0.0059 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 71420 | -| policy_gradient_loss | -0.0024 | -| std | 0.143 | -| value_loss | 1.21e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7144 | -| time_elapsed | 46642 | -| total_timesteps | 914432 | -| train/ | | -| approx_kl | 0.013838565 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.525 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 71430 | -| policy_gradient_loss | -0.00376 | -| std | 0.143 | -| value_loss | 6.93e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7145 | -| time_elapsed | 46646 | -| total_timesteps | 914560 | -| train/ | | -| approx_kl | 0.015222678 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 0.523 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | 0.00301 | -| n_updates | 71440 | -| policy_gradient_loss | 0.000423 | -| std | 0.143 | -| value_loss | 8.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7146 | -| time_elapsed | 46650 | -| total_timesteps | 914688 | -| train/ | | -| approx_kl | 0.010697873 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.523 | -| explained_variance | -0.00616 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 71450 | -| policy_gradient_loss | -0.00373 | -| std | 0.143 | -| value_loss | 1.48e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7147 | -| time_elapsed | 46654 | -| total_timesteps | 914816 | -| train/ | | -| approx_kl | 0.01585291 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.522 | -| explained_variance | 0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0041 | -| n_updates | 71460 | -| policy_gradient_loss | 0.000832 | -| std | 0.144 | -| value_loss | 1.08e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7148 | -| time_elapsed | 46657 | -| total_timesteps | 914944 | -| train/ | | -| approx_kl | 0.03289156 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 0.521 | -| explained_variance | -0.751 | -| learning_rate | 0.0003 | -| loss | -0.00489 | -| n_updates | 71470 | -| policy_gradient_loss | -0.00512 | -| std | 0.144 | -| value_loss | 3.05e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7149 | -| time_elapsed | 46659 | -| total_timesteps | 915072 | -| train/ | | -| approx_kl | 0.01659828 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 0.52 | -| explained_variance | -0.00574 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 71480 | -| policy_gradient_loss | -0.00562 | -| std | 0.144 | -| value_loss | 3.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7150 | -| time_elapsed | 46666 | -| total_timesteps | 915200 | -| train/ | | -| approx_kl | 0.039109357 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -3.29 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 71490 | -| policy_gradient_loss | -0.00989 | -| std | 0.144 | -| value_loss | 0.00454 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7151 | -| time_elapsed | 46669 | -| total_timesteps | 915328 | -| train/ | | -| approx_kl | 0.031506874 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 71500 | -| policy_gradient_loss | -0.00671 | -| std | 0.144 | -| value_loss | 4.01e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7152 | -| time_elapsed | 46674 | -| total_timesteps | 915456 | -| train/ | | -| approx_kl | 0.027240802 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 0.517 | -| explained_variance | -69.5 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 71510 | -| policy_gradient_loss | -0.0114 | -| std | 0.144 | -| value_loss | 8.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7153 | -| time_elapsed | 46677 | -| total_timesteps | 915584 | -| train/ | | -| approx_kl | 0.032935537 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.516 | -| explained_variance | -66.7 | -| learning_rate | 0.0003 | -| loss | -0.0298 | -| n_updates | 71520 | -| policy_gradient_loss | -0.0122 | -| std | 0.144 | -| value_loss | 6.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7154 | -| time_elapsed | 46681 | -| total_timesteps | 915712 | -| train/ | | -| approx_kl | 0.033520795 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.516 | -| explained_variance | -70.9 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 71530 | -| policy_gradient_loss | -0.00756 | -| std | 0.144 | -| value_loss | 8.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7155 | -| time_elapsed | 46685 | -| total_timesteps | 915840 | -| train/ | | -| approx_kl | 0.014180094 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.516 | -| explained_variance | -2.31 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 71540 | -| policy_gradient_loss | -0.00153 | -| std | 0.144 | -| value_loss | 9.02e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.07 | -| time/ | | -| fps | 19 | -| iterations | 7156 | -| time_elapsed | 46688 | -| total_timesteps | 915968 | -| train/ | | -| approx_kl | 0.0027272054 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.517 | -| explained_variance | -8.57 | -| learning_rate | 0.0003 | -| loss | -0.000832 | -| n_updates | 71550 | -| policy_gradient_loss | 0.000463 | -| std | 0.144 | -| value_loss | 8.74e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7157 | -| time_elapsed | 46691 | -| total_timesteps | 916096 | -| train/ | | -| approx_kl | 0.047327477 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.518 | -| explained_variance | -5.34 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 71560 | -| policy_gradient_loss | -0.00916 | -| std | 0.144 | -| value_loss | 6.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7158 | -| time_elapsed | 46698 | -| total_timesteps | 916224 | -| train/ | | -| approx_kl | 0.04370086 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -0.838 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 71570 | -| policy_gradient_loss | -0.014 | -| std | 0.144 | -| value_loss | 0.00177 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7159 | -| time_elapsed | 46701 | -| total_timesteps | 916352 | -| train/ | | -| approx_kl | 0.0011755824 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | -0.000617 | -| n_updates | 71580 | -| policy_gradient_loss | -0.000423 | -| std | 0.144 | -| value_loss | 0.000333 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7160 | -| time_elapsed | 46705 | -| total_timesteps | 916480 | -| train/ | | -| approx_kl | 0.006861124 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.000924 | -| n_updates | 71590 | -| policy_gradient_loss | 0.00221 | -| std | 0.144 | -| value_loss | 0.000107 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7161 | -| time_elapsed | 46708 | -| total_timesteps | 916608 | -| train/ | | -| approx_kl | 0.015104694 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.519 | -| explained_variance | -0.0785 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 71600 | -| policy_gradient_loss | -0.00286 | -| std | 0.144 | -| value_loss | 4.22e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7162 | -| time_elapsed | 46712 | -| total_timesteps | 916736 | -| train/ | | -| approx_kl | 0.00812903 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 0.52 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.000492 | -| n_updates | 71610 | -| policy_gradient_loss | 0.00126 | -| std | 0.144 | -| value_loss | 5.45e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7163 | -| time_elapsed | 46716 | -| total_timesteps | 916864 | -| train/ | | -| approx_kl | 0.002215826 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.522 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 71620 | -| policy_gradient_loss | 0.00158 | -| std | 0.144 | -| value_loss | 2.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7164 | -| time_elapsed | 46720 | -| total_timesteps | 916992 | -| train/ | | -| approx_kl | 0.012905551 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.521 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.00698 | -| n_updates | 71630 | -| policy_gradient_loss | 0.00199 | -| std | 0.144 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7165 | -| time_elapsed | 46724 | -| total_timesteps | 917120 | -| train/ | | -| approx_kl | 0.011256969 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.521 | -| explained_variance | 0.0186 | -| learning_rate | 0.0003 | -| loss | 0.000529 | -| n_updates | 71640 | -| policy_gradient_loss | 0.000386 | -| std | 0.144 | -| value_loss | 2.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7166 | -| time_elapsed | 46734 | -| total_timesteps | 917248 | -| train/ | | -| approx_kl | 0.025944548 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.521 | -| explained_variance | 0.455 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 71650 | -| policy_gradient_loss | -0.0109 | -| std | 0.144 | -| value_loss | 0.00201 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7167 | -| time_elapsed | 46738 | -| total_timesteps | 917376 | -| train/ | | -| approx_kl | 0.015706573 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.522 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 71660 | -| policy_gradient_loss | -0.00398 | -| std | 0.144 | -| value_loss | 1.11e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7168 | -| time_elapsed | 46742 | -| total_timesteps | 917504 | -| train/ | | -| approx_kl | 0.032897968 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.522 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 71670 | -| policy_gradient_loss | -0.00474 | -| std | 0.144 | -| value_loss | 3.67e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7169 | -| time_elapsed | 46746 | -| total_timesteps | 917632 | -| train/ | | -| approx_kl | 0.0013300083 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 0.523 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.000619 | -| n_updates | 71680 | -| policy_gradient_loss | -0.000376 | -| std | 0.143 | -| value_loss | 6.64e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7170 | -| time_elapsed | 46750 | -| total_timesteps | 917760 | -| train/ | | -| approx_kl | 0.012070008 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.526 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | 0.000235 | -| n_updates | 71690 | -| policy_gradient_loss | -0.000109 | -| std | 0.143 | -| value_loss | 3.09e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7171 | -| time_elapsed | 46753 | -| total_timesteps | 917888 | -| train/ | | -| approx_kl | 0.0127341915 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 0.528 | -| explained_variance | -0.00161 | -| learning_rate | 0.0003 | -| loss | -0.0266 | -| n_updates | 71700 | -| policy_gradient_loss | -0.0198 | -| std | 0.143 | -| value_loss | 3.61e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7172 | -| time_elapsed | 46756 | -| total_timesteps | 918016 | -| train/ | | -| approx_kl | 0.0032535703 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.528 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00498 | -| n_updates | 71710 | -| policy_gradient_loss | -0.00131 | -| std | 0.143 | -| value_loss | 1.1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7173 | -| time_elapsed | 46763 | -| total_timesteps | 918144 | -| train/ | | -| approx_kl | 0.037932295 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 0.529 | -| explained_variance | 0.0169 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 71720 | -| policy_gradient_loss | -0.0105 | -| std | 0.143 | -| value_loss | 0.00105 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7174 | -| time_elapsed | 46767 | -| total_timesteps | 918272 | -| train/ | | -| approx_kl | 0.0017039105 | -| clip_fraction | 0.00547 | -| clip_range | 0.2 | -| entropy_loss | 0.53 | -| explained_variance | 0.00317 | -| learning_rate | 0.0003 | -| loss | -0.000551 | -| n_updates | 71730 | -| policy_gradient_loss | -0.000264 | -| std | 0.142 | -| value_loss | 1.56e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7175 | -| time_elapsed | 46769 | -| total_timesteps | 918400 | -| train/ | | -| approx_kl | 0.012990081 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.534 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.0025 | -| n_updates | 71740 | -| policy_gradient_loss | 0.000717 | -| std | 0.142 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7176 | -| time_elapsed | 46771 | -| total_timesteps | 918528 | -| train/ | | -| approx_kl | 0.028163247 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.536 | -| explained_variance | -0.0753 | -| learning_rate | 0.0003 | -| loss | 4.8e-05 | -| n_updates | 71750 | -| policy_gradient_loss | -0.00239 | -| std | 0.141 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7177 | -| time_elapsed | 46774 | -| total_timesteps | 918656 | -| train/ | | -| approx_kl | 0.004242988 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.538 | -| explained_variance | -0.493 | -| learning_rate | 0.0003 | -| loss | -0.000959 | -| n_updates | 71760 | -| policy_gradient_loss | 9.59e-05 | -| std | 0.141 | -| value_loss | 6.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7178 | -| time_elapsed | 46776 | -| total_timesteps | 918784 | -| train/ | | -| approx_kl | 0.018278329 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.538 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 71770 | -| policy_gradient_loss | -0.00202 | -| std | 0.141 | -| value_loss | 1.75e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7179 | -| time_elapsed | 46779 | -| total_timesteps | 918912 | -| train/ | | -| approx_kl | 0.0012744409 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.538 | -| explained_variance | 0.00653 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 71780 | -| policy_gradient_loss | 0.000669 | -| std | 0.141 | -| value_loss | 4.35e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7180 | -| time_elapsed | 46781 | -| total_timesteps | 919040 | -| train/ | | -| approx_kl | 0.009356512 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.538 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 71790 | -| policy_gradient_loss | 0.000618 | -| std | 0.141 | -| value_loss | 3.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7181 | -| time_elapsed | 46789 | -| total_timesteps | 919168 | -| train/ | | -| approx_kl | 0.020186037 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.539 | -| explained_variance | 0.378 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 71800 | -| policy_gradient_loss | -0.00119 | -| std | 0.141 | -| value_loss | 0.0298 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7182 | -| time_elapsed | 46793 | -| total_timesteps | 919296 | -| train/ | | -| approx_kl | 0.017632365 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 0.54 | -| explained_variance | -0.521 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 71810 | -| policy_gradient_loss | -0.00234 | -| std | 0.141 | -| value_loss | 8.52e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7183 | -| time_elapsed | 46797 | -| total_timesteps | 919424 | -| train/ | | -| approx_kl | 0.0329394 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.54 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 71820 | -| policy_gradient_loss | -0.00852 | -| std | 0.141 | -| value_loss | 0.000105 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7184 | -| time_elapsed | 46801 | -| total_timesteps | 919552 | -| train/ | | -| approx_kl | 0.0019349433 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.54 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 71830 | -| policy_gradient_loss | -0.00121 | -| std | 0.141 | -| value_loss | 2.96e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7185 | -| time_elapsed | 46805 | -| total_timesteps | 919680 | -| train/ | | -| approx_kl | 0.01695317 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.541 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.000388 | -| n_updates | 71840 | -| policy_gradient_loss | -0.00071 | -| std | 0.141 | -| value_loss | 1.76e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7186 | -| time_elapsed | 46808 | -| total_timesteps | 919808 | -| train/ | | -| approx_kl | 0.018653871 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.541 | -| explained_variance | 0.00316 | -| learning_rate | 0.0003 | -| loss | -0.000885 | -| n_updates | 71850 | -| policy_gradient_loss | -0.00224 | -| std | 0.141 | -| value_loss | 2.69e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7187 | -| time_elapsed | 46811 | -| total_timesteps | 919936 | -| train/ | | -| approx_kl | 0.042552672 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 0.541 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 71860 | -| policy_gradient_loss | -0.0118 | -| std | 0.141 | -| value_loss | 1.05e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7188 | -| time_elapsed | 46815 | -| total_timesteps | 920064 | -| train/ | | -| approx_kl | 0.02588746 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 0.542 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 71870 | -| policy_gradient_loss | -0.00555 | -| std | 0.141 | -| value_loss | 6.39e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7189 | -| time_elapsed | 46821 | -| total_timesteps | 920192 | -| train/ | | -| approx_kl | 0.06449701 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 0.543 | -| explained_variance | -0.449 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 71880 | -| policy_gradient_loss | -0.0157 | -| std | 0.141 | -| value_loss | 0.00167 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7190 | -| time_elapsed | 46824 | -| total_timesteps | 920320 | -| train/ | | -| approx_kl | 0.011265397 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 0.543 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | -0.000702 | -| n_updates | 71890 | -| policy_gradient_loss | -0.000542 | -| std | 0.14 | -| value_loss | 6.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7191 | -| time_elapsed | 46827 | -| total_timesteps | 920448 | -| train/ | | -| approx_kl | 0.0048654843 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.545 | -| explained_variance | -0.727 | -| learning_rate | 0.0003 | -| loss | -0.000963 | -| n_updates | 71900 | -| policy_gradient_loss | -0.000415 | -| std | 0.14 | -| value_loss | 2.31e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7192 | -| time_elapsed | 46830 | -| total_timesteps | 920576 | -| train/ | | -| approx_kl | 0.028338948 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.546 | -| explained_variance | 0.00254 | -| learning_rate | 0.0003 | -| loss | 0.00791 | -| n_updates | 71910 | -| policy_gradient_loss | -2.45e-07 | -| std | 0.14 | -| value_loss | 2.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7193 | -| time_elapsed | 46834 | -| total_timesteps | 920704 | -| train/ | | -| approx_kl | 0.006246564 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 0.547 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 71920 | -| policy_gradient_loss | -0.0127 | -| std | 0.14 | -| value_loss | 3.01e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7194 | -| time_elapsed | 46837 | -| total_timesteps | 920832 | -| train/ | | -| approx_kl | 0.00021600304 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | 0.548 | -| explained_variance | -0.0692 | -| learning_rate | 0.0003 | -| loss | -9.74e-05 | -| n_updates | 71930 | -| policy_gradient_loss | 7.25e-05 | -| std | 0.14 | -| value_loss | 5.43e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7195 | -| time_elapsed | 46841 | -| total_timesteps | 920960 | -| train/ | | -| approx_kl | 0.046746556 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 0.551 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | -0.00983 | -| n_updates | 71940 | -| policy_gradient_loss | -0.0109 | -| std | 0.139 | -| value_loss | 4.99e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7196 | -| time_elapsed | 46845 | -| total_timesteps | 921088 | -| train/ | | -| approx_kl | 0.0026491997 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 0.554 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | -0.000785 | -| n_updates | 71950 | -| policy_gradient_loss | -0.00036 | -| std | 0.139 | -| value_loss | 1.97e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7197 | -| time_elapsed | 46852 | -| total_timesteps | 921216 | -| train/ | | -| approx_kl | 0.009819291 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.558 | -| explained_variance | 0.105 | -| learning_rate | 0.0003 | -| loss | 0.0191 | -| n_updates | 71960 | -| policy_gradient_loss | -0.00585 | -| std | 0.138 | -| value_loss | 0.0601 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7198 | -| time_elapsed | 46856 | -| total_timesteps | 921344 | -| train/ | | -| approx_kl | 0.0063452516 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.56 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 71970 | -| policy_gradient_loss | 0.00171 | -| std | 0.138 | -| value_loss | 0.00132 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7199 | -| time_elapsed | 46860 | -| total_timesteps | 921472 | -| train/ | | -| approx_kl | 0.021060377 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 0.561 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | 0.00428 | -| n_updates | 71980 | -| policy_gradient_loss | 0.0035 | -| std | 0.138 | -| value_loss | 0.00219 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7200 | -| time_elapsed | 46864 | -| total_timesteps | 921600 | -| train/ | | -| approx_kl | 0.014904426 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 0.562 | -| explained_variance | -0.436 | -| learning_rate | 0.0003 | -| loss | -0.000345 | -| n_updates | 71990 | -| policy_gradient_loss | 0.00156 | -| std | 0.138 | -| value_loss | 0.000894 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7201 | -| time_elapsed | 46867 | -| total_timesteps | 921728 | -| train/ | | -| approx_kl | 0.01976213 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 0.563 | -| explained_variance | -0.389 | -| learning_rate | 0.0003 | -| loss | 0.000835 | -| n_updates | 72000 | -| policy_gradient_loss | -0.000439 | -| std | 0.138 | -| value_loss | 0.000119 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7202 | -| time_elapsed | 46871 | -| total_timesteps | 921856 | -| train/ | | -| approx_kl | 0.008558426 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.563 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 72010 | -| policy_gradient_loss | -0.000737 | -| std | 0.138 | -| value_loss | 4.9e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7203 | -| time_elapsed | 46874 | -| total_timesteps | 921984 | -| train/ | | -| approx_kl | 0.008479709 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 0.563 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00726 | -| n_updates | 72020 | -| policy_gradient_loss | -0.00403 | -| std | 0.138 | -| value_loss | 8.87e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7204 | -| time_elapsed | 46876 | -| total_timesteps | 922112 | -| train/ | | -| approx_kl | 0.034916967 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 0.564 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 72030 | -| policy_gradient_loss | -0.0101 | -| std | 0.138 | -| value_loss | 9.45e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7205 | -| time_elapsed | 46887 | -| total_timesteps | 922240 | -| train/ | | -| approx_kl | 0.031986963 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.565 | -| explained_variance | -0.634 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 72040 | -| policy_gradient_loss | -0.0143 | -| std | 0.138 | -| value_loss | 0.0013 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7206 | -| time_elapsed | 46891 | -| total_timesteps | 922368 | -| train/ | | -| approx_kl | 6.0169492e-05 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.565 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.000319 | -| n_updates | 72050 | -| policy_gradient_loss | 0.000345 | -| std | 0.137 | -| value_loss | 2.41e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7207 | -| time_elapsed | 46894 | -| total_timesteps | 922496 | -| train/ | | -| approx_kl | 0.009702903 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.566 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 72060 | -| policy_gradient_loss | -0.00323 | -| std | 0.137 | -| value_loss | 5.49e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7208 | -| time_elapsed | 46897 | -| total_timesteps | 922624 | -| train/ | | -| approx_kl | 0.0187293 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 0.567 | -| explained_variance | -1.53 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 72070 | -| policy_gradient_loss | -0.000354 | -| std | 0.137 | -| value_loss | 6.55e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7209 | -| time_elapsed | 46900 | -| total_timesteps | 922752 | -| train/ | | -| approx_kl | 0.0018019937 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.568 | -| explained_variance | 0.00427 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 72080 | -| policy_gradient_loss | -0.00104 | -| std | 0.137 | -| value_loss | 4.75e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.06 | -| time/ | | -| fps | 19 | -| iterations | 7210 | -| time_elapsed | 46903 | -| total_timesteps | 922880 | -| train/ | | -| approx_kl | 0.0016968297 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 0.569 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | -3.14e-05 | -| n_updates | 72090 | -| policy_gradient_loss | -2.16e-05 | -| std | 0.137 | -| value_loss | 2.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7211 | -| time_elapsed | 46906 | -| total_timesteps | 923008 | -| train/ | | -| approx_kl | 0.011128774 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.569 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 72100 | -| policy_gradient_loss | -0.00149 | -| std | 0.137 | -| value_loss | 2.57e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7212 | -| time_elapsed | 46915 | -| total_timesteps | 923136 | -| train/ | | -| approx_kl | 0.1131702 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 0.57 | -| explained_variance | 0.594 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 72110 | -| policy_gradient_loss | -0.0147 | -| std | 0.137 | -| value_loss | 0.00059 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7213 | -| time_elapsed | 46919 | -| total_timesteps | 923264 | -| train/ | | -| approx_kl | 0.0025633038 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.57 | -| explained_variance | 0.535 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 72120 | -| policy_gradient_loss | -0.00253 | -| std | 0.137 | -| value_loss | 1.57e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7214 | -| time_elapsed | 46922 | -| total_timesteps | 923392 | -| train/ | | -| approx_kl | 0.0283643 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 0.57 | -| explained_variance | -21.3 | -| learning_rate | 0.0003 | -| loss | -0.00946 | -| n_updates | 72130 | -| policy_gradient_loss | -0.00739 | -| std | 0.137 | -| value_loss | 2.67e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7215 | -| time_elapsed | 46926 | -| total_timesteps | 923520 | -| train/ | | -| approx_kl | 0.07104776 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 0.571 | -| explained_variance | -0.405 | -| learning_rate | 0.0003 | -| loss | -0.0305 | -| n_updates | 72140 | -| policy_gradient_loss | -0.0262 | -| std | 0.137 | -| value_loss | 1.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7216 | -| time_elapsed | 46930 | -| total_timesteps | 923648 | -| train/ | | -| approx_kl | 0.005564082 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.571 | -| explained_variance | -0.933 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 72150 | -| policy_gradient_loss | -0.00847 | -| std | 0.137 | -| value_loss | 1.71e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7217 | -| time_elapsed | 46934 | -| total_timesteps | 923776 | -| train/ | | -| approx_kl | 0.009458502 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.57 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 72160 | -| policy_gradient_loss | -0.000853 | -| std | 0.137 | -| value_loss | 2.85e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.05 | -| time/ | | -| fps | 19 | -| iterations | 7218 | -| time_elapsed | 46938 | -| total_timesteps | 923904 | -| train/ | | -| approx_kl | 0.003852786 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.569 | -| explained_variance | -0.298 | -| learning_rate | 0.0003 | -| loss | -0.000642 | -| n_updates | 72170 | -| policy_gradient_loss | 0.00109 | -| std | 0.137 | -| value_loss | 6.18e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7219 | -| time_elapsed | 46942 | -| total_timesteps | 924032 | -| train/ | | -| approx_kl | 0.0015070084 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.568 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 72180 | -| policy_gradient_loss | -0.000422 | -| std | 0.137 | -| value_loss | 1.62e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7220 | -| time_elapsed | 46949 | -| total_timesteps | 924160 | -| train/ | | -| approx_kl | 0.018308476 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 0.567 | -| explained_variance | 0.33 | -| learning_rate | 0.0003 | -| loss | 0.000991 | -| n_updates | 72190 | -| policy_gradient_loss | -0.014 | -| std | 0.137 | -| value_loss | 0.026 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7221 | -| time_elapsed | 46953 | -| total_timesteps | 924288 | -| train/ | | -| approx_kl | 0.002687302 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.568 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 72200 | -| policy_gradient_loss | -0.000475 | -| std | 0.137 | -| value_loss | 0.000538 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7222 | -| time_elapsed | 46956 | -| total_timesteps | 924416 | -| train/ | | -| approx_kl | 0.023312649 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.569 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 72210 | -| policy_gradient_loss | -0.00483 | -| std | 0.137 | -| value_loss | 7.21e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7223 | -| time_elapsed | 46960 | -| total_timesteps | 924544 | -| train/ | | -| approx_kl | 0.0019363342 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.57 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 72220 | -| policy_gradient_loss | 0.000262 | -| std | 0.137 | -| value_loss | 0.000117 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7224 | -| time_elapsed | 46963 | -| total_timesteps | 924672 | -| train/ | | -| approx_kl | 0.0109617505 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.57 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 72230 | -| policy_gradient_loss | -0.003 | -| std | 0.137 | -| value_loss | 0.000237 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7225 | -| time_elapsed | 46967 | -| total_timesteps | 924800 | -| train/ | | -| approx_kl | 0.014471834 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.571 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | 0.00073 | -| n_updates | 72240 | -| policy_gradient_loss | 2.35e-05 | -| std | 0.137 | -| value_loss | 6.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7226 | -| time_elapsed | 46970 | -| total_timesteps | 924928 | -| train/ | | -| approx_kl | 0.024685431 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | 0.013 | -| learning_rate | 0.0003 | -| loss | 0.00702 | -| n_updates | 72250 | -| policy_gradient_loss | 0.00191 | -| std | 0.137 | -| value_loss | 8.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7227 | -| time_elapsed | 46973 | -| total_timesteps | 925056 | -| train/ | | -| approx_kl | 0.022127148 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.00986 | -| n_updates | 72260 | -| policy_gradient_loss | -0.00678 | -| std | 0.136 | -| value_loss | 1.5e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7228 | -| time_elapsed | 46978 | -| total_timesteps | 925184 | -| train/ | | -| approx_kl | 0.07923141 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 72270 | -| policy_gradient_loss | -0.0127 | -| std | 0.136 | -| value_loss | 0.00093 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7229 | -| time_elapsed | 46982 | -| total_timesteps | 925312 | -| train/ | | -| approx_kl | 0.023455236 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.0866 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 72280 | -| policy_gradient_loss | -0.00406 | -| std | 0.136 | -| value_loss | 4.96e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7230 | -| time_elapsed | 46984 | -| total_timesteps | 925440 | -| train/ | | -| approx_kl | 0.016910423 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.691 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 72290 | -| policy_gradient_loss | -0.00541 | -| std | 0.136 | -| value_loss | 8.95e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7231 | -| time_elapsed | 46987 | -| total_timesteps | 925568 | -| train/ | | -| approx_kl | 0.0052980217 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | 0.574 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | -8.69e-05 | -| n_updates | 72300 | -| policy_gradient_loss | -5.58e-05 | -| std | 0.136 | -| value_loss | 3.1e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7232 | -| time_elapsed | 46991 | -| total_timesteps | 925696 | -| train/ | | -| approx_kl | 0.014745681 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.576 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 72310 | -| policy_gradient_loss | -0.0014 | -| std | 0.136 | -| value_loss | 4.55e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7233 | -| time_elapsed | 46995 | -| total_timesteps | 925824 | -| train/ | | -| approx_kl | 0.0050547314 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.577 | -| explained_variance | -0.0801 | -| learning_rate | 0.0003 | -| loss | -0.000663 | -| n_updates | 72320 | -| policy_gradient_loss | -0.000224 | -| std | 0.136 | -| value_loss | 1.68e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.04 | -| time/ | | -| fps | 19 | -| iterations | 7234 | -| time_elapsed | 46998 | -| total_timesteps | 925952 | -| train/ | | -| approx_kl | 0.009138455 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 0.58 | -| explained_variance | -0.000892 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 72330 | -| policy_gradient_loss | -0.0032 | -| std | 0.135 | -| value_loss | 3.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7235 | -| time_elapsed | 47000 | -| total_timesteps | 926080 | -| train/ | | -| approx_kl | 0.0057124663 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.582 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 72340 | -| policy_gradient_loss | -0.000501 | -| std | 0.135 | -| value_loss | 6.78e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7236 | -| time_elapsed | 47007 | -| total_timesteps | 926208 | -| train/ | | -| approx_kl | 0.019752517 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.583 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 72350 | -| policy_gradient_loss | -0.00122 | -| std | 0.135 | -| value_loss | 0.00106 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7237 | -| time_elapsed | 47010 | -| total_timesteps | 926336 | -| train/ | | -| approx_kl | 0.014162265 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 0.582 | -| explained_variance | -3.97 | -| learning_rate | 0.0003 | -| loss | 0.00555 | -| n_updates | 72360 | -| policy_gradient_loss | 0.000976 | -| std | 0.135 | -| value_loss | 1.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7238 | -| time_elapsed | 47013 | -| total_timesteps | 926464 | -| train/ | | -| approx_kl | 0.015230436 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | -0.703 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 72370 | -| policy_gradient_loss | -0.00843 | -| std | 0.136 | -| value_loss | 3.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7239 | -| time_elapsed | 47017 | -| total_timesteps | 926592 | -| train/ | | -| approx_kl | 0.031435024 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 0.578 | -| explained_variance | 0.00369 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 72380 | -| policy_gradient_loss | -0.00305 | -| std | 0.136 | -| value_loss | 5.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7240 | -| time_elapsed | 47020 | -| total_timesteps | 926720 | -| train/ | | -| approx_kl | 0.010468914 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.578 | -| explained_variance | 0.000492 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 72390 | -| policy_gradient_loss | -0.00849 | -| std | 0.136 | -| value_loss | 1.74e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7241 | -| time_elapsed | 47024 | -| total_timesteps | 926848 | -| train/ | | -| approx_kl | 0.0015811571 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.578 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | -0.000731 | -| n_updates | 72400 | -| policy_gradient_loss | 0.00274 | -| std | 0.136 | -| value_loss | 2.92e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.02 | -| time/ | | -| fps | 19 | -| iterations | 7242 | -| time_elapsed | 47027 | -| total_timesteps | 926976 | -| train/ | | -| approx_kl | 0.012834514 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 0.578 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 72410 | -| policy_gradient_loss | -7.35e-05 | -| std | 0.136 | -| value_loss | 2.52e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7243 | -| time_elapsed | 47030 | -| total_timesteps | 927104 | -| train/ | | -| approx_kl | 0.0005953917 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.577 | -| explained_variance | -0.212 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 72420 | -| policy_gradient_loss | -0.000984 | -| std | 0.136 | -| value_loss | 3.44e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7244 | -| time_elapsed | 47038 | -| total_timesteps | 927232 | -| train/ | | -| approx_kl | 0.011885403 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | 0.283 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 72430 | -| policy_gradient_loss | -0.0101 | -| std | 0.136 | -| value_loss | 0.000702 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7245 | -| time_elapsed | 47041 | -| total_timesteps | 927360 | -| train/ | | -| approx_kl | 0.007472036 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | -8.72 | -| learning_rate | 0.0003 | -| loss | -0.00998 | -| n_updates | 72440 | -| policy_gradient_loss | -0.00588 | -| std | 0.136 | -| value_loss | 7.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7246 | -| time_elapsed | 47044 | -| total_timesteps | 927488 | -| train/ | | -| approx_kl | 0.01468877 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | -4.35 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 72450 | -| policy_gradient_loss | -0.00215 | -| std | 0.136 | -| value_loss | 3.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7247 | -| time_elapsed | 47048 | -| total_timesteps | 927616 | -| train/ | | -| approx_kl | 0.01118825 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | -0.712 | -| learning_rate | 0.0003 | -| loss | -0.00894 | -| n_updates | 72460 | -| policy_gradient_loss | -0.00578 | -| std | 0.136 | -| value_loss | 9.78e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7248 | -| time_elapsed | 47051 | -| total_timesteps | 927744 | -| train/ | | -| approx_kl | 0.0029083532 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 72470 | -| policy_gradient_loss | -0.000581 | -| std | 0.136 | -| value_loss | 2.87e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 2.03 | -| time/ | | -| fps | 19 | -| iterations | 7249 | -| time_elapsed | 47054 | -| total_timesteps | 927872 | -| train/ | | -| approx_kl | 0.04716829 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 72480 | -| policy_gradient_loss | -0.0212 | -| std | 0.136 | -| value_loss | 7.64e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7250 | -| time_elapsed | 47057 | -| total_timesteps | 928000 | -| train/ | | -| approx_kl | 0.0003625471 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.578 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | -0.000483 | -| n_updates | 72490 | -| policy_gradient_loss | -0.000113 | -| std | 0.136 | -| value_loss | 7.22e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7251 | -| time_elapsed | 47060 | -| total_timesteps | 928128 | -| train/ | | -| approx_kl | 0.011209864 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.577 | -| explained_variance | 7.99e-05 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 72500 | -| policy_gradient_loss | -0.00177 | -| std | 0.136 | -| value_loss | 2.52e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7252 | -| time_elapsed | 47068 | -| total_timesteps | 928256 | -| train/ | | -| approx_kl | 0.0038099582 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.577 | -| explained_variance | 0.259 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 72510 | -| policy_gradient_loss | 0.000551 | -| std | 0.136 | -| value_loss | 0.0214 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7253 | -| time_elapsed | 47072 | -| total_timesteps | 928384 | -| train/ | | -| approx_kl | 0.011844744 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.578 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | 0.00214 | -| n_updates | 72520 | -| policy_gradient_loss | 8.02e-05 | -| std | 0.136 | -| value_loss | 0.00263 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7254 | -| time_elapsed | 47075 | -| total_timesteps | 928512 | -| train/ | | -| approx_kl | 0.0014162096 | -| clip_fraction | 0.0109 | -| clip_range | 0.2 | -| entropy_loss | 0.577 | -| explained_variance | 0.0159 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 72530 | -| policy_gradient_loss | -0.00209 | -| std | 0.136 | -| value_loss | 0.00101 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7255 | -| time_elapsed | 47079 | -| total_timesteps | 928640 | -| train/ | | -| approx_kl | 0.0036447495 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 72540 | -| policy_gradient_loss | -0.0113 | -| std | 0.137 | -| value_loss | 0.000151 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7256 | -| time_elapsed | 47081 | -| total_timesteps | 928768 | -| train/ | | -| approx_kl | 0.004693484 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 72550 | -| policy_gradient_loss | -0.00108 | -| std | 0.137 | -| value_loss | 0.000332 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.96 | -| time/ | | -| fps | 19 | -| iterations | 7257 | -| time_elapsed | 47084 | -| total_timesteps | 928896 | -| train/ | | -| approx_kl | 0.025079101 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | -0.00961 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 72560 | -| policy_gradient_loss | 0.000806 | -| std | 0.136 | -| value_loss | 6.98e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7258 | -| time_elapsed | 47088 | -| total_timesteps | 929024 | -| train/ | | -| approx_kl | 0.0007362496 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.574 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.000341 | -| n_updates | 72570 | -| policy_gradient_loss | 0.000648 | -| std | 0.136 | -| value_loss | 0.000182 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7259 | -| time_elapsed | 47096 | -| total_timesteps | 929152 | -| train/ | | -| approx_kl | 0.02076059 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 0.576 | -| explained_variance | 0.578 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 72580 | -| policy_gradient_loss | -0.0143 | -| std | 0.136 | -| value_loss | 0.00484 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7260 | -| time_elapsed | 47100 | -| total_timesteps | 929280 | -| train/ | | -| approx_kl | 0.0043025343 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.576 | -| explained_variance | 0.00321 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 72590 | -| policy_gradient_loss | -0.00246 | -| std | 0.136 | -| value_loss | 0.00262 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7261 | -| time_elapsed | 47103 | -| total_timesteps | 929408 | -| train/ | | -| approx_kl | 9.110849e-05 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 0.575 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | -0.00046 | -| n_updates | 72600 | -| policy_gradient_loss | -0.000152 | -| std | 0.136 | -| value_loss | 0.000572 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7262 | -| time_elapsed | 47107 | -| total_timesteps | 929536 | -| train/ | | -| approx_kl | 0.0007470497 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.405 | -| learning_rate | 0.0003 | -| loss | -0.000283 | -| n_updates | 72610 | -| policy_gradient_loss | -0.000104 | -| std | 0.137 | -| value_loss | 6.24e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7263 | -| time_elapsed | 47111 | -| total_timesteps | 929664 | -| train/ | | -| approx_kl | 0.009727592 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.569 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 72620 | -| policy_gradient_loss | -0.00238 | -| std | 0.137 | -| value_loss | 0.000154 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7264 | -| time_elapsed | 47115 | -| total_timesteps | 929792 | -| train/ | | -| approx_kl | 0.016316716 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 0.568 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 72630 | -| policy_gradient_loss | 0.000479 | -| std | 0.137 | -| value_loss | 4.18e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7265 | -| time_elapsed | 47118 | -| total_timesteps | 929920 | -| train/ | | -| approx_kl | 0.027918056 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.568 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 72640 | -| policy_gradient_loss | -0.00612 | -| std | 0.137 | -| value_loss | 1.55e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7266 | -| time_elapsed | 47121 | -| total_timesteps | 930048 | -| train/ | | -| approx_kl | 0.0072989506 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.568 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | -0.00389 | -| n_updates | 72650 | -| policy_gradient_loss | -0.00196 | -| std | 0.137 | -| value_loss | 9.22e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7267 | -| time_elapsed | 47128 | -| total_timesteps | 930176 | -| train/ | | -| approx_kl | 0.008612381 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.569 | -| explained_variance | 0.487 | -| learning_rate | 0.0003 | -| loss | 0.00493 | -| n_updates | 72660 | -| policy_gradient_loss | 0.000377 | -| std | 0.137 | -| value_loss | 0.011 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7268 | -| time_elapsed | 47132 | -| total_timesteps | 930304 | -| train/ | | -| approx_kl | 0.028265039 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 0.571 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00793 | -| n_updates | 72670 | -| policy_gradient_loss | -0.00526 | -| std | 0.137 | -| value_loss | 1.24e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7269 | -| time_elapsed | 47136 | -| total_timesteps | 930432 | -| train/ | | -| approx_kl | 0.02819704 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | -0.675 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 72680 | -| policy_gradient_loss | -0.00248 | -| std | 0.137 | -| value_loss | 5.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7270 | -| time_elapsed | 47139 | -| total_timesteps | 930560 | -| train/ | | -| approx_kl | 0.023162782 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | -0.00986 | -| n_updates | 72690 | -| policy_gradient_loss | -0.00391 | -| std | 0.136 | -| value_loss | 2.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7271 | -| time_elapsed | 47143 | -| total_timesteps | 930688 | -| train/ | | -| approx_kl | 0.033048872 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 72700 | -| policy_gradient_loss | -0.0076 | -| std | 0.136 | -| value_loss | 1.49e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7272 | -| time_elapsed | 47146 | -| total_timesteps | 930816 | -| train/ | | -| approx_kl | 0.03038105 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 72710 | -| policy_gradient_loss | -0.00977 | -| std | 0.136 | -| value_loss | 1.33e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.97 | -| time/ | | -| fps | 19 | -| iterations | 7273 | -| time_elapsed | 47150 | -| total_timesteps | 930944 | -| train/ | | -| approx_kl | 0.011407944 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.23 | -| learning_rate | 0.0003 | -| loss | 0.000662 | -| n_updates | 72720 | -| policy_gradient_loss | -0.000141 | -| std | 0.136 | -| value_loss | 5.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7274 | -| time_elapsed | 47153 | -| total_timesteps | 931072 | -| train/ | | -| approx_kl | 0.032844633 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 0.574 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 72730 | -| policy_gradient_loss | -0.01 | -| std | 0.136 | -| value_loss | 7.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7275 | -| time_elapsed | 47158 | -| total_timesteps | 931200 | -| train/ | | -| approx_kl | 0.013107795 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.574 | -| explained_variance | 0.501 | -| learning_rate | 0.0003 | -| loss | -0.00783 | -| n_updates | 72740 | -| policy_gradient_loss | -0.00506 | -| std | 0.136 | -| value_loss | 0.000883 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7276 | -| time_elapsed | 47161 | -| total_timesteps | 931328 | -| train/ | | -| approx_kl | 0.013059497 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.00942 | -| n_updates | 72750 | -| policy_gradient_loss | -0.00621 | -| std | 0.136 | -| value_loss | 1.31e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7277 | -| time_elapsed | 47165 | -| total_timesteps | 931456 | -| train/ | | -| approx_kl | 0.013438545 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.00354 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 72760 | -| policy_gradient_loss | -0.00104 | -| std | 0.136 | -| value_loss | 2.56e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7278 | -| time_elapsed | 47169 | -| total_timesteps | 931584 | -| train/ | | -| approx_kl | 0.0076108715 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | 0.0158 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 72770 | -| policy_gradient_loss | -0.00062 | -| std | 0.136 | -| value_loss | 1.59e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7279 | -| time_elapsed | 47172 | -| total_timesteps | 931712 | -| train/ | | -| approx_kl | 0.02525732 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 72780 | -| policy_gradient_loss | -0.012 | -| std | 0.136 | -| value_loss | 4.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7280 | -| time_elapsed | 47176 | -| total_timesteps | 931840 | -| train/ | | -| approx_kl | 0.008313317 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 72790 | -| policy_gradient_loss | -0.00575 | -| std | 0.137 | -| value_loss | 2.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.93 | -| time/ | | -| fps | 19 | -| iterations | 7281 | -| time_elapsed | 47179 | -| total_timesteps | 931968 | -| train/ | | -| approx_kl | 0.010189983 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | -0.295 | -| learning_rate | 0.0003 | -| loss | 0.000561 | -| n_updates | 72800 | -| policy_gradient_loss | -1.04e-05 | -| std | 0.137 | -| value_loss | 3.62e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7282 | -| time_elapsed | 47183 | -| total_timesteps | 932096 | -| train/ | | -| approx_kl | 0.0082743745 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.572 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 72810 | -| policy_gradient_loss | -0.00726 | -| std | 0.137 | -| value_loss | 1.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7283 | -| time_elapsed | 47191 | -| total_timesteps | 932224 | -| train/ | | -| approx_kl | 0.016600987 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | 0.782 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 72820 | -| policy_gradient_loss | -0.00137 | -| std | 0.136 | -| value_loss | 0.00183 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7284 | -| time_elapsed | 47195 | -| total_timesteps | 932352 | -| train/ | | -| approx_kl | 0.030349106 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.62 | -| learning_rate | 0.0003 | -| loss | 0.00345 | -| n_updates | 72830 | -| policy_gradient_loss | 0.00414 | -| std | 0.136 | -| value_loss | 2.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7285 | -| time_elapsed | 47198 | -| total_timesteps | 932480 | -| train/ | | -| approx_kl | 0.016605623 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 72840 | -| policy_gradient_loss | -0.00204 | -| std | 0.136 | -| value_loss | 9.58e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7286 | -| time_elapsed | 47201 | -| total_timesteps | 932608 | -| train/ | | -| approx_kl | 0.0016381084 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.573 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 72850 | -| policy_gradient_loss | -0.000987 | -| std | 0.136 | -| value_loss | 9.21e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7287 | -| time_elapsed | 47204 | -| total_timesteps | 932736 | -| train/ | | -| approx_kl | 0.0017215977 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.576 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 72860 | -| policy_gradient_loss | -0.000864 | -| std | 0.136 | -| value_loss | 1.47e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7288 | -| time_elapsed | 47208 | -| total_timesteps | 932864 | -| train/ | | -| approx_kl | 0.0028689145 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.579 | -| explained_variance | -0.09 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 72870 | -| policy_gradient_loss | -0.00389 | -| std | 0.135 | -| value_loss | 1.85e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.78 | -| time/ | | -| fps | 19 | -| iterations | 7289 | -| time_elapsed | 47210 | -| total_timesteps | 932992 | -| train/ | | -| approx_kl | 0.0023410744 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 0.582 | -| explained_variance | -0.547 | -| learning_rate | 0.0003 | -| loss | -0.000455 | -| n_updates | 72880 | -| policy_gradient_loss | -0.000205 | -| std | 0.135 | -| value_loss | 1.44e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.65 | -| time/ | | -| fps | 19 | -| iterations | 7290 | -| time_elapsed | 47212 | -| total_timesteps | 933120 | -| train/ | | -| approx_kl | 0.018458549 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.586 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 72890 | -| policy_gradient_loss | -0.0044 | -| std | 0.134 | -| value_loss | 2.75e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.65 | -| time/ | | -| fps | 19 | -| iterations | 7291 | -| time_elapsed | 47218 | -| total_timesteps | 933248 | -| train/ | | -| approx_kl | 0.012458866 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.589 | -| explained_variance | 0.156 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 72900 | -| policy_gradient_loss | -0.00842 | -| std | 0.134 | -| value_loss | 0.00818 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.65 | -| time/ | | -| fps | 19 | -| iterations | 7292 | -| time_elapsed | 47222 | -| total_timesteps | 933376 | -| train/ | | -| approx_kl | 0.029965352 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.591 | -| explained_variance | -0.326 | -| learning_rate | 0.0003 | -| loss | -0.00638 | -| n_updates | 72910 | -| policy_gradient_loss | -0.00263 | -| std | 0.134 | -| value_loss | 0.000565 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.65 | -| time/ | | -| fps | 19 | -| iterations | 7293 | -| time_elapsed | 47225 | -| total_timesteps | 933504 | -| train/ | | -| approx_kl | 0.00047700293 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 0.592 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.000856 | -| n_updates | 72920 | -| policy_gradient_loss | -0.000903 | -| std | 0.134 | -| value_loss | 0.000203 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.65 | -| time/ | | -| fps | 19 | -| iterations | 7294 | -| time_elapsed | 47229 | -| total_timesteps | 933632 | -| train/ | | -| approx_kl | 0.015612198 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.592 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 72930 | -| policy_gradient_loss | -0.0036 | -| std | 0.134 | -| value_loss | 0.00022 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.65 | -| time/ | | -| fps | 19 | -| iterations | 7295 | -| time_elapsed | 47231 | -| total_timesteps | 933760 | -| train/ | | -| approx_kl | 0.0017623669 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.592 | -| explained_variance | 0.00455 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 72940 | -| policy_gradient_loss | -0.000705 | -| std | 0.134 | -| value_loss | 4.3e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.65 | -| time/ | | -| fps | 19 | -| iterations | 7296 | -| time_elapsed | 47234 | -| total_timesteps | 933888 | -| train/ | | -| approx_kl | 0.018002491 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.592 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 0.00374 | -| n_updates | 72950 | -| policy_gradient_loss | 0.000445 | -| std | 0.134 | -| value_loss | 2e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7297 | -| time_elapsed | 47238 | -| total_timesteps | 934016 | -| train/ | | -| approx_kl | 0.014349731 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.593 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 72960 | -| policy_gradient_loss | -0.000218 | -| std | 0.134 | -| value_loss | 7.75e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7298 | -| time_elapsed | 47247 | -| total_timesteps | 934144 | -| train/ | | -| approx_kl | 0.09955187 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 0.592 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 72970 | -| policy_gradient_loss | -0.0164 | -| std | 0.134 | -| value_loss | 0.000893 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7299 | -| time_elapsed | 47250 | -| total_timesteps | 934272 | -| train/ | | -| approx_kl | 0.008062273 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 0.593 | -| explained_variance | 0.546 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 72980 | -| policy_gradient_loss | -0.00333 | -| std | 0.134 | -| value_loss | 2.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7300 | -| time_elapsed | 47253 | -| total_timesteps | 934400 | -| train/ | | -| approx_kl | 0.016965326 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.593 | -| explained_variance | 0.0015 | -| learning_rate | 0.0003 | -| loss | 0.00493 | -| n_updates | 72990 | -| policy_gradient_loss | 0.00112 | -| std | 0.134 | -| value_loss | 4.86e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7301 | -| time_elapsed | 47255 | -| total_timesteps | 934528 | -| train/ | | -| approx_kl | 0.0042487253 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 0.593 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 73000 | -| policy_gradient_loss | 0.000115 | -| std | 0.134 | -| value_loss | 2.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7302 | -| time_elapsed | 47257 | -| total_timesteps | 934656 | -| train/ | | -| approx_kl | 0.006859221 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 0.594 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 73010 | -| policy_gradient_loss | -0.00652 | -| std | 0.134 | -| value_loss | 1.1e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7303 | -| time_elapsed | 47259 | -| total_timesteps | 934784 | -| train/ | | -| approx_kl | 0.0055609276 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 0.594 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | -0.00848 | -| n_updates | 73020 | -| policy_gradient_loss | -0.0064 | -| std | 0.134 | -| value_loss | 7.74e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.43 | -| time/ | | -| fps | 19 | -| iterations | 7304 | -| time_elapsed | 47260 | -| total_timesteps | 934912 | -| train/ | | -| approx_kl | 0.004850253 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.595 | -| explained_variance | -0.0825 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 73030 | -| policy_gradient_loss | -9.49e-05 | -| std | 0.133 | -| value_loss | 6.38e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7305 | -| time_elapsed | 47263 | -| total_timesteps | 935040 | -| train/ | | -| approx_kl | 0.0062265727 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 0.596 | -| explained_variance | -0.0666 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 73040 | -| policy_gradient_loss | -0.00316 | -| std | 0.133 | -| value_loss | 3.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7306 | -| time_elapsed | 47270 | -| total_timesteps | 935168 | -| train/ | | -| approx_kl | 0.028443787 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 0.597 | -| explained_variance | 0.56 | -| learning_rate | 0.0003 | -| loss | 0.00537 | -| n_updates | 73050 | -| policy_gradient_loss | -0.00372 | -| std | 0.133 | -| value_loss | 0.00763 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7307 | -| time_elapsed | 47274 | -| total_timesteps | 935296 | -| train/ | | -| approx_kl | 0.01325948 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.597 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 73060 | -| policy_gradient_loss | -0.00383 | -| std | 0.133 | -| value_loss | 0.000442 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7308 | -| time_elapsed | 47279 | -| total_timesteps | 935424 | -| train/ | | -| approx_kl | 0.0020779497 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.597 | -| explained_variance | 0.0168 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 73070 | -| policy_gradient_loss | -0.000678 | -| std | 0.133 | -| value_loss | 2.47e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7309 | -| time_elapsed | 47282 | -| total_timesteps | 935552 | -| train/ | | -| approx_kl | 0.0015321616 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.598 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.000904 | -| n_updates | 73080 | -| policy_gradient_loss | -0.000355 | -| std | 0.133 | -| value_loss | 3.99e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7310 | -| time_elapsed | 47286 | -| total_timesteps | 935680 | -| train/ | | -| approx_kl | 0.043499775 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 0.599 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 73090 | -| policy_gradient_loss | -0.00864 | -| std | 0.133 | -| value_loss | 0.00011 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7311 | -| time_elapsed | 47288 | -| total_timesteps | 935808 | -| train/ | | -| approx_kl | 0.0015119319 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.599 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 73100 | -| policy_gradient_loss | -0.00162 | -| std | 0.133 | -| value_loss | 2.57e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.29 | -| time/ | | -| fps | 19 | -| iterations | 7312 | -| time_elapsed | 47291 | -| total_timesteps | 935936 | -| train/ | | -| approx_kl | 0.026920564 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.598 | -| explained_variance | -0.333 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 73110 | -| policy_gradient_loss | -0.0136 | -| std | 0.133 | -| value_loss | 9.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7313 | -| time_elapsed | 47295 | -| total_timesteps | 936064 | -| train/ | | -| approx_kl | 0.009589767 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.597 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 73120 | -| policy_gradient_loss | -0.00113 | -| std | 0.133 | -| value_loss | 3.93e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7314 | -| time_elapsed | 47303 | -| total_timesteps | 936192 | -| train/ | | -| approx_kl | 0.03986878 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 0.596 | -| explained_variance | 0.712 | -| learning_rate | 0.0003 | -| loss | -0.0084 | -| n_updates | 73130 | -| policy_gradient_loss | -0.00664 | -| std | 0.133 | -| value_loss | 0.000547 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7315 | -| time_elapsed | 47306 | -| total_timesteps | 936320 | -| train/ | | -| approx_kl | 0.006654853 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 0.596 | -| explained_variance | -0.0813 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 73140 | -| policy_gradient_loss | -0.00106 | -| std | 0.133 | -| value_loss | 2.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7316 | -| time_elapsed | 47310 | -| total_timesteps | 936448 | -| train/ | | -| approx_kl | 0.009417323 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.595 | -| explained_variance | -0.000928 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 73150 | -| policy_gradient_loss | -0.00142 | -| std | 0.134 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7317 | -| time_elapsed | 47313 | -| total_timesteps | 936576 | -| train/ | | -| approx_kl | 0.0008795634 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.595 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 73160 | -| policy_gradient_loss | -0.000783 | -| std | 0.133 | -| value_loss | 5.95e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7318 | -| time_elapsed | 47317 | -| total_timesteps | 936704 | -| train/ | | -| approx_kl | 0.023388807 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.597 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.00513 | -| n_updates | 73170 | -| policy_gradient_loss | 0.00117 | -| std | 0.133 | -| value_loss | 9.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7319 | -| time_elapsed | 47320 | -| total_timesteps | 936832 | -| train/ | | -| approx_kl | 0.015496818 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.598 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | 0.00283 | -| n_updates | 73180 | -| policy_gradient_loss | 0.000525 | -| std | 0.133 | -| value_loss | 1.97e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.28 | -| time/ | | -| fps | 19 | -| iterations | 7320 | -| time_elapsed | 47324 | -| total_timesteps | 936960 | -| train/ | | -| approx_kl | 0.0044404557 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.601 | -| explained_variance | 0.0153 | -| learning_rate | 0.0003 | -| loss | -0.00624 | -| n_updates | 73190 | -| policy_gradient_loss | -0.00448 | -| std | 0.133 | -| value_loss | 2.68e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7321 | -| time_elapsed | 47328 | -| total_timesteps | 937088 | -| train/ | | -| approx_kl | 0.009867553 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.603 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.000278 | -| n_updates | 73200 | -| policy_gradient_loss | 0.000445 | -| std | 0.132 | -| value_loss | 1.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7322 | -| time_elapsed | 47334 | -| total_timesteps | 937216 | -| train/ | | -| approx_kl | 0.018606927 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.604 | -| explained_variance | 0.583 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 73210 | -| policy_gradient_loss | -0.0107 | -| std | 0.132 | -| value_loss | 0.00441 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7323 | -| time_elapsed | 47338 | -| total_timesteps | 937344 | -| train/ | | -| approx_kl | 0.0037050294 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.605 | -| explained_variance | -0.841 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 73220 | -| policy_gradient_loss | -0.0104 | -| std | 0.132 | -| value_loss | 0.000122 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7324 | -| time_elapsed | 47340 | -| total_timesteps | 937472 | -| train/ | | -| approx_kl | 0.009728026 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.606 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | -0.00405 | -| n_updates | 73230 | -| policy_gradient_loss | -0.00221 | -| std | 0.132 | -| value_loss | 3.13e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7325 | -| time_elapsed | 47343 | -| total_timesteps | 937600 | -| train/ | | -| approx_kl | 0.016092172 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.606 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 73240 | -| policy_gradient_loss | 0.00149 | -| std | 0.132 | -| value_loss | 1.45e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7326 | -| time_elapsed | 47346 | -| total_timesteps | 937728 | -| train/ | | -| approx_kl | 0.0037882556 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.607 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 73250 | -| policy_gradient_loss | 0.00178 | -| std | 0.132 | -| value_loss | 1.18e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7327 | -| time_elapsed | 47350 | -| total_timesteps | 937856 | -| train/ | | -| approx_kl | 0.0007430017 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 0.607 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 73260 | -| policy_gradient_loss | -0.00194 | -| std | 0.132 | -| value_loss | 4.38e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.27 | -| time/ | | -| fps | 19 | -| iterations | 7328 | -| time_elapsed | 47354 | -| total_timesteps | 937984 | -| train/ | | -| approx_kl | 0.0012080297 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 0.607 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 73270 | -| policy_gradient_loss | 0.000123 | -| std | 0.132 | -| value_loss | 1.48e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.25 | -| time/ | | -| fps | 19 | -| iterations | 7329 | -| time_elapsed | 47356 | -| total_timesteps | 938112 | -| train/ | | -| approx_kl | 0.023320243 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 0.608 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 73280 | -| policy_gradient_loss | -0.00604 | -| std | 0.132 | -| value_loss | 2.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.25 | -| time/ | | -| fps | 19 | -| iterations | 7330 | -| time_elapsed | 47365 | -| total_timesteps | 938240 | -| train/ | | -| approx_kl | 0.012551966 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 0.61 | -| explained_variance | 0.555 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 73290 | -| policy_gradient_loss | -0.0148 | -| std | 0.131 | -| value_loss | 0.00885 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.25 | -| time/ | | -| fps | 19 | -| iterations | 7331 | -| time_elapsed | 47367 | -| total_timesteps | 938368 | -| train/ | | -| approx_kl | 0.0068028895 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.611 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 73300 | -| policy_gradient_loss | -0.00208 | -| std | 0.131 | -| value_loss | 1.83e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.25 | -| time/ | | -| fps | 19 | -| iterations | 7332 | -| time_elapsed | 47371 | -| total_timesteps | 938496 | -| train/ | | -| approx_kl | 0.014997752 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.612 | -| explained_variance | -0.24 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 73310 | -| policy_gradient_loss | -0.0105 | -| std | 0.131 | -| value_loss | 1.26e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.25 | -| time/ | | -| fps | 19 | -| iterations | 7333 | -| time_elapsed | 47374 | -| total_timesteps | 938624 | -| train/ | | -| approx_kl | 0.004116079 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.613 | -| explained_variance | -0.603 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 73320 | -| policy_gradient_loss | -0.000409 | -| std | 0.131 | -| value_loss | 2.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.25 | -| time/ | | -| fps | 19 | -| iterations | 7334 | -| time_elapsed | 47377 | -| total_timesteps | 938752 | -| train/ | | -| approx_kl | 0.0068477057 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.615 | -| explained_variance | -0.0918 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 73330 | -| policy_gradient_loss | 0.00135 | -| std | 0.131 | -| value_loss | 5.74e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.25 | -| time/ | | -| fps | 19 | -| iterations | 7335 | -| time_elapsed | 47379 | -| total_timesteps | 938880 | -| train/ | | -| approx_kl | 0.041346367 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 0.617 | -| explained_variance | -0.416 | -| learning_rate | 0.0003 | -| loss | 0.00908 | -| n_updates | 73340 | -| policy_gradient_loss | 0.0067 | -| std | 0.13 | -| value_loss | 3.49e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7336 | -| time_elapsed | 47382 | -| total_timesteps | 939008 | -| train/ | | -| approx_kl | 0.0017300243 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.618 | -| explained_variance | -0.000978 | -| learning_rate | 0.0003 | -| loss | -0.00782 | -| n_updates | 73350 | -| policy_gradient_loss | -0.00602 | -| std | 0.13 | -| value_loss | 4.47e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7337 | -| time_elapsed | 47391 | -| total_timesteps | 939136 | -| train/ | | -| approx_kl | 0.033952948 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 0.618 | -| explained_variance | 0.769 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 73360 | -| policy_gradient_loss | -0.0194 | -| std | 0.13 | -| value_loss | 0.00126 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7338 | -| time_elapsed | 47393 | -| total_timesteps | 939264 | -| train/ | | -| approx_kl | 0.017261185 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.618 | -| explained_variance | 0.0165 | -| learning_rate | 0.0003 | -| loss | 0.00447 | -| n_updates | 73370 | -| policy_gradient_loss | -0.000707 | -| std | 0.13 | -| value_loss | 0.00658 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7339 | -| time_elapsed | 47398 | -| total_timesteps | 939392 | -| train/ | | -| approx_kl | 0.005975893 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.618 | -| explained_variance | -0.317 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 73380 | -| policy_gradient_loss | 0.00119 | -| std | 0.13 | -| value_loss | 0.000233 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7340 | -| time_elapsed | 47401 | -| total_timesteps | 939520 | -| train/ | | -| approx_kl | 0.0069038165 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 0.619 | -| explained_variance | -0.000139 | -| learning_rate | 0.0003 | -| loss | -0.00816 | -| n_updates | 73390 | -| policy_gradient_loss | -0.00401 | -| std | 0.13 | -| value_loss | 0.000107 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7341 | -| time_elapsed | 47404 | -| total_timesteps | 939648 | -| train/ | | -| approx_kl | 0.0059226216 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.619 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 73400 | -| policy_gradient_loss | 0.00141 | -| std | 0.13 | -| value_loss | 0.000117 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7342 | -| time_elapsed | 47408 | -| total_timesteps | 939776 | -| train/ | | -| approx_kl | 0.0070605697 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.62 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 73410 | -| policy_gradient_loss | 0.00289 | -| std | 0.13 | -| value_loss | 5.01e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.26 | -| time/ | | -| fps | 19 | -| iterations | 7343 | -| time_elapsed | 47411 | -| total_timesteps | 939904 | -| train/ | | -| approx_kl | 0.009803234 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 0.621 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 73420 | -| policy_gradient_loss | 0.00326 | -| std | 0.13 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7344 | -| time_elapsed | 47413 | -| total_timesteps | 940032 | -| train/ | | -| approx_kl | 0.0102155525 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 0.622 | -| explained_variance | -0.0839 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 73430 | -| policy_gradient_loss | -0.00184 | -| std | 0.13 | -| value_loss | 1.12e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7345 | -| time_elapsed | 47422 | -| total_timesteps | 940160 | -| train/ | | -| approx_kl | 0.0101047475 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 0.623 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 73440 | -| policy_gradient_loss | -0.00154 | -| std | 0.13 | -| value_loss | 0.00278 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7346 | -| time_elapsed | 47426 | -| total_timesteps | 940288 | -| train/ | | -| approx_kl | 0.008454774 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 0.624 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 73450 | -| policy_gradient_loss | 0.00758 | -| std | 0.13 | -| value_loss | 6.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7347 | -| time_elapsed | 47429 | -| total_timesteps | 940416 | -| train/ | | -| approx_kl | 0.010860155 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 0.625 | -| explained_variance | 0.0248 | -| learning_rate | 0.0003 | -| loss | -0.00599 | -| n_updates | 73460 | -| policy_gradient_loss | 0.000531 | -| std | 0.13 | -| value_loss | 7.76e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7348 | -| time_elapsed | 47432 | -| total_timesteps | 940544 | -| train/ | | -| approx_kl | 0.021738857 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.625 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 73470 | -| policy_gradient_loss | -0.00263 | -| std | 0.129 | -| value_loss | 9.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7349 | -| time_elapsed | 47435 | -| total_timesteps | 940672 | -| train/ | | -| approx_kl | 0.025011644 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.626 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 73480 | -| policy_gradient_loss | -0.0113 | -| std | 0.129 | -| value_loss | 4.59e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7350 | -| time_elapsed | 47439 | -| total_timesteps | 940800 | -| train/ | | -| approx_kl | 0.0179501 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 0.626 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 73490 | -| policy_gradient_loss | -0.00254 | -| std | 0.129 | -| value_loss | 2.94e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 19 | -| iterations | 7351 | -| time_elapsed | 47442 | -| total_timesteps | 940928 | -| train/ | | -| approx_kl | 0.0054635564 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 0.627 | -| explained_variance | -0.0975 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 73500 | -| policy_gradient_loss | -0.00478 | -| std | 0.129 | -| value_loss | 3.8e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7352 | -| time_elapsed | 47445 | -| total_timesteps | 941056 | -| train/ | | -| approx_kl | 0.020420833 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.629 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 73510 | -| policy_gradient_loss | -0.00134 | -| std | 0.129 | -| value_loss | 2.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7353 | -| time_elapsed | 47452 | -| total_timesteps | 941184 | -| train/ | | -| approx_kl | 0.028515784 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.629 | -| explained_variance | 0.57 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 73520 | -| policy_gradient_loss | -0.0162 | -| std | 0.129 | -| value_loss | 0.00974 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7354 | -| time_elapsed | 47456 | -| total_timesteps | 941312 | -| train/ | | -| approx_kl | 0.006694833 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.629 | -| explained_variance | 0.0155 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 73530 | -| policy_gradient_loss | 0.000938 | -| std | 0.129 | -| value_loss | 0.00123 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7355 | -| time_elapsed | 47460 | -| total_timesteps | 941440 | -| train/ | | -| approx_kl | 0.0041321195 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 0.63 | -| explained_variance | 0.00244 | -| learning_rate | 0.0003 | -| loss | -0.000806 | -| n_updates | 73540 | -| policy_gradient_loss | 0.00174 | -| std | 0.129 | -| value_loss | 0.00285 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7356 | -| time_elapsed | 47463 | -| total_timesteps | 941568 | -| train/ | | -| approx_kl | 0.01860285 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.631 | -| explained_variance | -0.00341 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 73550 | -| policy_gradient_loss | -0.000412 | -| std | 0.129 | -| value_loss | 5.46e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7357 | -| time_elapsed | 47466 | -| total_timesteps | 941696 | -| train/ | | -| approx_kl | 0.0013425336 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 0.632 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | -0.000947 | -| n_updates | 73560 | -| policy_gradient_loss | -0.000424 | -| std | 0.128 | -| value_loss | 2.61e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7358 | -| time_elapsed | 47469 | -| total_timesteps | 941824 | -| train/ | | -| approx_kl | 0.0012314948 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.633 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 73570 | -| policy_gradient_loss | -0.000556 | -| std | 0.129 | -| value_loss | 3.49e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7359 | -| time_elapsed | 47471 | -| total_timesteps | 941952 | -| train/ | | -| approx_kl | 0.0049932855 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.631 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 73580 | -| policy_gradient_loss | -0.00109 | -| std | 0.129 | -| value_loss | 4.85e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7360 | -| time_elapsed | 47475 | -| total_timesteps | 942080 | -| train/ | | -| approx_kl | 0.01638427 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.632 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 73590 | -| policy_gradient_loss | -0.0083 | -| std | 0.129 | -| value_loss | 6.97e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7361 | -| time_elapsed | 47482 | -| total_timesteps | 942208 | -| train/ | | -| approx_kl | 0.037526727 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.633 | -| explained_variance | 0.792 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 73600 | -| policy_gradient_loss | -0.00554 | -| std | 0.128 | -| value_loss | 0.00135 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7362 | -| time_elapsed | 47485 | -| total_timesteps | 942336 | -| train/ | | -| approx_kl | 0.0040550535 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.634 | -| explained_variance | -0.000331 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 73610 | -| policy_gradient_loss | -0.00262 | -| std | 0.128 | -| value_loss | 1.99e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7363 | -| time_elapsed | 47489 | -| total_timesteps | 942464 | -| train/ | | -| approx_kl | 0.025797658 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.634 | -| explained_variance | 0.00746 | -| learning_rate | 0.0003 | -| loss | 0.00169 | -| n_updates | 73620 | -| policy_gradient_loss | -0.00171 | -| std | 0.128 | -| value_loss | 2.4e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7364 | -| time_elapsed | 47493 | -| total_timesteps | 942592 | -| train/ | | -| approx_kl | 0.0026576435 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 0.634 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 73630 | -| policy_gradient_loss | -0.00491 | -| std | 0.128 | -| value_loss | 4.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7365 | -| time_elapsed | 47496 | -| total_timesteps | 942720 | -| train/ | | -| approx_kl | 0.007148614 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 0.635 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 73640 | -| policy_gradient_loss | -0.00579 | -| std | 0.128 | -| value_loss | 2.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7366 | -| time_elapsed | 47499 | -| total_timesteps | 942848 | -| train/ | | -| approx_kl | 0.024107635 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.635 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 4.58e-06 | -| n_updates | 73650 | -| policy_gradient_loss | -0.000765 | -| std | 0.128 | -| value_loss | 9.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7367 | -| time_elapsed | 47503 | -| total_timesteps | 942976 | -| train/ | | -| approx_kl | 0.01697632 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | -0.0688 | -| learning_rate | 0.0003 | -| loss | 0.0017 | -| n_updates | 73660 | -| policy_gradient_loss | 0.000338 | -| std | 0.128 | -| value_loss | 2.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7368 | -| time_elapsed | 47508 | -| total_timesteps | 943104 | -| train/ | | -| approx_kl | 0.028134037 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.00424 | -| learning_rate | 0.0003 | -| loss | 0.00627 | -| n_updates | 73670 | -| policy_gradient_loss | 0.000542 | -| std | 0.128 | -| value_loss | 3.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7369 | -| time_elapsed | 47516 | -| total_timesteps | 943232 | -| train/ | | -| approx_kl | 0.006779511 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | 0.234 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 73680 | -| policy_gradient_loss | -0.00836 | -| std | 0.128 | -| value_loss | 0.0171 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7370 | -| time_elapsed | 47519 | -| total_timesteps | 943360 | -| train/ | | -| approx_kl | 0.00091788825 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.616 | -| learning_rate | 0.0003 | -| loss | -0.000371 | -| n_updates | 73690 | -| policy_gradient_loss | 0.000492 | -| std | 0.128 | -| value_loss | 0.00072 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7371 | -| time_elapsed | 47522 | -| total_timesteps | 943488 | -| train/ | | -| approx_kl | 0.0039781523 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 0.639 | -| explained_variance | -0.000381 | -| learning_rate | 0.0003 | -| loss | -0.00991 | -| n_updates | 73700 | -| policy_gradient_loss | -0.00765 | -| std | 0.128 | -| value_loss | 0.00324 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7372 | -| time_elapsed | 47526 | -| total_timesteps | 943616 | -| train/ | | -| approx_kl | 0.008883433 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 0.641 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.000543 | -| n_updates | 73710 | -| policy_gradient_loss | 0.000481 | -| std | 0.127 | -| value_loss | 0.000764 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7373 | -| time_elapsed | 47529 | -| total_timesteps | 943744 | -| train/ | | -| approx_kl | 0.014313992 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.642 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 73720 | -| policy_gradient_loss | -0.00036 | -| std | 0.127 | -| value_loss | 0.000156 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7374 | -| time_elapsed | 47532 | -| total_timesteps | 943872 | -| train/ | | -| approx_kl | 0.013537731 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.641 | -| explained_variance | -0.0923 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 73730 | -| policy_gradient_loss | 0.000484 | -| std | 0.128 | -| value_loss | 6.1e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7375 | -| time_elapsed | 47536 | -| total_timesteps | 944000 | -| train/ | | -| approx_kl | 0.00083610415 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 73740 | -| policy_gradient_loss | -0.0015 | -| std | 0.128 | -| value_loss | 6.42e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7376 | -| time_elapsed | 47538 | -| total_timesteps | 944128 | -| train/ | | -| approx_kl | 0.008817658 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.634 | -| explained_variance | 0.00679 | -| learning_rate | 0.0003 | -| loss | -0.000723 | -| n_updates | 73750 | -| policy_gradient_loss | 0.000208 | -| std | 0.128 | -| value_loss | 0.000311 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7377 | -| time_elapsed | 47545 | -| total_timesteps | 944256 | -| train/ | | -| approx_kl | 0.01637035 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.633 | -| explained_variance | 0.377 | -| learning_rate | 0.0003 | -| loss | 0.003 | -| n_updates | 73760 | -| policy_gradient_loss | -0.00396 | -| std | 0.129 | -| value_loss | 0.0149 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7378 | -| time_elapsed | 47549 | -| total_timesteps | 944384 | -| train/ | | -| approx_kl | 0.008763108 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 0.632 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 73770 | -| policy_gradient_loss | -0.00708 | -| std | 0.129 | -| value_loss | 0.000332 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7379 | -| time_elapsed | 47553 | -| total_timesteps | 944512 | -| train/ | | -| approx_kl | 0.009114736 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.632 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 73780 | -| policy_gradient_loss | 0.000433 | -| std | 0.129 | -| value_loss | 0.000164 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7380 | -| time_elapsed | 47556 | -| total_timesteps | 944640 | -| train/ | | -| approx_kl | 0.005743353 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 0.632 | -| explained_variance | -0.0923 | -| learning_rate | 0.0003 | -| loss | -0.00609 | -| n_updates | 73790 | -| policy_gradient_loss | -0.00307 | -| std | 0.129 | -| value_loss | 0.00012 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7381 | -| time_elapsed | 47559 | -| total_timesteps | 944768 | -| train/ | | -| approx_kl | 0.00011083484 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 0.634 | -| explained_variance | -0.0843 | -| learning_rate | 0.0003 | -| loss | -0.000945 | -| n_updates | 73800 | -| policy_gradient_loss | -0.000365 | -| std | 0.128 | -| value_loss | 0.000132 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7382 | -| time_elapsed | 47562 | -| total_timesteps | 944896 | -| train/ | | -| approx_kl | 0.0069032237 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.639 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 73810 | -| policy_gradient_loss | -0.00747 | -| std | 0.127 | -| value_loss | 0.000469 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7383 | -| time_elapsed | 47565 | -| total_timesteps | 945024 | -| train/ | | -| approx_kl | 0.001406447 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 0.641 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -3.59e-06 | -| n_updates | 73820 | -| policy_gradient_loss | 0.000148 | -| std | 0.128 | -| value_loss | 0.000107 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7384 | -| time_elapsed | 47573 | -| total_timesteps | 945152 | -| train/ | | -| approx_kl | 0.01912895 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 0.638 | -| explained_variance | 0.278 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 73830 | -| policy_gradient_loss | -0.00542 | -| std | 0.128 | -| value_loss | 0.013 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7385 | -| time_elapsed | 47577 | -| total_timesteps | 945280 | -| train/ | | -| approx_kl | 0.018003743 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 73840 | -| policy_gradient_loss | 0.00275 | -| std | 0.128 | -| value_loss | 0.00265 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7386 | -| time_elapsed | 47579 | -| total_timesteps | 945408 | -| train/ | | -| approx_kl | 0.014582464 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.00282 | -| n_updates | 73850 | -| policy_gradient_loss | 0.000328 | -| std | 0.128 | -| value_loss | 0.00013 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7387 | -| time_elapsed | 47583 | -| total_timesteps | 945536 | -| train/ | | -| approx_kl | 0.01135763 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | -0.0716 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 73860 | -| policy_gradient_loss | -0.00406 | -| std | 0.128 | -| value_loss | 0.00027 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7388 | -| time_elapsed | 47586 | -| total_timesteps | 945664 | -| train/ | | -| approx_kl | 0.008706868 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | -0.000332 | -| n_updates | 73870 | -| policy_gradient_loss | -0.000206 | -| std | 0.128 | -| value_loss | 0.000104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7389 | -| time_elapsed | 47589 | -| total_timesteps | 945792 | -| train/ | | -| approx_kl | 0.010215192 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 73880 | -| policy_gradient_loss | -0.00162 | -| std | 0.128 | -| value_loss | 6.53e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7390 | -| time_elapsed | 47592 | -| total_timesteps | 945920 | -| train/ | | -| approx_kl | 0.023790125 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 73890 | -| policy_gradient_loss | -0.00653 | -| std | 0.128 | -| value_loss | 2.65e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7391 | -| time_elapsed | 47595 | -| total_timesteps | 946048 | -| train/ | | -| approx_kl | 0.013087693 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.0888 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 73900 | -| policy_gradient_loss | -0.00779 | -| std | 0.128 | -| value_loss | 1.62e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7392 | -| time_elapsed | 47601 | -| total_timesteps | 946176 | -| train/ | | -| approx_kl | 0.044929445 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | 0.613 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 73910 | -| policy_gradient_loss | -0.0164 | -| std | 0.128 | -| value_loss | 0.000951 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7393 | -| time_elapsed | 47605 | -| total_timesteps | 946304 | -| train/ | | -| approx_kl | 0.014012249 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | -0.00667 | -| n_updates | 73920 | -| policy_gradient_loss | -0.00271 | -| std | 0.128 | -| value_loss | 4.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7394 | -| time_elapsed | 47610 | -| total_timesteps | 946432 | -| train/ | | -| approx_kl | 0.018852806 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | 0.00941 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 73930 | -| policy_gradient_loss | -0.00183 | -| std | 0.128 | -| value_loss | 1.37e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7395 | -| time_elapsed | 47613 | -| total_timesteps | 946560 | -| train/ | | -| approx_kl | 0.03314099 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 0.636 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 73940 | -| policy_gradient_loss | -0.0163 | -| std | 0.128 | -| value_loss | 1.1e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7396 | -| time_elapsed | 47617 | -| total_timesteps | 946688 | -| train/ | | -| approx_kl | 2.8848182e-05 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 1.56e-05 | -| n_updates | 73950 | -| policy_gradient_loss | 0.0279 | -| std | 0.128 | -| value_loss | 7.55e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7397 | -| time_elapsed | 47621 | -| total_timesteps | 946816 | -| train/ | | -| approx_kl | 0.0014252118 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.637 | -| explained_variance | -0.0663 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 73960 | -| policy_gradient_loss | -0.00571 | -| std | 0.128 | -| value_loss | 1.32e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 19 | -| iterations | 7398 | -| time_elapsed | 47625 | -| total_timesteps | 946944 | -| train/ | | -| approx_kl | 0.01141142 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 0.638 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.00764 | -| n_updates | 73970 | -| policy_gradient_loss | -0.00312 | -| std | 0.128 | -| value_loss | 3.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7399 | -| time_elapsed | 47628 | -| total_timesteps | 947072 | -| train/ | | -| approx_kl | 0.006389647 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.639 | -| explained_variance | 0.00549 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 73980 | -| policy_gradient_loss | -0.00167 | -| std | 0.128 | -| value_loss | 1.05e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7400 | -| time_elapsed | 47634 | -| total_timesteps | 947200 | -| train/ | | -| approx_kl | 0.12164296 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 0.64 | -| explained_variance | 0.757 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 73990 | -| policy_gradient_loss | -0.005 | -| std | 0.128 | -| value_loss | 0.00224 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7401 | -| time_elapsed | 47637 | -| total_timesteps | 947328 | -| train/ | | -| approx_kl | 0.01077918 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.641 | -| explained_variance | -0.398 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 74000 | -| policy_gradient_loss | 0.000195 | -| std | 0.127 | -| value_loss | 1.54e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7402 | -| time_elapsed | 47641 | -| total_timesteps | 947456 | -| train/ | | -| approx_kl | 0.021615319 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 0.643 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 74010 | -| policy_gradient_loss | -0.00487 | -| std | 0.127 | -| value_loss | 1.38e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7403 | -| time_elapsed | 47645 | -| total_timesteps | 947584 | -| train/ | | -| approx_kl | 0.040992185 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.644 | -| explained_variance | -0.0713 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 74020 | -| policy_gradient_loss | -0.0093 | -| std | 0.127 | -| value_loss | 3.97e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7404 | -| time_elapsed | 47649 | -| total_timesteps | 947712 | -| train/ | | -| approx_kl | 0.00034019444 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.644 | -| explained_variance | -0.0867 | -| learning_rate | 0.0003 | -| loss | -0.000686 | -| n_updates | 74030 | -| policy_gradient_loss | 0.000463 | -| std | 0.127 | -| value_loss | 6.13e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7405 | -| time_elapsed | 47653 | -| total_timesteps | 947840 | -| train/ | | -| approx_kl | 0.03031415 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 0.644 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 74040 | -| policy_gradient_loss | -0.00484 | -| std | 0.127 | -| value_loss | 6.77e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 19 | -| iterations | 7406 | -| time_elapsed | 47657 | -| total_timesteps | 947968 | -| train/ | | -| approx_kl | 0.00086730113 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.644 | -| explained_variance | -0.073 | -| learning_rate | 0.0003 | -| loss | -0.000334 | -| n_updates | 74050 | -| policy_gradient_loss | 0.00012 | -| std | 0.127 | -| value_loss | 6.78e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7407 | -| time_elapsed | 47662 | -| total_timesteps | 948096 | -| train/ | | -| approx_kl | 0.0034851027 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.644 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | -0.00065 | -| n_updates | 74060 | -| policy_gradient_loss | 0.00169 | -| std | 0.127 | -| value_loss | 5.74e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7408 | -| time_elapsed | 47669 | -| total_timesteps | 948224 | -| train/ | | -| approx_kl | 0.046970807 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.644 | -| explained_variance | 0.811 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 74070 | -| policy_gradient_loss | -0.0127 | -| std | 0.127 | -| value_loss | 0.000767 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7409 | -| time_elapsed | 47673 | -| total_timesteps | 948352 | -| train/ | | -| approx_kl | 0.00044934172 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 0.644 | -| explained_variance | -0.656 | -| learning_rate | 0.0003 | -| loss | -0.000653 | -| n_updates | 74080 | -| policy_gradient_loss | -0.00062 | -| std | 0.127 | -| value_loss | 1.74e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7410 | -| time_elapsed | 47677 | -| total_timesteps | 948480 | -| train/ | | -| approx_kl | 0.00021952996 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.646 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | -0.000212 | -| n_updates | 74090 | -| policy_gradient_loss | 7.3e-05 | -| std | 0.127 | -| value_loss | 1.79e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7411 | -| time_elapsed | 47681 | -| total_timesteps | 948608 | -| train/ | | -| approx_kl | 0.009559924 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 0.647 | -| explained_variance | -0.00877 | -| learning_rate | 0.0003 | -| loss | -0.00673 | -| n_updates | 74100 | -| policy_gradient_loss | -0.00105 | -| std | 0.127 | -| value_loss | 5.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7412 | -| time_elapsed | 47684 | -| total_timesteps | 948736 | -| train/ | | -| approx_kl | 0.009106572 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.649 | -| explained_variance | -0.448 | -| learning_rate | 0.0003 | -| loss | 0.000622 | -| n_updates | 74110 | -| policy_gradient_loss | 0.000131 | -| std | 0.126 | -| value_loss | 6.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7413 | -| time_elapsed | 47687 | -| total_timesteps | 948864 | -| train/ | | -| approx_kl | 0.020015493 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.652 | -| explained_variance | 0.00547 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 74120 | -| policy_gradient_loss | -0.00649 | -| std | 0.126 | -| value_loss | 7.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 19 | -| iterations | 7414 | -| time_elapsed | 47691 | -| total_timesteps | 948992 | -| train/ | | -| approx_kl | 0.018426448 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 0.654 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | 0.00479 | -| n_updates | 74130 | -| policy_gradient_loss | 0.00122 | -| std | 0.126 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7415 | -| time_elapsed | 47695 | -| total_timesteps | 949120 | -| train/ | | -| approx_kl | 0.004953914 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.656 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 74140 | -| policy_gradient_loss | 0.00163 | -| std | 0.125 | -| value_loss | 1.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7416 | -| time_elapsed | 47704 | -| total_timesteps | 949248 | -| train/ | | -| approx_kl | 0.13311452 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.657 | -| explained_variance | 0.774 | -| learning_rate | 0.0003 | -| loss | -0.0271 | -| n_updates | 74150 | -| policy_gradient_loss | -0.0222 | -| std | 0.125 | -| value_loss | 0.000614 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7417 | -| time_elapsed | 47706 | -| total_timesteps | 949376 | -| train/ | | -| approx_kl | 0.007907496 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 0.659 | -| explained_variance | -2.04 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 74160 | -| policy_gradient_loss | -0.000188 | -| std | 0.125 | -| value_loss | 1.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7418 | -| time_elapsed | 47710 | -| total_timesteps | 949504 | -| train/ | | -| approx_kl | 0.020452194 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 0.66 | -| explained_variance | -1.22 | -| learning_rate | 0.0003 | -| loss | 0.000544 | -| n_updates | 74170 | -| policy_gradient_loss | -0.000679 | -| std | 0.125 | -| value_loss | 8.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7419 | -| time_elapsed | 47712 | -| total_timesteps | 949632 | -| train/ | | -| approx_kl | 0.004180694 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 0.66 | -| explained_variance | -0.0836 | -| learning_rate | 0.0003 | -| loss | -0.00706 | -| n_updates | 74180 | -| policy_gradient_loss | -0.00433 | -| std | 0.125 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7420 | -| time_elapsed | 47715 | -| total_timesteps | 949760 | -| train/ | | -| approx_kl | 0.002352702 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 0.661 | -| explained_variance | 0.0149 | -| learning_rate | 0.0003 | -| loss | -0.00592 | -| n_updates | 74190 | -| policy_gradient_loss | -0.00526 | -| std | 0.125 | -| value_loss | 4.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 19 | -| iterations | 7421 | -| time_elapsed | 47718 | -| total_timesteps | 949888 | -| train/ | | -| approx_kl | 0.008353445 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 0.661 | -| explained_variance | -2.31 | -| learning_rate | 0.0003 | -| loss | -0.00633 | -| n_updates | 74200 | -| policy_gradient_loss | -0.00344 | -| std | 0.125 | -| value_loss | 7.96e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7422 | -| time_elapsed | 47721 | -| total_timesteps | 950016 | -| train/ | | -| approx_kl | 0.0019871504 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 0.661 | -| explained_variance | -0.00316 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 74210 | -| policy_gradient_loss | 0.000183 | -| std | 0.125 | -| value_loss | 3.13e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7423 | -| time_elapsed | 47730 | -| total_timesteps | 950144 | -| train/ | | -| approx_kl | 0.11916187 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 0.666 | -| explained_variance | 0.726 | -| learning_rate | 0.0003 | -| loss | -0.0277 | -| n_updates | 74220 | -| policy_gradient_loss | -0.0233 | -| std | 0.124 | -| value_loss | 0.00293 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7424 | -| time_elapsed | 47734 | -| total_timesteps | 950272 | -| train/ | | -| approx_kl | 0.009510545 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | 0.00592 | -| learning_rate | 0.0003 | -| loss | 0.000616 | -| n_updates | 74230 | -| policy_gradient_loss | 0.000929 | -| std | 0.124 | -| value_loss | 0.000166 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7425 | -| time_elapsed | 47738 | -| total_timesteps | 950400 | -| train/ | | -| approx_kl | 0.00045730034 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.00587 | -| learning_rate | 0.0003 | -| loss | 0.000449 | -| n_updates | 74240 | -| policy_gradient_loss | 0.000503 | -| std | 0.124 | -| value_loss | 0.0047 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7426 | -| time_elapsed | 47741 | -| total_timesteps | 950528 | -| train/ | | -| approx_kl | 0.0004514209 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.665 | -| explained_variance | 0.00501 | -| learning_rate | 0.0003 | -| loss | 0.0879 | -| n_updates | 74250 | -| policy_gradient_loss | 0.00052 | -| std | 0.125 | -| value_loss | 0.171 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7427 | -| time_elapsed | 47745 | -| total_timesteps | 950656 | -| train/ | | -| approx_kl | 0.0015007444 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.663 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 74260 | -| policy_gradient_loss | 0.00187 | -| std | 0.125 | -| value_loss | 0.00119 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7428 | -| time_elapsed | 47748 | -| total_timesteps | 950784 | -| train/ | | -| approx_kl | 0.0047990885 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.66 | -| explained_variance | 0.000444 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 74270 | -| policy_gradient_loss | 0.000109 | -| std | 0.125 | -| value_loss | 0.00159 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 19 | -| iterations | 7429 | -| time_elapsed | 47750 | -| total_timesteps | 950912 | -| train/ | | -| approx_kl | 0.00769164 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 0.66 | -| explained_variance | -0.00409 | -| learning_rate | 0.0003 | -| loss | 0.000225 | -| n_updates | 74280 | -| policy_gradient_loss | 0.00408 | -| std | 0.125 | -| value_loss | 0.00117 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7430 | -| time_elapsed | 47753 | -| total_timesteps | 951040 | -| train/ | | -| approx_kl | 0.010826753 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 0.66 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 74290 | -| policy_gradient_loss | 0.00654 | -| std | 0.125 | -| value_loss | 0.000663 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7431 | -| time_elapsed | 47760 | -| total_timesteps | 951168 | -| train/ | | -| approx_kl | 0.024717601 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 0.66 | -| explained_variance | 0.224 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 74300 | -| policy_gradient_loss | -0.0061 | -| std | 0.125 | -| value_loss | 0.0143 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7432 | -| time_elapsed | 47763 | -| total_timesteps | 951296 | -| train/ | | -| approx_kl | 0.026902325 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 0.661 | -| explained_variance | 0.0606 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 74310 | -| policy_gradient_loss | -0.00225 | -| std | 0.125 | -| value_loss | 0.000298 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7433 | -| time_elapsed | 47767 | -| total_timesteps | 951424 | -| train/ | | -| approx_kl | 0.011869242 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.662 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | 0.000187 | -| n_updates | 74320 | -| policy_gradient_loss | 0.000759 | -| std | 0.125 | -| value_loss | 0.00035 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7434 | -| time_elapsed | 47770 | -| total_timesteps | 951552 | -| train/ | | -| approx_kl | 0.019824015 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 0.662 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 74330 | -| policy_gradient_loss | -0.0144 | -| std | 0.125 | -| value_loss | 0.000124 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7435 | -| time_elapsed | 47774 | -| total_timesteps | 951680 | -| train/ | | -| approx_kl | 1.8471386e-05 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.663 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | -0.000208 | -| n_updates | 74340 | -| policy_gradient_loss | 0.00155 | -| std | 0.124 | -| value_loss | 0.00023 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7436 | -| time_elapsed | 47778 | -| total_timesteps | 951808 | -| train/ | | -| approx_kl | 0.0047159474 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.666 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.00556 | -| n_updates | 74350 | -| policy_gradient_loss | -0.00213 | -| std | 0.124 | -| value_loss | 0.000866 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7437 | -| time_elapsed | 47783 | -| total_timesteps | 951936 | -| train/ | | -| approx_kl | 0.02753859 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.668 | -| explained_variance | 0.00662 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 74360 | -| policy_gradient_loss | -0.00213 | -| std | 0.124 | -| value_loss | 0.000317 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7438 | -| time_elapsed | 47787 | -| total_timesteps | 952064 | -| train/ | | -| approx_kl | 0.04367365 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 0.669 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00854 | -| n_updates | 74370 | -| policy_gradient_loss | -0.00799 | -| std | 0.124 | -| value_loss | 2.47e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7439 | -| time_elapsed | 47792 | -| total_timesteps | 952192 | -| train/ | | -| approx_kl | 0.019663148 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.669 | -| explained_variance | 0.42 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 74380 | -| policy_gradient_loss | -0.0166 | -| std | 0.124 | -| value_loss | 0.00603 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7440 | -| time_elapsed | 47796 | -| total_timesteps | 952320 | -| train/ | | -| approx_kl | 0.011942575 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.668 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 74390 | -| policy_gradient_loss | -0.000158 | -| std | 0.124 | -| value_loss | 1.29e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7441 | -| time_elapsed | 47800 | -| total_timesteps | 952448 | -| train/ | | -| approx_kl | 0.019777555 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 74400 | -| policy_gradient_loss | -0.00192 | -| std | 0.124 | -| value_loss | 5.9e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7442 | -| time_elapsed | 47804 | -| total_timesteps | 952576 | -| train/ | | -| approx_kl | 0.0066382056 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.0848 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 74410 | -| policy_gradient_loss | -0.0019 | -| std | 0.124 | -| value_loss | 3.15e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7443 | -| time_elapsed | 47809 | -| total_timesteps | 952704 | -| train/ | | -| approx_kl | 0.020678382 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 74420 | -| policy_gradient_loss | -0.0104 | -| std | 0.124 | -| value_loss | 2.19e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7444 | -| time_elapsed | 47812 | -| total_timesteps | 952832 | -| train/ | | -| approx_kl | 0.0065308777 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 0.668 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 74430 | -| policy_gradient_loss | -0.00377 | -| std | 0.124 | -| value_loss | 1.47e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 19 | -| iterations | 7445 | -| time_elapsed | 47816 | -| total_timesteps | 952960 | -| train/ | | -| approx_kl | 0.013098193 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 0.668 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 74440 | -| policy_gradient_loss | -0.00101 | -| std | 0.124 | -| value_loss | 1.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7446 | -| time_elapsed | 47820 | -| total_timesteps | 953088 | -| train/ | | -| approx_kl | 0.02064791 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 74450 | -| policy_gradient_loss | -0.00175 | -| std | 0.124 | -| value_loss | 7.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7447 | -| time_elapsed | 47827 | -| total_timesteps | 953216 | -| train/ | | -| approx_kl | 0.018951233 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | 0.74 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 74460 | -| policy_gradient_loss | -0.0151 | -| std | 0.124 | -| value_loss | 0.000747 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7448 | -| time_elapsed | 47831 | -| total_timesteps | 953344 | -| train/ | | -| approx_kl | 0.019635797 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | 0.00174 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 74470 | -| policy_gradient_loss | 0.00326 | -| std | 0.124 | -| value_loss | 2.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7449 | -| time_elapsed | 47835 | -| total_timesteps | 953472 | -| train/ | | -| approx_kl | 0.020750672 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 74480 | -| policy_gradient_loss | -0.00127 | -| std | 0.124 | -| value_loss | 7.29e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7450 | -| time_elapsed | 47839 | -| total_timesteps | 953600 | -| train/ | | -| approx_kl | 0.00030946452 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 74490 | -| policy_gradient_loss | -0.000906 | -| std | 0.124 | -| value_loss | 5e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7451 | -| time_elapsed | 47843 | -| total_timesteps | 953728 | -| train/ | | -| approx_kl | 0.0026323204 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 0.668 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | -0.00555 | -| n_updates | 74500 | -| policy_gradient_loss | -0.00406 | -| std | 0.124 | -| value_loss | 3.47e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7452 | -| time_elapsed | 47847 | -| total_timesteps | 953856 | -| train/ | | -| approx_kl | 0.001046218 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 0.668 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 74510 | -| policy_gradient_loss | -0.00187 | -| std | 0.124 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7453 | -| time_elapsed | 47851 | -| total_timesteps | 953984 | -| train/ | | -| approx_kl | 0.016153641 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 74520 | -| policy_gradient_loss | -0.00662 | -| std | 0.124 | -| value_loss | 1.2e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7454 | -| time_elapsed | 47855 | -| total_timesteps | 954112 | -| train/ | | -| approx_kl | 0.00010712398 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.666 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | -0.00012 | -| n_updates | 74530 | -| policy_gradient_loss | 0.00283 | -| std | 0.124 | -| value_loss | 3.57e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7455 | -| time_elapsed | 47864 | -| total_timesteps | 954240 | -| train/ | | -| approx_kl | 0.034040816 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | 0.673 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 74540 | -| policy_gradient_loss | -0.0168 | -| std | 0.124 | -| value_loss | 0.00132 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7456 | -| time_elapsed | 47867 | -| total_timesteps | 954368 | -| train/ | | -| approx_kl | 0.02593403 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.668 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | 0.0035 | -| n_updates | 74550 | -| policy_gradient_loss | 6.04e-05 | -| std | 0.124 | -| value_loss | 1.5e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7457 | -| time_elapsed | 47870 | -| total_timesteps | 954496 | -| train/ | | -| approx_kl | 0.0014601266 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | 0.669 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.000124 | -| n_updates | 74560 | -| policy_gradient_loss | -8.66e-05 | -| std | 0.124 | -| value_loss | 2.99e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7458 | -| time_elapsed | 47873 | -| total_timesteps | 954624 | -| train/ | | -| approx_kl | 0.01842777 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 74570 | -| policy_gradient_loss | -0.00936 | -| std | 0.124 | -| value_loss | 1.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7459 | -| time_elapsed | 47875 | -| total_timesteps | 954752 | -| train/ | | -| approx_kl | 0.02776964 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.00701 | -| n_updates | 74580 | -| policy_gradient_loss | 2.06e-05 | -| std | 0.124 | -| value_loss | 1.42e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7460 | -| time_elapsed | 47879 | -| total_timesteps | 954880 | -| train/ | | -| approx_kl | 0.013884524 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 74590 | -| policy_gradient_loss | 0.00389 | -| std | 0.124 | -| value_loss | 9.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7461 | -| time_elapsed | 47883 | -| total_timesteps | 955008 | -| train/ | | -| approx_kl | 0.023584733 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.000866 | -| n_updates | 74600 | -| policy_gradient_loss | -0.00092 | -| std | 0.124 | -| value_loss | 5.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7462 | -| time_elapsed | 47893 | -| total_timesteps | 955136 | -| train/ | | -| approx_kl | 0.03940525 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | 0.657 | -| learning_rate | 0.0003 | -| loss | -0.00966 | -| n_updates | 74610 | -| policy_gradient_loss | -0.00924 | -| std | 0.124 | -| value_loss | 0.00158 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7463 | -| time_elapsed | 47895 | -| total_timesteps | 955264 | -| train/ | | -| approx_kl | 0.0017159511 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | 0.102 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 74620 | -| policy_gradient_loss | -0.000419 | -| std | 0.124 | -| value_loss | 2.41e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7464 | -| time_elapsed | 47899 | -| total_timesteps | 955392 | -| train/ | | -| approx_kl | 0.009939266 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.397 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 74630 | -| policy_gradient_loss | 0.00202 | -| std | 0.124 | -| value_loss | 1.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7465 | -| time_elapsed | 47902 | -| total_timesteps | 955520 | -| train/ | | -| approx_kl | 0.016405374 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 74640 | -| policy_gradient_loss | -0.000447 | -| std | 0.124 | -| value_loss | 6.55e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7466 | -| time_elapsed | 47904 | -| total_timesteps | 955648 | -| train/ | | -| approx_kl | 0.03758059 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 74650 | -| policy_gradient_loss | -0.0103 | -| std | 0.124 | -| value_loss | 4.47e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7467 | -| time_elapsed | 47908 | -| total_timesteps | 955776 | -| train/ | | -| approx_kl | 0.009393204 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 74660 | -| policy_gradient_loss | -0.00901 | -| std | 0.124 | -| value_loss | 2.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 19 | -| iterations | 7468 | -| time_elapsed | 47911 | -| total_timesteps | 955904 | -| train/ | | -| approx_kl | 0.018878162 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.000896 | -| n_updates | 74670 | -| policy_gradient_loss | -0.000439 | -| std | 0.123 | -| value_loss | 2.7e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7469 | -| time_elapsed | 47915 | -| total_timesteps | 956032 | -| train/ | | -| approx_kl | 0.0110478755 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | -0.00704 | -| n_updates | 74680 | -| policy_gradient_loss | -0.00426 | -| std | 0.123 | -| value_loss | 1.37e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7470 | -| time_elapsed | 47922 | -| total_timesteps | 956160 | -| train/ | | -| approx_kl | 0.019720593 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | 0.739 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 74690 | -| policy_gradient_loss | -0.00805 | -| std | 0.123 | -| value_loss | 0.000939 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7471 | -| time_elapsed | 47926 | -| total_timesteps | 956288 | -| train/ | | -| approx_kl | 0.020297198 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.062 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 74700 | -| policy_gradient_loss | 0.00041 | -| std | 0.123 | -| value_loss | 2.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7472 | -| time_elapsed | 47929 | -| total_timesteps | 956416 | -| train/ | | -| approx_kl | 0.010456696 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 74710 | -| policy_gradient_loss | -0.00112 | -| std | 0.123 | -| value_loss | 1.16e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7473 | -| time_elapsed | 47932 | -| total_timesteps | 956544 | -| train/ | | -| approx_kl | 0.0031698276 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 74720 | -| policy_gradient_loss | 0.00691 | -| std | 0.123 | -| value_loss | 4.94e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7474 | -| time_elapsed | 47935 | -| total_timesteps | 956672 | -| train/ | | -| approx_kl | 0.02673927 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | -0.004 | -| n_updates | 74730 | -| policy_gradient_loss | -0.00504 | -| std | 0.123 | -| value_loss | 5.29e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7475 | -| time_elapsed | 47938 | -| total_timesteps | 956800 | -| train/ | | -| approx_kl | 0.01878454 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 74740 | -| policy_gradient_loss | -0.00298 | -| std | 0.123 | -| value_loss | 1.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7476 | -| time_elapsed | 47943 | -| total_timesteps | 956928 | -| train/ | | -| approx_kl | 0.020614643 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 74750 | -| policy_gradient_loss | -0.0023 | -| std | 0.123 | -| value_loss | 1.04e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7477 | -| time_elapsed | 47946 | -| total_timesteps | 957056 | -| train/ | | -| approx_kl | 0.0036028698 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 74760 | -| policy_gradient_loss | -0.000875 | -| std | 0.123 | -| value_loss | 9.61e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7478 | -| time_elapsed | 47951 | -| total_timesteps | 957184 | -| train/ | | -| approx_kl | 0.025030335 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | 0.387 | -| learning_rate | 0.0003 | -| loss | 0.000693 | -| n_updates | 74770 | -| policy_gradient_loss | -0.00457 | -| std | 0.123 | -| value_loss | 0.0125 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7479 | -| time_elapsed | 47955 | -| total_timesteps | 957312 | -| train/ | | -| approx_kl | 0.014953697 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.00965 | -| n_updates | 74780 | -| policy_gradient_loss | -0.00615 | -| std | 0.123 | -| value_loss | 1.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7480 | -| time_elapsed | 47957 | -| total_timesteps | 957440 | -| train/ | | -| approx_kl | 0.029734256 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.344 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 74790 | -| policy_gradient_loss | -0.00639 | -| std | 0.123 | -| value_loss | 5.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7481 | -| time_elapsed | 47960 | -| total_timesteps | 957568 | -| train/ | | -| approx_kl | 0.008858232 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -0.0974 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 74800 | -| policy_gradient_loss | 0.00444 | -| std | 0.123 | -| value_loss | 6e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7482 | -| time_elapsed | 47962 | -| total_timesteps | 957696 | -| train/ | | -| approx_kl | 0.0075227604 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.000179 | -| n_updates | 74810 | -| policy_gradient_loss | -6.94e-05 | -| std | 0.123 | -| value_loss | 1.01e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7483 | -| time_elapsed | 47965 | -| total_timesteps | 957824 | -| train/ | | -| approx_kl | 0.024532922 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.00899 | -| learning_rate | 0.0003 | -| loss | 0.00347 | -| n_updates | 74820 | -| policy_gradient_loss | 0.000249 | -| std | 0.123 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 19 | -| iterations | 7484 | -| time_elapsed | 47967 | -| total_timesteps | 957952 | -| train/ | | -| approx_kl | 0.025811294 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | -0.00486 | -| n_updates | 74830 | -| policy_gradient_loss | -0.00521 | -| std | 0.123 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7485 | -| time_elapsed | 47970 | -| total_timesteps | 958080 | -| train/ | | -| approx_kl | 0.019767385 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 74840 | -| policy_gradient_loss | -0.0023 | -| std | 0.123 | -| value_loss | 3.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7486 | -| time_elapsed | 47974 | -| total_timesteps | 958208 | -| train/ | | -| approx_kl | 0.10559572 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.00886 | -| n_updates | 74850 | -| policy_gradient_loss | 0.00155 | -| std | 0.123 | -| value_loss | 0.000137 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7487 | -| time_elapsed | 47976 | -| total_timesteps | 958336 | -| train/ | | -| approx_kl | 0.023674957 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | -1.21 | -| learning_rate | 0.0003 | -| loss | -0.00868 | -| n_updates | 74860 | -| policy_gradient_loss | -0.00375 | -| std | 0.123 | -| value_loss | 7.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7488 | -| time_elapsed | 47980 | -| total_timesteps | 958464 | -| train/ | | -| approx_kl | 0.01375404 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 0.674 | -| explained_variance | -1.92 | -| learning_rate | 0.0003 | -| loss | -0.00782 | -| n_updates | 74870 | -| policy_gradient_loss | -0.00179 | -| std | 0.123 | -| value_loss | 4.78e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7489 | -| time_elapsed | 47983 | -| total_timesteps | 958592 | -| train/ | | -| approx_kl | 0.0027397615 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | -0.476 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 74880 | -| policy_gradient_loss | 0.000143 | -| std | 0.123 | -| value_loss | 1.21e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7490 | -| time_elapsed | 47987 | -| total_timesteps | 958720 | -| train/ | | -| approx_kl | 0.0075183245 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 74890 | -| policy_gradient_loss | -0.0125 | -| std | 0.123 | -| value_loss | 1.46e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7491 | -| time_elapsed | 47990 | -| total_timesteps | 958848 | -| train/ | | -| approx_kl | 0.0005202913 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | 0.00868 | -| learning_rate | 0.0003 | -| loss | -0.00028 | -| n_updates | 74900 | -| policy_gradient_loss | 0.00035 | -| std | 0.123 | -| value_loss | 8.38e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7492 | -| time_elapsed | 47992 | -| total_timesteps | 958976 | -| train/ | | -| approx_kl | 0.0046238755 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | 0.00165 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 74910 | -| policy_gradient_loss | -0.000881 | -| std | 0.124 | -| value_loss | 1.89e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7493 | -| time_elapsed | 47995 | -| total_timesteps | 959104 | -| train/ | | -| approx_kl | 0.0031001582 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.00528 | -| learning_rate | 0.0003 | -| loss | -0.00704 | -| n_updates | 74920 | -| policy_gradient_loss | -0.00488 | -| std | 0.124 | -| value_loss | 5.14e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7494 | -| time_elapsed | 48004 | -| total_timesteps | 959232 | -| train/ | | -| approx_kl | 0.04321816 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | -0.0294 | -| n_updates | 74930 | -| policy_gradient_loss | -0.0222 | -| std | 0.124 | -| value_loss | 0.000136 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7495 | -| time_elapsed | 48007 | -| total_timesteps | 959360 | -| train/ | | -| approx_kl | 0.022848183 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 74940 | -| policy_gradient_loss | -0.00551 | -| std | 0.124 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7496 | -| time_elapsed | 48011 | -| total_timesteps | 959488 | -| train/ | | -| approx_kl | 0.0007250793 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.000531 | -| n_updates | 74950 | -| policy_gradient_loss | -2.29e-05 | -| std | 0.124 | -| value_loss | 1.09e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7497 | -| time_elapsed | 48013 | -| total_timesteps | 959616 | -| train/ | | -| approx_kl | 0.0033418587 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | 0.00988 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 74960 | -| policy_gradient_loss | 0.00184 | -| std | 0.123 | -| value_loss | 4.19e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7498 | -| time_elapsed | 48016 | -| total_timesteps | 959744 | -| train/ | | -| approx_kl | 0.030843515 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | 0.00762 | -| learning_rate | 0.0003 | -| loss | 0.00369 | -| n_updates | 74970 | -| policy_gradient_loss | -0.00178 | -| std | 0.123 | -| value_loss | 6.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7499 | -| time_elapsed | 48020 | -| total_timesteps | 959872 | -| train/ | | -| approx_kl | 0.004879737 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | -0.00907 | -| n_updates | 74980 | -| policy_gradient_loss | -0.0069 | -| std | 0.123 | -| value_loss | 3.63e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7500 | -| time_elapsed | 48023 | -| total_timesteps | 960000 | -| train/ | | -| approx_kl | 0.0048844083 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 74990 | -| policy_gradient_loss | -0.000588 | -| std | 0.123 | -| value_loss | 3.63e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7501 | -| time_elapsed | 48027 | -| total_timesteps | 960128 | -| train/ | | -| approx_kl | 0.036773726 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | 0.00402 | -| learning_rate | 0.0003 | -| loss | -0.00973 | -| n_updates | 75000 | -| policy_gradient_loss | -0.00749 | -| std | 0.123 | -| value_loss | 2.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7502 | -| time_elapsed | 48035 | -| total_timesteps | 960256 | -| train/ | | -| approx_kl | 0.016733553 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.679 | -| explained_variance | 0.568 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 75010 | -| policy_gradient_loss | -0.0153 | -| std | 0.123 | -| value_loss | 0.00384 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7503 | -| time_elapsed | 48040 | -| total_timesteps | 960384 | -| train/ | | -| approx_kl | 0.051965084 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 0.679 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.00836 | -| n_updates | 75020 | -| policy_gradient_loss | -0.00911 | -| std | 0.123 | -| value_loss | 5.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7504 | -| time_elapsed | 48043 | -| total_timesteps | 960512 | -| train/ | | -| approx_kl | 0.021453116 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -50.7 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 75030 | -| policy_gradient_loss | -0.00176 | -| std | 0.123 | -| value_loss | 3.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7505 | -| time_elapsed | 48047 | -| total_timesteps | 960640 | -| train/ | | -| approx_kl | 0.04233446 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -20.7 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 75040 | -| policy_gradient_loss | -0.00476 | -| std | 0.123 | -| value_loss | 5.97e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7506 | -| time_elapsed | 48051 | -| total_timesteps | 960768 | -| train/ | | -| approx_kl | 0.05013988 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -2.45 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 75050 | -| policy_gradient_loss | -0.00643 | -| std | 0.123 | -| value_loss | 8.1e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7507 | -| time_elapsed | 48054 | -| total_timesteps | 960896 | -| train/ | | -| approx_kl | 0.023977978 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | -0.679 | -| learning_rate | 0.0003 | -| loss | -9.45e-05 | -| n_updates | 75060 | -| policy_gradient_loss | -0.0014 | -| std | 0.123 | -| value_loss | 4.28e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7508 | -| time_elapsed | 48058 | -| total_timesteps | 961024 | -| train/ | | -| approx_kl | 0.0022472492 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | -0.00015 | -| n_updates | 75070 | -| policy_gradient_loss | -0.000109 | -| std | 0.123 | -| value_loss | 7.31e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7509 | -| time_elapsed | 48066 | -| total_timesteps | 961152 | -| train/ | | -| approx_kl | 0.011836227 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 0.675 | -| explained_variance | 0.472 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 75080 | -| policy_gradient_loss | -0.00169 | -| std | 0.123 | -| value_loss | 0.00859 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7510 | -| time_elapsed | 48071 | -| total_timesteps | 961280 | -| train/ | | -| approx_kl | 0.024911173 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -10.4 | -| learning_rate | 0.0003 | -| loss | -0.000927 | -| n_updates | 75090 | -| policy_gradient_loss | -0.000657 | -| std | 0.123 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7511 | -| time_elapsed | 48075 | -| total_timesteps | 961408 | -| train/ | | -| approx_kl | 0.021188483 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -106 | -| learning_rate | 0.0003 | -| loss | -0.00868 | -| n_updates | 75100 | -| policy_gradient_loss | -0.0065 | -| std | 0.123 | -| value_loss | 1.58e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 19 | -| iterations | 7512 | -| time_elapsed | 48079 | -| total_timesteps | 961536 | -| train/ | | -| approx_kl | 0.13611317 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -31 | -| learning_rate | 0.0003 | -| loss | 0.0028 | -| n_updates | 75110 | -| policy_gradient_loss | -0.00289 | -| std | 0.123 | -| value_loss | 2.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7513 | -| time_elapsed | 48082 | -| total_timesteps | 961664 | -| train/ | | -| approx_kl | 0.023104228 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -5.27 | -| learning_rate | 0.0003 | -| loss | -0.000248 | -| n_updates | 75120 | -| policy_gradient_loss | -0.000303 | -| std | 0.123 | -| value_loss | 3.07e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7514 | -| time_elapsed | 48085 | -| total_timesteps | 961792 | -| train/ | | -| approx_kl | 0.00504682 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 75130 | -| policy_gradient_loss | -0.000787 | -| std | 0.123 | -| value_loss | 1.31e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7515 | -| time_elapsed | 48088 | -| total_timesteps | 961920 | -| train/ | | -| approx_kl | 0.021667652 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.441 | -| learning_rate | 0.0003 | -| loss | -0.00773 | -| n_updates | 75140 | -| policy_gradient_loss | -0.00353 | -| std | 0.123 | -| value_loss | 2.75e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7516 | -| time_elapsed | 48091 | -| total_timesteps | 962048 | -| train/ | | -| approx_kl | 0.00079280324 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | -0.000276 | -| n_updates | 75150 | -| policy_gradient_loss | 0.00291 | -| std | 0.123 | -| value_loss | 1.45e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7517 | -| time_elapsed | 48097 | -| total_timesteps | 962176 | -| train/ | | -| approx_kl | 0.089641735 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | 0.579 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 75160 | -| policy_gradient_loss | -0.0196 | -| std | 0.123 | -| value_loss | 0.00589 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7518 | -| time_elapsed | 48101 | -| total_timesteps | 962304 | -| train/ | | -| approx_kl | 0.0058128447 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -220 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 75170 | -| policy_gradient_loss | -0.000701 | -| std | 0.123 | -| value_loss | 5.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7519 | -| time_elapsed | 48104 | -| total_timesteps | 962432 | -| train/ | | -| approx_kl | 0.049364567 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -371 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 75180 | -| policy_gradient_loss | -0.00177 | -| std | 0.123 | -| value_loss | 4.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7520 | -| time_elapsed | 48107 | -| total_timesteps | 962560 | -| train/ | | -| approx_kl | 0.03136623 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 0.674 | -| explained_variance | -38 | -| learning_rate | 0.0003 | -| loss | 0.000834 | -| n_updates | 75190 | -| policy_gradient_loss | -0.000954 | -| std | 0.123 | -| value_loss | 8.8e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7521 | -| time_elapsed | 48110 | -| total_timesteps | 962688 | -| train/ | | -| approx_kl | 0.09928273 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 0.674 | -| explained_variance | -237 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 75200 | -| policy_gradient_loss | -0.00594 | -| std | 0.123 | -| value_loss | 1.61e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7522 | -| time_elapsed | 48112 | -| total_timesteps | 962816 | -| train/ | | -| approx_kl | 0.06221932 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | -19.3 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 75210 | -| policy_gradient_loss | -0.0042 | -| std | 0.124 | -| value_loss | 3.93e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7523 | -| time_elapsed | 48115 | -| total_timesteps | 962944 | -| train/ | | -| approx_kl | 0.006056792 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -60.6 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 75220 | -| policy_gradient_loss | -0.00246 | -| std | 0.124 | -| value_loss | 5.7e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7524 | -| time_elapsed | 48118 | -| total_timesteps | 963072 | -| train/ | | -| approx_kl | 0.039038718 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | -5.15 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 75230 | -| policy_gradient_loss | -0.0112 | -| std | 0.123 | -| value_loss | 4.17e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7525 | -| time_elapsed | 48124 | -| total_timesteps | 963200 | -| train/ | | -| approx_kl | 0.027008567 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.0323 | -| n_updates | 75240 | -| policy_gradient_loss | -0.0218 | -| std | 0.123 | -| value_loss | 0.000418 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7526 | -| time_elapsed | 48128 | -| total_timesteps | 963328 | -| train/ | | -| approx_kl | 0.04429645 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 0.674 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 75250 | -| policy_gradient_loss | -0.00635 | -| std | 0.123 | -| value_loss | 7.14e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7527 | -| time_elapsed | 48132 | -| total_timesteps | 963456 | -| train/ | | -| approx_kl | 0.0045073405 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | -1.91 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 75260 | -| policy_gradient_loss | -0.00394 | -| std | 0.123 | -| value_loss | 5.62e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7528 | -| time_elapsed | 48135 | -| total_timesteps | 963584 | -| train/ | | -| approx_kl | 0.0024621538 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.612 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 75270 | -| policy_gradient_loss | -0.00116 | -| std | 0.124 | -| value_loss | 3.46e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7529 | -| time_elapsed | 48139 | -| total_timesteps | 963712 | -| train/ | | -| approx_kl | 0.008402281 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | 0.000499 | -| n_updates | 75280 | -| policy_gradient_loss | 0.00182 | -| std | 0.123 | -| value_loss | 6.62e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7530 | -| time_elapsed | 48144 | -| total_timesteps | 963840 | -| train/ | | -| approx_kl | 0.001630927 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 0.674 | -| explained_variance | -0.711 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 75290 | -| policy_gradient_loss | 0.00154 | -| std | 0.123 | -| value_loss | 3.11e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 20 | -| iterations | 7531 | -| time_elapsed | 48148 | -| total_timesteps | 963968 | -| train/ | | -| approx_kl | 0.016197229 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.0009 | -| n_updates | 75300 | -| policy_gradient_loss | -1.4e-06 | -| std | 0.123 | -| value_loss | 8.78e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7532 | -| time_elapsed | 48151 | -| total_timesteps | 964096 | -| train/ | | -| approx_kl | 0.024736036 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.00333 | -| learning_rate | 0.0003 | -| loss | 0.00382 | -| n_updates | 75310 | -| policy_gradient_loss | 6.91e-05 | -| std | 0.123 | -| value_loss | 1.08e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7533 | -| time_elapsed | 48159 | -| total_timesteps | 964224 | -| train/ | | -| approx_kl | 0.08260434 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | 0.893 | -| learning_rate | 0.0003 | -| loss | -0.0303 | -| n_updates | 75320 | -| policy_gradient_loss | -0.0212 | -| std | 0.123 | -| value_loss | 0.000324 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7534 | -| time_elapsed | 48164 | -| total_timesteps | 964352 | -| train/ | | -| approx_kl | 0.027675305 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.00673 | -| n_updates | 75330 | -| policy_gradient_loss | 0.000559 | -| std | 0.123 | -| value_loss | 3.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7535 | -| time_elapsed | 48166 | -| total_timesteps | 964480 | -| train/ | | -| approx_kl | 0.009586648 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -0.641 | -| learning_rate | 0.0003 | -| loss | 0.000134 | -| n_updates | 75340 | -| policy_gradient_loss | 0.00199 | -| std | 0.123 | -| value_loss | 2.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7536 | -| time_elapsed | 48170 | -| total_timesteps | 964608 | -| train/ | | -| approx_kl | 0.043044288 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -0.615 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 75350 | -| policy_gradient_loss | -0.00831 | -| std | 0.123 | -| value_loss | 3.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7537 | -| time_elapsed | 48173 | -| total_timesteps | 964736 | -| train/ | | -| approx_kl | 0.034374185 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -0.096 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 75360 | -| policy_gradient_loss | -0.0102 | -| std | 0.123 | -| value_loss | 1.98e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7538 | -| time_elapsed | 48177 | -| total_timesteps | 964864 | -| train/ | | -| approx_kl | 0.0019947174 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 75370 | -| policy_gradient_loss | 0.000455 | -| std | 0.123 | -| value_loss | 1.7e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7539 | -| time_elapsed | 48179 | -| total_timesteps | 964992 | -| train/ | | -| approx_kl | 0.028210197 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 75380 | -| policy_gradient_loss | -0.00542 | -| std | 0.124 | -| value_loss | 1.08e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7540 | -| time_elapsed | 48182 | -| total_timesteps | 965120 | -| train/ | | -| approx_kl | 0.0027838736 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | 0.00432 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 75390 | -| policy_gradient_loss | -0.00203 | -| std | 0.124 | -| value_loss | 1.12e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7541 | -| time_elapsed | 48191 | -| total_timesteps | 965248 | -| train/ | | -| approx_kl | 0.046972238 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 75400 | -| policy_gradient_loss | -0.0155 | -| std | 0.124 | -| value_loss | 0.001 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7542 | -| time_elapsed | 48195 | -| total_timesteps | 965376 | -| train/ | | -| approx_kl | 0.0041500265 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | -0.532 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 75410 | -| policy_gradient_loss | -0.000681 | -| std | 0.124 | -| value_loss | 1.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7543 | -| time_elapsed | 48198 | -| total_timesteps | 965504 | -| train/ | | -| approx_kl | 0.0028332002 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.416 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 75420 | -| policy_gradient_loss | -0.00101 | -| std | 0.124 | -| value_loss | 8.62e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7544 | -| time_elapsed | 48200 | -| total_timesteps | 965632 | -| train/ | | -| approx_kl | 0.04409646 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | -0.0592 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 75430 | -| policy_gradient_loss | -0.0157 | -| std | 0.124 | -| value_loss | 1.47e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7545 | -| time_elapsed | 48202 | -| total_timesteps | 965760 | -| train/ | | -| approx_kl | 0.0031252592 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | -0.00746 | -| n_updates | 75440 | -| policy_gradient_loss | -0.00413 | -| std | 0.124 | -| value_loss | 7.06e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7546 | -| time_elapsed | 48205 | -| total_timesteps | 965888 | -| train/ | | -| approx_kl | 0.013720102 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | -0.00076 | -| n_updates | 75450 | -| policy_gradient_loss | -0.000427 | -| std | 0.124 | -| value_loss | 5.1e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7547 | -| time_elapsed | 48209 | -| total_timesteps | 966016 | -| train/ | | -| approx_kl | 0.05471215 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 0.671 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 75460 | -| policy_gradient_loss | -0.0109 | -| std | 0.124 | -| value_loss | 4.73e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7548 | -| time_elapsed | 48216 | -| total_timesteps | 966144 | -| train/ | | -| approx_kl | 0.040714577 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | 0.828 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 75470 | -| policy_gradient_loss | -0.00971 | -| std | 0.124 | -| value_loss | 0.000964 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7549 | -| time_elapsed | 48220 | -| total_timesteps | 966272 | -| train/ | | -| approx_kl | 0.04442468 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 0.673 | -| explained_variance | -0.536 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 75480 | -| policy_gradient_loss | -0.0176 | -| std | 0.123 | -| value_loss | 2.35e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7550 | -| time_elapsed | 48224 | -| total_timesteps | 966400 | -| train/ | | -| approx_kl | 6.1889645e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.344 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 75490 | -| policy_gradient_loss | -0.00111 | -| std | 0.122 | -| value_loss | 4.1e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7551 | -| time_elapsed | 48227 | -| total_timesteps | 966528 | -| train/ | | -| approx_kl | 0.0011939988 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 0.685 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -0.00095 | -| n_updates | 75500 | -| policy_gradient_loss | -0.000609 | -| std | 0.122 | -| value_loss | 4.11e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7552 | -| time_elapsed | 48230 | -| total_timesteps | 966656 | -| train/ | | -| approx_kl | 0.0063537587 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 0.69 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.00465 | -| n_updates | 75510 | -| policy_gradient_loss | 0.000692 | -| std | 0.121 | -| value_loss | 6.16e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7553 | -| time_elapsed | 48233 | -| total_timesteps | 966784 | -| train/ | | -| approx_kl | 0.02852873 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.691 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 75520 | -| policy_gradient_loss | -0.00162 | -| std | 0.121 | -| value_loss | 1.97e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 20 | -| iterations | 7554 | -| time_elapsed | 48236 | -| total_timesteps | 966912 | -| train/ | | -| approx_kl | 0.009384988 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.692 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 75530 | -| policy_gradient_loss | -0.000528 | -| std | 0.121 | -| value_loss | 1.58e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7555 | -| time_elapsed | 48240 | -| total_timesteps | 967040 | -| train/ | | -| approx_kl | 0.020996826 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 0.692 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 75540 | -| policy_gradient_loss | -0.0068 | -| std | 0.121 | -| value_loss | 1.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7556 | -| time_elapsed | 48247 | -| total_timesteps | 967168 | -| train/ | | -| approx_kl | 0.024886096 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.692 | -| explained_variance | 0.707 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 75550 | -| policy_gradient_loss | -0.0148 | -| std | 0.121 | -| value_loss | 0.00315 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7557 | -| time_elapsed | 48252 | -| total_timesteps | 967296 | -| train/ | | -| approx_kl | 0.005783385 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.691 | -| explained_variance | -15 | -| learning_rate | 0.0003 | -| loss | -0.000564 | -| n_updates | 75560 | -| policy_gradient_loss | 0.00124 | -| std | 0.121 | -| value_loss | 4.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7558 | -| time_elapsed | 48255 | -| total_timesteps | 967424 | -| train/ | | -| approx_kl | 0.027132723 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.69 | -| explained_variance | -63.2 | -| learning_rate | 0.0003 | -| loss | -0.00642 | -| n_updates | 75570 | -| policy_gradient_loss | -0.000855 | -| std | 0.121 | -| value_loss | 3.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7559 | -| time_elapsed | 48259 | -| total_timesteps | 967552 | -| train/ | | -| approx_kl | 0.094449036 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 0.69 | -| explained_variance | -9.92 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 75580 | -| policy_gradient_loss | -0.00504 | -| std | 0.121 | -| value_loss | 7.43e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7560 | -| time_elapsed | 48263 | -| total_timesteps | 967680 | -| train/ | | -| approx_kl | 0.004682281 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 0.689 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 75590 | -| policy_gradient_loss | -0.00145 | -| std | 0.122 | -| value_loss | 2.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7561 | -| time_elapsed | 48266 | -| total_timesteps | 967808 | -| train/ | | -| approx_kl | 0.034659717 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 0.687 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.00376 | -| n_updates | 75600 | -| policy_gradient_loss | -0.00109 | -| std | 0.122 | -| value_loss | 4.68e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7562 | -| time_elapsed | 48270 | -| total_timesteps | 967936 | -| train/ | | -| approx_kl | 0.0011582565 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.686 | -| explained_variance | -0.00504 | -| learning_rate | 0.0003 | -| loss | -0.000878 | -| n_updates | 75610 | -| policy_gradient_loss | -7.45e-05 | -| std | 0.122 | -| value_loss | 9.59e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7563 | -| time_elapsed | 48274 | -| total_timesteps | 968064 | -| train/ | | -| approx_kl | 0.01405092 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 0.684 | -| explained_variance | 0.00199 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 75620 | -| policy_gradient_loss | -0.000919 | -| std | 0.122 | -| value_loss | 5.54e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7564 | -| time_elapsed | 48279 | -| total_timesteps | 968192 | -| train/ | | -| approx_kl | 0.028479427 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.683 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 75630 | -| policy_gradient_loss | -0.017 | -| std | 0.122 | -| value_loss | 0.00122 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7565 | -| time_elapsed | 48282 | -| total_timesteps | 968320 | -| train/ | | -| approx_kl | 0.012742775 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 0.684 | -| explained_variance | -5.51 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 75640 | -| policy_gradient_loss | -0.00122 | -| std | 0.122 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7566 | -| time_elapsed | 48285 | -| total_timesteps | 968448 | -| train/ | | -| approx_kl | 0.043363918 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 0.684 | -| explained_variance | -7.11 | -| learning_rate | 0.0003 | -| loss | -0.00846 | -| n_updates | 75650 | -| policy_gradient_loss | -0.00331 | -| std | 0.122 | -| value_loss | 4.98e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7567 | -| time_elapsed | 48288 | -| total_timesteps | 968576 | -| train/ | | -| approx_kl | 0.012198052 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 0.684 | -| explained_variance | -1.95 | -| learning_rate | 0.0003 | -| loss | -0.000857 | -| n_updates | 75660 | -| policy_gradient_loss | 0.000352 | -| std | 0.122 | -| value_loss | 1.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7568 | -| time_elapsed | 48291 | -| total_timesteps | 968704 | -| train/ | | -| approx_kl | 0.008770512 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 0.683 | -| explained_variance | -0.319 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 75670 | -| policy_gradient_loss | 0.000605 | -| std | 0.122 | -| value_loss | 8.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7569 | -| time_elapsed | 48293 | -| total_timesteps | 968832 | -| train/ | | -| approx_kl | 0.037739083 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 0.682 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 75680 | -| policy_gradient_loss | -0.00804 | -| std | 0.122 | -| value_loss | 1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 20 | -| iterations | 7570 | -| time_elapsed | 48297 | -| total_timesteps | 968960 | -| train/ | | -| approx_kl | 0.012985564 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 0.681 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.000441 | -| n_updates | 75690 | -| policy_gradient_loss | -0.000356 | -| std | 0.123 | -| value_loss | 3.04e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7571 | -| time_elapsed | 48299 | -| total_timesteps | 969088 | -| train/ | | -| approx_kl | 0.0011687619 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.676 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 75700 | -| policy_gradient_loss | -0.00178 | -| std | 0.123 | -| value_loss | 1.63e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7572 | -| time_elapsed | 48306 | -| total_timesteps | 969216 | -| train/ | | -| approx_kl | 0.017354384 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.672 | -| explained_variance | 0.664 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 75710 | -| policy_gradient_loss | -0.0161 | -| std | 0.124 | -| value_loss | 0.00436 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7573 | -| time_elapsed | 48311 | -| total_timesteps | 969344 | -| train/ | | -| approx_kl | 0.015582468 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 0.669 | -| explained_variance | -153 | -| learning_rate | 0.0003 | -| loss | -0.000483 | -| n_updates | 75720 | -| policy_gradient_loss | -0.000411 | -| std | 0.124 | -| value_loss | 7.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7574 | -| time_elapsed | 48314 | -| total_timesteps | 969472 | -| train/ | | -| approx_kl | 0.071418315 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 0.666 | -| explained_variance | -54.6 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 75730 | -| policy_gradient_loss | -0.00522 | -| std | 0.124 | -| value_loss | 5.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7575 | -| time_elapsed | 48318 | -| total_timesteps | 969600 | -| train/ | | -| approx_kl | 0.033291526 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 0.665 | -| explained_variance | -12.7 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 75740 | -| policy_gradient_loss | -0.0024 | -| std | 0.125 | -| value_loss | 1.46e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7576 | -| time_elapsed | 48323 | -| total_timesteps | 969728 | -| train/ | | -| approx_kl | 0.0065373564 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.665 | -| explained_variance | -0.799 | -| learning_rate | 0.0003 | -| loss | -0.000496 | -| n_updates | 75750 | -| policy_gradient_loss | 0.000364 | -| std | 0.124 | -| value_loss | 2.3e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7577 | -| time_elapsed | 48325 | -| total_timesteps | 969856 | -| train/ | | -| approx_kl | 0.009444089 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.667 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.00265 | -| n_updates | 75760 | -| policy_gradient_loss | 0.001 | -| std | 0.124 | -| value_loss | 1.93e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7578 | -| time_elapsed | 48328 | -| total_timesteps | 969984 | -| train/ | | -| approx_kl | 0.008456089 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | 0.00638 | -| learning_rate | 0.0003 | -| loss | -0.000502 | -| n_updates | 75770 | -| policy_gradient_loss | -6.54e-05 | -| std | 0.124 | -| value_loss | 2.53e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7579 | -| time_elapsed | 48331 | -| total_timesteps | 970112 | -| train/ | | -| approx_kl | 0.037597686 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.00838 | -| n_updates | 75780 | -| policy_gradient_loss | -0.00603 | -| std | 0.124 | -| value_loss | 2.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7580 | -| time_elapsed | 48339 | -| total_timesteps | 970240 | -| train/ | | -| approx_kl | 0.077917986 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 0.669 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | -0.0258 | -| n_updates | 75790 | -| policy_gradient_loss | -0.0175 | -| std | 0.124 | -| value_loss | 0.00168 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7581 | -| time_elapsed | 48343 | -| total_timesteps | 970368 | -| train/ | | -| approx_kl | 0.00018742029 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 0.669 | -| explained_variance | -2.57 | -| learning_rate | 0.0003 | -| loss | -0.000611 | -| n_updates | 75800 | -| policy_gradient_loss | 0.00664 | -| std | 0.124 | -| value_loss | 2.94e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7582 | -| time_elapsed | 48347 | -| total_timesteps | 970496 | -| train/ | | -| approx_kl | 0.0243676 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | -9.17 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 75810 | -| policy_gradient_loss | -0.00166 | -| std | 0.124 | -| value_loss | 2.05e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7583 | -| time_elapsed | 48350 | -| total_timesteps | 970624 | -| train/ | | -| approx_kl | 0.0001369887 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.67 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 75820 | -| policy_gradient_loss | 0.000411 | -| std | 0.124 | -| value_loss | 2.59e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7584 | -| time_elapsed | 48354 | -| total_timesteps | 970752 | -| train/ | | -| approx_kl | 0.0005545961 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 0.674 | -| explained_variance | -0.0785 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 75830 | -| policy_gradient_loss | -0.000654 | -| std | 0.123 | -| value_loss | 1.24e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7585 | -| time_elapsed | 48358 | -| total_timesteps | 970880 | -| train/ | | -| approx_kl | 0.0046917098 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.677 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 75840 | -| policy_gradient_loss | -0.0022 | -| std | 0.123 | -| value_loss | 1e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7586 | -| time_elapsed | 48361 | -| total_timesteps | 971008 | -| train/ | | -| approx_kl | 0.0023572012 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | -0.000603 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 75850 | -| policy_gradient_loss | -0.00142 | -| std | 0.123 | -| value_loss | 5.34e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7587 | -| time_elapsed | 48371 | -| total_timesteps | 971136 | -| train/ | | -| approx_kl | 0.10736832 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 0.678 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 75860 | -| policy_gradient_loss | -0.00987 | -| std | 0.123 | -| value_loss | 0.00143 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7588 | -| time_elapsed | 48375 | -| total_timesteps | 971264 | -| train/ | | -| approx_kl | 0.038999215 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.679 | -| explained_variance | 0.927 | -| learning_rate | 0.0003 | -| loss | 0.00249 | -| n_updates | 75870 | -| policy_gradient_loss | -0.000143 | -| std | 0.123 | -| value_loss | 5.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7589 | -| time_elapsed | 48378 | -| total_timesteps | 971392 | -| train/ | | -| approx_kl | 0.122224346 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -24.4 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 75880 | -| policy_gradient_loss | -0.00662 | -| std | 0.123 | -| value_loss | 6.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7590 | -| time_elapsed | 48382 | -| total_timesteps | 971520 | -| train/ | | -| approx_kl | 0.019199632 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -6.84 | -| learning_rate | 0.0003 | -| loss | -0.00635 | -| n_updates | 75890 | -| policy_gradient_loss | -0.00453 | -| std | 0.123 | -| value_loss | 5.8e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7591 | -| time_elapsed | 48385 | -| total_timesteps | 971648 | -| train/ | | -| approx_kl | 0.0023265262 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 75900 | -| policy_gradient_loss | 0.00295 | -| std | 0.123 | -| value_loss | 2.16e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7592 | -| time_elapsed | 48388 | -| total_timesteps | 971776 | -| train/ | | -| approx_kl | 0.031241843 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | 0.00614 | -| n_updates | 75910 | -| policy_gradient_loss | 0.000964 | -| std | 0.123 | -| value_loss | 8.95e-10 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7593 | -| time_elapsed | 48392 | -| total_timesteps | 971904 | -| train/ | | -| approx_kl | 0.0211 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00527 | -| n_updates | 75920 | -| policy_gradient_loss | -0.00373 | -| std | 0.123 | -| value_loss | 1.58e-09 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7594 | -| time_elapsed | 48396 | -| total_timesteps | 972032 | -| train/ | | -| approx_kl | 0.0010311631 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 75930 | -| policy_gradient_loss | 0.000219 | -| std | 0.123 | -| value_loss | 1.29e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7595 | -| time_elapsed | 48403 | -| total_timesteps | 972160 | -| train/ | | -| approx_kl | 0.053710118 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 0.681 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 75940 | -| policy_gradient_loss | -0.0157 | -| std | 0.122 | -| value_loss | 0.000269 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7596 | -| time_elapsed | 48406 | -| total_timesteps | 972288 | -| train/ | | -| approx_kl | 0.004229221 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.681 | -| explained_variance | -7.16 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 75950 | -| policy_gradient_loss | -0.00302 | -| std | 0.122 | -| value_loss | 7.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7597 | -| time_elapsed | 48408 | -| total_timesteps | 972416 | -| train/ | | -| approx_kl | 0.03814237 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.681 | -| explained_variance | -15.7 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 75960 | -| policy_gradient_loss | -0.00943 | -| std | 0.123 | -| value_loss | 4.51e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7598 | -| time_elapsed | 48411 | -| total_timesteps | 972544 | -| train/ | | -| approx_kl | 0.0026609753 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 0.681 | -| explained_variance | -3.12 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 75970 | -| policy_gradient_loss | -0.00824 | -| std | 0.123 | -| value_loss | 1.85e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7599 | -| time_elapsed | 48413 | -| total_timesteps | 972672 | -| train/ | | -| approx_kl | 0.017233256 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -0.605 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 75980 | -| policy_gradient_loss | -0.0064 | -| std | 0.123 | -| value_loss | 1.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7600 | -| time_elapsed | 48416 | -| total_timesteps | 972800 | -| train/ | | -| approx_kl | 0.011038516 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -2.66 | -| learning_rate | 0.0003 | -| loss | -0.00722 | -| n_updates | 75990 | -| policy_gradient_loss | -0.00255 | -| std | 0.123 | -| value_loss | 1.07e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7601 | -| time_elapsed | 48419 | -| total_timesteps | 972928 | -| train/ | | -| approx_kl | 0.0074769775 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 0.679 | -| explained_variance | 0.00602 | -| learning_rate | 0.0003 | -| loss | -0.00675 | -| n_updates | 76000 | -| policy_gradient_loss | -0.00104 | -| std | 0.123 | -| value_loss | 4.54e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7602 | -| time_elapsed | 48422 | -| total_timesteps | 973056 | -| train/ | | -| approx_kl | 0.020344295 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.679 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 76010 | -| policy_gradient_loss | 0.000849 | -| std | 0.123 | -| value_loss | 2.3e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7603 | -| time_elapsed | 48427 | -| total_timesteps | 973184 | -| train/ | | -| approx_kl | 0.057843708 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | 0.696 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 76020 | -| policy_gradient_loss | -0.0156 | -| std | 0.123 | -| value_loss | 0.00464 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7604 | -| time_elapsed | 48430 | -| total_timesteps | 973312 | -| train/ | | -| approx_kl | 0.063167624 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -1.15e+03 | -| learning_rate | 0.0003 | -| loss | -0.000219 | -| n_updates | 76030 | -| policy_gradient_loss | -0.00283 | -| std | 0.123 | -| value_loss | 1.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7605 | -| time_elapsed | 48433 | -| total_timesteps | 973440 | -| train/ | | -| approx_kl | 0.06769746 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -843 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 76040 | -| policy_gradient_loss | -0.0032 | -| std | 0.123 | -| value_loss | 7.86e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7606 | -| time_elapsed | 48437 | -| total_timesteps | 973568 | -| train/ | | -| approx_kl | 0.004545568 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -199 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 76050 | -| policy_gradient_loss | -0.00969 | -| std | 0.123 | -| value_loss | 8.57e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7607 | -| time_elapsed | 48440 | -| total_timesteps | 973696 | -| train/ | | -| approx_kl | 0.0127640385 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.68 | -| explained_variance | -29.3 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 76060 | -| policy_gradient_loss | -0.00208 | -| std | 0.123 | -| value_loss | 8.99e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7608 | -| time_elapsed | 48442 | -| total_timesteps | 973824 | -| train/ | | -| approx_kl | 0.016831031 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.681 | -| explained_variance | -3.14 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 76070 | -| policy_gradient_loss | -0.00141 | -| std | 0.122 | -| value_loss | 2.18e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 20 | -| iterations | 7609 | -| time_elapsed | 48445 | -| total_timesteps | 973952 | -| train/ | | -| approx_kl | 0.0002679266 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.682 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 76080 | -| policy_gradient_loss | -0.00132 | -| std | 0.122 | -| value_loss | 1.9e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7610 | -| time_elapsed | 48449 | -| total_timesteps | 974080 | -| train/ | | -| approx_kl | 0.004104327 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.683 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 76090 | -| policy_gradient_loss | -0.00332 | -| std | 0.122 | -| value_loss | 8.92e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7611 | -| time_elapsed | 48455 | -| total_timesteps | 974208 | -| train/ | | -| approx_kl | 0.008081925 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | 0.682 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 76100 | -| policy_gradient_loss | -0.0142 | -| std | 0.122 | -| value_loss | 0.00178 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7612 | -| time_elapsed | 48459 | -| total_timesteps | 974336 | -| train/ | | -| approx_kl | 0.034995947 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.682 | -| explained_variance | -27.6 | -| learning_rate | 0.0003 | -| loss | -0.000547 | -| n_updates | 76110 | -| policy_gradient_loss | -0.000567 | -| std | 0.122 | -| value_loss | 1.67e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7613 | -| time_elapsed | 48462 | -| total_timesteps | 974464 | -| train/ | | -| approx_kl | 0.0005929833 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 0.683 | -| explained_variance | -62.3 | -| learning_rate | 0.0003 | -| loss | -0.000453 | -| n_updates | 76120 | -| policy_gradient_loss | -0.00022 | -| std | 0.122 | -| value_loss | 1.09e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7614 | -| time_elapsed | 48466 | -| total_timesteps | 974592 | -| train/ | | -| approx_kl | 0.004816067 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 0.686 | -| explained_variance | -6.99 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 76130 | -| policy_gradient_loss | -0.00173 | -| std | 0.122 | -| value_loss | 2.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7615 | -| time_elapsed | 48469 | -| total_timesteps | 974720 | -| train/ | | -| approx_kl | 0.03299254 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.687 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 76140 | -| policy_gradient_loss | -0.0142 | -| std | 0.122 | -| value_loss | 1.64e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7616 | -| time_elapsed | 48473 | -| total_timesteps | 974848 | -| train/ | | -| approx_kl | 0.0023384634 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 0.688 | -| explained_variance | -0.0743 | -| learning_rate | 0.0003 | -| loss | -0.000501 | -| n_updates | 76150 | -| policy_gradient_loss | 2.61e-05 | -| std | 0.122 | -| value_loss | 1.19e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 20 | -| iterations | 7617 | -| time_elapsed | 48476 | -| total_timesteps | 974976 | -| train/ | | -| approx_kl | 0.01477379 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.689 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.000729 | -| n_updates | 76160 | -| policy_gradient_loss | 0.000587 | -| std | 0.121 | -| value_loss | 2.33e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7618 | -| time_elapsed | 48479 | -| total_timesteps | 975104 | -| train/ | | -| approx_kl | 0.0007134224 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.689 | -| explained_variance | 0.00809 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 76170 | -| policy_gradient_loss | -0.000341 | -| std | 0.122 | -| value_loss | 8.87e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7619 | -| time_elapsed | 48488 | -| total_timesteps | 975232 | -| train/ | | -| approx_kl | 0.021251023 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 0.688 | -| explained_variance | -2.46 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 76180 | -| policy_gradient_loss | -0.0165 | -| std | 0.122 | -| value_loss | 0.00162 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7620 | -| time_elapsed | 48491 | -| total_timesteps | 975360 | -| train/ | | -| approx_kl | 0.042130277 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.689 | -| explained_variance | -16.4 | -| learning_rate | 0.0003 | -| loss | -0.00718 | -| n_updates | 76190 | -| policy_gradient_loss | -0.00458 | -| std | 0.122 | -| value_loss | 6.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7621 | -| time_elapsed | 48495 | -| total_timesteps | 975488 | -| train/ | | -| approx_kl | 0.006832277 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 0.689 | -| explained_variance | -5.97 | -| learning_rate | 0.0003 | -| loss | -0.00759 | -| n_updates | 76200 | -| policy_gradient_loss | -0.00524 | -| std | 0.121 | -| value_loss | 3.93e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7622 | -| time_elapsed | 48499 | -| total_timesteps | 975616 | -| train/ | | -| approx_kl | 0.00044263108 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.69 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.000679 | -| n_updates | 76210 | -| policy_gradient_loss | -0.000344 | -| std | 0.121 | -| value_loss | 9.2e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7623 | -| time_elapsed | 48502 | -| total_timesteps | 975744 | -| train/ | | -| approx_kl | 0.0011051092 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.694 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 76220 | -| policy_gradient_loss | -0.000353 | -| std | 0.121 | -| value_loss | 1.6e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7624 | -| time_elapsed | 48506 | -| total_timesteps | 975872 | -| train/ | | -| approx_kl | 0.010561392 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.697 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 76230 | -| policy_gradient_loss | -0.00172 | -| std | 0.12 | -| value_loss | 1.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7625 | -| time_elapsed | 48510 | -| total_timesteps | 976000 | -| train/ | | -| approx_kl | 0.022047434 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | -0.0826 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 76240 | -| policy_gradient_loss | -0.00833 | -| std | 0.12 | -| value_loss | 2.61e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7626 | -| time_elapsed | 48514 | -| total_timesteps | 976128 | -| train/ | | -| approx_kl | 0.00482799 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | 0.00472 | -| learning_rate | 0.0003 | -| loss | -0.00831 | -| n_updates | 76250 | -| policy_gradient_loss | -0.00286 | -| std | 0.12 | -| value_loss | 7.68e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7627 | -| time_elapsed | 48522 | -| total_timesteps | 976256 | -| train/ | | -| approx_kl | 0.011826048 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 76260 | -| policy_gradient_loss | -0.00739 | -| std | 0.12 | -| value_loss | 0.000175 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7628 | -| time_elapsed | 48525 | -| total_timesteps | 976384 | -| train/ | | -| approx_kl | 0.052392006 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.698 | -| explained_variance | -6.23 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 76270 | -| policy_gradient_loss | -0.00323 | -| std | 0.12 | -| value_loss | 7.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7629 | -| time_elapsed | 48528 | -| total_timesteps | 976512 | -| train/ | | -| approx_kl | 6.83479e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.7 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | -0.000734 | -| n_updates | 76280 | -| policy_gradient_loss | -0.000317 | -| std | 0.12 | -| value_loss | 1.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7630 | -| time_elapsed | 48531 | -| total_timesteps | 976640 | -| train/ | | -| approx_kl | 0.006586035 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.706 | -| explained_variance | -0.584 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 76290 | -| policy_gradient_loss | -0.0009 | -| std | 0.119 | -| value_loss | 5.68e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7631 | -| time_elapsed | 48536 | -| total_timesteps | 976768 | -| train/ | | -| approx_kl | 0.0018190322 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.708 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 76300 | -| policy_gradient_loss | -0.000844 | -| std | 0.119 | -| value_loss | 1.96e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7632 | -| time_elapsed | 48539 | -| total_timesteps | 976896 | -| train/ | | -| approx_kl | 0.020037074 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 0.709 | -| explained_variance | -0.00474 | -| learning_rate | 0.0003 | -| loss | -0.0098 | -| n_updates | 76310 | -| policy_gradient_loss | -0.00637 | -| std | 0.119 | -| value_loss | 6.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7633 | -| time_elapsed | 48543 | -| total_timesteps | 977024 | -| train/ | | -| approx_kl | 0.008275315 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.708 | -| explained_variance | -24.9 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 76320 | -| policy_gradient_loss | -0.00012 | -| std | 0.119 | -| value_loss | 8.89e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7634 | -| time_elapsed | 48551 | -| total_timesteps | 977152 | -| train/ | | -| approx_kl | 0.02389705 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 0.709 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 76330 | -| policy_gradient_loss | -0.0151 | -| std | 0.119 | -| value_loss | 0.000911 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7635 | -| time_elapsed | 48554 | -| total_timesteps | 977280 | -| train/ | | -| approx_kl | 0.030791573 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 0.709 | -| explained_variance | 0.515 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 76340 | -| policy_gradient_loss | -0.00361 | -| std | 0.119 | -| value_loss | 1.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7636 | -| time_elapsed | 48558 | -| total_timesteps | 977408 | -| train/ | | -| approx_kl | 0.09515547 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 0.709 | -| explained_variance | -101 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 76350 | -| policy_gradient_loss | -0.0026 | -| std | 0.119 | -| value_loss | 1.26e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7637 | -| time_elapsed | 48562 | -| total_timesteps | 977536 | -| train/ | | -| approx_kl | 0.07604541 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.709 | -| explained_variance | -16.1 | -| learning_rate | 0.0003 | -| loss | -0.00606 | -| n_updates | 76360 | -| policy_gradient_loss | -0.00533 | -| std | 0.119 | -| value_loss | 1.77e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7638 | -| time_elapsed | 48566 | -| total_timesteps | 977664 | -| train/ | | -| approx_kl | 0.007695582 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 0.708 | -| explained_variance | -2.47 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 76370 | -| policy_gradient_loss | -0.00246 | -| std | 0.119 | -| value_loss | 2.65e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7639 | -| time_elapsed | 48569 | -| total_timesteps | 977792 | -| train/ | | -| approx_kl | 0.016696317 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.708 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | 0.00203 | -| n_updates | 76380 | -| policy_gradient_loss | 3.1e-05 | -| std | 0.119 | -| value_loss | 1.98e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 20 | -| iterations | 7640 | -| time_elapsed | 48572 | -| total_timesteps | 977920 | -| train/ | | -| approx_kl | 0.019693473 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 0.708 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 76390 | -| policy_gradient_loss | -0.00723 | -| std | 0.119 | -| value_loss | 1.78e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7641 | -| time_elapsed | 48576 | -| total_timesteps | 978048 | -| train/ | | -| approx_kl | 0.028681343 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.708 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 76400 | -| policy_gradient_loss | -0.00702 | -| std | 0.119 | -| value_loss | 5.42e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7642 | -| time_elapsed | 48583 | -| total_timesteps | 978176 | -| train/ | | -| approx_kl | 0.022081826 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 0.709 | -| explained_variance | 0.675 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 76410 | -| policy_gradient_loss | -0.00491 | -| std | 0.119 | -| value_loss | 0.00533 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7643 | -| time_elapsed | 48586 | -| total_timesteps | 978304 | -| train/ | | -| approx_kl | 0.009044628 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.71 | -| explained_variance | -1.6e+03 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 76420 | -| policy_gradient_loss | -0.0147 | -| std | 0.119 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7644 | -| time_elapsed | 48589 | -| total_timesteps | 978432 | -| train/ | | -| approx_kl | 0.0059855985 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.71 | -| explained_variance | -555 | -| learning_rate | 0.0003 | -| loss | -0.00054 | -| n_updates | 76430 | -| policy_gradient_loss | -0.000221 | -| std | 0.119 | -| value_loss | 4.98e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7645 | -| time_elapsed | 48592 | -| total_timesteps | 978560 | -| train/ | | -| approx_kl | 0.15708259 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 0.708 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | -0.000128 | -| n_updates | 76440 | -| policy_gradient_loss | -0.00497 | -| std | 0.119 | -| value_loss | 1.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7646 | -| time_elapsed | 48595 | -| total_timesteps | 978688 | -| train/ | | -| approx_kl | 0.039462514 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.706 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.00995 | -| n_updates | 76450 | -| policy_gradient_loss | -0.00888 | -| std | 0.12 | -| value_loss | 1.9e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7647 | -| time_elapsed | 48598 | -| total_timesteps | 978816 | -| train/ | | -| approx_kl | 0.0016254801 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.705 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 76460 | -| policy_gradient_loss | -0.002 | -| std | 0.12 | -| value_loss | 2.75e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 20 | -| iterations | 7648 | -| time_elapsed | 48602 | -| total_timesteps | 978944 | -| train/ | | -| approx_kl | 0.0053158947 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.703 | -| explained_variance | -0.00314 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 76470 | -| policy_gradient_loss | -0.00721 | -| std | 0.12 | -| value_loss | 2.69e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7649 | -| time_elapsed | 48606 | -| total_timesteps | 979072 | -| train/ | | -| approx_kl | 0.02529832 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.7 | -| explained_variance | 0.00619 | -| learning_rate | 0.0003 | -| loss | 0.00353 | -| n_updates | 76480 | -| policy_gradient_loss | 0.000178 | -| std | 0.12 | -| value_loss | 1.02e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7650 | -| time_elapsed | 48614 | -| total_timesteps | 979200 | -| train/ | | -| approx_kl | 0.050739586 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 76490 | -| policy_gradient_loss | -0.0137 | -| std | 0.12 | -| value_loss | 0.000167 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7651 | -| time_elapsed | 48618 | -| total_timesteps | 979328 | -| train/ | | -| approx_kl | 0.00081638386 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 0.698 | -| explained_variance | -5.12 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 76500 | -| policy_gradient_loss | -0.0073 | -| std | 0.12 | -| value_loss | 2.18e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7652 | -| time_elapsed | 48621 | -| total_timesteps | 979456 | -| train/ | | -| approx_kl | 0.032816414 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.698 | -| explained_variance | -2.79 | -| learning_rate | 0.0003 | -| loss | 0.00231 | -| n_updates | 76510 | -| policy_gradient_loss | -0.000507 | -| std | 0.12 | -| value_loss | 2.12e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7653 | -| time_elapsed | 48624 | -| total_timesteps | 979584 | -| train/ | | -| approx_kl | 0.0028539146 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 0.698 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 76520 | -| policy_gradient_loss | -0.002 | -| std | 0.12 | -| value_loss | 4.18e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7654 | -| time_elapsed | 48628 | -| total_timesteps | 979712 | -| train/ | | -| approx_kl | 0.0010452387 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | -0.0743 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 76530 | -| policy_gradient_loss | 0.00149 | -| std | 0.12 | -| value_loss | 5.14e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7655 | -| time_elapsed | 48631 | -| total_timesteps | 979840 | -| train/ | | -| approx_kl | 0.012729583 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | -0.00271 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 76540 | -| policy_gradient_loss | -0.00869 | -| std | 0.12 | -| value_loss | 1.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7656 | -| time_elapsed | 48634 | -| total_timesteps | 979968 | -| train/ | | -| approx_kl | 0.018602036 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 76550 | -| policy_gradient_loss | -0.00117 | -| std | 0.12 | -| value_loss | 7.5e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7657 | -| time_elapsed | 48637 | -| total_timesteps | 980096 | -| train/ | | -| approx_kl | 0.0052025183 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.7 | -| explained_variance | -0.0737 | -| learning_rate | 0.0003 | -| loss | -0.00629 | -| n_updates | 76560 | -| policy_gradient_loss | -0.00394 | -| std | 0.12 | -| value_loss | 1.67e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7658 | -| time_elapsed | 48644 | -| total_timesteps | 980224 | -| train/ | | -| approx_kl | 0.022457777 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.701 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 76570 | -| policy_gradient_loss | -0.0159 | -| std | 0.12 | -| value_loss | 0.000187 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7659 | -| time_elapsed | 48647 | -| total_timesteps | 980352 | -| train/ | | -| approx_kl | 0.047445174 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 0.701 | -| explained_variance | -2.22 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 76580 | -| policy_gradient_loss | -0.00625 | -| std | 0.12 | -| value_loss | 2.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7660 | -| time_elapsed | 48651 | -| total_timesteps | 980480 | -| train/ | | -| approx_kl | 0.020081963 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 0.702 | -| explained_variance | -16.3 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 76590 | -| policy_gradient_loss | -0.000334 | -| std | 0.12 | -| value_loss | 6.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7661 | -| time_elapsed | 48655 | -| total_timesteps | 980608 | -| train/ | | -| approx_kl | 0.036533564 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.702 | -| explained_variance | -2.22 | -| learning_rate | 0.0003 | -| loss | 0.00585 | -| n_updates | 76600 | -| policy_gradient_loss | 0.00027 | -| std | 0.12 | -| value_loss | 1.49e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7662 | -| time_elapsed | 48660 | -| total_timesteps | 980736 | -| train/ | | -| approx_kl | 0.0145646185 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 0.701 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | 0.000734 | -| n_updates | 76610 | -| policy_gradient_loss | 0.00267 | -| std | 0.12 | -| value_loss | 2.37e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7663 | -| time_elapsed | 48664 | -| total_timesteps | 980864 | -| train/ | | -| approx_kl | 0.029918289 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.699 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 76620 | -| policy_gradient_loss | -0.00272 | -| std | 0.12 | -| value_loss | 1.81e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 20 | -| iterations | 7664 | -| time_elapsed | 48668 | -| total_timesteps | 980992 | -| train/ | | -| approx_kl | 0.00023964792 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 0.7 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 76630 | -| policy_gradient_loss | -0.000652 | -| std | 0.12 | -| value_loss | 5.87e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7665 | -| time_elapsed | 48673 | -| total_timesteps | 981120 | -| train/ | | -| approx_kl | 0.021640921 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 0.707 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 76640 | -| policy_gradient_loss | -0.00661 | -| std | 0.119 | -| value_loss | 2.62e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7666 | -| time_elapsed | 48682 | -| total_timesteps | 981248 | -| train/ | | -| approx_kl | 0.048064057 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.71 | -| explained_variance | 0.697 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 76650 | -| policy_gradient_loss | -0.0173 | -| std | 0.119 | -| value_loss | 0.000532 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7667 | -| time_elapsed | 48686 | -| total_timesteps | 981376 | -| train/ | | -| approx_kl | 0.0064188377 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 0.712 | -| explained_variance | -61.5 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 76660 | -| policy_gradient_loss | -0.00223 | -| std | 0.119 | -| value_loss | 7.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7668 | -| time_elapsed | 48690 | -| total_timesteps | 981504 | -| train/ | | -| approx_kl | 0.020188963 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.714 | -| explained_variance | -98.8 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 76670 | -| policy_gradient_loss | -0.00144 | -| std | 0.118 | -| value_loss | 4.9e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7669 | -| time_elapsed | 48694 | -| total_timesteps | 981632 | -| train/ | | -| approx_kl | 0.0710742 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.716 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 76680 | -| policy_gradient_loss | -0.00339 | -| std | 0.118 | -| value_loss | 1.87e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7670 | -| time_elapsed | 48697 | -| total_timesteps | 981760 | -| train/ | | -| approx_kl | 0.0080971075 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.718 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00945 | -| n_updates | 76690 | -| policy_gradient_loss | -0.00428 | -| std | 0.118 | -| value_loss | 6.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7671 | -| time_elapsed | 48701 | -| total_timesteps | 981888 | -| train/ | | -| approx_kl | 0.010194689 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 0.718 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | -0.004 | -| n_updates | 76700 | -| policy_gradient_loss | 0.00416 | -| std | 0.118 | -| value_loss | 3.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7672 | -| time_elapsed | 48705 | -| total_timesteps | 982016 | -| train/ | | -| approx_kl | 0.015391986 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.719 | -| explained_variance | -0.357 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 76710 | -| policy_gradient_loss | -0.000625 | -| std | 0.118 | -| value_loss | 2.26e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7673 | -| time_elapsed | 48714 | -| total_timesteps | 982144 | -| train/ | | -| approx_kl | 0.03772756 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.719 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.0246 | -| n_updates | 76720 | -| policy_gradient_loss | -0.0198 | -| std | 0.118 | -| value_loss | 0.00028 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7674 | -| time_elapsed | 48717 | -| total_timesteps | 982272 | -| train/ | | -| approx_kl | 0.0035546888 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.72 | -| explained_variance | -0.456 | -| learning_rate | 0.0003 | -| loss | -0.000604 | -| n_updates | 76730 | -| policy_gradient_loss | 9.07e-05 | -| std | 0.118 | -| value_loss | 2.18e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7675 | -| time_elapsed | 48720 | -| total_timesteps | 982400 | -| train/ | | -| approx_kl | 0.016920809 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 0.721 | -| explained_variance | -1.81 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 76740 | -| policy_gradient_loss | -0.00877 | -| std | 0.118 | -| value_loss | 1.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7676 | -| time_elapsed | 48723 | -| total_timesteps | 982528 | -| train/ | | -| approx_kl | 0.009015828 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 0.722 | -| explained_variance | -0.235 | -| learning_rate | 0.0003 | -| loss | -0.000658 | -| n_updates | 76750 | -| policy_gradient_loss | 0.00818 | -| std | 0.118 | -| value_loss | 3.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7677 | -| time_elapsed | 48727 | -| total_timesteps | 982656 | -| train/ | | -| approx_kl | 0.06398984 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 0.722 | -| explained_variance | -0.453 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 76760 | -| policy_gradient_loss | -0.0124 | -| std | 0.118 | -| value_loss | 4.72e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7678 | -| time_elapsed | 48729 | -| total_timesteps | 982784 | -| train/ | | -| approx_kl | 0.0023224084 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.722 | -| explained_variance | -0.23 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 76770 | -| policy_gradient_loss | 0.00739 | -| std | 0.117 | -| value_loss | 2.43e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7679 | -| time_elapsed | 48733 | -| total_timesteps | 982912 | -| train/ | | -| approx_kl | 0.013891671 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 76780 | -| policy_gradient_loss | -0.000953 | -| std | 0.117 | -| value_loss | 2.67e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7680 | -| time_elapsed | 48736 | -| total_timesteps | 983040 | -| train/ | | -| approx_kl | 0.03789208 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | -0.0279 | -| n_updates | 76790 | -| policy_gradient_loss | -0.00786 | -| std | 0.117 | -| value_loss | 1.98e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7681 | -| time_elapsed | 48743 | -| total_timesteps | 983168 | -| train/ | | -| approx_kl | 0.027491713 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | 0.908 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 76800 | -| policy_gradient_loss | -0.00848 | -| std | 0.117 | -| value_loss | 0.000611 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7682 | -| time_elapsed | 48745 | -| total_timesteps | 983296 | -| train/ | | -| approx_kl | 0.0013880995 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | -8.59 | -| learning_rate | 0.0003 | -| loss | -0.000775 | -| n_updates | 76810 | -| policy_gradient_loss | -0.000368 | -| std | 0.117 | -| value_loss | 2.5e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7683 | -| time_elapsed | 48749 | -| total_timesteps | 983424 | -| train/ | | -| approx_kl | 0.1389677 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 0.722 | -| explained_variance | -50.5 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 76820 | -| policy_gradient_loss | -0.00488 | -| std | 0.118 | -| value_loss | 9.74e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7684 | -| time_elapsed | 48751 | -| total_timesteps | 983552 | -| train/ | | -| approx_kl | 0.0027831509 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.721 | -| explained_variance | -31.1 | -| learning_rate | 0.0003 | -| loss | -0.00966 | -| n_updates | 76830 | -| policy_gradient_loss | -0.0106 | -| std | 0.118 | -| value_loss | 6.21e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7685 | -| time_elapsed | 48754 | -| total_timesteps | 983680 | -| train/ | | -| approx_kl | 0.013454481 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 0.722 | -| explained_variance | -4.94 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 76840 | -| policy_gradient_loss | -0.0135 | -| std | 0.118 | -| value_loss | 1.72e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7686 | -| time_elapsed | 48757 | -| total_timesteps | 983808 | -| train/ | | -| approx_kl | 0.009026889 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 0.722 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.00843 | -| n_updates | 76850 | -| policy_gradient_loss | -0.00346 | -| std | 0.118 | -| value_loss | 4.02e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7687 | -| time_elapsed | 48760 | -| total_timesteps | 983936 | -| train/ | | -| approx_kl | 0.0023035798 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 0.722 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | -0.000468 | -| n_updates | 76860 | -| policy_gradient_loss | 0.00249 | -| std | 0.118 | -| value_loss | 1.34e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7688 | -| time_elapsed | 48763 | -| total_timesteps | 984064 | -| train/ | | -| approx_kl | 0.016569903 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 0.72 | -| explained_variance | -0.000442 | -| learning_rate | 0.0003 | -| loss | -0.00766 | -| n_updates | 76870 | -| policy_gradient_loss | -0.0044 | -| std | 0.118 | -| value_loss | 4.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7689 | -| time_elapsed | 48769 | -| total_timesteps | 984192 | -| train/ | | -| approx_kl | 0.037145138 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.72 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 76880 | -| policy_gradient_loss | -0.00477 | -| std | 0.118 | -| value_loss | 0.000193 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7690 | -| time_elapsed | 48772 | -| total_timesteps | 984320 | -| train/ | | -| approx_kl | 0.0010583033 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.72 | -| explained_variance | -0.6 | -| learning_rate | 0.0003 | -| loss | -0.00041 | -| n_updates | 76890 | -| policy_gradient_loss | 0.000224 | -| std | 0.118 | -| value_loss | 1.17e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7691 | -| time_elapsed | 48774 | -| total_timesteps | 984448 | -| train/ | | -| approx_kl | 0.003851288 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 0.721 | -| explained_variance | -0.379 | -| learning_rate | 0.0003 | -| loss | -0.000142 | -| n_updates | 76900 | -| policy_gradient_loss | -0.000212 | -| std | 0.118 | -| value_loss | 1.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7692 | -| time_elapsed | 48777 | -| total_timesteps | 984576 | -| train/ | | -| approx_kl | 0.0062654684 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 76910 | -| policy_gradient_loss | -0.00192 | -| std | 0.117 | -| value_loss | 1.44e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7693 | -| time_elapsed | 48780 | -| total_timesteps | 984704 | -| train/ | | -| approx_kl | 0.0049665975 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 76920 | -| policy_gradient_loss | -0.00638 | -| std | 0.117 | -| value_loss | 3.17e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7694 | -| time_elapsed | 48782 | -| total_timesteps | 984832 | -| train/ | | -| approx_kl | 0.0032236772 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.00557 | -| n_updates | 76930 | -| policy_gradient_loss | -0.00438 | -| std | 0.117 | -| value_loss | 1.74e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7695 | -| time_elapsed | 48786 | -| total_timesteps | 984960 | -| train/ | | -| approx_kl | 0.0019365628 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.723 | -| explained_variance | 0.00836 | -| learning_rate | 0.0003 | -| loss | -0.000823 | -| n_updates | 76940 | -| policy_gradient_loss | -2.4e-05 | -| std | 0.117 | -| value_loss | 1.06e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7696 | -| time_elapsed | 48788 | -| total_timesteps | 985088 | -| train/ | | -| approx_kl | 0.00050570443 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 0.726 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 76950 | -| policy_gradient_loss | -0.000762 | -| std | 0.116 | -| value_loss | 1.14e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7697 | -| time_elapsed | 48795 | -| total_timesteps | 985216 | -| train/ | | -| approx_kl | 0.038833953 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.735 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 76960 | -| policy_gradient_loss | -0.0167 | -| std | 0.116 | -| value_loss | 0.00097 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7698 | -| time_elapsed | 48799 | -| total_timesteps | 985344 | -| train/ | | -| approx_kl | 0.054335743 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.739 | -| explained_variance | -25.9 | -| learning_rate | 0.0003 | -| loss | -0.00777 | -| n_updates | 76970 | -| policy_gradient_loss | -0.00519 | -| std | 0.115 | -| value_loss | 7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7699 | -| time_elapsed | 48802 | -| total_timesteps | 985472 | -| train/ | | -| approx_kl | 0.012210869 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.74 | -| explained_variance | -6.18 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 76980 | -| policy_gradient_loss | -0.00235 | -| std | 0.115 | -| value_loss | 2.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7700 | -| time_elapsed | 48805 | -| total_timesteps | 985600 | -| train/ | | -| approx_kl | 0.004425192 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.742 | -| explained_variance | -1.76 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 76990 | -| policy_gradient_loss | -0.00747 | -| std | 0.115 | -| value_loss | 7.26e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7701 | -| time_elapsed | 48809 | -| total_timesteps | 985728 | -| train/ | | -| approx_kl | 0.00411182 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -17.8 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 77000 | -| policy_gradient_loss | -0.0137 | -| std | 0.115 | -| value_loss | 2.3e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7702 | -| time_elapsed | 48813 | -| total_timesteps | 985856 | -| train/ | | -| approx_kl | 0.0023376527 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 77010 | -| policy_gradient_loss | -0.00312 | -| std | 0.115 | -| value_loss | 7.92e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7703 | -| time_elapsed | 48816 | -| total_timesteps | 985984 | -| train/ | | -| approx_kl | 0.0024282224 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.745 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | -0.00811 | -| n_updates | 77020 | -| policy_gradient_loss | -0.00682 | -| std | 0.115 | -| value_loss | 2.34e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 20 | -| iterations | 7704 | -| time_elapsed | 48820 | -| total_timesteps | 986112 | -| train/ | | -| approx_kl | 0.0006550485 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 0.745 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 77030 | -| policy_gradient_loss | 0.00338 | -| std | 0.115 | -| value_loss | 9.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 20 | -| iterations | 7705 | -| time_elapsed | 48830 | -| total_timesteps | 986240 | -| train/ | | -| approx_kl | 0.029285736 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.746 | -| explained_variance | 0.66 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 77040 | -| policy_gradient_loss | -0.0139 | -| std | 0.115 | -| value_loss | 0.00607 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 20 | -| iterations | 7706 | -| time_elapsed | 48833 | -| total_timesteps | 986368 | -| train/ | | -| approx_kl | 0.24066098 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 0.746 | -| explained_variance | -111 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 77050 | -| policy_gradient_loss | -0.00655 | -| std | 0.115 | -| value_loss | 5.66e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 20 | -| iterations | 7707 | -| time_elapsed | 48837 | -| total_timesteps | 986496 | -| train/ | | -| approx_kl | 0.0072823605 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.746 | -| explained_variance | -479 | -| learning_rate | 0.0003 | -| loss | -0.00641 | -| n_updates | 77060 | -| policy_gradient_loss | -0.00525 | -| std | 0.115 | -| value_loss | 3.64e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 20 | -| iterations | 7708 | -| time_elapsed | 48841 | -| total_timesteps | 986624 | -| train/ | | -| approx_kl | 0.0013838387 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.745 | -| explained_variance | -186 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 77070 | -| policy_gradient_loss | -0.0127 | -| std | 0.115 | -| value_loss | 5.34e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 20 | -| iterations | 7709 | -| time_elapsed | 48845 | -| total_timesteps | 986752 | -| train/ | | -| approx_kl | 0.00015919749 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.745 | -| explained_variance | -3.68 | -| learning_rate | 0.0003 | -| loss | 0.0004 | -| n_updates | 77080 | -| policy_gradient_loss | -0.000401 | -| std | 0.115 | -| value_loss | 2.38e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 20 | -| iterations | 7710 | -| time_elapsed | 48849 | -| total_timesteps | 986880 | -| train/ | | -| approx_kl | 0.00086928904 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 77090 | -| policy_gradient_loss | -0.00225 | -| std | 0.115 | -| value_loss | 6.7e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7711 | -| time_elapsed | 48853 | -| total_timesteps | 987008 | -| train/ | | -| approx_kl | 0.0053028017 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 77100 | -| policy_gradient_loss | -0.00631 | -| std | 0.115 | -| value_loss | 1.37e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7712 | -| time_elapsed | 48863 | -| total_timesteps | 987136 | -| train/ | | -| approx_kl | 0.02966887 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | 0.864 | -| learning_rate | 0.0003 | -| loss | -0.00581 | -| n_updates | 77110 | -| policy_gradient_loss | -0.00419 | -| std | 0.115 | -| value_loss | 0.00158 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7713 | -| time_elapsed | 48865 | -| total_timesteps | 987264 | -| train/ | | -| approx_kl | 0.2015028 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 0.745 | -| explained_variance | -9.07 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 77120 | -| policy_gradient_loss | -0.00205 | -| std | 0.115 | -| value_loss | 2.15e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7714 | -| time_elapsed | 48867 | -| total_timesteps | 987392 | -| train/ | | -| approx_kl | 0.15644604 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -298 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 77130 | -| policy_gradient_loss | -0.00387 | -| std | 0.115 | -| value_loss | 1.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7715 | -| time_elapsed | 48871 | -| total_timesteps | 987520 | -| train/ | | -| approx_kl | 0.00236521 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -18.9 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 77140 | -| policy_gradient_loss | -0.00104 | -| std | 0.115 | -| value_loss | 9.04e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7716 | -| time_elapsed | 48875 | -| total_timesteps | 987648 | -| train/ | | -| approx_kl | 0.0006435951 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 77150 | -| policy_gradient_loss | -0.000733 | -| std | 0.115 | -| value_loss | 2.13e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7717 | -| time_elapsed | 48877 | -| total_timesteps | 987776 | -| train/ | | -| approx_kl | 3.1512696e-05 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | 0.00017 | -| n_updates | 77160 | -| policy_gradient_loss | 0.000442 | -| std | 0.115 | -| value_loss | 3.01e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7718 | -| time_elapsed | 48880 | -| total_timesteps | 987904 | -| train/ | | -| approx_kl | 0.0074807354 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -0.0066 | -| learning_rate | 0.0003 | -| loss | -0.00679 | -| n_updates | 77170 | -| policy_gradient_loss | -0.00297 | -| std | 0.115 | -| value_loss | 2.35e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7719 | -| time_elapsed | 48883 | -| total_timesteps | 988032 | -| train/ | | -| approx_kl | 9.889761e-05 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -0.00801 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 77180 | -| policy_gradient_loss | 0.000497 | -| std | 0.115 | -| value_loss | 8.65e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7720 | -| time_elapsed | 48892 | -| total_timesteps | 988160 | -| train/ | | -| approx_kl | 0.074404575 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | 0.939 | -| learning_rate | 0.0003 | -| loss | -0.0256 | -| n_updates | 77190 | -| policy_gradient_loss | -0.0177 | -| std | 0.115 | -| value_loss | 0.000662 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7721 | -| time_elapsed | 48894 | -| total_timesteps | 988288 | -| train/ | | -| approx_kl | 0.028068256 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -16 | -| learning_rate | 0.0003 | -| loss | -0.00495 | -| n_updates | 77200 | -| policy_gradient_loss | -0.00301 | -| std | 0.115 | -| value_loss | 2.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7722 | -| time_elapsed | 48896 | -| total_timesteps | 988416 | -| train/ | | -| approx_kl | 0.0026920112 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -25.6 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 77210 | -| policy_gradient_loss | -0.0165 | -| std | 0.115 | -| value_loss | 1.04e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7723 | -| time_elapsed | 48899 | -| total_timesteps | 988544 | -| train/ | | -| approx_kl | 0.00035930425 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 77220 | -| policy_gradient_loss | 0.00052 | -| std | 0.115 | -| value_loss | 5.05e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7724 | -| time_elapsed | 48902 | -| total_timesteps | 988672 | -| train/ | | -| approx_kl | 0.067434065 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 77230 | -| policy_gradient_loss | -0.0126 | -| std | 0.115 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7725 | -| time_elapsed | 48904 | -| total_timesteps | 988800 | -| train/ | | -| approx_kl | 0.011302034 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 77240 | -| policy_gradient_loss | -0.00262 | -| std | 0.115 | -| value_loss | 1.66e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7726 | -| time_elapsed | 48906 | -| total_timesteps | 988928 | -| train/ | | -| approx_kl | 0.00030713202 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.000996 | -| n_updates | 77250 | -| policy_gradient_loss | 0.00202 | -| std | 0.115 | -| value_loss | 2.04e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7727 | -| time_elapsed | 48910 | -| total_timesteps | 989056 | -| train/ | | -| approx_kl | 0.0105649475 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -0.00066 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 77260 | -| policy_gradient_loss | -0.00535 | -| std | 0.115 | -| value_loss | 1.08e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7728 | -| time_elapsed | 48915 | -| total_timesteps | 989184 | -| train/ | | -| approx_kl | 0.023296349 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0302 | -| n_updates | 77270 | -| policy_gradient_loss | -0.0158 | -| std | 0.115 | -| value_loss | 0.000409 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7729 | -| time_elapsed | 48917 | -| total_timesteps | 989312 | -| train/ | | -| approx_kl | 0.0043231007 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 77280 | -| policy_gradient_loss | 0.00163 | -| std | 0.115 | -| value_loss | 1.38e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7730 | -| time_elapsed | 48920 | -| total_timesteps | 989440 | -| train/ | | -| approx_kl | 0.01296002 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -58.4 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 77290 | -| policy_gradient_loss | -0.00181 | -| std | 0.115 | -| value_loss | 7e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7731 | -| time_elapsed | 48922 | -| total_timesteps | 989568 | -| train/ | | -| approx_kl | 0.0005784449 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 0.742 | -| explained_variance | -3.21 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 77300 | -| policy_gradient_loss | 0.00362 | -| std | 0.115 | -| value_loss | 1.43e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7732 | -| time_elapsed | 48925 | -| total_timesteps | 989696 | -| train/ | | -| approx_kl | 0.02718665 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.742 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.00901 | -| n_updates | 77310 | -| policy_gradient_loss | -0.00535 | -| std | 0.115 | -| value_loss | 1.03e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7733 | -| time_elapsed | 48926 | -| total_timesteps | 989824 | -| train/ | | -| approx_kl | 9.636581e-05 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.741 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.000496 | -| n_updates | 77320 | -| policy_gradient_loss | 0.0026 | -| std | 0.115 | -| value_loss | 9.01e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7734 | -| time_elapsed | 48929 | -| total_timesteps | 989952 | -| train/ | | -| approx_kl | 0.00012800656 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.742 | -| explained_variance | -0.00334 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 77330 | -| policy_gradient_loss | 0.000728 | -| std | 0.115 | -| value_loss | 4.71e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7735 | -| time_elapsed | 48932 | -| total_timesteps | 990080 | -| train/ | | -| approx_kl | 0.003082327 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | 0.00507 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 77340 | -| policy_gradient_loss | -0.000915 | -| std | 0.115 | -| value_loss | 4.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7736 | -| time_elapsed | 48937 | -| total_timesteps | 990208 | -| train/ | | -| approx_kl | 0.040198486 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 77350 | -| policy_gradient_loss | -0.0148 | -| std | 0.115 | -| value_loss | 0.00021 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7737 | -| time_elapsed | 48940 | -| total_timesteps | 990336 | -| train/ | | -| approx_kl | 0.0060505215 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.742 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 77360 | -| policy_gradient_loss | -0.00239 | -| std | 0.115 | -| value_loss | 2.75e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7738 | -| time_elapsed | 48943 | -| total_timesteps | 990464 | -| train/ | | -| approx_kl | 5.3897966e-05 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.741 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | -9.82e-05 | -| n_updates | 77370 | -| policy_gradient_loss | 0.00056 | -| std | 0.115 | -| value_loss | 3.21e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7739 | -| time_elapsed | 48945 | -| total_timesteps | 990592 | -| train/ | | -| approx_kl | 0.053138297 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 0.742 | -| explained_variance | -0.532 | -| learning_rate | 0.0003 | -| loss | -0.00689 | -| n_updates | 77380 | -| policy_gradient_loss | -0.0083 | -| std | 0.115 | -| value_loss | 6.17e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7740 | -| time_elapsed | 48947 | -| total_timesteps | 990720 | -| train/ | | -| approx_kl | 0.0101686325 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.743 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 77390 | -| policy_gradient_loss | -0.0013 | -| std | 0.115 | -| value_loss | 2.73e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7741 | -| time_elapsed | 48951 | -| total_timesteps | 990848 | -| train/ | | -| approx_kl | 0.004850779 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 77400 | -| policy_gradient_loss | -0.00219 | -| std | 0.115 | -| value_loss | 2.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7742 | -| time_elapsed | 48954 | -| total_timesteps | 990976 | -| train/ | | -| approx_kl | 0.033040825 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 0.744 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 77410 | -| policy_gradient_loss | -0.0114 | -| std | 0.115 | -| value_loss | 2.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7743 | -| time_elapsed | 48958 | -| total_timesteps | 991104 | -| train/ | | -| approx_kl | 0.025654763 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 0.745 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 77420 | -| policy_gradient_loss | 0.000185 | -| std | 0.115 | -| value_loss | 7.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7744 | -| time_elapsed | 48964 | -| total_timesteps | 991232 | -| train/ | | -| approx_kl | 0.058734838 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.745 | -| explained_variance | -3.31 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 77430 | -| policy_gradient_loss | -0.0137 | -| std | 0.115 | -| value_loss | 0.0032 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7745 | -| time_elapsed | 48967 | -| total_timesteps | 991360 | -| train/ | | -| approx_kl | 0.0005584657 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.746 | -| explained_variance | -145 | -| learning_rate | 0.0003 | -| loss | -0.000474 | -| n_updates | 77440 | -| policy_gradient_loss | -0.000369 | -| std | 0.115 | -| value_loss | 1.51e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7746 | -| time_elapsed | 48970 | -| total_timesteps | 991488 | -| train/ | | -| approx_kl | 0.0023371559 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 0.749 | -| explained_variance | -1.74e+03 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 77450 | -| policy_gradient_loss | -0.000766 | -| std | 0.114 | -| value_loss | 6.77e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7747 | -| time_elapsed | 48972 | -| total_timesteps | 991616 | -| train/ | | -| approx_kl | 0.007991176 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.752 | -| explained_variance | -4 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 77460 | -| policy_gradient_loss | -0.00241 | -| std | 0.114 | -| value_loss | 3.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7748 | -| time_elapsed | 48975 | -| total_timesteps | 991744 | -| train/ | | -| approx_kl | 0.0006939331 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.754 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | -0.000219 | -| n_updates | 77470 | -| policy_gradient_loss | 0.000185 | -| std | 0.114 | -| value_loss | 3.01e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7749 | -| time_elapsed | 48977 | -| total_timesteps | 991872 | -| train/ | | -| approx_kl | 0.004024977 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.754 | -| explained_variance | -17 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 77480 | -| policy_gradient_loss | -0.0111 | -| std | 0.114 | -| value_loss | 2.23e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7750 | -| time_elapsed | 48980 | -| total_timesteps | 992000 | -| train/ | | -| approx_kl | 0.00035129534 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 0.754 | -| explained_variance | -0.712 | -| learning_rate | 0.0003 | -| loss | -0.000611 | -| n_updates | 77490 | -| policy_gradient_loss | 0.000219 | -| std | 0.114 | -| value_loss | 3.6e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7751 | -| time_elapsed | 48982 | -| total_timesteps | 992128 | -| train/ | | -| approx_kl | 0.0007368922 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.756 | -| explained_variance | 0.00191 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 77500 | -| policy_gradient_loss | 0.000753 | -| std | 0.113 | -| value_loss | 3.44e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7752 | -| time_elapsed | 48989 | -| total_timesteps | 992256 | -| train/ | | -| approx_kl | 0.028157026 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.758 | -| explained_variance | -3.96 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 77510 | -| policy_gradient_loss | -0.0121 | -| std | 0.113 | -| value_loss | 0.00282 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7753 | -| time_elapsed | 48992 | -| total_timesteps | 992384 | -| train/ | | -| approx_kl | 0.0024139103 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 0.76 | -| explained_variance | -17.9 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 77520 | -| policy_gradient_loss | -0.00462 | -| std | 0.113 | -| value_loss | 5.06e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7754 | -| time_elapsed | 48996 | -| total_timesteps | 992512 | -| train/ | | -| approx_kl | 0.013898604 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 0.761 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | -0.00769 | -| n_updates | 77530 | -| policy_gradient_loss | -0.00415 | -| std | 0.113 | -| value_loss | 8.47e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7755 | -| time_elapsed | 49000 | -| total_timesteps | 992640 | -| train/ | | -| approx_kl | 0.00014285697 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.762 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | 0.00276 | -| n_updates | 77540 | -| policy_gradient_loss | -0.00295 | -| std | 0.113 | -| value_loss | 2.38e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7756 | -| time_elapsed | 49003 | -| total_timesteps | 992768 | -| train/ | | -| approx_kl | 0.0026741745 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 0.762 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 77550 | -| policy_gradient_loss | -0.00122 | -| std | 0.113 | -| value_loss | 1.41e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 20 | -| iterations | 7757 | -| time_elapsed | 49006 | -| total_timesteps | 992896 | -| train/ | | -| approx_kl | 0.0004238682 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.762 | -| explained_variance | -0.0998 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 77560 | -| policy_gradient_loss | -0.00214 | -| std | 0.113 | -| value_loss | 1.35e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7758 | -| time_elapsed | 49010 | -| total_timesteps | 993024 | -| train/ | | -| approx_kl | 0.00011972571 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.763 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | 0.000284 | -| n_updates | 77570 | -| policy_gradient_loss | 0.000772 | -| std | 0.113 | -| value_loss | 3.34e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7759 | -| time_elapsed | 49017 | -| total_timesteps | 993152 | -| train/ | | -| approx_kl | 0.21823251 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 77580 | -| policy_gradient_loss | -0.0142 | -| std | 0.113 | -| value_loss | 0.00113 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7760 | -| time_elapsed | 49020 | -| total_timesteps | 993280 | -| train/ | | -| approx_kl | 0.0038822554 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -2.71 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 77590 | -| policy_gradient_loss | -0.0127 | -| std | 0.113 | -| value_loss | 2.37e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7761 | -| time_elapsed | 49025 | -| total_timesteps | 993408 | -| train/ | | -| approx_kl | 0.035520334 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -17.2 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 77600 | -| policy_gradient_loss | 0.000246 | -| std | 0.113 | -| value_loss | 5.92e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7762 | -| time_elapsed | 49029 | -| total_timesteps | 993536 | -| train/ | | -| approx_kl | 0.00016470114 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | 0.000178 | -| n_updates | 77610 | -| policy_gradient_loss | 0.000408 | -| std | 0.113 | -| value_loss | 8.23e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7763 | -| time_elapsed | 49032 | -| total_timesteps | 993664 | -| train/ | | -| approx_kl | 0.0045294566 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.765 | -| explained_variance | -0.362 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 77620 | -| policy_gradient_loss | 0.00442 | -| std | 0.113 | -| value_loss | 9.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7764 | -| time_elapsed | 49036 | -| total_timesteps | 993792 | -| train/ | | -| approx_kl | 0.024875466 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 77630 | -| policy_gradient_loss | -0.0183 | -| std | 0.113 | -| value_loss | 9.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7765 | -| time_elapsed | 49040 | -| total_timesteps | 993920 | -| train/ | | -| approx_kl | 0.010686012 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 77640 | -| policy_gradient_loss | 0.00648 | -| std | 0.113 | -| value_loss | 1.05e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7766 | -| time_elapsed | 49043 | -| total_timesteps | 994048 | -| train/ | | -| approx_kl | 0.024124451 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.763 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | 0.00618 | -| n_updates | 77650 | -| policy_gradient_loss | 0.00142 | -| std | 0.113 | -| value_loss | 2.12e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7767 | -| time_elapsed | 49049 | -| total_timesteps | 994176 | -| train/ | | -| approx_kl | 22.911867 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 0.763 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 77660 | -| policy_gradient_loss | -0.00732 | -| std | 0.113 | -| value_loss | 0.000183 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7768 | -| time_elapsed | 49053 | -| total_timesteps | 994304 | -| train/ | | -| approx_kl | 0.006560826 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 77670 | -| policy_gradient_loss | -0.00216 | -| std | 0.113 | -| value_loss | 6.33e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7769 | -| time_elapsed | 49057 | -| total_timesteps | 994432 | -| train/ | | -| approx_kl | 0.0018296517 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 0.762 | -| explained_variance | -2.07 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 77680 | -| policy_gradient_loss | 0.0039 | -| std | 0.113 | -| value_loss | 4.06e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7770 | -| time_elapsed | 49061 | -| total_timesteps | 994560 | -| train/ | | -| approx_kl | 0.0058112205 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 0.763 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.00556 | -| n_updates | 77690 | -| policy_gradient_loss | 0.0122 | -| std | 0.113 | -| value_loss | 2.89e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7771 | -| time_elapsed | 49064 | -| total_timesteps | 994688 | -| train/ | | -| approx_kl | 0.00012265705 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 0.764 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | 0.000618 | -| n_updates | 77700 | -| policy_gradient_loss | -0.000787 | -| std | 0.113 | -| value_loss | 8.64e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7772 | -| time_elapsed | 49069 | -| total_timesteps | 994816 | -| train/ | | -| approx_kl | 0.0032356777 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 0.765 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 77710 | -| policy_gradient_loss | -0.00172 | -| std | 0.113 | -| value_loss | 7.52e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7773 | -| time_elapsed | 49073 | -| total_timesteps | 994944 | -| train/ | | -| approx_kl | 0.017458819 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.765 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 77720 | -| policy_gradient_loss | -0.00183 | -| std | 0.113 | -| value_loss | 1.28e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7774 | -| time_elapsed | 49077 | -| total_timesteps | 995072 | -| train/ | | -| approx_kl | 0.00042241905 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 0.765 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -0.000205 | -| n_updates | 77730 | -| policy_gradient_loss | 0.000593 | -| std | 0.112 | -| value_loss | 3.27e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7775 | -| time_elapsed | 49083 | -| total_timesteps | 995200 | -| train/ | | -| approx_kl | 0.007942875 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.769 | -| explained_variance | 0.85 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 77740 | -| policy_gradient_loss | -0.00428 | -| std | 0.112 | -| value_loss | 0.00143 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7776 | -| time_elapsed | 49088 | -| total_timesteps | 995328 | -| train/ | | -| approx_kl | 0.09653411 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 0.773 | -| explained_variance | -3.4e+03 | -| learning_rate | 0.0003 | -| loss | -0.00873 | -| n_updates | 77750 | -| policy_gradient_loss | -0.00627 | -| std | 0.112 | -| value_loss | 3.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7777 | -| time_elapsed | 49092 | -| total_timesteps | 995456 | -| train/ | | -| approx_kl | 0.083523534 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 0.774 | -| explained_variance | -3.52e+03 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 77760 | -| policy_gradient_loss | -0.00231 | -| std | 0.112 | -| value_loss | 1.83e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7778 | -| time_elapsed | 49095 | -| total_timesteps | 995584 | -| train/ | | -| approx_kl | 0.028622638 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 0.773 | -| explained_variance | -288 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 77770 | -| policy_gradient_loss | -0.00642 | -| std | 0.112 | -| value_loss | 1.13e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7779 | -| time_elapsed | 49099 | -| total_timesteps | 995712 | -| train/ | | -| approx_kl | 5.1092356e-06 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.772 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 77780 | -| policy_gradient_loss | 0.000299 | -| std | 0.112 | -| value_loss | 7.97e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7780 | -| time_elapsed | 49103 | -| total_timesteps | 995840 | -| train/ | | -| approx_kl | 0.002079958 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.772 | -| explained_variance | -3.13 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 77790 | -| policy_gradient_loss | -0.00171 | -| std | 0.112 | -| value_loss | 3.2e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 20 | -| iterations | 7781 | -| time_elapsed | 49106 | -| total_timesteps | 995968 | -| train/ | | -| approx_kl | 0.006371876 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.771 | -| explained_variance | -2.43 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 77800 | -| policy_gradient_loss | -0.0117 | -| std | 0.112 | -| value_loss | 1.03e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7782 | -| time_elapsed | 49109 | -| total_timesteps | 996096 | -| train/ | | -| approx_kl | 0.00634335 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.77 | -| explained_variance | -0.391 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 77810 | -| policy_gradient_loss | -0.0031 | -| std | 0.112 | -| value_loss | 8.6e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7783 | -| time_elapsed | 49117 | -| total_timesteps | 996224 | -| train/ | | -| approx_kl | 0.28370914 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.77 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 77820 | -| policy_gradient_loss | -0.0128 | -| std | 0.112 | -| value_loss | 0.00134 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7784 | -| time_elapsed | 49121 | -| total_timesteps | 996352 | -| train/ | | -| approx_kl | 0.00016839383 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.769 | -| explained_variance | -5.86e+03 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 77830 | -| policy_gradient_loss | -0.0101 | -| std | 0.112 | -| value_loss | 1.78e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7785 | -| time_elapsed | 49124 | -| total_timesteps | 996480 | -| train/ | | -| approx_kl | 0.0082807625 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.769 | -| explained_variance | -3.06e+03 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 77840 | -| policy_gradient_loss | -0.00912 | -| std | 0.112 | -| value_loss | 1.33e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7786 | -| time_elapsed | 49128 | -| total_timesteps | 996608 | -| train/ | | -| approx_kl | 0.23169516 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 0.769 | -| explained_variance | -373 | -| learning_rate | 0.0003 | -| loss | -0.000804 | -| n_updates | 77850 | -| policy_gradient_loss | -0.00659 | -| std | 0.112 | -| value_loss | 1.25e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7787 | -| time_elapsed | 49132 | -| total_timesteps | 996736 | -| train/ | | -| approx_kl | 0.003463463 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 0.769 | -| explained_variance | -54.5 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 77860 | -| policy_gradient_loss | -0.00133 | -| std | 0.112 | -| value_loss | 1.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7788 | -| time_elapsed | 49135 | -| total_timesteps | 996864 | -| train/ | | -| approx_kl | 0.025394352 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 0.769 | -| explained_variance | -3.04 | -| learning_rate | 0.0003 | -| loss | 0.00966 | -| n_updates | 77870 | -| policy_gradient_loss | 0.0174 | -| std | 0.112 | -| value_loss | 6.42e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7789 | -| time_elapsed | 49139 | -| total_timesteps | 996992 | -| train/ | | -| approx_kl | 0.0051483964 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.77 | -| explained_variance | -0.0845 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 77880 | -| policy_gradient_loss | -0.000159 | -| std | 0.112 | -| value_loss | 2.29e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7790 | -| time_elapsed | 49142 | -| total_timesteps | 997120 | -| train/ | | -| approx_kl | 0.0019412194 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.773 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.00674 | -| n_updates | 77890 | -| policy_gradient_loss | -0.00372 | -| std | 0.112 | -| value_loss | 5.15e-07 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7791 | -| time_elapsed | 49152 | -| total_timesteps | 997248 | -| train/ | | -| approx_kl | 5.552474 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.774 | -| explained_variance | 0.711 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 77900 | -| policy_gradient_loss | -0.0161 | -| std | 0.111 | -| value_loss | 0.000855 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7792 | -| time_elapsed | 49156 | -| total_timesteps | 997376 | -| train/ | | -| approx_kl | 0.07385521 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 77910 | -| policy_gradient_loss | -0.0081 | -| std | 0.111 | -| value_loss | 1.31e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7793 | -| time_elapsed | 49159 | -| total_timesteps | 997504 | -| train/ | | -| approx_kl | 0.008802298 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.776 | -| explained_variance | -19.8 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 77920 | -| policy_gradient_loss | -0.00732 | -| std | 0.111 | -| value_loss | 4.34e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7794 | -| time_elapsed | 49163 | -| total_timesteps | 997632 | -| train/ | | -| approx_kl | 0.054750443 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -9.96 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 77930 | -| policy_gradient_loss | -0.0052 | -| std | 0.111 | -| value_loss | 5.5e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7795 | -| time_elapsed | 49167 | -| total_timesteps | 997760 | -| train/ | | -| approx_kl | 0.004874567 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.625 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 77940 | -| policy_gradient_loss | -0.00565 | -| std | 0.111 | -| value_loss | 1.71e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 20 | -| iterations | 7796 | -| time_elapsed | 49170 | -| total_timesteps | 997888 | -| train/ | | -| approx_kl | 0.0017755846 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.00765 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 77950 | -| policy_gradient_loss | -0.00187 | -| std | 0.111 | -| value_loss | 3.1e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7797 | -| time_elapsed | 49173 | -| total_timesteps | 998016 | -| train/ | | -| approx_kl | 0.013320292 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 77960 | -| policy_gradient_loss | 0.00112 | -| std | 0.111 | -| value_loss | 3.13e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7798 | -| time_elapsed | 49181 | -| total_timesteps | 998144 | -| train/ | | -| approx_kl | 2.4330404 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 77970 | -| policy_gradient_loss | -0.0105 | -| std | 0.111 | -| value_loss | 0.00154 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7799 | -| time_elapsed | 49185 | -| total_timesteps | 998272 | -| train/ | | -| approx_kl | 0.012789087 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -744 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 77980 | -| policy_gradient_loss | -0.00972 | -| std | 0.111 | -| value_loss | 1.61e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7800 | -| time_elapsed | 49188 | -| total_timesteps | 998400 | -| train/ | | -| approx_kl | 0.08110638 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -1.65e+03 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 77990 | -| policy_gradient_loss | -0.000629 | -| std | 0.111 | -| value_loss | 6.52e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7801 | -| time_elapsed | 49192 | -| total_timesteps | 998528 | -| train/ | | -| approx_kl | 0.04247678 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 0.776 | -| explained_variance | -58.1 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 78000 | -| policy_gradient_loss | -0.00574 | -| std | 0.111 | -| value_loss | 3.59e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7802 | -| time_elapsed | 49195 | -| total_timesteps | 998656 | -| train/ | | -| approx_kl | 0.034014672 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 0.778 | -| explained_variance | -6.2 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 78010 | -| policy_gradient_loss | -0.00367 | -| std | 0.111 | -| value_loss | 5.27e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7803 | -| time_elapsed | 49199 | -| total_timesteps | 998784 | -| train/ | | -| approx_kl | 0.001348427 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 0.778 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 78020 | -| policy_gradient_loss | -0.00078 | -| std | 0.111 | -| value_loss | 2.85e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 20 | -| iterations | 7804 | -| time_elapsed | 49203 | -| total_timesteps | 998912 | -| train/ | | -| approx_kl | 0.03882522 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 0.777 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.0262 | -| n_updates | 78030 | -| policy_gradient_loss | -0.0197 | -| std | 0.111 | -| value_loss | 1.11e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7805 | -| time_elapsed | 49205 | -| total_timesteps | 999040 | -| train/ | | -| approx_kl | 0.023839168 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.776 | -| explained_variance | -0.000565 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 78040 | -| policy_gradient_loss | 0.00358 | -| std | 0.111 | -| value_loss | 1.05e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7806 | -| time_elapsed | 49210 | -| total_timesteps | 999168 | -| train/ | | -| approx_kl | 2.4580405 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 78050 | -| policy_gradient_loss | -0.0136 | -| std | 0.111 | -| value_loss | 0.000173 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7807 | -| time_elapsed | 49213 | -| total_timesteps | 999296 | -| train/ | | -| approx_kl | 0.011035526 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -4.17 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 78060 | -| policy_gradient_loss | -0.00589 | -| std | 0.111 | -| value_loss | 2.07e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7808 | -| time_elapsed | 49215 | -| total_timesteps | 999424 | -| train/ | | -| approx_kl | 0.02792905 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -7.25 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 78070 | -| policy_gradient_loss | -0.0104 | -| std | 0.111 | -| value_loss | 2.51e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7809 | -| time_elapsed | 49218 | -| total_timesteps | 999552 | -| train/ | | -| approx_kl | 0.0012761038 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.624 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 78080 | -| policy_gradient_loss | -0.00581 | -| std | 0.111 | -| value_loss | 1.77e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7810 | -| time_elapsed | 49221 | -| total_timesteps | 999680 | -| train/ | | -| approx_kl | 0.049616918 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.00481 | -| n_updates | 78090 | -| policy_gradient_loss | -0.00128 | -| std | 0.112 | -| value_loss | 1.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7811 | -| time_elapsed | 49225 | -| total_timesteps | 999808 | -| train/ | | -| approx_kl | 0.009256102 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.334 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 78100 | -| policy_gradient_loss | -0.0102 | -| std | 0.112 | -| value_loss | 1.62e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 20 | -| iterations | 7812 | -| time_elapsed | 49228 | -| total_timesteps | 999936 | -| train/ | | -| approx_kl | 0.0016624411 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 0.775 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 78110 | -| policy_gradient_loss | -0.00109 | -| std | 0.111 | -| value_loss | 6.51e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7813 | -| time_elapsed | 49232 | -| total_timesteps | 1000064 | -| train/ | | -| approx_kl | 0.00034421356 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.776 | -| explained_variance | -0.00643 | -| learning_rate | 0.0003 | -| loss | -0.000748 | -| n_updates | 78120 | -| policy_gradient_loss | -0.000346 | -| std | 0.111 | -| value_loss | 2.88e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7814 | -| time_elapsed | 49238 | -| total_timesteps | 1000192 | -| train/ | | -| approx_kl | 3.3629467 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.779 | -| explained_variance | 0.783 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 78130 | -| policy_gradient_loss | -0.0168 | -| std | 0.111 | -| value_loss | 0.000484 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7815 | -| time_elapsed | 49242 | -| total_timesteps | 1000320 | -| train/ | | -| approx_kl | 0.0006565843 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.78 | -| explained_variance | -23.1 | -| learning_rate | 0.0003 | -| loss | -0.000734 | -| n_updates | 78140 | -| policy_gradient_loss | -0.000178 | -| std | 0.111 | -| value_loss | 8.26e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7816 | -| time_elapsed | 49246 | -| total_timesteps | 1000448 | -| train/ | | -| approx_kl | 0.0839249 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 0.782 | -| explained_variance | -97.9 | -| learning_rate | 0.0003 | -| loss | -0.00726 | -| n_updates | 78150 | -| policy_gradient_loss | -0.00673 | -| std | 0.111 | -| value_loss | 5.71e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7817 | -| time_elapsed | 49249 | -| total_timesteps | 1000576 | -| train/ | | -| approx_kl | 0.03053282 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.783 | -| explained_variance | -8.64 | -| learning_rate | 0.0003 | -| loss | -0.00713 | -| n_updates | 78160 | -| policy_gradient_loss | -0.00386 | -| std | 0.111 | -| value_loss | 7.21e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7818 | -| time_elapsed | 49254 | -| total_timesteps | 1000704 | -| train/ | | -| approx_kl | 0.008908009 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 0.783 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 78170 | -| policy_gradient_loss | 0.00127 | -| std | 0.111 | -| value_loss | 1.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7819 | -| time_elapsed | 49257 | -| total_timesteps | 1000832 | -| train/ | | -| approx_kl | 0.013167691 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 0.783 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 78180 | -| policy_gradient_loss | -8.05e-05 | -| std | 0.111 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 20 | -| iterations | 7820 | -| time_elapsed | 49260 | -| total_timesteps | 1000960 | -| train/ | | -| approx_kl | 0.0033447267 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 0.784 | -| explained_variance | -2.41 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 78190 | -| policy_gradient_loss | -0.00715 | -| std | 0.11 | -| value_loss | 2.84e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7821 | -| time_elapsed | 49264 | -| total_timesteps | 1001088 | -| train/ | | -| approx_kl | 0.0031183953 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.784 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | -0.00453 | -| n_updates | 78200 | -| policy_gradient_loss | -0.00324 | -| std | 0.11 | -| value_loss | 6.73e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7822 | -| time_elapsed | 49270 | -| total_timesteps | 1001216 | -| train/ | | -| approx_kl | 0.039568942 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 0.784 | -| explained_variance | -0.778 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 78210 | -| policy_gradient_loss | -0.0109 | -| std | 0.11 | -| value_loss | 0.00129 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7823 | -| time_elapsed | 49273 | -| total_timesteps | 1001344 | -| train/ | | -| approx_kl | 0.01155193 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 0.784 | -| explained_variance | -72.6 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 78220 | -| policy_gradient_loss | -0.0135 | -| std | 0.11 | -| value_loss | 3.96e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7824 | -| time_elapsed | 49276 | -| total_timesteps | 1001472 | -| train/ | | -| approx_kl | 0.01797964 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.784 | -| explained_variance | -31.4 | -| learning_rate | 0.0003 | -| loss | -0.000455 | -| n_updates | 78230 | -| policy_gradient_loss | 1.47e-05 | -| std | 0.11 | -| value_loss | 6e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7825 | -| time_elapsed | 49280 | -| total_timesteps | 1001600 | -| train/ | | -| approx_kl | 9.751413e-06 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.786 | -| explained_variance | -4.27 | -| learning_rate | 0.0003 | -| loss | -0.000328 | -| n_updates | 78240 | -| policy_gradient_loss | 0.00119 | -| std | 0.11 | -| value_loss | 2.63e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7826 | -| time_elapsed | 49284 | -| total_timesteps | 1001728 | -| train/ | | -| approx_kl | 0.0179323 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.788 | -| explained_variance | -0.0865 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 78250 | -| policy_gradient_loss | -0.00423 | -| std | 0.11 | -| value_loss | 1.65e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7827 | -| time_elapsed | 49288 | -| total_timesteps | 1001856 | -| train/ | | -| approx_kl | 0.005715218 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 0.79 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 78260 | -| policy_gradient_loss | -0.0104 | -| std | 0.11 | -| value_loss | 5.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 20 | -| iterations | 7828 | -| time_elapsed | 49290 | -| total_timesteps | 1001984 | -| train/ | | -| approx_kl | 0.0001828121 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 0.791 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | -1.76e-05 | -| n_updates | 78270 | -| policy_gradient_loss | 0.000197 | -| std | 0.11 | -| value_loss | 3.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7829 | -| time_elapsed | 49294 | -| total_timesteps | 1002112 | -| train/ | | -| approx_kl | 0.001145198 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.79 | -| explained_variance | 0.00569 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 78280 | -| policy_gradient_loss | -0.00305 | -| std | 0.11 | -| value_loss | 8.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7830 | -| time_elapsed | 49303 | -| total_timesteps | 1002240 | -| train/ | | -| approx_kl | 0.031014046 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.789 | -| explained_variance | 0.748 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 78290 | -| policy_gradient_loss | -0.0161 | -| std | 0.11 | -| value_loss | 0.00336 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7831 | -| time_elapsed | 49306 | -| total_timesteps | 1002368 | -| train/ | | -| approx_kl | 0.0071804533 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.789 | -| explained_variance | -8.25 | -| learning_rate | 0.0003 | -| loss | -0.0093 | -| n_updates | 78300 | -| policy_gradient_loss | -0.00675 | -| std | 0.11 | -| value_loss | 0.000244 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7832 | -| time_elapsed | 49309 | -| total_timesteps | 1002496 | -| train/ | | -| approx_kl | 0.0363645 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 0.79 | -| explained_variance | -3.14 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 78310 | -| policy_gradient_loss | -0.00336 | -| std | 0.11 | -| value_loss | 0.00134 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7833 | -| time_elapsed | 49311 | -| total_timesteps | 1002624 | -| train/ | | -| approx_kl | 0.04252389 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 0.791 | -| explained_variance | -0.323 | -| learning_rate | 0.0003 | -| loss | -0.00765 | -| n_updates | 78320 | -| policy_gradient_loss | -0.00621 | -| std | 0.11 | -| value_loss | 0.000159 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7834 | -| time_elapsed | 49314 | -| total_timesteps | 1002752 | -| train/ | | -| approx_kl | 0.0018353187 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.792 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 78330 | -| policy_gradient_loss | -0.00223 | -| std | 0.11 | -| value_loss | 5.51e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 20 | -| iterations | 7835 | -| time_elapsed | 49317 | -| total_timesteps | 1002880 | -| train/ | | -| approx_kl | 0.015590645 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.793 | -| explained_variance | 0.00535 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 78340 | -| policy_gradient_loss | -0.00892 | -| std | 0.109 | -| value_loss | 2.74e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7836 | -| time_elapsed | 49320 | -| total_timesteps | 1003008 | -| train/ | | -| approx_kl | 0.0057910765 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.794 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | -0.00269 | -| n_updates | 78350 | -| policy_gradient_loss | -0.000712 | -| std | 0.109 | -| value_loss | 1.2e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7837 | -| time_elapsed | 49330 | -| total_timesteps | 1003136 | -| train/ | | -| approx_kl | 0.046223763 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.794 | -| explained_variance | 0.168 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 78360 | -| policy_gradient_loss | -0.00833 | -| std | 0.109 | -| value_loss | 0.00111 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7838 | -| time_elapsed | 49334 | -| total_timesteps | 1003264 | -| train/ | | -| approx_kl | 0.00825779 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.794 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | -0.00391 | -| n_updates | 78370 | -| policy_gradient_loss | 0.000876 | -| std | 0.109 | -| value_loss | 1.51e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7839 | -| time_elapsed | 49338 | -| total_timesteps | 1003392 | -| train/ | | -| approx_kl | 0.04969556 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.794 | -| explained_variance | -0.456 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 78380 | -| policy_gradient_loss | -0.00665 | -| std | 0.109 | -| value_loss | 4.93e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7840 | -| time_elapsed | 49342 | -| total_timesteps | 1003520 | -| train/ | | -| approx_kl | 0.015213709 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 0.794 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 78390 | -| policy_gradient_loss | -0.00739 | -| std | 0.109 | -| value_loss | 4.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7841 | -| time_elapsed | 49345 | -| total_timesteps | 1003648 | -| train/ | | -| approx_kl | 0.025844084 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 0.794 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 78400 | -| policy_gradient_loss | 0.00242 | -| std | 0.109 | -| value_loss | 2.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7842 | -| time_elapsed | 49349 | -| total_timesteps | 1003776 | -| train/ | | -| approx_kl | 0.01848942 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 0.793 | -| explained_variance | -0.00987 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 78410 | -| policy_gradient_loss | -0.00769 | -| std | 0.11 | -| value_loss | 1.32e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 20 | -| iterations | 7843 | -| time_elapsed | 49353 | -| total_timesteps | 1003904 | -| train/ | | -| approx_kl | 0.015293505 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 0.792 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 78420 | -| policy_gradient_loss | 0.000731 | -| std | 0.11 | -| value_loss | 5.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7844 | -| time_elapsed | 49357 | -| total_timesteps | 1004032 | -| train/ | | -| approx_kl | 0.005921375 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 0.792 | -| explained_variance | -0.00773 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 78430 | -| policy_gradient_loss | 0.00261 | -| std | 0.11 | -| value_loss | 6.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7845 | -| time_elapsed | 49364 | -| total_timesteps | 1004160 | -| train/ | | -| approx_kl | 0.045202285 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 0.793 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 78440 | -| policy_gradient_loss | -0.013 | -| std | 0.11 | -| value_loss | 0.000598 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7846 | -| time_elapsed | 49367 | -| total_timesteps | 1004288 | -| train/ | | -| approx_kl | 0.061392844 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.793 | -| explained_variance | -6.74 | -| learning_rate | 0.0003 | -| loss | -0.00957 | -| n_updates | 78450 | -| policy_gradient_loss | -0.00555 | -| std | 0.11 | -| value_loss | 4.51e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7847 | -| time_elapsed | 49371 | -| total_timesteps | 1004416 | -| train/ | | -| approx_kl | 0.0008185208 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.792 | -| explained_variance | -79.9 | -| learning_rate | 0.0003 | -| loss | -0.000527 | -| n_updates | 78460 | -| policy_gradient_loss | -0.000254 | -| std | 0.11 | -| value_loss | 4.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7848 | -| time_elapsed | 49374 | -| total_timesteps | 1004544 | -| train/ | | -| approx_kl | 0.0011554915 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.789 | -| explained_variance | -3.53 | -| learning_rate | 0.0003 | -| loss | -0.00557 | -| n_updates | 78470 | -| policy_gradient_loss | -0.00661 | -| std | 0.11 | -| value_loss | 1.31e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7849 | -| time_elapsed | 49378 | -| total_timesteps | 1004672 | -| train/ | | -| approx_kl | 0.0014348379 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 0.787 | -| explained_variance | -0.0689 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 78480 | -| policy_gradient_loss | -0.00155 | -| std | 0.11 | -| value_loss | 2.24e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7850 | -| time_elapsed | 49382 | -| total_timesteps | 1004800 | -| train/ | | -| approx_kl | 1.8866267e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.789 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | -0.000493 | -| n_updates | 78490 | -| policy_gradient_loss | -0.000194 | -| std | 0.11 | -| value_loss | 3.63e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 20 | -| iterations | 7851 | -| time_elapsed | 49386 | -| total_timesteps | 1004928 | -| train/ | | -| approx_kl | 0.012391848 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 0.793 | -| explained_variance | -0.0032 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 78500 | -| policy_gradient_loss | -0.00596 | -| std | 0.109 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7852 | -| time_elapsed | 49389 | -| total_timesteps | 1005056 | -| train/ | | -| approx_kl | 0.006591142 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 0.796 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 78510 | -| policy_gradient_loss | 0.0022 | -| std | 0.109 | -| value_loss | 6.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7853 | -| time_elapsed | 49394 | -| total_timesteps | 1005184 | -| train/ | | -| approx_kl | 0.004896946 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.796 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 78520 | -| policy_gradient_loss | -0.0113 | -| std | 0.109 | -| value_loss | 0.00129 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7854 | -| time_elapsed | 49398 | -| total_timesteps | 1005312 | -| train/ | | -| approx_kl | 0.0292994 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.796 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | 0.0056 | -| n_updates | 78530 | -| policy_gradient_loss | 0.00123 | -| std | 0.109 | -| value_loss | 6.73e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7855 | -| time_elapsed | 49401 | -| total_timesteps | 1005440 | -| train/ | | -| approx_kl | 0.083058596 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 0.796 | -| explained_variance | -292 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 78540 | -| policy_gradient_loss | -0.00911 | -| std | 0.109 | -| value_loss | 2.86e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7856 | -| time_elapsed | 49403 | -| total_timesteps | 1005568 | -| train/ | | -| approx_kl | 0.0014943955 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.797 | -| explained_variance | -68.2 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 78550 | -| policy_gradient_loss | -0.00143 | -| std | 0.109 | -| value_loss | 3.26e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7857 | -| time_elapsed | 49406 | -| total_timesteps | 1005696 | -| train/ | | -| approx_kl | 0.0012096078 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 0.798 | -| explained_variance | -5.35 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 78560 | -| policy_gradient_loss | -0.000666 | -| std | 0.109 | -| value_loss | 4.2e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7858 | -| time_elapsed | 49409 | -| total_timesteps | 1005824 | -| train/ | | -| approx_kl | 0.007075876 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | -0.00687 | -| n_updates | 78570 | -| policy_gradient_loss | -0.0049 | -| std | 0.109 | -| value_loss | 2.47e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 20 | -| iterations | 7859 | -| time_elapsed | 49413 | -| total_timesteps | 1005952 | -| train/ | | -| approx_kl | 0.0012258342 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | -0.0812 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 78580 | -| policy_gradient_loss | -0.00115 | -| std | 0.109 | -| value_loss | 1.53e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7860 | -| time_elapsed | 49414 | -| total_timesteps | 1006080 | -| train/ | | -| approx_kl | 0.003100343 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.799 | -| explained_variance | -0.000692 | -| learning_rate | 0.0003 | -| loss | -0.00577 | -| n_updates | 78590 | -| policy_gradient_loss | -0.00503 | -| std | 0.109 | -| value_loss | 2.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7861 | -| time_elapsed | 49421 | -| total_timesteps | 1006208 | -| train/ | | -| approx_kl | 0.012040643 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 0.799 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 78600 | -| policy_gradient_loss | -0.0168 | -| std | 0.109 | -| value_loss | 0.000139 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7862 | -| time_elapsed | 49422 | -| total_timesteps | 1006336 | -| train/ | | -| approx_kl | 0.00864581 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.798 | -| explained_variance | -8.82 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 78610 | -| policy_gradient_loss | -0.00358 | -| std | 0.109 | -| value_loss | 4.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7863 | -| time_elapsed | 49425 | -| total_timesteps | 1006464 | -| train/ | | -| approx_kl | 0.020576604 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 0.798 | -| explained_variance | -22.3 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 78620 | -| policy_gradient_loss | -0.000814 | -| std | 0.109 | -| value_loss | 2.95e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7864 | -| time_elapsed | 49428 | -| total_timesteps | 1006592 | -| train/ | | -| approx_kl | 0.0037085167 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 0.799 | -| explained_variance | -2.68 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 78630 | -| policy_gradient_loss | -0.00509 | -| std | 0.109 | -| value_loss | 2.71e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7865 | -| time_elapsed | 49432 | -| total_timesteps | 1006720 | -| train/ | | -| approx_kl | 0.004301781 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 78640 | -| policy_gradient_loss | -0.00918 | -| std | 0.109 | -| value_loss | 6.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7866 | -| time_elapsed | 49435 | -| total_timesteps | 1006848 | -| train/ | | -| approx_kl | 0.01858742 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | -0.0732 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 78650 | -| policy_gradient_loss | -0.00806 | -| std | 0.109 | -| value_loss | 4.48e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 20 | -| iterations | 7867 | -| time_elapsed | 49439 | -| total_timesteps | 1006976 | -| train/ | | -| approx_kl | 0.03181051 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | -0.0559 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 78660 | -| policy_gradient_loss | -0.00128 | -| std | 0.109 | -| value_loss | 1.33e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 20 | -| iterations | 7868 | -| time_elapsed | 49442 | -| total_timesteps | 1007104 | -| train/ | | -| approx_kl | 0.0014442243 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.801 | -| explained_variance | 0.0059 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 78670 | -| policy_gradient_loss | -0.00178 | -| std | 0.109 | -| value_loss | 8.23e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 20 | -| iterations | 7869 | -| time_elapsed | 49450 | -| total_timesteps | 1007232 | -| train/ | | -| approx_kl | 0.19047248 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | 0.907 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 78680 | -| policy_gradient_loss | -0.0161 | -| std | 0.109 | -| value_loss | 0.00072 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 20 | -| iterations | 7870 | -| time_elapsed | 49453 | -| total_timesteps | 1007360 | -| train/ | | -| approx_kl | 0.008876966 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | -38.7 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 78690 | -| policy_gradient_loss | -0.00619 | -| std | 0.109 | -| value_loss | 6.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 20 | -| iterations | 7871 | -| time_elapsed | 49456 | -| total_timesteps | 1007488 | -| train/ | | -| approx_kl | 0.058274046 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 0.8 | -| explained_variance | -74.9 | -| learning_rate | 0.0003 | -| loss | -0.00786 | -| n_updates | 78700 | -| policy_gradient_loss | -0.00494 | -| std | 0.109 | -| value_loss | 1.77e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 20 | -| iterations | 7872 | -| time_elapsed | 49459 | -| total_timesteps | 1007616 | -| train/ | | -| approx_kl | 0.00017539226 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.799 | -| explained_variance | -15.7 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 78710 | -| policy_gradient_loss | -0.00012 | -| std | 0.109 | -| value_loss | 9.67e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 20 | -| iterations | 7873 | -| time_elapsed | 49462 | -| total_timesteps | 1007744 | -| train/ | | -| approx_kl | 0.0015299777 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | 0.801 | -| explained_variance | -0.0954 | -| learning_rate | 0.0003 | -| loss | -0.000375 | -| n_updates | 78720 | -| policy_gradient_loss | -0.000295 | -| std | 0.108 | -| value_loss | 2.95e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 20 | -| iterations | 7874 | -| time_elapsed | 49465 | -| total_timesteps | 1007872 | -| train/ | | -| approx_kl | 0.0141616985 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | -0.0604 | -| learning_rate | 0.0003 | -| loss | -0.0074 | -| n_updates | 78730 | -| policy_gradient_loss | -0.00357 | -| std | 0.108 | -| value_loss | 1.57e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7875 | -| time_elapsed | 49468 | -| total_timesteps | 1008000 | -| train/ | | -| approx_kl | 0.0144701665 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | -0.229 | -| learning_rate | 0.0003 | -| loss | -0.000465 | -| n_updates | 78740 | -| policy_gradient_loss | -0.000119 | -| std | 0.108 | -| value_loss | 7.2e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7876 | -| time_elapsed | 49471 | -| total_timesteps | 1008128 | -| train/ | | -| approx_kl | 0.011168221 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | 0.0026 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 78750 | -| policy_gradient_loss | -0.00709 | -| std | 0.108 | -| value_loss | 3.32e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7877 | -| time_elapsed | 49477 | -| total_timesteps | 1008256 | -| train/ | | -| approx_kl | 0.28249085 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | 0.557 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 78760 | -| policy_gradient_loss | -0.0123 | -| std | 0.108 | -| value_loss | 0.000687 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7878 | -| time_elapsed | 49481 | -| total_timesteps | 1008384 | -| train/ | | -| approx_kl | 0.08051525 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 0.805 | -| explained_variance | -8.53 | -| learning_rate | 0.0003 | -| loss | 0.00082 | -| n_updates | 78770 | -| policy_gradient_loss | 0.000305 | -| std | 0.108 | -| value_loss | 2.88e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7879 | -| time_elapsed | 49484 | -| total_timesteps | 1008512 | -| train/ | | -| approx_kl | 0.016159082 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.805 | -| explained_variance | -13.1 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 78780 | -| policy_gradient_loss | -0.00101 | -| std | 0.108 | -| value_loss | 1.54e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7880 | -| time_elapsed | 49487 | -| total_timesteps | 1008640 | -| train/ | | -| approx_kl | 0.00025417004 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | -3.36 | -| learning_rate | 0.0003 | -| loss | -0.0043 | -| n_updates | 78790 | -| policy_gradient_loss | -0.00761 | -| std | 0.108 | -| value_loss | 1.94e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7881 | -| time_elapsed | 49490 | -| total_timesteps | 1008768 | -| train/ | | -| approx_kl | 0.02160963 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 78800 | -| policy_gradient_loss | -0.00591 | -| std | 0.108 | -| value_loss | 2.17e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 20 | -| iterations | 7882 | -| time_elapsed | 49493 | -| total_timesteps | 1008896 | -| train/ | | -| approx_kl | 0.03237805 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | 0.00827 | -| n_updates | 78810 | -| policy_gradient_loss | 0.00141 | -| std | 0.108 | -| value_loss | 1.16e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7883 | -| time_elapsed | 49497 | -| total_timesteps | 1009024 | -| train/ | | -| approx_kl | 0.038617577 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | 0.000917 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 78820 | -| policy_gradient_loss | -0.0139 | -| std | 0.108 | -| value_loss | 7.12e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7884 | -| time_elapsed | 49504 | -| total_timesteps | 1009152 | -| train/ | | -| approx_kl | 0.06468951 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 78830 | -| policy_gradient_loss | -0.0138 | -| std | 0.108 | -| value_loss | 4.34e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7885 | -| time_elapsed | 49507 | -| total_timesteps | 1009280 | -| train/ | | -| approx_kl | 0.00024393946 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | 0.000673 | -| learning_rate | 0.0003 | -| loss | -0.000596 | -| n_updates | 78840 | -| policy_gradient_loss | 0.00592 | -| std | 0.108 | -| value_loss | 6.95e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7886 | -| time_elapsed | 49510 | -| total_timesteps | 1009408 | -| train/ | | -| approx_kl | 0.001195793 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | -6.03 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 78850 | -| policy_gradient_loss | -0.00149 | -| std | 0.108 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7887 | -| time_elapsed | 49513 | -| total_timesteps | 1009536 | -| train/ | | -| approx_kl | 0.009441019 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | -0.701 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 78860 | -| policy_gradient_loss | -0.0104 | -| std | 0.108 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7888 | -| time_elapsed | 49517 | -| total_timesteps | 1009664 | -| train/ | | -| approx_kl | 0.026105355 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 78870 | -| policy_gradient_loss | -0.00543 | -| std | 0.108 | -| value_loss | 4.76e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7889 | -| time_elapsed | 49520 | -| total_timesteps | 1009792 | -| train/ | | -| approx_kl | 0.0002152957 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | -0.0704 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 78880 | -| policy_gradient_loss | 0.0022 | -| std | 0.108 | -| value_loss | 2.3e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 20 | -| iterations | 7890 | -| time_elapsed | 49523 | -| total_timesteps | 1009920 | -| train/ | | -| approx_kl | 0.0056654788 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 0.807 | -| explained_variance | 0.00553 | -| learning_rate | 0.0003 | -| loss | -0.000264 | -| n_updates | 78890 | -| policy_gradient_loss | -8.02e-05 | -| std | 0.108 | -| value_loss | 9.78e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7891 | -| time_elapsed | 49526 | -| total_timesteps | 1010048 | -| train/ | | -| approx_kl | 0.0018733218 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.809 | -| explained_variance | 0.00385 | -| learning_rate | 0.0003 | -| loss | -0.00629 | -| n_updates | 78900 | -| policy_gradient_loss | -0.00727 | -| std | 0.108 | -| value_loss | 9.1e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7892 | -| time_elapsed | 49532 | -| total_timesteps | 1010176 | -| train/ | | -| approx_kl | 0.6930421 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 0.809 | -| explained_variance | 0.668 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 78910 | -| policy_gradient_loss | -0.00671 | -| std | 0.108 | -| value_loss | 0.00666 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7893 | -| time_elapsed | 49535 | -| total_timesteps | 1010304 | -| train/ | | -| approx_kl | 0.012860811 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 0.808 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.0235 | -| n_updates | 78920 | -| policy_gradient_loss | -0.0166 | -| std | 0.108 | -| value_loss | 9.51e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7894 | -| time_elapsed | 49537 | -| total_timesteps | 1010432 | -| train/ | | -| approx_kl | 0.005401532 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 0.807 | -| explained_variance | -70.2 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 78930 | -| policy_gradient_loss | -0.000806 | -| std | 0.108 | -| value_loss | 0.000148 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7895 | -| time_elapsed | 49540 | -| total_timesteps | 1010560 | -| train/ | | -| approx_kl | 0.0086800335 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.806 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 78940 | -| policy_gradient_loss | -0.00596 | -| std | 0.108 | -| value_loss | 0.00079 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7896 | -| time_elapsed | 49544 | -| total_timesteps | 1010688 | -| train/ | | -| approx_kl | 0.0032753637 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 0.805 | -| explained_variance | -0.326 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 78950 | -| policy_gradient_loss | -0.00367 | -| std | 0.108 | -| value_loss | 0.000419 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7897 | -| time_elapsed | 49548 | -| total_timesteps | 1010816 | -| train/ | | -| approx_kl | 0.0014995555 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.805 | -| explained_variance | 0.0028 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 78960 | -| policy_gradient_loss | -0.00134 | -| std | 0.108 | -| value_loss | 0.00025 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7898 | -| time_elapsed | 49553 | -| total_timesteps | 1010944 | -| train/ | | -| approx_kl | 0.018370777 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 0.805 | -| explained_variance | -0.0898 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 78970 | -| policy_gradient_loss | -0.0165 | -| std | 0.108 | -| value_loss | 9.17e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7899 | -| time_elapsed | 49556 | -| total_timesteps | 1011072 | -| train/ | | -| approx_kl | 0.0014193854 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.805 | -| explained_variance | -0.0592 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 78980 | -| policy_gradient_loss | 0.00165 | -| std | 0.108 | -| value_loss | 0.000706 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7900 | -| time_elapsed | 49563 | -| total_timesteps | 1011200 | -| train/ | | -| approx_kl | 0.0018755742 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 0.804 | -| explained_variance | 0.949 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 78990 | -| policy_gradient_loss | -0.00632 | -| std | 0.108 | -| value_loss | 0.000683 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7901 | -| time_elapsed | 49567 | -| total_timesteps | 1011328 | -| train/ | | -| approx_kl | 0.095811434 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | -37.2 | -| learning_rate | 0.0003 | -| loss | -0.00568 | -| n_updates | 79000 | -| policy_gradient_loss | -0.00566 | -| std | 0.108 | -| value_loss | 4.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7902 | -| time_elapsed | 49570 | -| total_timesteps | 1011456 | -| train/ | | -| approx_kl | 0.012646538 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 0.803 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 79010 | -| policy_gradient_loss | -0.00741 | -| std | 0.108 | -| value_loss | 4.85e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7903 | -| time_elapsed | 49574 | -| total_timesteps | 1011584 | -| train/ | | -| approx_kl | 9.3369745e-05 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | 0.805 | -| explained_variance | -0.086 | -| learning_rate | 0.0003 | -| loss | -0.000899 | -| n_updates | 79020 | -| policy_gradient_loss | -0.000218 | -| std | 0.108 | -| value_loss | 4.95e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7904 | -| time_elapsed | 49578 | -| total_timesteps | 1011712 | -| train/ | | -| approx_kl | 0.003017276 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.811 | -| explained_variance | -0.262 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 79030 | -| policy_gradient_loss | -0.00103 | -| std | 0.107 | -| value_loss | 3.17e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7905 | -| time_elapsed | 49582 | -| total_timesteps | 1011840 | -| train/ | | -| approx_kl | 0.008467751 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 0.815 | -| explained_variance | -0.39 | -| learning_rate | 0.0003 | -| loss | -0.00785 | -| n_updates | 79040 | -| policy_gradient_loss | -0.00648 | -| std | 0.107 | -| value_loss | 9.11e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 20 | -| iterations | 7906 | -| time_elapsed | 49585 | -| total_timesteps | 1011968 | -| train/ | | -| approx_kl | 7.2414055e-05 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.816 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.000693 | -| n_updates | 79050 | -| policy_gradient_loss | -0.00267 | -| std | 0.107 | -| value_loss | 8.52e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7907 | -| time_elapsed | 49587 | -| total_timesteps | 1012096 | -| train/ | | -| approx_kl | 0.0011317427 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 0.818 | -| explained_variance | 0.00583 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 79060 | -| policy_gradient_loss | -0.00509 | -| std | 0.107 | -| value_loss | 1.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7908 | -| time_elapsed | 49592 | -| total_timesteps | 1012224 | -| train/ | | -| approx_kl | 0.002657684 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | 0.319 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 79070 | -| policy_gradient_loss | -0.00936 | -| std | 0.107 | -| value_loss | 0.00101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7909 | -| time_elapsed | 49596 | -| total_timesteps | 1012352 | -| train/ | | -| approx_kl | 0.020591523 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -381 | -| learning_rate | 0.0003 | -| loss | -0.00997 | -| n_updates | 79080 | -| policy_gradient_loss | -0.00624 | -| std | 0.107 | -| value_loss | 9.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7910 | -| time_elapsed | 49600 | -| total_timesteps | 1012480 | -| train/ | | -| approx_kl | 0.005388457 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -183 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 79090 | -| policy_gradient_loss | -0.012 | -| std | 0.107 | -| value_loss | 2.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7911 | -| time_elapsed | 49604 | -| total_timesteps | 1012608 | -| train/ | | -| approx_kl | 0.10224563 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -358 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 79100 | -| policy_gradient_loss | -0.00654 | -| std | 0.106 | -| value_loss | 2.27e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7912 | -| time_elapsed | 49609 | -| total_timesteps | 1012736 | -| train/ | | -| approx_kl | 0.03835552 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 0.821 | -| explained_variance | -755 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 79110 | -| policy_gradient_loss | -0.00877 | -| std | 0.106 | -| value_loss | 1.28e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7913 | -| time_elapsed | 49611 | -| total_timesteps | 1012864 | -| train/ | | -| approx_kl | 0.051451236 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.822 | -| explained_variance | -19.6 | -| learning_rate | 0.0003 | -| loss | -0.00636 | -| n_updates | 79120 | -| policy_gradient_loss | -0.00287 | -| std | 0.106 | -| value_loss | 1.09e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7914 | -| time_elapsed | 49614 | -| total_timesteps | 1012992 | -| train/ | | -| approx_kl | 0.014862955 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 0.822 | -| explained_variance | -4.74 | -| learning_rate | 0.0003 | -| loss | -0.00955 | -| n_updates | 79130 | -| policy_gradient_loss | -0.00421 | -| std | 0.106 | -| value_loss | 1.9e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 20 | -| iterations | 7915 | -| time_elapsed | 49617 | -| total_timesteps | 1013120 | -| train/ | | -| approx_kl | 0.0014583701 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 0.821 | -| explained_variance | -0.643 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 79140 | -| policy_gradient_loss | 0.00589 | -| std | 0.107 | -| value_loss | 6.28e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 20 | -| iterations | 7916 | -| time_elapsed | 49627 | -| total_timesteps | 1013248 | -| train/ | | -| approx_kl | 0.10182675 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | 0.877 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 79150 | -| policy_gradient_loss | -0.00115 | -| std | 0.107 | -| value_loss | 0.00122 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 20 | -| iterations | 7917 | -| time_elapsed | 49631 | -| total_timesteps | 1013376 | -| train/ | | -| approx_kl | 0.051091343 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 0.821 | -| explained_variance | -474 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 79160 | -| policy_gradient_loss | -0.00896 | -| std | 0.106 | -| value_loss | 3.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 20 | -| iterations | 7918 | -| time_elapsed | 49635 | -| total_timesteps | 1013504 | -| train/ | | -| approx_kl | 0.12742491 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 0.821 | -| explained_variance | -430 | -| learning_rate | 0.0003 | -| loss | -0.000509 | -| n_updates | 79170 | -| policy_gradient_loss | -0.00166 | -| std | 0.106 | -| value_loss | 1.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 20 | -| iterations | 7919 | -| time_elapsed | 49639 | -| total_timesteps | 1013632 | -| train/ | | -| approx_kl | 0.046932757 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 79180 | -| policy_gradient_loss | -0.00806 | -| std | 0.107 | -| value_loss | 1.47e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 20 | -| iterations | 7920 | -| time_elapsed | 49643 | -| total_timesteps | 1013760 | -| train/ | | -| approx_kl | 0.04123448 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | -0.00706 | -| n_updates | 79190 | -| policy_gradient_loss | -0.00299 | -| std | 0.107 | -| value_loss | 1.2e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 20 | -| iterations | 7921 | -| time_elapsed | 49646 | -| total_timesteps | 1013888 | -| train/ | | -| approx_kl | 0.00023958273 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 0.819 | -| explained_variance | -0.332 | -| learning_rate | 0.0003 | -| loss | -0.000829 | -| n_updates | 79200 | -| policy_gradient_loss | -0.000666 | -| std | 0.107 | -| value_loss | 7.4e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7922 | -| time_elapsed | 49649 | -| total_timesteps | 1014016 | -| train/ | | -| approx_kl | 0.0004092236 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.819 | -| explained_variance | -0.0499 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 79210 | -| policy_gradient_loss | -0.00333 | -| std | 0.107 | -| value_loss | 7.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7923 | -| time_elapsed | 49658 | -| total_timesteps | 1014144 | -| train/ | | -| approx_kl | 0.019722428 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.818 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 79220 | -| policy_gradient_loss | -0.00987 | -| std | 0.107 | -| value_loss | 0.000289 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7924 | -| time_elapsed | 49661 | -| total_timesteps | 1014272 | -| train/ | | -| approx_kl | 0.0035093538 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 0.818 | -| explained_variance | 0.354 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 79230 | -| policy_gradient_loss | -0.00535 | -| std | 0.107 | -| value_loss | 1.94e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7925 | -| time_elapsed | 49665 | -| total_timesteps | 1014400 | -| train/ | | -| approx_kl | 0.053352572 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 0.818 | -| explained_variance | -43.4 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 79240 | -| policy_gradient_loss | -0.00973 | -| std | 0.107 | -| value_loss | 5.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7926 | -| time_elapsed | 49668 | -| total_timesteps | 1014528 | -| train/ | | -| approx_kl | 0.012083981 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.819 | -| explained_variance | -4.68 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 79250 | -| policy_gradient_loss | -0.0063 | -| std | 0.107 | -| value_loss | 1.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7927 | -| time_elapsed | 49672 | -| total_timesteps | 1014656 | -| train/ | | -| approx_kl | 0.0018776776 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.819 | -| explained_variance | -0.978 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 79260 | -| policy_gradient_loss | -0.000306 | -| std | 0.107 | -| value_loss | 5.62e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7928 | -| time_elapsed | 49676 | -| total_timesteps | 1014784 | -| train/ | | -| approx_kl | 0.009766253 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 79270 | -| policy_gradient_loss | -0.0116 | -| std | 0.107 | -| value_loss | 1.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 20 | -| iterations | 7929 | -| time_elapsed | 49680 | -| total_timesteps | 1014912 | -| train/ | | -| approx_kl | 0.006292527 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 79280 | -| policy_gradient_loss | 0.00498 | -| std | 0.107 | -| value_loss | 9.6e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7930 | -| time_elapsed | 49683 | -| total_timesteps | 1015040 | -| train/ | | -| approx_kl | 0.005675488 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | -0.00151 | -| learning_rate | 0.0003 | -| loss | -0.00922 | -| n_updates | 79290 | -| policy_gradient_loss | -0.00184 | -| std | 0.107 | -| value_loss | 1.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7931 | -| time_elapsed | 49693 | -| total_timesteps | 1015168 | -| train/ | | -| approx_kl | 0.23674838 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 0.82 | -| explained_variance | 0.951 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 79300 | -| policy_gradient_loss | -0.011 | -| std | 0.107 | -| value_loss | 0.000519 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7932 | -| time_elapsed | 49698 | -| total_timesteps | 1015296 | -| train/ | | -| approx_kl | 0.19930784 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 0.819 | -| explained_variance | -51 | -| learning_rate | 0.0003 | -| loss | 0.00098 | -| n_updates | 79310 | -| policy_gradient_loss | -0.00388 | -| std | 0.107 | -| value_loss | 2.29e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7933 | -| time_elapsed | 49702 | -| total_timesteps | 1015424 | -| train/ | | -| approx_kl | 0.08330828 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 0.818 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 79320 | -| policy_gradient_loss | -0.000895 | -| std | 0.107 | -| value_loss | 1.24e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7934 | -| time_elapsed | 49705 | -| total_timesteps | 1015552 | -| train/ | | -| approx_kl | 0.0055276575 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.814 | -| explained_variance | -5.56 | -| learning_rate | 0.0003 | -| loss | -0.00798 | -| n_updates | 79330 | -| policy_gradient_loss | -0.0063 | -| std | 0.107 | -| value_loss | 1.19e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7935 | -| time_elapsed | 49708 | -| total_timesteps | 1015680 | -| train/ | | -| approx_kl | 0.00019595493 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 0.812 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 79340 | -| policy_gradient_loss | -0.00312 | -| std | 0.107 | -| value_loss | 2.43e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7936 | -| time_elapsed | 49713 | -| total_timesteps | 1015808 | -| train/ | | -| approx_kl | 0.011446467 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.813 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 79350 | -| policy_gradient_loss | -0.00125 | -| std | 0.107 | -| value_loss | 5.57e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 20 | -| iterations | 7937 | -| time_elapsed | 49717 | -| total_timesteps | 1015936 | -| train/ | | -| approx_kl | 0.0364848 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 0.814 | -| explained_variance | -111 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 79360 | -| policy_gradient_loss | -0.00112 | -| std | 0.107 | -| value_loss | 3.56e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7938 | -| time_elapsed | 49721 | -| total_timesteps | 1016064 | -| train/ | | -| approx_kl | 0.004958271 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 0.814 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 79370 | -| policy_gradient_loss | -0.00563 | -| std | 0.107 | -| value_loss | 3.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7939 | -| time_elapsed | 49727 | -| total_timesteps | 1016192 | -| train/ | | -| approx_kl | 0.008576667 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.815 | -| explained_variance | 0.039 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 79380 | -| policy_gradient_loss | -0.0106 | -| std | 0.107 | -| value_loss | 0.00173 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7940 | -| time_elapsed | 49731 | -| total_timesteps | 1016320 | -| train/ | | -| approx_kl | 0.021101674 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.814 | -| explained_variance | -91.7 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 79390 | -| policy_gradient_loss | -0.00977 | -| std | 0.107 | -| value_loss | 4.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7941 | -| time_elapsed | 49735 | -| total_timesteps | 1016448 | -| train/ | | -| approx_kl | 0.025630284 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.815 | -| explained_variance | -1.17e+03 | -| learning_rate | 0.0003 | -| loss | -0.000599 | -| n_updates | 79400 | -| policy_gradient_loss | -0.000619 | -| std | 0.107 | -| value_loss | 2.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7942 | -| time_elapsed | 49738 | -| total_timesteps | 1016576 | -| train/ | | -| approx_kl | 0.11132314 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 0.816 | -| explained_variance | -121 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 79410 | -| policy_gradient_loss | -0.00741 | -| std | 0.107 | -| value_loss | 1.69e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7943 | -| time_elapsed | 49742 | -| total_timesteps | 1016704 | -| train/ | | -| approx_kl | 0.06457834 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 0.817 | -| explained_variance | -8.13 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 79420 | -| policy_gradient_loss | -0.0178 | -| std | 0.107 | -| value_loss | 1.99e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7944 | -| time_elapsed | 49745 | -| total_timesteps | 1016832 | -| train/ | | -| approx_kl | 0.00031887088 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 0.818 | -| explained_variance | -0.379 | -| learning_rate | 0.0003 | -| loss | -0.000514 | -| n_updates | 79430 | -| policy_gradient_loss | 0.000532 | -| std | 0.107 | -| value_loss | 3.52e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7945 | -| time_elapsed | 49749 | -| total_timesteps | 1016960 | -| train/ | | -| approx_kl | 0.0026836633 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.821 | -| explained_variance | 0.00345 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 79440 | -| policy_gradient_loss | -0.0115 | -| std | 0.106 | -| value_loss | 6.12e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7946 | -| time_elapsed | 49754 | -| total_timesteps | 1017088 | -| train/ | | -| approx_kl | 0.00013582129 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 0.823 | -| explained_variance | -0.00603 | -| learning_rate | 0.0003 | -| loss | -0.000644 | -| n_updates | 79450 | -| policy_gradient_loss | -0.000825 | -| std | 0.106 | -| value_loss | 7.44e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7947 | -| time_elapsed | 49760 | -| total_timesteps | 1017216 | -| train/ | | -| approx_kl | 0.014996944 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.825 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 79460 | -| policy_gradient_loss | -0.0123 | -| std | 0.106 | -| value_loss | 0.000139 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7948 | -| time_elapsed | 49763 | -| total_timesteps | 1017344 | -| train/ | | -| approx_kl | 0.004069732 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.825 | -| explained_variance | -6.51 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 79470 | -| policy_gradient_loss | -0.0106 | -| std | 0.106 | -| value_loss | 1.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7949 | -| time_elapsed | 49767 | -| total_timesteps | 1017472 | -| train/ | | -| approx_kl | 0.05383593 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 0.825 | -| explained_variance | -14.9 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 79480 | -| policy_gradient_loss | -0.0168 | -| std | 0.106 | -| value_loss | 1.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7950 | -| time_elapsed | 49770 | -| total_timesteps | 1017600 | -| train/ | | -| approx_kl | 0.016021283 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 0.824 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00871 | -| n_updates | 79490 | -| policy_gradient_loss | -0.00342 | -| std | 0.106 | -| value_loss | 2.62e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7951 | -| time_elapsed | 49774 | -| total_timesteps | 1017728 | -| train/ | | -| approx_kl | 0.0074861962 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 0.824 | -| explained_variance | -0.657 | -| learning_rate | 0.0003 | -| loss | -0.00889 | -| n_updates | 79500 | -| policy_gradient_loss | -0.00495 | -| std | 0.106 | -| value_loss | 6.69e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7952 | -| time_elapsed | 49779 | -| total_timesteps | 1017856 | -| train/ | | -| approx_kl | 0.01968416 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 0.823 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 79510 | -| policy_gradient_loss | 0.00152 | -| std | 0.106 | -| value_loss | 5.66e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 20 | -| iterations | 7953 | -| time_elapsed | 49782 | -| total_timesteps | 1017984 | -| train/ | | -| approx_kl | 0.0045717615 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 0.824 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 79520 | -| policy_gradient_loss | -0.000877 | -| std | 0.106 | -| value_loss | 2.82e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 20 | -| iterations | 7954 | -| time_elapsed | 49786 | -| total_timesteps | 1018112 | -| train/ | | -| approx_kl | 0.0014188383 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 0.825 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 79530 | -| policy_gradient_loss | -0.00324 | -| std | 0.106 | -| value_loss | 5.86e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 20 | -| iterations | 7955 | -| time_elapsed | 49795 | -| total_timesteps | 1018240 | -| train/ | | -| approx_kl | 0.016672587 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.826 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 79540 | -| policy_gradient_loss | -0.0159 | -| std | 0.106 | -| value_loss | 9.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 20 | -| iterations | 7956 | -| time_elapsed | 49799 | -| total_timesteps | 1018368 | -| train/ | | -| approx_kl | 0.047599413 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 0.827 | -| explained_variance | -3 | -| learning_rate | 0.0003 | -| loss | -0.00795 | -| n_updates | 79550 | -| policy_gradient_loss | -0.00676 | -| std | 0.106 | -| value_loss | 1.3e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 20 | -| iterations | 7957 | -| time_elapsed | 49803 | -| total_timesteps | 1018496 | -| train/ | | -| approx_kl | 3.8506463e-05 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 0.829 | -| explained_variance | -6.28 | -| learning_rate | 0.0003 | -| loss | -0.000847 | -| n_updates | 79560 | -| policy_gradient_loss | -0.000292 | -| std | 0.105 | -| value_loss | 4.25e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 20 | -| iterations | 7958 | -| time_elapsed | 49806 | -| total_timesteps | 1018624 | -| train/ | | -| approx_kl | 0.016770978 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 0.834 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 79570 | -| policy_gradient_loss | -0.016 | -| std | 0.105 | -| value_loss | 1.74e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 20 | -| iterations | 7959 | -| time_elapsed | 49810 | -| total_timesteps | 1018752 | -| train/ | | -| approx_kl | 0.022005923 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 0.838 | -| explained_variance | -0.0833 | -| learning_rate | 0.0003 | -| loss | 0.00786 | -| n_updates | 79580 | -| policy_gradient_loss | 0.00161 | -| std | 0.105 | -| value_loss | 9.34e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 20 | -| iterations | 7960 | -| time_elapsed | 49814 | -| total_timesteps | 1018880 | -| train/ | | -| approx_kl | 0.017441923 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 79590 | -| policy_gradient_loss | -0.00851 | -| std | 0.104 | -| value_loss | 1.62e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7961 | -| time_elapsed | 49817 | -| total_timesteps | 1019008 | -| train/ | | -| approx_kl | 0.03482989 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.841 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.00484 | -| n_updates | 79600 | -| policy_gradient_loss | -0.000513 | -| std | 0.104 | -| value_loss | 1.58e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7962 | -| time_elapsed | 49824 | -| total_timesteps | 1019136 | -| train/ | | -| approx_kl | 0.040618125 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.841 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 79610 | -| policy_gradient_loss | -0.00825 | -| std | 0.104 | -| value_loss | 0.000519 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7963 | -| time_elapsed | 49827 | -| total_timesteps | 1019264 | -| train/ | | -| approx_kl | 0.0029632645 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 0.842 | -| explained_variance | -6.11 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 79620 | -| policy_gradient_loss | -0.00205 | -| std | 0.104 | -| value_loss | 2.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7964 | -| time_elapsed | 49831 | -| total_timesteps | 1019392 | -| train/ | | -| approx_kl | 0.073995195 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 0.842 | -| explained_variance | -1.09e+03 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 79630 | -| policy_gradient_loss | -0.0101 | -| std | 0.104 | -| value_loss | 2.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7965 | -| time_elapsed | 49835 | -| total_timesteps | 1019520 | -| train/ | | -| approx_kl | 0.033412933 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 0.842 | -| explained_variance | -89.6 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 79640 | -| policy_gradient_loss | -0.011 | -| std | 0.104 | -| value_loss | 2.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7966 | -| time_elapsed | 49839 | -| total_timesteps | 1019648 | -| train/ | | -| approx_kl | 0.04002666 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.842 | -| explained_variance | -8.19 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 79650 | -| policy_gradient_loss | -0.00201 | -| std | 0.104 | -| value_loss | 2.78e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7967 | -| time_elapsed | 49842 | -| total_timesteps | 1019776 | -| train/ | | -| approx_kl | 0.010438852 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 0.841 | -| explained_variance | -0.623 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 79660 | -| policy_gradient_loss | -0.0112 | -| std | 0.104 | -| value_loss | 1.53e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 20 | -| iterations | 7968 | -| time_elapsed | 49845 | -| total_timesteps | 1019904 | -| train/ | | -| approx_kl | 0.024916355 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.00277 | -| n_updates | 79670 | -| policy_gradient_loss | 0.000811 | -| std | 0.105 | -| value_loss | 1e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7969 | -| time_elapsed | 49848 | -| total_timesteps | 1020032 | -| train/ | | -| approx_kl | 0.04011274 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.839 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00865 | -| n_updates | 79680 | -| policy_gradient_loss | -0.00695 | -| std | 0.105 | -| value_loss | 4.33e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7970 | -| time_elapsed | 49855 | -| total_timesteps | 1020160 | -| train/ | | -| approx_kl | 0.1432937 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.839 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 79690 | -| policy_gradient_loss | -0.00762 | -| std | 0.105 | -| value_loss | 0.000149 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7971 | -| time_elapsed | 49859 | -| total_timesteps | 1020288 | -| train/ | | -| approx_kl | 0.0064185984 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.838 | -| explained_variance | -75.4 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 79700 | -| policy_gradient_loss | -0.0159 | -| std | 0.105 | -| value_loss | 1.57e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7972 | -| time_elapsed | 49862 | -| total_timesteps | 1020416 | -| train/ | | -| approx_kl | 0.01761321 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | -35.6 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 79710 | -| policy_gradient_loss | -0.00649 | -| std | 0.105 | -| value_loss | 1.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7973 | -| time_elapsed | 49864 | -| total_timesteps | 1020544 | -| train/ | | -| approx_kl | 0.07962186 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | -13.3 | -| learning_rate | 0.0003 | -| loss | -0.00785 | -| n_updates | 79720 | -| policy_gradient_loss | -0.00303 | -| std | 0.105 | -| value_loss | 1.5e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7974 | -| time_elapsed | 49868 | -| total_timesteps | 1020672 | -| train/ | | -| approx_kl | 0.012668553 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.837 | -| explained_variance | -0.664 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 79730 | -| policy_gradient_loss | -0.0019 | -| std | 0.105 | -| value_loss | 7.91e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7975 | -| time_elapsed | 49873 | -| total_timesteps | 1020800 | -| train/ | | -| approx_kl | 0.00017908448 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.838 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | -0.000107 | -| n_updates | 79740 | -| policy_gradient_loss | 0.00138 | -| std | 0.105 | -| value_loss | 9.46e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 20 | -| iterations | 7976 | -| time_elapsed | 49876 | -| total_timesteps | 1020928 | -| train/ | | -| approx_kl | 0.0032415674 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | -0.00866 | -| n_updates | 79750 | -| policy_gradient_loss | -0.00885 | -| std | 0.104 | -| value_loss | 3.85e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7977 | -| time_elapsed | 49881 | -| total_timesteps | 1021056 | -| train/ | | -| approx_kl | 0.00033892505 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 0.841 | -| explained_variance | -0.00375 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 79760 | -| policy_gradient_loss | -0.00191 | -| std | 0.104 | -| value_loss | 1.67e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7978 | -| time_elapsed | 49886 | -| total_timesteps | 1021184 | -| train/ | | -| approx_kl | 0.034021813 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.842 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 79770 | -| policy_gradient_loss | -0.00446 | -| std | 0.104 | -| value_loss | 0.000263 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7979 | -| time_elapsed | 49891 | -| total_timesteps | 1021312 | -| train/ | | -| approx_kl | 0.022703836 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.842 | -| explained_variance | -661 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 79780 | -| policy_gradient_loss | -0.0012 | -| std | 0.104 | -| value_loss | 5.22e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7980 | -| time_elapsed | 49895 | -| total_timesteps | 1021440 | -| train/ | | -| approx_kl | 0.09980457 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 0.841 | -| explained_variance | -265 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 79790 | -| policy_gradient_loss | -0.0031 | -| std | 0.104 | -| value_loss | 1.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7981 | -| time_elapsed | 49899 | -| total_timesteps | 1021568 | -| train/ | | -| approx_kl | 0.030316366 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -4.5 | -| learning_rate | 0.0003 | -| loss | -0.00606 | -| n_updates | 79800 | -| policy_gradient_loss | -0.00463 | -| std | 0.104 | -| value_loss | 5.39e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7982 | -| time_elapsed | 49903 | -| total_timesteps | 1021696 | -| train/ | | -| approx_kl | 0.00081407465 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 79810 | -| policy_gradient_loss | -0.000815 | -| std | 0.104 | -| value_loss | 1.9e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7983 | -| time_elapsed | 49906 | -| total_timesteps | 1021824 | -| train/ | | -| approx_kl | 0.0029320405 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 79820 | -| policy_gradient_loss | -0.00148 | -| std | 0.104 | -| value_loss | 1.5e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 20 | -| iterations | 7984 | -| time_elapsed | 49911 | -| total_timesteps | 1021952 | -| train/ | | -| approx_kl | 0.016925847 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 79830 | -| policy_gradient_loss | -0.00173 | -| std | 0.105 | -| value_loss | 1.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7985 | -| time_elapsed | 49915 | -| total_timesteps | 1022080 | -| train/ | | -| approx_kl | 0.019774292 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 79840 | -| policy_gradient_loss | -0.000851 | -| std | 0.104 | -| value_loss | 8.2e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7986 | -| time_elapsed | 49922 | -| total_timesteps | 1022208 | -| train/ | | -| approx_kl | 0.038224377 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 0.84 | -| explained_variance | -1.42 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 79850 | -| policy_gradient_loss | -0.00746 | -| std | 0.105 | -| value_loss | 0.00203 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7987 | -| time_elapsed | 49925 | -| total_timesteps | 1022336 | -| train/ | | -| approx_kl | 0.05235114 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 0.839 | -| explained_variance | -143 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 79860 | -| policy_gradient_loss | -0.00807 | -| std | 0.105 | -| value_loss | 1.02e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7988 | -| time_elapsed | 49928 | -| total_timesteps | 1022464 | -| train/ | | -| approx_kl | 0.005741339 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 0.839 | -| explained_variance | -1.3e+03 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 79870 | -| policy_gradient_loss | -0.0134 | -| std | 0.105 | -| value_loss | 2.67e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7989 | -| time_elapsed | 49931 | -| total_timesteps | 1022592 | -| train/ | | -| approx_kl | 0.0033318931 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 0.839 | -| explained_variance | -22.4 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 79880 | -| policy_gradient_loss | -0.00158 | -| std | 0.105 | -| value_loss | 2.81e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7990 | -| time_elapsed | 49935 | -| total_timesteps | 1022720 | -| train/ | | -| approx_kl | 0.008408217 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.839 | -| explained_variance | -0.356 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 79890 | -| policy_gradient_loss | 8.09e-05 | -| std | 0.105 | -| value_loss | 3.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7991 | -| time_elapsed | 49937 | -| total_timesteps | 1022848 | -| train/ | | -| approx_kl | 0.03436515 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.839 | -| explained_variance | 0.000191 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 79900 | -| policy_gradient_loss | -6.59e-05 | -| std | 0.105 | -| value_loss | 2.01e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 20 | -| iterations | 7992 | -| time_elapsed | 49941 | -| total_timesteps | 1022976 | -| train/ | | -| approx_kl | 4.1691586e-05 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 0.838 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.000163 | -| n_updates | 79910 | -| policy_gradient_loss | 0.00271 | -| std | 0.105 | -| value_loss | 1.84e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 7993 | -| time_elapsed | 49945 | -| total_timesteps | 1023104 | -| train/ | | -| approx_kl | 0.0011130194 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.837 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 79920 | -| policy_gradient_loss | -0.00148 | -| std | 0.105 | -| value_loss | 4.08e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 7994 | -| time_elapsed | 49955 | -| total_timesteps | 1023232 | -| train/ | | -| approx_kl | 0.046985235 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 0.837 | -| explained_variance | 0.888 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 79930 | -| policy_gradient_loss | -0.0157 | -| std | 0.105 | -| value_loss | 0.00104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 7995 | -| time_elapsed | 49959 | -| total_timesteps | 1023360 | -| train/ | | -| approx_kl | 0.049342442 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | -85.9 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 79940 | -| policy_gradient_loss | -0.000169 | -| std | 0.105 | -| value_loss | 1.83e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 7996 | -| time_elapsed | 49963 | -| total_timesteps | 1023488 | -| train/ | | -| approx_kl | 0.06623505 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 0.835 | -| explained_variance | -357 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 79950 | -| policy_gradient_loss | -0.00187 | -| std | 0.105 | -| value_loss | 1.25e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 7997 | -| time_elapsed | 49967 | -| total_timesteps | 1023616 | -| train/ | | -| approx_kl | 0.01348742 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 0.835 | -| explained_variance | -42.3 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 79960 | -| policy_gradient_loss | -0.00948 | -| std | 0.105 | -| value_loss | 1.96e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 7998 | -| time_elapsed | 49970 | -| total_timesteps | 1023744 | -| train/ | | -| approx_kl | 0.030161548 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 0.835 | -| explained_variance | -8.16 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 79970 | -| policy_gradient_loss | -0.0113 | -| std | 0.105 | -| value_loss | 4.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 7999 | -| time_elapsed | 49973 | -| total_timesteps | 1023872 | -| train/ | | -| approx_kl | 0.011123611 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.835 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | 0.00188 | -| n_updates | 79980 | -| policy_gradient_loss | 0.000739 | -| std | 0.105 | -| value_loss | 5.8e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8000 | -| time_elapsed | 49976 | -| total_timesteps | 1024000 | -| train/ | | -| approx_kl | 0.0015466004 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | -0.38 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 79990 | -| policy_gradient_loss | -0.00476 | -| std | 0.105 | -| value_loss | 1.28e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8001 | -| time_elapsed | 49979 | -| total_timesteps | 1024128 | -| train/ | | -| approx_kl | 0.009609205 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | 0.0012 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 80000 | -| policy_gradient_loss | -0.0021 | -| std | 0.105 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8002 | -| time_elapsed | 49985 | -| total_timesteps | 1024256 | -| train/ | | -| approx_kl | 0.004267363 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | -2.87 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 80010 | -| policy_gradient_loss | -0.00848 | -| std | 0.105 | -| value_loss | 0.00237 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8003 | -| time_elapsed | 49988 | -| total_timesteps | 1024384 | -| train/ | | -| approx_kl | 0.064741075 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | -149 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 80020 | -| policy_gradient_loss | -0.00463 | -| std | 0.105 | -| value_loss | 3.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8004 | -| time_elapsed | 49992 | -| total_timesteps | 1024512 | -| train/ | | -| approx_kl | 0.003920349 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.836 | -| explained_variance | -1.01e+04 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 80030 | -| policy_gradient_loss | -0.0013 | -| std | 0.105 | -| value_loss | 1.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8005 | -| time_elapsed | 49995 | -| total_timesteps | 1024640 | -| train/ | | -| approx_kl | 0.000419111 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.838 | -| explained_variance | -3.28e+03 | -| learning_rate | 0.0003 | -| loss | -0.000218 | -| n_updates | 80040 | -| policy_gradient_loss | -9.89e-05 | -| std | 0.104 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8006 | -| time_elapsed | 49998 | -| total_timesteps | 1024768 | -| train/ | | -| approx_kl | 0.021090839 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 0.842 | -| explained_variance | -84.2 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 80050 | -| policy_gradient_loss | -0.00109 | -| std | 0.104 | -| value_loss | 2.06e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 20 | -| iterations | 8007 | -| time_elapsed | 50001 | -| total_timesteps | 1024896 | -| train/ | | -| approx_kl | 0.002992249 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 0.846 | -| explained_variance | -4.54 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 80060 | -| policy_gradient_loss | 0.000986 | -| std | 0.104 | -| value_loss | 7.59e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8008 | -| time_elapsed | 50004 | -| total_timesteps | 1025024 | -| train/ | | -| approx_kl | 0.014549316 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.847 | -| explained_variance | -0.917 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 80070 | -| policy_gradient_loss | -0.00432 | -| std | 0.104 | -| value_loss | 1.86e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8009 | -| time_elapsed | 50012 | -| total_timesteps | 1025152 | -| train/ | | -| approx_kl | 0.058911484 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 0.847 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0299 | -| n_updates | 80080 | -| policy_gradient_loss | -0.0224 | -| std | 0.104 | -| value_loss | 4.29e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8010 | -| time_elapsed | 50015 | -| total_timesteps | 1025280 | -| train/ | | -| approx_kl | 0.11526073 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 0.848 | -| explained_variance | -54 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 80090 | -| policy_gradient_loss | -0.00304 | -| std | 0.104 | -| value_loss | 5.2e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8011 | -| time_elapsed | 50018 | -| total_timesteps | 1025408 | -| train/ | | -| approx_kl | 0.078100026 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 0.848 | -| explained_variance | -69.3 | -| learning_rate | 0.0003 | -| loss | -0.00842 | -| n_updates | 80100 | -| policy_gradient_loss | -0.00854 | -| std | 0.104 | -| value_loss | 3.1e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8012 | -| time_elapsed | 50021 | -| total_timesteps | 1025536 | -| train/ | | -| approx_kl | 0.11669937 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 0.847 | -| explained_variance | -9.48 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 80110 | -| policy_gradient_loss | -0.0084 | -| std | 0.104 | -| value_loss | 3.22e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8013 | -| time_elapsed | 50024 | -| total_timesteps | 1025664 | -| train/ | | -| approx_kl | 0.0007726946 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.846 | -| explained_variance | -0.892 | -| learning_rate | 0.0003 | -| loss | -0.000616 | -| n_updates | 80120 | -| policy_gradient_loss | 0.00129 | -| std | 0.104 | -| value_loss | 1.92e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8014 | -| time_elapsed | 50027 | -| total_timesteps | 1025792 | -| train/ | | -| approx_kl | 0.005411708 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.846 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 80130 | -| policy_gradient_loss | -0.00553 | -| std | 0.104 | -| value_loss | 3.19e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 20 | -| iterations | 8015 | -| time_elapsed | 50030 | -| total_timesteps | 1025920 | -| train/ | | -| approx_kl | 0.011603673 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 0.846 | -| explained_variance | -0.00833 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 80140 | -| policy_gradient_loss | -0.00923 | -| std | 0.104 | -| value_loss | 5.79e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8016 | -| time_elapsed | 50034 | -| total_timesteps | 1026048 | -| train/ | | -| approx_kl | 0.000938287 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.848 | -| explained_variance | -0.00989 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 80150 | -| policy_gradient_loss | -0.000506 | -| std | 0.103 | -| value_loss | 8e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8017 | -| time_elapsed | 50040 | -| total_timesteps | 1026176 | -| train/ | | -| approx_kl | 0.032220177 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.856 | -| explained_variance | 0.769 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 80160 | -| policy_gradient_loss | -0.00684 | -| std | 0.102 | -| value_loss | 0.00351 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8018 | -| time_elapsed | 50044 | -| total_timesteps | 1026304 | -| train/ | | -| approx_kl | 0.00544724 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.861 | -| explained_variance | -203 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 80170 | -| policy_gradient_loss | -0.00944 | -| std | 0.102 | -| value_loss | 7.25e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8019 | -| time_elapsed | 50045 | -| total_timesteps | 1026432 | -| train/ | | -| approx_kl | 0.061248366 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 0.863 | -| explained_variance | -5.47e+03 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 80180 | -| policy_gradient_loss | -0.00242 | -| std | 0.102 | -| value_loss | 3.61e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8020 | -| time_elapsed | 50048 | -| total_timesteps | 1026560 | -| train/ | | -| approx_kl | 0.0037255036 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.863 | -| explained_variance | -1.82e+03 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 80190 | -| policy_gradient_loss | -0.0131 | -| std | 0.102 | -| value_loss | 1.53e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8021 | -| time_elapsed | 50051 | -| total_timesteps | 1026688 | -| train/ | | -| approx_kl | 0.028749619 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 0.863 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 80200 | -| policy_gradient_loss | -0.00988 | -| std | 0.102 | -| value_loss | 1.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8022 | -| time_elapsed | 50055 | -| total_timesteps | 1026816 | -| train/ | | -| approx_kl | 0.027956858 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.864 | -| explained_variance | -7.24 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 80210 | -| policy_gradient_loss | -0.00993 | -| std | 0.102 | -| value_loss | 6.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 20 | -| iterations | 8023 | -| time_elapsed | 50059 | -| total_timesteps | 1026944 | -| train/ | | -| approx_kl | 0.008568818 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 0.864 | -| explained_variance | -0.0888 | -| learning_rate | 0.0003 | -| loss | -0.00675 | -| n_updates | 80220 | -| policy_gradient_loss | 0.000589 | -| std | 0.102 | -| value_loss | 4.53e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8024 | -| time_elapsed | 50063 | -| total_timesteps | 1027072 | -| train/ | | -| approx_kl | 0.020040104 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 0.864 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 80230 | -| policy_gradient_loss | 0.00113 | -| std | 0.102 | -| value_loss | 2.93e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8025 | -| time_elapsed | 50070 | -| total_timesteps | 1027200 | -| train/ | | -| approx_kl | 0.0138558075 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 0.864 | -| explained_variance | 0.673 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 80240 | -| policy_gradient_loss | -0.0111 | -| std | 0.102 | -| value_loss | 0.000881 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8026 | -| time_elapsed | 50074 | -| total_timesteps | 1027328 | -| train/ | | -| approx_kl | 0.03279941 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.864 | -| explained_variance | -212 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 80250 | -| policy_gradient_loss | 0.000494 | -| std | 0.102 | -| value_loss | 3.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8027 | -| time_elapsed | 50078 | -| total_timesteps | 1027456 | -| train/ | | -| approx_kl | 0.018116932 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 0.866 | -| explained_variance | -56.5 | -| learning_rate | 0.0003 | -| loss | -0.00987 | -| n_updates | 80260 | -| policy_gradient_loss | -0.00602 | -| std | 0.102 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8028 | -| time_elapsed | 50082 | -| total_timesteps | 1027584 | -| train/ | | -| approx_kl | 0.0028315391 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 0.866 | -| explained_variance | -4.18 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 80270 | -| policy_gradient_loss | -0.00712 | -| std | 0.102 | -| value_loss | 2.04e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8029 | -| time_elapsed | 50086 | -| total_timesteps | 1027712 | -| train/ | | -| approx_kl | 0.0009416044 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 0.866 | -| explained_variance | -0.351 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 80280 | -| policy_gradient_loss | -0.000961 | -| std | 0.102 | -| value_loss | 7.32e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8030 | -| time_elapsed | 50089 | -| total_timesteps | 1027840 | -| train/ | | -| approx_kl | 0.0006579859 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.868 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 80290 | -| policy_gradient_loss | -0.00456 | -| std | 0.102 | -| value_loss | 1.05e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8031 | -| time_elapsed | 50093 | -| total_timesteps | 1027968 | -| train/ | | -| approx_kl | 0.008815306 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 0.869 | -| explained_variance | 0.0026 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 80300 | -| policy_gradient_loss | 0.0015 | -| std | 0.101 | -| value_loss | 7.8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8032 | -| time_elapsed | 50097 | -| total_timesteps | 1028096 | -| train/ | | -| approx_kl | 0.025974032 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.87 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.00812 | -| n_updates | 80310 | -| policy_gradient_loss | 0.00173 | -| std | 0.101 | -| value_loss | 1.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8033 | -| time_elapsed | 50103 | -| total_timesteps | 1028224 | -| train/ | | -| approx_kl | 0.01876116 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 0.87 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0338 | -| n_updates | 80320 | -| policy_gradient_loss | -0.025 | -| std | 0.101 | -| value_loss | 4.6e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8034 | -| time_elapsed | 50107 | -| total_timesteps | 1028352 | -| train/ | | -| approx_kl | 0.023237843 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.87 | -| explained_variance | -3.42 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 80330 | -| policy_gradient_loss | -0.00309 | -| std | 0.101 | -| value_loss | 2.31e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8035 | -| time_elapsed | 50112 | -| total_timesteps | 1028480 | -| train/ | | -| approx_kl | 0.00023423322 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 0.871 | -| explained_variance | -59.2 | -| learning_rate | 0.0003 | -| loss | -0.000171 | -| n_updates | 80340 | -| policy_gradient_loss | 0.000152 | -| std | 0.101 | -| value_loss | 3e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8036 | -| time_elapsed | 50116 | -| total_timesteps | 1028608 | -| train/ | | -| approx_kl | 0.0026309523 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 0.874 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | -0.00811 | -| n_updates | 80350 | -| policy_gradient_loss | -0.00632 | -| std | 0.101 | -| value_loss | 1.85e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8037 | -| time_elapsed | 50119 | -| total_timesteps | 1028736 | -| train/ | | -| approx_kl | 0.018520232 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 0.877 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.000115 | -| n_updates | 80360 | -| policy_gradient_loss | 0.00125 | -| std | 0.101 | -| value_loss | 4.09e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8038 | -| time_elapsed | 50123 | -| total_timesteps | 1028864 | -| train/ | | -| approx_kl | 0.0029744375 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.879 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 80370 | -| policy_gradient_loss | 0.00159 | -| std | 0.1 | -| value_loss | 4.42e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 20 | -| iterations | 8039 | -| time_elapsed | 50126 | -| total_timesteps | 1028992 | -| train/ | | -| approx_kl | 0.00047064945 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.879 | -| explained_variance | 0.00642 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 80380 | -| policy_gradient_loss | -0.00059 | -| std | 0.1 | -| value_loss | 1.35e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8040 | -| time_elapsed | 50130 | -| total_timesteps | 1029120 | -| train/ | | -| approx_kl | 0.011495758 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 0.88 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.0077 | -| n_updates | 80390 | -| policy_gradient_loss | -0.00145 | -| std | 0.1 | -| value_loss | 5.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8041 | -| time_elapsed | 50137 | -| total_timesteps | 1029248 | -| train/ | | -| approx_kl | 0.008318698 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 0.881 | -| explained_variance | 0.6 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 80400 | -| policy_gradient_loss | -0.00946 | -| std | 0.1 | -| value_loss | 0.000923 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8042 | -| time_elapsed | 50140 | -| total_timesteps | 1029376 | -| train/ | | -| approx_kl | 0.021899927 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 0.882 | -| explained_variance | -2.27e+03 | -| learning_rate | 0.0003 | -| loss | -0.000879 | -| n_updates | 80410 | -| policy_gradient_loss | 0.00179 | -| std | 0.1 | -| value_loss | 7.8e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8043 | -| time_elapsed | 50143 | -| total_timesteps | 1029504 | -| train/ | | -| approx_kl | 0.04394303 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.884 | -| explained_variance | -898 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 80420 | -| policy_gradient_loss | -0.00295 | -| std | 0.1 | -| value_loss | 5.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8044 | -| time_elapsed | 50147 | -| total_timesteps | 1029632 | -| train/ | | -| approx_kl | 0.026172783 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.884 | -| explained_variance | -9.28e+03 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 80430 | -| policy_gradient_loss | -0.0115 | -| std | 0.1 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8045 | -| time_elapsed | 50150 | -| total_timesteps | 1029760 | -| train/ | | -| approx_kl | 0.005330506 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.884 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 80440 | -| policy_gradient_loss | -0.000268 | -| std | 0.0999 | -| value_loss | 2.62e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 20 | -| iterations | 8046 | -| time_elapsed | 50154 | -| total_timesteps | 1029888 | -| train/ | | -| approx_kl | 0.0013446626 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.885 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 80450 | -| policy_gradient_loss | 0.000227 | -| std | 0.0998 | -| value_loss | 3.58e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8047 | -| time_elapsed | 50158 | -| total_timesteps | 1030016 | -| train/ | | -| approx_kl | 0.033914357 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 0.886 | -| explained_variance | -3.36e+03 | -| learning_rate | 0.0003 | -| loss | -0.000615 | -| n_updates | 80460 | -| policy_gradient_loss | -0.000761 | -| std | 0.0996 | -| value_loss | 5.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8048 | -| time_elapsed | 50167 | -| total_timesteps | 1030144 | -| train/ | | -| approx_kl | 0.006625347 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 0.888 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 80470 | -| policy_gradient_loss | -0.00899 | -| std | 0.0996 | -| value_loss | 0.000111 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8049 | -| time_elapsed | 50170 | -| total_timesteps | 1030272 | -| train/ | | -| approx_kl | 0.02015145 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 0.888 | -| explained_variance | -26.5 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 80480 | -| policy_gradient_loss | -0.00398 | -| std | 0.0996 | -| value_loss | 6.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8050 | -| time_elapsed | 50173 | -| total_timesteps | 1030400 | -| train/ | | -| approx_kl | 0.019048536 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 0.888 | -| explained_variance | -1.3e+03 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 80490 | -| policy_gradient_loss | -0.00642 | -| std | 0.0996 | -| value_loss | 3.16e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8051 | -| time_elapsed | 50176 | -| total_timesteps | 1030528 | -| train/ | | -| approx_kl | 0.00015198812 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.888 | -| explained_variance | -3.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.000805 | -| n_updates | 80500 | -| policy_gradient_loss | -0.00229 | -| std | 0.0996 | -| value_loss | 2.79e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8052 | -| time_elapsed | 50180 | -| total_timesteps | 1030656 | -| train/ | | -| approx_kl | 0.025953108 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 0.888 | -| explained_variance | -1.11e+03 | -| learning_rate | 0.0003 | -| loss | -0.00943 | -| n_updates | 80510 | -| policy_gradient_loss | -0.00544 | -| std | 0.0995 | -| value_loss | 1.75e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8053 | -| time_elapsed | 50184 | -| total_timesteps | 1030784 | -| train/ | | -| approx_kl | 0.023048615 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | -69.7 | -| learning_rate | 0.0003 | -| loss | -0.0097 | -| n_updates | 80520 | -| policy_gradient_loss | -0.00625 | -| std | 0.0995 | -| value_loss | 7.91e-12 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 20 | -| iterations | 8054 | -| time_elapsed | 50187 | -| total_timesteps | 1030912 | -| train/ | | -| approx_kl | 0.039690822 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | -9.08 | -| learning_rate | 0.0003 | -| loss | -0.000401 | -| n_updates | 80530 | -| policy_gradient_loss | -0.00231 | -| std | 0.0995 | -| value_loss | 9.96e-13 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8055 | -| time_elapsed | 50190 | -| total_timesteps | 1031040 | -| train/ | | -| approx_kl | 0.0020361142 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | -1.75 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 80540 | -| policy_gradient_loss | -0.000738 | -| std | 0.0996 | -| value_loss | 2.94e-13 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8056 | -| time_elapsed | 50197 | -| total_timesteps | 1031168 | -| train/ | | -| approx_kl | 0.00712883 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 0.887 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 80550 | -| policy_gradient_loss | -0.0149 | -| std | 0.0997 | -| value_loss | 0.000319 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8057 | -| time_elapsed | 50200 | -| total_timesteps | 1031296 | -| train/ | | -| approx_kl | 0.052407034 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 0.886 | -| explained_variance | -81.8 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 80560 | -| policy_gradient_loss | -0.0187 | -| std | 0.0998 | -| value_loss | 1.88e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8058 | -| time_elapsed | 50204 | -| total_timesteps | 1031424 | -| train/ | | -| approx_kl | 0.0061634914 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 0.884 | -| explained_variance | -35.3 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 80570 | -| policy_gradient_loss | -0.0148 | -| std | 0.1 | -| value_loss | 2.56e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8059 | -| time_elapsed | 50208 | -| total_timesteps | 1031552 | -| train/ | | -| approx_kl | 0.03950318 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.882 | -| explained_variance | -8.2 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 80580 | -| policy_gradient_loss | -0.00153 | -| std | 0.1 | -| value_loss | 2.05e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8060 | -| time_elapsed | 50211 | -| total_timesteps | 1031680 | -| train/ | | -| approx_kl | 0.04819863 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 0.881 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 80590 | -| policy_gradient_loss | -0.00907 | -| std | 0.1 | -| value_loss | 6.35e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8061 | -| time_elapsed | 50213 | -| total_timesteps | 1031808 | -| train/ | | -| approx_kl | 0.0034993468 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 0.881 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 80600 | -| policy_gradient_loss | -0.00156 | -| std | 0.1 | -| value_loss | 2e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 20 | -| iterations | 8062 | -| time_elapsed | 50216 | -| total_timesteps | 1031936 | -| train/ | | -| approx_kl | 0.0047558504 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 0.88 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 80610 | -| policy_gradient_loss | -0.00477 | -| std | 0.1 | -| value_loss | 3.06e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8063 | -| time_elapsed | 50220 | -| total_timesteps | 1032064 | -| train/ | | -| approx_kl | 7.7357516e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 0.882 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | -0.000785 | -| n_updates | 80620 | -| policy_gradient_loss | -0.000302 | -| std | 0.0997 | -| value_loss | 3.5e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8064 | -| time_elapsed | 50225 | -| total_timesteps | 1032192 | -| train/ | | -| approx_kl | 0.00045246072 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | 0.736 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 80630 | -| policy_gradient_loss | -0.00405 | -| std | 0.0991 | -| value_loss | 0.00455 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8065 | -| time_elapsed | 50230 | -| total_timesteps | 1032320 | -| train/ | | -| approx_kl | 0.030035703 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 0.894 | -| explained_variance | -172 | -| learning_rate | 0.0003 | -| loss | -0.0043 | -| n_updates | 80640 | -| policy_gradient_loss | -0.00282 | -| std | 0.0989 | -| value_loss | 8.55e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8066 | -| time_elapsed | 50235 | -| total_timesteps | 1032448 | -| train/ | | -| approx_kl | 0.26374903 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 0.895 | -| explained_variance | -319 | -| learning_rate | 0.0003 | -| loss | 0.00285 | -| n_updates | 80650 | -| policy_gradient_loss | -0.000603 | -| std | 0.0989 | -| value_loss | 3.84e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8067 | -| time_elapsed | 50238 | -| total_timesteps | 1032576 | -| train/ | | -| approx_kl | 0.12749618 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 0.894 | -| explained_variance | -37.7 | -| learning_rate | 0.0003 | -| loss | -0.000273 | -| n_updates | 80660 | -| policy_gradient_loss | -0.0035 | -| std | 0.099 | -| value_loss | 1.75e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8068 | -| time_elapsed | 50241 | -| total_timesteps | 1032704 | -| train/ | | -| approx_kl | 0.0028143874 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -1.22 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 80670 | -| policy_gradient_loss | -0.000903 | -| std | 0.099 | -| value_loss | 3.91e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8069 | -| time_elapsed | 50245 | -| total_timesteps | 1032832 | -| train/ | | -| approx_kl | 1.3045501e-05 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.000332 | -| n_updates | 80680 | -| policy_gradient_loss | -0.000162 | -| std | 0.099 | -| value_loss | 2.78e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8070 | -| time_elapsed | 50249 | -| total_timesteps | 1032960 | -| train/ | | -| approx_kl | 0.0008849376 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 80690 | -| policy_gradient_loss | 0.00185 | -| std | 0.0991 | -| value_loss | 6.82e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8071 | -| time_elapsed | 50253 | -| total_timesteps | 1033088 | -| train/ | | -| approx_kl | 8.440111e-05 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 80700 | -| policy_gradient_loss | -0.00222 | -| std | 0.0991 | -| value_loss | 4.8e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8072 | -| time_elapsed | 50260 | -| total_timesteps | 1033216 | -| train/ | | -| approx_kl | 0.01369155 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.892 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 80710 | -| policy_gradient_loss | -0.00376 | -| std | 0.0991 | -| value_loss | 0.00144 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8073 | -| time_elapsed | 50263 | -| total_timesteps | 1033344 | -| train/ | | -| approx_kl | 0.00078847446 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -5.29e+03 | -| learning_rate | 0.0003 | -| loss | -0.000144 | -| n_updates | 80720 | -| policy_gradient_loss | -3.2e-05 | -| std | 0.0991 | -| value_loss | 3.49e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8074 | -| time_elapsed | 50266 | -| total_timesteps | 1033472 | -| train/ | | -| approx_kl | 0.03425012 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 0.892 | -| explained_variance | -6.51e+03 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 80730 | -| policy_gradient_loss | -0.0081 | -| std | 0.0993 | -| value_loss | 1.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8075 | -| time_elapsed | 50269 | -| total_timesteps | 1033600 | -| train/ | | -| approx_kl | 0.044140756 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.891 | -| explained_variance | -155 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 80740 | -| policy_gradient_loss | -0.00497 | -| std | 0.0993 | -| value_loss | 5.44e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8076 | -| time_elapsed | 50273 | -| total_timesteps | 1033728 | -| train/ | | -| approx_kl | 0.02701212 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 0.891 | -| explained_variance | -20.9 | -| learning_rate | 0.0003 | -| loss | -0.00588 | -| n_updates | 80750 | -| policy_gradient_loss | -0.00369 | -| std | 0.0993 | -| value_loss | 4.51e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8077 | -| time_elapsed | 50277 | -| total_timesteps | 1033856 | -| train/ | | -| approx_kl | 0.0065253316 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 0.891 | -| explained_variance | -2.53 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 80760 | -| policy_gradient_loss | 0.00168 | -| std | 0.0993 | -| value_loss | 1.88e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8078 | -| time_elapsed | 50279 | -| total_timesteps | 1033984 | -| train/ | | -| approx_kl | 0.034395024 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.891 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 80770 | -| policy_gradient_loss | -0.00127 | -| std | 0.0993 | -| value_loss | 2.92e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 20 | -| iterations | 8079 | -| time_elapsed | 50283 | -| total_timesteps | 1034112 | -| train/ | | -| approx_kl | 0.05708597 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | 0.00903 | -| n_updates | 80780 | -| policy_gradient_loss | -0.00284 | -| std | 0.0996 | -| value_loss | 2.62e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 20 | -| iterations | 8080 | -| time_elapsed | 50291 | -| total_timesteps | 1034240 | -| train/ | | -| approx_kl | 0.0042053047 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.887 | -| explained_variance | -6.02 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 80790 | -| policy_gradient_loss | -0.0115 | -| std | 0.0998 | -| value_loss | 0.00505 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 20 | -| iterations | 8081 | -| time_elapsed | 50295 | -| total_timesteps | 1034368 | -| train/ | | -| approx_kl | 0.0829641 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 0.886 | -| explained_variance | -36.3 | -| learning_rate | 0.0003 | -| loss | 0.00468 | -| n_updates | 80800 | -| policy_gradient_loss | 0.00325 | -| std | 0.0998 | -| value_loss | 2.13e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 20 | -| iterations | 8082 | -| time_elapsed | 50299 | -| total_timesteps | 1034496 | -| train/ | | -| approx_kl | 0.0018663001 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.886 | -| explained_variance | -68.9 | -| learning_rate | 0.0003 | -| loss | -0.000741 | -| n_updates | 80810 | -| policy_gradient_loss | 0.000316 | -| std | 0.0997 | -| value_loss | 9.34e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 20 | -| iterations | 8083 | -| time_elapsed | 50303 | -| total_timesteps | 1034624 | -| train/ | | -| approx_kl | 0.01008998 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 0.888 | -| explained_variance | -54.3 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 80820 | -| policy_gradient_loss | -0.00961 | -| std | 0.0995 | -| value_loss | 7.5e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 20 | -| iterations | 8084 | -| time_elapsed | 50306 | -| total_timesteps | 1034752 | -| train/ | | -| approx_kl | 0.00030151708 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | 0.000276 | -| n_updates | 80830 | -| policy_gradient_loss | 0.00237 | -| std | 0.0995 | -| value_loss | 3.56e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 20 | -| iterations | 8085 | -| time_elapsed | 50309 | -| total_timesteps | 1034880 | -| train/ | | -| approx_kl | 0.0059651774 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 80840 | -| policy_gradient_loss | -0.00404 | -| std | 0.0996 | -| value_loss | 2.01e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8086 | -| time_elapsed | 50312 | -| total_timesteps | 1035008 | -| train/ | | -| approx_kl | 0.0018341336 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.887 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 80850 | -| policy_gradient_loss | -0.000483 | -| std | 0.0998 | -| value_loss | 6.82e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8087 | -| time_elapsed | 50320 | -| total_timesteps | 1035136 | -| train/ | | -| approx_kl | 0.0061607324 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 0.885 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 80860 | -| policy_gradient_loss | -0.0105 | -| std | 0.0999 | -| value_loss | 0.000449 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8088 | -| time_elapsed | 50324 | -| total_timesteps | 1035264 | -| train/ | | -| approx_kl | 0.035634037 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 0.885 | -| explained_variance | -821 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 80870 | -| policy_gradient_loss | -0.00087 | -| std | 0.0999 | -| value_loss | 4.85e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8089 | -| time_elapsed | 50327 | -| total_timesteps | 1035392 | -| train/ | | -| approx_kl | 0.14067662 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 0.885 | -| explained_variance | -2.07e+03 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 80880 | -| policy_gradient_loss | -0.0104 | -| std | 0.0998 | -| value_loss | 1.66e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8090 | -| time_elapsed | 50330 | -| total_timesteps | 1035520 | -| train/ | | -| approx_kl | 0.10356456 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 0.886 | -| explained_variance | -1.81e+03 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 80890 | -| policy_gradient_loss | -0.00378 | -| std | 0.0997 | -| value_loss | 9.49e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8091 | -| time_elapsed | 50333 | -| total_timesteps | 1035648 | -| train/ | | -| approx_kl | 0.115317345 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 0.887 | -| explained_variance | -2.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.00995 | -| n_updates | 80900 | -| policy_gradient_loss | -0.00689 | -| std | 0.0996 | -| value_loss | 9.77e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8092 | -| time_elapsed | 50337 | -| total_timesteps | 1035776 | -| train/ | | -| approx_kl | 0.037688807 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 0.888 | -| explained_variance | -3.61e+03 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 80910 | -| policy_gradient_loss | -0.00969 | -| std | 0.0995 | -| value_loss | 2.8e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8093 | -| time_elapsed | 50341 | -| total_timesteps | 1035904 | -| train/ | | -| approx_kl | 0.008684069 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 80920 | -| policy_gradient_loss | -4.1e-05 | -| std | 0.0995 | -| value_loss | 7.37e-11 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8094 | -| time_elapsed | 50345 | -| total_timesteps | 1036032 | -| train/ | | -| approx_kl | 0.00059450883 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 0.889 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 80930 | -| policy_gradient_loss | -0.000533 | -| std | 0.0994 | -| value_loss | 3.43e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8095 | -| time_elapsed | 50352 | -| total_timesteps | 1036160 | -| train/ | | -| approx_kl | 0.011159521 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 0.89 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 80940 | -| policy_gradient_loss | -0.00223 | -| std | 0.0992 | -| value_loss | 0.00288 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8096 | -| time_elapsed | 50356 | -| total_timesteps | 1036288 | -| train/ | | -| approx_kl | 0.1266412 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -3.67e+03 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 80950 | -| policy_gradient_loss | -0.00197 | -| std | 0.099 | -| value_loss | 2.07e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8097 | -| time_elapsed | 50357 | -| total_timesteps | 1036416 | -| train/ | | -| approx_kl | 0.0056265653 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -2.67e+03 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 80960 | -| policy_gradient_loss | -0.00918 | -| std | 0.099 | -| value_loss | 9.06e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8098 | -| time_elapsed | 50360 | -| total_timesteps | 1036544 | -| train/ | | -| approx_kl | 0.0021844716 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.894 | -| explained_variance | -247 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 80970 | -| policy_gradient_loss | -0.0129 | -| std | 0.0989 | -| value_loss | 2.95e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8099 | -| time_elapsed | 50363 | -| total_timesteps | 1036672 | -| train/ | | -| approx_kl | 0.004453661 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.894 | -| explained_variance | -0.409 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 80980 | -| policy_gradient_loss | -0.00889 | -| std | 0.099 | -| value_loss | 4.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8100 | -| time_elapsed | 50365 | -| total_timesteps | 1036800 | -| train/ | | -| approx_kl | 0.005192134 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.894 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 80990 | -| policy_gradient_loss | -0.0105 | -| std | 0.099 | -| value_loss | 3.86e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 20 | -| iterations | 8101 | -| time_elapsed | 50368 | -| total_timesteps | 1036928 | -| train/ | | -| approx_kl | 0.015588269 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -0.321 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 81000 | -| policy_gradient_loss | -0.0122 | -| std | 0.0991 | -| value_loss | 6.44e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8102 | -| time_elapsed | 50370 | -| total_timesteps | 1037056 | -| train/ | | -| approx_kl | 0.024950752 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -45.8 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 81010 | -| policy_gradient_loss | -0.0176 | -| std | 0.099 | -| value_loss | 0.000129 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8103 | -| time_elapsed | 50375 | -| total_timesteps | 1037184 | -| train/ | | -| approx_kl | 0.083200894 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 0.893 | -| explained_variance | -0.332 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 81020 | -| policy_gradient_loss | -0.0068 | -| std | 0.0991 | -| value_loss | 0.00309 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8104 | -| time_elapsed | 50380 | -| total_timesteps | 1037312 | -| train/ | | -| approx_kl | 0.026742402 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 0.892 | -| explained_variance | -91.4 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 81030 | -| policy_gradient_loss | -0.00737 | -| std | 0.0992 | -| value_loss | 0.00114 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8105 | -| time_elapsed | 50383 | -| total_timesteps | 1037440 | -| train/ | | -| approx_kl | 7.589487e-05 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 0.892 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | 9.85e-05 | -| n_updates | 81040 | -| policy_gradient_loss | 0.000205 | -| std | 0.0991 | -| value_loss | 2.73e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8106 | -| time_elapsed | 50387 | -| total_timesteps | 1037568 | -| train/ | | -| approx_kl | 0.0013010935 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 0.894 | -| explained_variance | -0.313 | -| learning_rate | 0.0003 | -| loss | -0.000833 | -| n_updates | 81050 | -| policy_gradient_loss | -0.000509 | -| std | 0.0989 | -| value_loss | 2.04e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8107 | -| time_elapsed | 50390 | -| total_timesteps | 1037696 | -| train/ | | -| approx_kl | 0.0009626015 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 0.895 | -| explained_variance | -0.0877 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 81060 | -| policy_gradient_loss | -0.00195 | -| std | 0.0989 | -| value_loss | 8.35e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8108 | -| time_elapsed | 50392 | -| total_timesteps | 1037824 | -| train/ | | -| approx_kl | 0.02873683 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 0.895 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 81070 | -| policy_gradient_loss | -0.0114 | -| std | 0.0989 | -| value_loss | 6.28e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 20 | -| iterations | 8109 | -| time_elapsed | 50396 | -| total_timesteps | 1037952 | -| train/ | | -| approx_kl | 0.0008992362 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.895 | -| explained_variance | -0.0732 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 81080 | -| policy_gradient_loss | 0.00297 | -| std | 0.0988 | -| value_loss | 2.75e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8110 | -| time_elapsed | 50400 | -| total_timesteps | 1038080 | -| train/ | | -| approx_kl | 0.0018505491 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.896 | -| explained_variance | -0.00125 | -| learning_rate | 0.0003 | -| loss | -0.000596 | -| n_updates | 81090 | -| policy_gradient_loss | -8.74e-05 | -| std | 0.0987 | -| value_loss | 2.44e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8111 | -| time_elapsed | 50406 | -| total_timesteps | 1038208 | -| train/ | | -| approx_kl | 0.008000765 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 0.897 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 81100 | -| policy_gradient_loss | -0.0153 | -| std | 0.0986 | -| value_loss | 0.002 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8112 | -| time_elapsed | 50409 | -| total_timesteps | 1038336 | -| train/ | | -| approx_kl | 0.000786352 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 0.898 | -| explained_variance | -17.3 | -| learning_rate | 0.0003 | -| loss | -0.000922 | -| n_updates | 81110 | -| policy_gradient_loss | -0.000803 | -| std | 0.0985 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8113 | -| time_elapsed | 50413 | -| total_timesteps | 1038464 | -| train/ | | -| approx_kl | 0.0018378026 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 0.9 | -| explained_variance | -127 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 81120 | -| policy_gradient_loss | -0.0111 | -| std | 0.0983 | -| value_loss | 4.56e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8114 | -| time_elapsed | 50417 | -| total_timesteps | 1038592 | -| train/ | | -| approx_kl | 0.06598319 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 0.901 | -| explained_variance | -34.5 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 81130 | -| policy_gradient_loss | -0.00227 | -| std | 0.0982 | -| value_loss | 2.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8115 | -| time_elapsed | 50421 | -| total_timesteps | 1038720 | -| train/ | | -| approx_kl | 0.027728483 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 0.902 | -| explained_variance | -3.74 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 81140 | -| policy_gradient_loss | -0.00761 | -| std | 0.0981 | -| value_loss | 7.55e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8116 | -| time_elapsed | 50424 | -| total_timesteps | 1038848 | -| train/ | | -| approx_kl | 0.04285316 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 0.903 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.00591 | -| n_updates | 81150 | -| policy_gradient_loss | 1.39e-05 | -| std | 0.0981 | -| value_loss | 2.59e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 20 | -| iterations | 8117 | -| time_elapsed | 50428 | -| total_timesteps | 1038976 | -| train/ | | -| approx_kl | 0.0021873685 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 0.903 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | -0.00564 | -| n_updates | 81160 | -| policy_gradient_loss | -0.00474 | -| std | 0.0981 | -| value_loss | 1.03e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 20 | -| iterations | 8118 | -| time_elapsed | 50431 | -| total_timesteps | 1039104 | -| train/ | | -| approx_kl | 0.0058409 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 0.902 | -| explained_variance | -0.00416 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 81170 | -| policy_gradient_loss | -0.0104 | -| std | 0.0982 | -| value_loss | 2.64e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 20 | -| iterations | 8119 | -| time_elapsed | 50438 | -| total_timesteps | 1039232 | -| train/ | | -| approx_kl | 0.042055853 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 0.902 | -| explained_variance | 0.818 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 81180 | -| policy_gradient_loss | -0.0153 | -| std | 0.0983 | -| value_loss | 0.00247 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 20 | -| iterations | 8120 | -| time_elapsed | 50441 | -| total_timesteps | 1039360 | -| train/ | | -| approx_kl | 0.09673004 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 0.901 | -| explained_variance | -369 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 81190 | -| policy_gradient_loss | -0.00393 | -| std | 0.0984 | -| value_loss | 7.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 20 | -| iterations | 8121 | -| time_elapsed | 50444 | -| total_timesteps | 1039488 | -| train/ | | -| approx_kl | 0.041229498 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 0.9 | -| explained_variance | -7.87e+03 | -| learning_rate | 0.0003 | -| loss | -0.00922 | -| n_updates | 81200 | -| policy_gradient_loss | -0.00666 | -| std | 0.0984 | -| value_loss | 4.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 20 | -| iterations | 8122 | -| time_elapsed | 50447 | -| total_timesteps | 1039616 | -| train/ | | -| approx_kl | 0.122836456 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 0.9 | -| explained_variance | -426 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 81210 | -| policy_gradient_loss | -0.00314 | -| std | 0.0985 | -| value_loss | 4.21e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 20 | -| iterations | 8123 | -| time_elapsed | 50452 | -| total_timesteps | 1039744 | -| train/ | | -| approx_kl | 0.08418638 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 0.899 | -| explained_variance | -32.8 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 81220 | -| policy_gradient_loss | -0.00824 | -| std | 0.0985 | -| value_loss | 3.1e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 20 | -| iterations | 8124 | -| time_elapsed | 50454 | -| total_timesteps | 1039872 | -| train/ | | -| approx_kl | 0.03257157 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 0.899 | -| explained_variance | -2.2 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 81230 | -| policy_gradient_loss | -0.00712 | -| std | 0.0985 | -| value_loss | 1.07e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8125 | -| time_elapsed | 50457 | -| total_timesteps | 1040000 | -| train/ | | -| approx_kl | 0.02037693 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 0.898 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.00136 | -| n_updates | 81240 | -| policy_gradient_loss | -0.000209 | -| std | 0.0985 | -| value_loss | 2.55e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8126 | -| time_elapsed | 50461 | -| total_timesteps | 1040128 | -| train/ | | -| approx_kl | 0.0005931286 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.899 | -| explained_variance | -0.00278 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 81250 | -| policy_gradient_loss | -0.00134 | -| std | 0.0985 | -| value_loss | 7.36e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8127 | -| time_elapsed | 50469 | -| total_timesteps | 1040256 | -| train/ | | -| approx_kl | 0.020258775 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 0.899 | -| explained_variance | 0.943 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 81260 | -| policy_gradient_loss | -0.00467 | -| std | 0.0983 | -| value_loss | 0.000665 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8128 | -| time_elapsed | 50473 | -| total_timesteps | 1040384 | -| train/ | | -| approx_kl | 0.018479062 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 0.901 | -| explained_variance | -1.99e+04 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 81270 | -| policy_gradient_loss | -0.0114 | -| std | 0.0982 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8129 | -| time_elapsed | 50476 | -| total_timesteps | 1040512 | -| train/ | | -| approx_kl | 0.024756085 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.902 | -| explained_variance | -6.06e+03 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 81280 | -| policy_gradient_loss | -0.00316 | -| std | 0.0981 | -| value_loss | 4.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8130 | -| time_elapsed | 50479 | -| total_timesteps | 1040640 | -| train/ | | -| approx_kl | 0.08178189 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 0.902 | -| explained_variance | -168 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 81290 | -| policy_gradient_loss | -0.00137 | -| std | 0.0982 | -| value_loss | 3.59e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8131 | -| time_elapsed | 50483 | -| total_timesteps | 1040768 | -| train/ | | -| approx_kl | 0.022815604 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 0.901 | -| explained_variance | -5.6 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 81300 | -| policy_gradient_loss | -0.000289 | -| std | 0.0983 | -| value_loss | 2.6e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8132 | -| time_elapsed | 50486 | -| total_timesteps | 1040896 | -| train/ | | -| approx_kl | 0.009690478 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 0.901 | -| explained_variance | -0.723 | -| learning_rate | 0.0003 | -| loss | -0.006 | -| n_updates | 81310 | -| policy_gradient_loss | 0.000362 | -| std | 0.0983 | -| value_loss | 2.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8133 | -| time_elapsed | 50489 | -| total_timesteps | 1041024 | -| train/ | | -| approx_kl | 0.013692714 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 0.9 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | -0.000551 | -| n_updates | 81320 | -| policy_gradient_loss | 0.000562 | -| std | 0.0983 | -| value_loss | 2.33e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8134 | -| time_elapsed | 50497 | -| total_timesteps | 1041152 | -| train/ | | -| approx_kl | 0.0051964168 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 0.902 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 81330 | -| policy_gradient_loss | -0.00237 | -| std | 0.0979 | -| value_loss | 0.00158 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8135 | -| time_elapsed | 50500 | -| total_timesteps | 1041280 | -| train/ | | -| approx_kl | 0.18167365 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 0.906 | -| explained_variance | -1.47e+04 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 81340 | -| policy_gradient_loss | -0.00537 | -| std | 0.0977 | -| value_loss | 1.82e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8136 | -| time_elapsed | 50503 | -| total_timesteps | 1041408 | -| train/ | | -| approx_kl | 0.16276217 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 0.908 | -| explained_variance | -1.16e+03 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 81350 | -| policy_gradient_loss | -0.00428 | -| std | 0.0976 | -| value_loss | 7.05e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8137 | -| time_elapsed | 50506 | -| total_timesteps | 1041536 | -| train/ | | -| approx_kl | 0.018480485 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.908 | -| explained_variance | -51.7 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 81360 | -| policy_gradient_loss | -0.0114 | -| std | 0.0976 | -| value_loss | 3.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8138 | -| time_elapsed | 50509 | -| total_timesteps | 1041664 | -| train/ | | -| approx_kl | 0.01164029 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 0.909 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 81370 | -| policy_gradient_loss | 0.000862 | -| std | 0.0973 | -| value_loss | 4.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8139 | -| time_elapsed | 50513 | -| total_timesteps | 1041792 | -| train/ | | -| approx_kl | 0.016315037 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.912 | -| explained_variance | -0.65 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 81380 | -| policy_gradient_loss | -0.00272 | -| std | 0.0972 | -| value_loss | 8.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 20 | -| iterations | 8140 | -| time_elapsed | 50516 | -| total_timesteps | 1041920 | -| train/ | | -| approx_kl | 0.004213155 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 0.913 | -| explained_variance | -0.474 | -| learning_rate | 0.0003 | -| loss | -0.00405 | -| n_updates | 81390 | -| policy_gradient_loss | -0.00169 | -| std | 0.0971 | -| value_loss | 1.16e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8141 | -| time_elapsed | 50520 | -| total_timesteps | 1042048 | -| train/ | | -| approx_kl | 0.0015044292 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 0.914 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 81400 | -| policy_gradient_loss | -0.00213 | -| std | 0.0969 | -| value_loss | 1.09e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8142 | -| time_elapsed | 50526 | -| total_timesteps | 1042176 | -| train/ | | -| approx_kl | 0.008042313 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 0.916 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.0277 | -| n_updates | 81410 | -| policy_gradient_loss | -0.0166 | -| std | 0.0968 | -| value_loss | 0.000123 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8143 | -| time_elapsed | 50530 | -| total_timesteps | 1042304 | -| train/ | | -| approx_kl | 0.0052505443 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -4.39 | -| learning_rate | 0.0003 | -| loss | -0.00957 | -| n_updates | 81420 | -| policy_gradient_loss | -0.00719 | -| std | 0.0967 | -| value_loss | 3.78e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8144 | -| time_elapsed | 50532 | -| total_timesteps | 1042432 | -| train/ | | -| approx_kl | 0.032236535 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -5.29 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 81430 | -| policy_gradient_loss | -0.00467 | -| std | 0.0966 | -| value_loss | 2.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8145 | -| time_elapsed | 50535 | -| total_timesteps | 1042560 | -| train/ | | -| approx_kl | 0.022852061 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 0.918 | -| explained_variance | -2.65 | -| learning_rate | 0.0003 | -| loss | -0.00464 | -| n_updates | 81440 | -| policy_gradient_loss | -0.00278 | -| std | 0.0966 | -| value_loss | 2.03e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8146 | -| time_elapsed | 50538 | -| total_timesteps | 1042688 | -| train/ | | -| approx_kl | 0.00068528065 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -0.642 | -| learning_rate | 0.0003 | -| loss | -0.000112 | -| n_updates | 81450 | -| policy_gradient_loss | 3.45e-06 | -| std | 0.0968 | -| value_loss | 1.15e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8147 | -| time_elapsed | 50541 | -| total_timesteps | 1042816 | -| train/ | | -| approx_kl | 0.003438111 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.914 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 81460 | -| policy_gradient_loss | -0.0012 | -| std | 0.0971 | -| value_loss | 8.22e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 20 | -| iterations | 8148 | -| time_elapsed | 50544 | -| total_timesteps | 1042944 | -| train/ | | -| approx_kl | 0.027304737 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 0.913 | -| explained_variance | -0.093 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 81470 | -| policy_gradient_loss | -0.00754 | -| std | 0.0972 | -| value_loss | 7.8e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8149 | -| time_elapsed | 50547 | -| total_timesteps | 1043072 | -| train/ | | -| approx_kl | 0.0022593988 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 0.912 | -| explained_variance | 0.00316 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 81480 | -| policy_gradient_loss | -0.0051 | -| std | 0.0972 | -| value_loss | 1.92e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8150 | -| time_elapsed | 50554 | -| total_timesteps | 1043200 | -| train/ | | -| approx_kl | 0.016317816 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 0.913 | -| explained_variance | 0.915 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 81490 | -| policy_gradient_loss | -0.0135 | -| std | 0.0971 | -| value_loss | 0.000785 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8151 | -| time_elapsed | 50558 | -| total_timesteps | 1043328 | -| train/ | | -| approx_kl | 0.0974475 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 0.913 | -| explained_variance | -346 | -| learning_rate | 0.0003 | -| loss | 0.00251 | -| n_updates | 81500 | -| policy_gradient_loss | -0.002 | -| std | 0.0971 | -| value_loss | 1.65e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8152 | -| time_elapsed | 50561 | -| total_timesteps | 1043456 | -| train/ | | -| approx_kl | 0.013004173 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 0.914 | -| explained_variance | -243 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 81510 | -| policy_gradient_loss | -0.00153 | -| std | 0.0969 | -| value_loss | 7.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8153 | -| time_elapsed | 50566 | -| total_timesteps | 1043584 | -| train/ | | -| approx_kl | 0.048530858 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 0.916 | -| explained_variance | -4.44 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 81520 | -| policy_gradient_loss | -0.00251 | -| std | 0.0967 | -| value_loss | 6.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8154 | -| time_elapsed | 50570 | -| total_timesteps | 1043712 | -| train/ | | -| approx_kl | 0.015648093 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 0.918 | -| explained_variance | -0.095 | -| learning_rate | 0.0003 | -| loss | 0.00373 | -| n_updates | 81530 | -| policy_gradient_loss | 0.00128 | -| std | 0.0966 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8155 | -| time_elapsed | 50575 | -| total_timesteps | 1043840 | -| train/ | | -| approx_kl | 0.0015251143 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 0.919 | -| explained_variance | -0.00103 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 81540 | -| policy_gradient_loss | -0.00148 | -| std | 0.0965 | -| value_loss | 1.05e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 20 | -| iterations | 8156 | -| time_elapsed | 50578 | -| total_timesteps | 1043968 | -| train/ | | -| approx_kl | 0.0003706119 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 0.919 | -| explained_variance | -0.00866 | -| learning_rate | 0.0003 | -| loss | -0.000115 | -| n_updates | 81550 | -| policy_gradient_loss | 0.000244 | -| std | 0.0966 | -| value_loss | 2.12e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8157 | -| time_elapsed | 50582 | -| total_timesteps | 1044096 | -| train/ | | -| approx_kl | 0.0044817077 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 81560 | -| policy_gradient_loss | -0.00376 | -| std | 0.0968 | -| value_loss | 1.01e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8158 | -| time_elapsed | 50592 | -| total_timesteps | 1044224 | -| train/ | | -| approx_kl | 0.016435396 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.916 | -| explained_variance | -1.84 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 81570 | -| policy_gradient_loss | -0.00432 | -| std | 0.0969 | -| value_loss | 0.00454 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8159 | -| time_elapsed | 50595 | -| total_timesteps | 1044352 | -| train/ | | -| approx_kl | 0.06554639 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 0.916 | -| explained_variance | -1.07e+03 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 81580 | -| policy_gradient_loss | -0.00325 | -| std | 0.0968 | -| value_loss | 2.6e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8160 | -| time_elapsed | 50599 | -| total_timesteps | 1044480 | -| train/ | | -| approx_kl | 0.024799446 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -2.42e+03 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 81590 | -| policy_gradient_loss | -0.0153 | -| std | 0.0968 | -| value_loss | 1.17e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8161 | -| time_elapsed | 50602 | -| total_timesteps | 1044608 | -| train/ | | -| approx_kl | 0.037531745 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -25.5 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 81600 | -| policy_gradient_loss | -0.000593 | -| std | 0.0967 | -| value_loss | 5.53e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8162 | -| time_elapsed | 50606 | -| total_timesteps | 1044736 | -| train/ | | -| approx_kl | 0.00035145506 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -0.524 | -| learning_rate | 0.0003 | -| loss | -0.000749 | -| n_updates | 81610 | -| policy_gradient_loss | -0.000516 | -| std | 0.0967 | -| value_loss | 3.5e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8163 | -| time_elapsed | 50611 | -| total_timesteps | 1044864 | -| train/ | | -| approx_kl | 0.0008733906 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 81620 | -| policy_gradient_loss | -0.00489 | -| std | 0.0967 | -| value_loss | 5.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 20 | -| iterations | 8164 | -| time_elapsed | 50615 | -| total_timesteps | 1044992 | -| train/ | | -| approx_kl | 0.016203366 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 81630 | -| policy_gradient_loss | 0.000472 | -| std | 0.0967 | -| value_loss | 5.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 20 | -| iterations | 8165 | -| time_elapsed | 50617 | -| total_timesteps | 1045120 | -| train/ | | -| approx_kl | 0.014560118 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -0.00134 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 81640 | -| policy_gradient_loss | -0.00279 | -| std | 0.0967 | -| value_loss | 8.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 20 | -| iterations | 8166 | -| time_elapsed | 50625 | -| total_timesteps | 1045248 | -| train/ | | -| approx_kl | 0.020469217 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -3.27 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 81650 | -| policy_gradient_loss | -0.0142 | -| std | 0.0967 | -| value_loss | 0.00335 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 20 | -| iterations | 8167 | -| time_elapsed | 50629 | -| total_timesteps | 1045376 | -| train/ | | -| approx_kl | 0.044987176 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 0.917 | -| explained_variance | -4.56e+03 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 81660 | -| policy_gradient_loss | -0.0157 | -| std | 0.0968 | -| value_loss | 5.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 20 | -| iterations | 8168 | -| time_elapsed | 50632 | -| total_timesteps | 1045504 | -| train/ | | -| approx_kl | 0.031855933 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 0.916 | -| explained_variance | -1.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 81670 | -| policy_gradient_loss | -0.00692 | -| std | 0.0969 | -| value_loss | 5.03e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 20 | -| iterations | 8169 | -| time_elapsed | 50636 | -| total_timesteps | 1045632 | -| train/ | | -| approx_kl | 0.0068213013 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 0.916 | -| explained_variance | -36.2 | -| learning_rate | 0.0003 | -| loss | -0.00348 | -| n_updates | 81680 | -| policy_gradient_loss | -0.00262 | -| std | 0.0967 | -| value_loss | 5.19e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 20 | -| iterations | 8170 | -| time_elapsed | 50639 | -| total_timesteps | 1045760 | -| train/ | | -| approx_kl | 0.11226537 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 0.918 | -| explained_variance | -112 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 81690 | -| policy_gradient_loss | -0.00602 | -| std | 0.0965 | -| value_loss | 5.59e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 20 | -| iterations | 8171 | -| time_elapsed | 50644 | -| total_timesteps | 1045888 | -| train/ | | -| approx_kl | 0.003493507 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 0.92 | -| explained_variance | -0.713 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 81700 | -| policy_gradient_loss | -0.00277 | -| std | 0.0964 | -| value_loss | 2.22e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8172 | -| time_elapsed | 50646 | -| total_timesteps | 1046016 | -| train/ | | -| approx_kl | 0.0065700924 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 0.921 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 81710 | -| policy_gradient_loss | -0.0107 | -| std | 0.0963 | -| value_loss | 2.8e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8173 | -| time_elapsed | 50654 | -| total_timesteps | 1046144 | -| train/ | | -| approx_kl | 0.0065062274 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.922 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 81720 | -| policy_gradient_loss | -0.00431 | -| std | 0.0961 | -| value_loss | 0.00113 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8174 | -| time_elapsed | 50658 | -| total_timesteps | 1046272 | -| train/ | | -| approx_kl | 0.020797942 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 0.925 | -| explained_variance | -2.8e+03 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 81730 | -| policy_gradient_loss | -0.0159 | -| std | 0.0958 | -| value_loss | 5.92e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8175 | -| time_elapsed | 50661 | -| total_timesteps | 1046400 | -| train/ | | -| approx_kl | 0.08365311 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 0.927 | -| explained_variance | -8.09e+03 | -| learning_rate | 0.0003 | -| loss | -0.00827 | -| n_updates | 81740 | -| policy_gradient_loss | -0.00789 | -| std | 0.0957 | -| value_loss | 4.33e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8176 | -| time_elapsed | 50663 | -| total_timesteps | 1046528 | -| train/ | | -| approx_kl | 0.0032919827 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 0.928 | -| explained_variance | -29.8 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 81750 | -| policy_gradient_loss | -0.00853 | -| std | 0.0957 | -| value_loss | 2.88e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8177 | -| time_elapsed | 50666 | -| total_timesteps | 1046656 | -| train/ | | -| approx_kl | 0.0005248962 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 0.928 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 81760 | -| policy_gradient_loss | -0.00072 | -| std | 0.0956 | -| value_loss | 5.33e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8178 | -| time_elapsed | 50669 | -| total_timesteps | 1046784 | -| train/ | | -| approx_kl | 0.0014985534 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | 0.929 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.000649 | -| n_updates | 81770 | -| policy_gradient_loss | -0.000187 | -| std | 0.0955 | -| value_loss | 1.97e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 20 | -| iterations | 8179 | -| time_elapsed | 50672 | -| total_timesteps | 1046912 | -| train/ | | -| approx_kl | 0.001087999 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.93 | -| explained_variance | 0.000475 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 81780 | -| policy_gradient_loss | 0.000412 | -| std | 0.0955 | -| value_loss | 3.09e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8180 | -| time_elapsed | 50676 | -| total_timesteps | 1047040 | -| train/ | | -| approx_kl | 0.0021236995 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 0.93 | -| explained_variance | 0.00262 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 81790 | -| policy_gradient_loss | 0.000505 | -| std | 0.0955 | -| value_loss | 7.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8181 | -| time_elapsed | 50681 | -| total_timesteps | 1047168 | -| train/ | | -| approx_kl | 0.010136196 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 0.931 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 81800 | -| policy_gradient_loss | -0.0152 | -| std | 0.0953 | -| value_loss | 2.23e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8182 | -| time_elapsed | 50684 | -| total_timesteps | 1047296 | -| train/ | | -| approx_kl | 0.04652955 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 0.932 | -| explained_variance | -0.611 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 81810 | -| policy_gradient_loss | -0.0108 | -| std | 0.0953 | -| value_loss | 2.62e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8183 | -| time_elapsed | 50688 | -| total_timesteps | 1047424 | -| train/ | | -| approx_kl | 0.0056863977 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 0.932 | -| explained_variance | -0.34 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 81820 | -| policy_gradient_loss | -0.00565 | -| std | 0.0953 | -| value_loss | 6.75e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8184 | -| time_elapsed | 50691 | -| total_timesteps | 1047552 | -| train/ | | -| approx_kl | 0.0043309596 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.932 | -| explained_variance | 0.000331 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 81830 | -| policy_gradient_loss | -0.00362 | -| std | 0.0953 | -| value_loss | 7.46e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8185 | -| time_elapsed | 50696 | -| total_timesteps | 1047680 | -| train/ | | -| approx_kl | 0.00068300357 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 0.932 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 81840 | -| policy_gradient_loss | -0.0082 | -| std | 0.0953 | -| value_loss | 1.76e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8186 | -| time_elapsed | 50699 | -| total_timesteps | 1047808 | -| train/ | | -| approx_kl | 0.00012289826 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 0.932 | -| explained_variance | -0.00286 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 81850 | -| policy_gradient_loss | -0.00591 | -| std | 0.0953 | -| value_loss | 5.57e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 20 | -| iterations | 8187 | -| time_elapsed | 50702 | -| total_timesteps | 1047936 | -| train/ | | -| approx_kl | 0.0010099523 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 0.932 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 81860 | -| policy_gradient_loss | -0.00235 | -| std | 0.0952 | -| value_loss | 1.74e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8188 | -| time_elapsed | 50706 | -| total_timesteps | 1048064 | -| train/ | | -| approx_kl | 0.0012127021 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 0.934 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 81870 | -| policy_gradient_loss | -0.00532 | -| std | 0.095 | -| value_loss | 2.76e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8189 | -| time_elapsed | 50712 | -| total_timesteps | 1048192 | -| train/ | | -| approx_kl | 0.04434799 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.935 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 81880 | -| policy_gradient_loss | -0.0143 | -| std | 0.095 | -| value_loss | 0.00012 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8190 | -| time_elapsed | 50715 | -| total_timesteps | 1048320 | -| train/ | | -| approx_kl | 0.07463981 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 0.935 | -| explained_variance | -61 | -| learning_rate | 0.0003 | -| loss | -0.00642 | -| n_updates | 81890 | -| policy_gradient_loss | -0.00576 | -| std | 0.095 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8191 | -| time_elapsed | 50719 | -| total_timesteps | 1048448 | -| train/ | | -| approx_kl | 0.01712689 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 0.935 | -| explained_variance | -247 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 81900 | -| policy_gradient_loss | -0.00207 | -| std | 0.0949 | -| value_loss | 1.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8192 | -| time_elapsed | 50722 | -| total_timesteps | 1048576 | -| train/ | | -| approx_kl | 0.0053902534 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 0.937 | -| explained_variance | -11.6 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 81910 | -| policy_gradient_loss | 0.000639 | -| std | 0.0947 | -| value_loss | 4.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8193 | -| time_elapsed | 50725 | -| total_timesteps | 1048704 | -| train/ | | -| approx_kl | 0.009681337 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.939 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 81920 | -| policy_gradient_loss | -0.00633 | -| std | 0.0946 | -| value_loss | 1.09e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8194 | -| time_elapsed | 50729 | -| total_timesteps | 1048832 | -| train/ | | -| approx_kl | 0.00053886324 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 0.939 | -| explained_variance | -0.544 | -| learning_rate | 0.0003 | -| loss | -0.0028 | -| n_updates | 81930 | -| policy_gradient_loss | -0.00226 | -| std | 0.0946 | -| value_loss | 1.22e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 20 | -| iterations | 8195 | -| time_elapsed | 50731 | -| total_timesteps | 1048960 | -| train/ | | -| approx_kl | 0.0011184281 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 0.939 | -| explained_variance | -0.00964 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 81940 | -| policy_gradient_loss | -0.000271 | -| std | 0.0946 | -| value_loss | 1.66e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8196 | -| time_elapsed | 50735 | -| total_timesteps | 1049088 | -| train/ | | -| approx_kl | 0.0022025793 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.939 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | -0.000987 | -| n_updates | 81950 | -| policy_gradient_loss | 0.00152 | -| std | 0.0946 | -| value_loss | 3.6e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8197 | -| time_elapsed | 50743 | -| total_timesteps | 1049216 | -| train/ | | -| approx_kl | 0.02602204 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.939 | -| explained_variance | -0.952 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 81960 | -| policy_gradient_loss | -0.0167 | -| std | 0.0946 | -| value_loss | 0.00213 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8198 | -| time_elapsed | 50747 | -| total_timesteps | 1049344 | -| train/ | | -| approx_kl | 0.033204608 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 0.939 | -| explained_variance | -4.37e+03 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 81970 | -| policy_gradient_loss | -0.0026 | -| std | 0.0945 | -| value_loss | 9.63e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8199 | -| time_elapsed | 50748 | -| total_timesteps | 1049472 | -| train/ | | -| approx_kl | 0.14545895 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 0.941 | -| explained_variance | -632 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 81980 | -| policy_gradient_loss | -0.00407 | -| std | 0.0944 | -| value_loss | 7.62e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8200 | -| time_elapsed | 50751 | -| total_timesteps | 1049600 | -| train/ | | -| approx_kl | 0.03433556 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.942 | -| explained_variance | -22 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 81990 | -| policy_gradient_loss | -0.00675 | -| std | 0.0943 | -| value_loss | 7.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8201 | -| time_elapsed | 50755 | -| total_timesteps | 1049728 | -| train/ | | -| approx_kl | 0.00765792 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 0.942 | -| explained_variance | -34.5 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 82000 | -| policy_gradient_loss | -0.00894 | -| std | 0.0943 | -| value_loss | 2.12e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8202 | -| time_elapsed | 50759 | -| total_timesteps | 1049856 | -| train/ | | -| approx_kl | 0.053975392 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 0.942 | -| explained_variance | -1.29 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 82010 | -| policy_gradient_loss | -0.00603 | -| std | 0.0943 | -| value_loss | 4.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 20 | -| iterations | 8203 | -| time_elapsed | 50762 | -| total_timesteps | 1049984 | -| train/ | | -| approx_kl | 0.02926195 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.942 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 82020 | -| policy_gradient_loss | -0.01 | -| std | 0.0943 | -| value_loss | 1.78e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 20 | -| iterations | 8204 | -| time_elapsed | 50766 | -| total_timesteps | 1050112 | -| train/ | | -| approx_kl | 0.031715818 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 0.942 | -| explained_variance | -0.51 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 82030 | -| policy_gradient_loss | -0.0035 | -| std | 0.0943 | -| value_loss | 7.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 20 | -| iterations | 8205 | -| time_elapsed | 50774 | -| total_timesteps | 1050240 | -| train/ | | -| approx_kl | 0.008141849 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.941 | -| explained_variance | -5.09 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 82040 | -| policy_gradient_loss | -0.00723 | -| std | 0.0945 | -| value_loss | 0.00178 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 20 | -| iterations | 8206 | -| time_elapsed | 50777 | -| total_timesteps | 1050368 | -| train/ | | -| approx_kl | 0.06447877 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 0.94 | -| explained_variance | -2.84e+04 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 82050 | -| policy_gradient_loss | -0.00387 | -| std | 0.0945 | -| value_loss | 9.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 20 | -| iterations | 8207 | -| time_elapsed | 50780 | -| total_timesteps | 1050496 | -| train/ | | -| approx_kl | 0.087078094 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 0.941 | -| explained_variance | -65.7 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 82060 | -| policy_gradient_loss | -0.0109 | -| std | 0.0944 | -| value_loss | 1.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 20 | -| iterations | 8208 | -| time_elapsed | 50783 | -| total_timesteps | 1050624 | -| train/ | | -| approx_kl | 0.02506065 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 0.942 | -| explained_variance | -9.76 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 82070 | -| policy_gradient_loss | 0.000201 | -| std | 0.0942 | -| value_loss | 1.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 20 | -| iterations | 8209 | -| time_elapsed | 50787 | -| total_timesteps | 1050752 | -| train/ | | -| approx_kl | 0.020765929 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 0.944 | -| explained_variance | -0.758 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 82080 | -| policy_gradient_loss | -0.00134 | -| std | 0.094 | -| value_loss | 2.69e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 20 | -| iterations | 8210 | -| time_elapsed | 50790 | -| total_timesteps | 1050880 | -| train/ | | -| approx_kl | 0.00015615998 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 0.946 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | -0.000675 | -| n_updates | 82090 | -| policy_gradient_loss | 0.00392 | -| std | 0.0939 | -| value_loss | 3.88e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8211 | -| time_elapsed | 50793 | -| total_timesteps | 1051008 | -| train/ | | -| approx_kl | 0.00036634784 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 0.948 | -| explained_variance | -0.000323 | -| learning_rate | 0.0003 | -| loss | -0.00014 | -| n_updates | 82100 | -| policy_gradient_loss | 3.82e-05 | -| std | 0.0936 | -| value_loss | 3.47e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8212 | -| time_elapsed | 50803 | -| total_timesteps | 1051136 | -| train/ | | -| approx_kl | 0.14438665 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 0.951 | -| explained_variance | 0.679 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 82110 | -| policy_gradient_loss | -0.00662 | -| std | 0.0934 | -| value_loss | 0.000331 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8213 | -| time_elapsed | 50806 | -| total_timesteps | 1051264 | -| train/ | | -| approx_kl | 0.00048757344 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 0.952 | -| explained_variance | -85.3 | -| learning_rate | 0.0003 | -| loss | -0.00591 | -| n_updates | 82120 | -| policy_gradient_loss | -0.0118 | -| std | 0.0934 | -| value_loss | 4.92e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8214 | -| time_elapsed | 50809 | -| total_timesteps | 1051392 | -| train/ | | -| approx_kl | 0.082882516 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 0.952 | -| explained_variance | -130 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 82130 | -| policy_gradient_loss | -0.00445 | -| std | 0.0933 | -| value_loss | 7.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8215 | -| time_elapsed | 50812 | -| total_timesteps | 1051520 | -| train/ | | -| approx_kl | 0.017108306 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 0.953 | -| explained_variance | -4.39 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 82140 | -| policy_gradient_loss | -0.00163 | -| std | 0.0933 | -| value_loss | 5.36e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8216 | -| time_elapsed | 50817 | -| total_timesteps | 1051648 | -| train/ | | -| approx_kl | 0.0027884403 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 0.954 | -| explained_variance | -0.426 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 82150 | -| policy_gradient_loss | -0.00858 | -| std | 0.0932 | -| value_loss | 4.59e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8217 | -| time_elapsed | 50819 | -| total_timesteps | 1051776 | -| train/ | | -| approx_kl | 1.5926082e-05 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.955 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.00021 | -| n_updates | 82160 | -| policy_gradient_loss | -0.000219 | -| std | 0.093 | -| value_loss | 2.3e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8218 | -| time_elapsed | 50823 | -| total_timesteps | 1051904 | -| train/ | | -| approx_kl | 0.023545668 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 0.958 | -| explained_variance | -0.00154 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 82170 | -| policy_gradient_loss | -0.00536 | -| std | 0.0927 | -| value_loss | 2.64e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8219 | -| time_elapsed | 50827 | -| total_timesteps | 1052032 | -| train/ | | -| approx_kl | 0.0049306704 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 0.96 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 82180 | -| policy_gradient_loss | 0.00364 | -| std | 0.0926 | -| value_loss | 1.32e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8220 | -| time_elapsed | 50836 | -| total_timesteps | 1052160 | -| train/ | | -| approx_kl | 0.15408131 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.961 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 82190 | -| policy_gradient_loss | -0.00382 | -| std | 0.0925 | -| value_loss | 0.00145 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8221 | -| time_elapsed | 50840 | -| total_timesteps | 1052288 | -| train/ | | -| approx_kl | 0.04014268 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 0.963 | -| explained_variance | -48.3 | -| learning_rate | 0.0003 | -| loss | 0.00244 | -| n_updates | 82200 | -| policy_gradient_loss | 0.000187 | -| std | 0.0923 | -| value_loss | 8.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8222 | -| time_elapsed | 50843 | -| total_timesteps | 1052416 | -| train/ | | -| approx_kl | 0.021002002 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 0.965 | -| explained_variance | -35 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 82210 | -| policy_gradient_loss | -0.00282 | -| std | 0.0921 | -| value_loss | 3.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8223 | -| time_elapsed | 50845 | -| total_timesteps | 1052544 | -| train/ | | -| approx_kl | 0.012359952 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 0.965 | -| explained_variance | -7.71 | -| learning_rate | 0.0003 | -| loss | -0.000825 | -| n_updates | 82220 | -| policy_gradient_loss | -0.000325 | -| std | 0.0923 | -| value_loss | 5.51e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8224 | -| time_elapsed | 50848 | -| total_timesteps | 1052672 | -| train/ | | -| approx_kl | 0.016875774 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 0.963 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | 0.00307 | -| n_updates | 82230 | -| policy_gradient_loss | 0.00201 | -| std | 0.0924 | -| value_loss | 1.86e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8225 | -| time_elapsed | 50851 | -| total_timesteps | 1052800 | -| train/ | | -| approx_kl | 0.0058002416 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 0.963 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | -0.000152 | -| n_updates | 82240 | -| policy_gradient_loss | 0.00113 | -| std | 0.0923 | -| value_loss | 3.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 20 | -| iterations | 8226 | -| time_elapsed | 50854 | -| total_timesteps | 1052928 | -| train/ | | -| approx_kl | 0.004445115 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 0.964 | -| explained_variance | -0.00482 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 82250 | -| policy_gradient_loss | -0.00612 | -| std | 0.0922 | -| value_loss | 3.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8227 | -| time_elapsed | 50858 | -| total_timesteps | 1053056 | -| train/ | | -| approx_kl | 0.003454185 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 0.965 | -| explained_variance | 0.0041 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 82260 | -| policy_gradient_loss | -0.00145 | -| std | 0.092 | -| value_loss | 2.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8228 | -| time_elapsed | 50863 | -| total_timesteps | 1053184 | -| train/ | | -| approx_kl | 0.09591302 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 0.968 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 82270 | -| policy_gradient_loss | -0.00279 | -| std | 0.0917 | -| value_loss | 0.000878 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8229 | -| time_elapsed | 50866 | -| total_timesteps | 1053312 | -| train/ | | -| approx_kl | 0.08728611 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 0.971 | -| explained_variance | -25.4 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 82280 | -| policy_gradient_loss | -0.00637 | -| std | 0.0915 | -| value_loss | 9.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8230 | -| time_elapsed | 50868 | -| total_timesteps | 1053440 | -| train/ | | -| approx_kl | 0.056058995 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -35.1 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 82290 | -| policy_gradient_loss | -0.00262 | -| std | 0.0915 | -| value_loss | 5.26e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8231 | -| time_elapsed | 50873 | -| total_timesteps | 1053568 | -| train/ | | -| approx_kl | 0.00017885724 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 0.973 | -| explained_variance | -5.32 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 82300 | -| policy_gradient_loss | -0.013 | -| std | 0.0915 | -| value_loss | 1.62e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8232 | -| time_elapsed | 50877 | -| total_timesteps | 1053696 | -| train/ | | -| approx_kl | 0.010549666 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.973 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | -0.00788 | -| n_updates | 82310 | -| policy_gradient_loss | -0.00504 | -| std | 0.0915 | -| value_loss | 2.14e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8233 | -| time_elapsed | 50881 | -| total_timesteps | 1053824 | -| train/ | | -| approx_kl | 0.0061029745 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.00922 | -| n_updates | 82320 | -| policy_gradient_loss | -0.00594 | -| std | 0.0916 | -| value_loss | 2.43e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8234 | -| time_elapsed | 50886 | -| total_timesteps | 1053952 | -| train/ | | -| approx_kl | 0.0012031677 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.000848 | -| n_updates | 82330 | -| policy_gradient_loss | 0.000777 | -| std | 0.0916 | -| value_loss | 5.52e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8235 | -| time_elapsed | 50889 | -| total_timesteps | 1054080 | -| train/ | | -| approx_kl | 0.012940533 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 0.971 | -| explained_variance | -0.0013 | -| learning_rate | 0.0003 | -| loss | -0.00655 | -| n_updates | 82340 | -| policy_gradient_loss | -0.00153 | -| std | 0.0916 | -| value_loss | 2.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8236 | -| time_elapsed | 50894 | -| total_timesteps | 1054208 | -| train/ | | -| approx_kl | 0.020977665 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 0.971 | -| explained_variance | 0.366 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 82350 | -| policy_gradient_loss | -0.00831 | -| std | 0.0917 | -| value_loss | 0.000695 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8237 | -| time_elapsed | 50898 | -| total_timesteps | 1054336 | -| train/ | | -| approx_kl | 0.005022376 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 0.97 | -| explained_variance | -19.5 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 82360 | -| policy_gradient_loss | -0.00944 | -| std | 0.0917 | -| value_loss | 2.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8238 | -| time_elapsed | 50901 | -| total_timesteps | 1054464 | -| train/ | | -| approx_kl | 0.076309636 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 0.97 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.00726 | -| n_updates | 82370 | -| policy_gradient_loss | -0.00498 | -| std | 0.0917 | -| value_loss | 8.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8239 | -| time_elapsed | 50904 | -| total_timesteps | 1054592 | -| train/ | | -| approx_kl | 0.013857112 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 0.971 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 82380 | -| policy_gradient_loss | -0.000248 | -| std | 0.0916 | -| value_loss | 4.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8240 | -| time_elapsed | 50906 | -| total_timesteps | 1054720 | -| train/ | | -| approx_kl | 0.034233164 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 0.971 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | 0.00366 | -| n_updates | 82390 | -| policy_gradient_loss | -0.000752 | -| std | 0.0916 | -| value_loss | 1.98e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8241 | -| time_elapsed | 50909 | -| total_timesteps | 1054848 | -| train/ | | -| approx_kl | 0.0140666235 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 0.971 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 82400 | -| policy_gradient_loss | -0.00349 | -| std | 0.0916 | -| value_loss | 8.13e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8242 | -| time_elapsed | 50912 | -| total_timesteps | 1054976 | -| train/ | | -| approx_kl | 0.014000462 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 0.971 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 82410 | -| policy_gradient_loss | -0.00214 | -| std | 0.0916 | -| value_loss | 7.45e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8243 | -| time_elapsed | 50914 | -| total_timesteps | 1055104 | -| train/ | | -| approx_kl | 0.0012084413 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 82420 | -| policy_gradient_loss | -0.00195 | -| std | 0.0915 | -| value_loss | 4.81e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8244 | -| time_elapsed | 50922 | -| total_timesteps | 1055232 | -| train/ | | -| approx_kl | 0.0022912053 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | 0.888 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 82430 | -| policy_gradient_loss | -0.0121 | -| std | 0.0915 | -| value_loss | 0.000207 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8245 | -| time_elapsed | 50926 | -| total_timesteps | 1055360 | -| train/ | | -| approx_kl | 0.0010521561 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -6.6 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 82440 | -| policy_gradient_loss | -0.00902 | -| std | 0.0915 | -| value_loss | 1.54e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8246 | -| time_elapsed | 50929 | -| total_timesteps | 1055488 | -| train/ | | -| approx_kl | 0.050425727 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -1.12e+04 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 82450 | -| policy_gradient_loss | -0.0109 | -| std | 0.0916 | -| value_loss | 2.62e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8247 | -| time_elapsed | 50933 | -| total_timesteps | 1055616 | -| train/ | | -| approx_kl | 0.03451608 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -42.2 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 82460 | -| policy_gradient_loss | -0.00108 | -| std | 0.0915 | -| value_loss | 8.32e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8248 | -| time_elapsed | 50936 | -| total_timesteps | 1055744 | -| train/ | | -| approx_kl | 0.009805984 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 0.973 | -| explained_variance | -15 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 82470 | -| policy_gradient_loss | -0.00134 | -| std | 0.0914 | -| value_loss | 4.26e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8249 | -| time_elapsed | 50940 | -| total_timesteps | 1055872 | -| train/ | | -| approx_kl | 0.016101079 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 0.975 | -| explained_variance | -61.9 | -| learning_rate | 0.0003 | -| loss | -0.000337 | -| n_updates | 82480 | -| policy_gradient_loss | -0.000114 | -| std | 0.0911 | -| value_loss | 2.34e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8250 | -| time_elapsed | 50944 | -| total_timesteps | 1056000 | -| train/ | | -| approx_kl | 0.00024500675 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 0.978 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 82490 | -| policy_gradient_loss | -0.0145 | -| std | 0.091 | -| value_loss | 1.93e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8251 | -| time_elapsed | 50949 | -| total_timesteps | 1056128 | -| train/ | | -| approx_kl | 0.0037182975 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 0.979 | -| explained_variance | -0.00263 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 82500 | -| policy_gradient_loss | -0.0094 | -| std | 0.0909 | -| value_loss | 9.67e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8252 | -| time_elapsed | 50958 | -| total_timesteps | 1056256 | -| train/ | | -| approx_kl | 0.005211685 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 0.979 | -| explained_variance | 0.634 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 82510 | -| policy_gradient_loss | -0.0149 | -| std | 0.0909 | -| value_loss | 0.000413 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8253 | -| time_elapsed | 50961 | -| total_timesteps | 1056384 | -| train/ | | -| approx_kl | 0.021359894 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 0.979 | -| explained_variance | -45.1 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 82520 | -| policy_gradient_loss | -0.00175 | -| std | 0.0909 | -| value_loss | 4.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8254 | -| time_elapsed | 50965 | -| total_timesteps | 1056512 | -| train/ | | -| approx_kl | 0.02279709 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 0.979 | -| explained_variance | -101 | -| learning_rate | 0.0003 | -| loss | -0.000738 | -| n_updates | 82530 | -| policy_gradient_loss | -0.000287 | -| std | 0.0908 | -| value_loss | 2.7e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8255 | -| time_elapsed | 50968 | -| total_timesteps | 1056640 | -| train/ | | -| approx_kl | 0.0013159933 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -16.2 | -| learning_rate | 0.0003 | -| loss | -0.000752 | -| n_updates | 82540 | -| policy_gradient_loss | -0.000521 | -| std | 0.0905 | -| value_loss | 3.67e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8256 | -| time_elapsed | 50971 | -| total_timesteps | 1056768 | -| train/ | | -| approx_kl | 0.0021232218 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 0.985 | -| explained_variance | -1.42 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 82550 | -| policy_gradient_loss | -0.00106 | -| std | 0.0902 | -| value_loss | 2.18e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8257 | -| time_elapsed | 50975 | -| total_timesteps | 1056896 | -| train/ | | -| approx_kl | 0.00033645006 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 0.988 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | -0.000526 | -| n_updates | 82560 | -| policy_gradient_loss | 8.91e-05 | -| std | 0.09 | -| value_loss | 6.05e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8258 | -| time_elapsed | 50978 | -| total_timesteps | 1057024 | -| train/ | | -| approx_kl | 0.00030669663 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 0.991 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 82570 | -| policy_gradient_loss | 0.000796 | -| std | 0.0897 | -| value_loss | 4.51e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8259 | -| time_elapsed | 50986 | -| total_timesteps | 1057152 | -| train/ | | -| approx_kl | 0.0028783265 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 0.994 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 82580 | -| policy_gradient_loss | -0.00812 | -| std | 0.0895 | -| value_loss | 0.000112 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8260 | -| time_elapsed | 50989 | -| total_timesteps | 1057280 | -| train/ | | -| approx_kl | 0.0017521782 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 0.995 | -| explained_variance | -0.478 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 82590 | -| policy_gradient_loss | -0.00328 | -| std | 0.0894 | -| value_loss | 1.43e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8261 | -| time_elapsed | 50992 | -| total_timesteps | 1057408 | -| train/ | | -| approx_kl | 0.0046509113 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 0.996 | -| explained_variance | -0.804 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 82600 | -| policy_gradient_loss | -0.00193 | -| std | 0.0893 | -| value_loss | 2.78e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8262 | -| time_elapsed | 50996 | -| total_timesteps | 1057536 | -| train/ | | -| approx_kl | 0.003984889 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.996 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.00592 | -| n_updates | 82610 | -| policy_gradient_loss | -0.0038 | -| std | 0.0894 | -| value_loss | 1.05e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8263 | -| time_elapsed | 50998 | -| total_timesteps | 1057664 | -| train/ | | -| approx_kl | 0.0026478688 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 0.995 | -| explained_variance | -0.00406 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 82620 | -| policy_gradient_loss | -0.00247 | -| std | 0.0895 | -| value_loss | 7.75e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8264 | -| time_elapsed | 51001 | -| total_timesteps | 1057792 | -| train/ | | -| approx_kl | 0.0043759854 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 0.993 | -| explained_variance | -0.00334 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 82630 | -| policy_gradient_loss | -0.00103 | -| std | 0.0899 | -| value_loss | 1.75e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8265 | -| time_elapsed | 51003 | -| total_timesteps | 1057920 | -| train/ | | -| approx_kl | 0.0008653975 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.988 | -| explained_variance | -0.00672 | -| learning_rate | 0.0003 | -| loss | -0.000418 | -| n_updates | 82640 | -| policy_gradient_loss | -6.89e-05 | -| std | 0.0903 | -| value_loss | 8.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8266 | -| time_elapsed | 51007 | -| total_timesteps | 1058048 | -| train/ | | -| approx_kl | 0.040617686 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 0.984 | -| explained_variance | 0.0047 | -| learning_rate | 0.0003 | -| loss | -0.0097 | -| n_updates | 82650 | -| policy_gradient_loss | -0.00789 | -| std | 0.0906 | -| value_loss | 1.49e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8267 | -| time_elapsed | 51012 | -| total_timesteps | 1058176 | -| train/ | | -| approx_kl | 0.0010968754 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 82660 | -| policy_gradient_loss | -0.0079 | -| std | 0.0906 | -| value_loss | 5.49e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8268 | -| time_elapsed | 51016 | -| total_timesteps | 1058304 | -| train/ | | -| approx_kl | 0.012374969 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -826 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 82670 | -| policy_gradient_loss | -0.00316 | -| std | 0.0906 | -| value_loss | 3.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8269 | -| time_elapsed | 51019 | -| total_timesteps | 1058432 | -| train/ | | -| approx_kl | 0.045791708 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -49.7 | -| learning_rate | 0.0003 | -| loss | 0.000576 | -| n_updates | 82680 | -| policy_gradient_loss | -0.0011 | -| std | 0.0906 | -| value_loss | 7.19e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8270 | -| time_elapsed | 51022 | -| total_timesteps | 1058560 | -| train/ | | -| approx_kl | 0.14004207 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -1.71e+03 | -| learning_rate | 0.0003 | -| loss | 0.00293 | -| n_updates | 82690 | -| policy_gradient_loss | -0.000989 | -| std | 0.0907 | -| value_loss | 4.82e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8271 | -| time_elapsed | 51026 | -| total_timesteps | 1058688 | -| train/ | | -| approx_kl | 0.14803295 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -1.94e+03 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 82700 | -| policy_gradient_loss | -0.00743 | -| std | 0.0907 | -| value_loss | 3.61e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8272 | -| time_elapsed | 51030 | -| total_timesteps | 1058816 | -| train/ | | -| approx_kl | 0.02994802 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 0.981 | -| explained_variance | -12.3 | -| learning_rate | 0.0003 | -| loss | -0.00453 | -| n_updates | 82710 | -| policy_gradient_loss | -0.00306 | -| std | 0.0907 | -| value_loss | 6.41e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.8 | -| time/ | | -| fps | 20 | -| iterations | 8273 | -| time_elapsed | 51032 | -| total_timesteps | 1058944 | -| train/ | | -| approx_kl | 0.0011221725 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | 0.000659 | -| learning_rate | 0.0003 | -| loss | -0.000254 | -| n_updates | 82720 | -| policy_gradient_loss | 0.000446 | -| std | 0.0907 | -| value_loss | 1.44e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8274 | -| time_elapsed | 51034 | -| total_timesteps | 1059072 | -| train/ | | -| approx_kl | 0.011474148 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -0.00219 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 82730 | -| policy_gradient_loss | -0.0117 | -| std | 0.0907 | -| value_loss | 5.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8275 | -| time_elapsed | 51039 | -| total_timesteps | 1059200 | -| train/ | | -| approx_kl | 0.039451152 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | 0.7 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 82740 | -| policy_gradient_loss | -0.00432 | -| std | 0.0906 | -| value_loss | 0.00352 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8276 | -| time_elapsed | 51042 | -| total_timesteps | 1059328 | -| train/ | | -| approx_kl | 0.024444845 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -40.4 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 82750 | -| policy_gradient_loss | -0.0152 | -| std | 0.0905 | -| value_loss | 5.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8277 | -| time_elapsed | 51046 | -| total_timesteps | 1059456 | -| train/ | | -| approx_kl | 0.17441219 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 0.984 | -| explained_variance | -19.9 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 82760 | -| policy_gradient_loss | -0.00584 | -| std | 0.0905 | -| value_loss | 7.17e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8278 | -| time_elapsed | 51049 | -| total_timesteps | 1059584 | -| train/ | | -| approx_kl | 0.0046352386 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 0.984 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 82770 | -| policy_gradient_loss | -0.0109 | -| std | 0.0905 | -| value_loss | 7.07e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8279 | -| time_elapsed | 51052 | -| total_timesteps | 1059712 | -| train/ | | -| approx_kl | 0.0010555359 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 0.984 | -| explained_variance | -2.05 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 82780 | -| policy_gradient_loss | -0.0011 | -| std | 0.0905 | -| value_loss | 6.19e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8280 | -| time_elapsed | 51056 | -| total_timesteps | 1059840 | -| train/ | | -| approx_kl | 0.025009746 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -12.9 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 82790 | -| policy_gradient_loss | -0.00788 | -| std | 0.0905 | -| value_loss | 2.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.803 | -| time/ | | -| fps | 20 | -| iterations | 8281 | -| time_elapsed | 51059 | -| total_timesteps | 1059968 | -| train/ | | -| approx_kl | 0.001508534 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.00593 | -| n_updates | 82800 | -| policy_gradient_loss | -0.0047 | -| std | 0.0905 | -| value_loss | 3.1e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8282 | -| time_elapsed | 51062 | -| total_timesteps | 1060096 | -| train/ | | -| approx_kl | 0.0023794095 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.984 | -| explained_variance | -0.0845 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 82810 | -| policy_gradient_loss | -0.00619 | -| std | 0.0904 | -| value_loss | 8.56e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8283 | -| time_elapsed | 51071 | -| total_timesteps | 1060224 | -| train/ | | -| approx_kl | 0.003558415 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 0.985 | -| explained_variance | 0.749 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 82820 | -| policy_gradient_loss | -0.00872 | -| std | 0.0903 | -| value_loss | 0.00342 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8284 | -| time_elapsed | 51075 | -| total_timesteps | 1060352 | -| train/ | | -| approx_kl | 0.016042158 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 0.985 | -| explained_variance | -45 | -| learning_rate | 0.0003 | -| loss | -0.000744 | -| n_updates | 82830 | -| policy_gradient_loss | -0.0004 | -| std | 0.0905 | -| value_loss | 1.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8285 | -| time_elapsed | 51079 | -| total_timesteps | 1060480 | -| train/ | | -| approx_kl | 0.055345573 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 0.981 | -| explained_variance | -204 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 82840 | -| policy_gradient_loss | -0.000986 | -| std | 0.091 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8286 | -| time_elapsed | 51082 | -| total_timesteps | 1060608 | -| train/ | | -| approx_kl | 0.030239932 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 0.976 | -| explained_variance | -14.6 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 82850 | -| policy_gradient_loss | -0.00278 | -| std | 0.0913 | -| value_loss | 5.58e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8287 | -| time_elapsed | 51087 | -| total_timesteps | 1060736 | -| train/ | | -| approx_kl | 0.00016271835 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 0.974 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 82860 | -| policy_gradient_loss | 0.0031 | -| std | 0.0914 | -| value_loss | 1.04e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8288 | -| time_elapsed | 51091 | -| total_timesteps | 1060864 | -| train/ | | -| approx_kl | 0.020149373 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -0.00776 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 82870 | -| policy_gradient_loss | -0.000935 | -| std | 0.0916 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8289 | -| time_elapsed | 51094 | -| total_timesteps | 1060992 | -| train/ | | -| approx_kl | 0.0019782656 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -0.87 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 82880 | -| policy_gradient_loss | 0.000606 | -| std | 0.0916 | -| value_loss | 3.27e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8290 | -| time_elapsed | 51099 | -| total_timesteps | 1061120 | -| train/ | | -| approx_kl | 0.002024856 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 0.972 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 82890 | -| policy_gradient_loss | -0.00235 | -| std | 0.0915 | -| value_loss | 1.79e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8291 | -| time_elapsed | 51109 | -| total_timesteps | 1061248 | -| train/ | | -| approx_kl | 0.18028395 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 0.974 | -| explained_variance | 0.867 | -| learning_rate | 0.0003 | -| loss | -0.000848 | -| n_updates | 82900 | -| policy_gradient_loss | -0.000785 | -| std | 0.0912 | -| value_loss | 0.0014 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8292 | -| time_elapsed | 51113 | -| total_timesteps | 1061376 | -| train/ | | -| approx_kl | 0.11643692 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 0.977 | -| explained_variance | -970 | -| learning_rate | 0.0003 | -| loss | -0.00835 | -| n_updates | 82910 | -| policy_gradient_loss | -0.00691 | -| std | 0.091 | -| value_loss | 8.38e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8293 | -| time_elapsed | 51116 | -| total_timesteps | 1061504 | -| train/ | | -| approx_kl | 0.0060663945 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.979 | -| explained_variance | -4.29e+03 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 82920 | -| policy_gradient_loss | -0.00105 | -| std | 0.0908 | -| value_loss | 3.29e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8294 | -| time_elapsed | 51121 | -| total_timesteps | 1061632 | -| train/ | | -| approx_kl | 0.0072045047 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 0.98 | -| explained_variance | -611 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 82930 | -| policy_gradient_loss | -0.0149 | -| std | 0.0907 | -| value_loss | 1.53e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8295 | -| time_elapsed | 51124 | -| total_timesteps | 1061760 | -| train/ | | -| approx_kl | 0.015395487 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 0.981 | -| explained_variance | -3.54 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 82940 | -| policy_gradient_loss | 0.00113 | -| std | 0.0906 | -| value_loss | 3.11e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8296 | -| time_elapsed | 51126 | -| total_timesteps | 1061888 | -| train/ | | -| approx_kl | 2.9291958e-05 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | -1.18e-05 | -| n_updates | 82950 | -| policy_gradient_loss | 0.0044 | -| std | 0.0907 | -| value_loss | 8.95e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8297 | -| time_elapsed | 51130 | -| total_timesteps | 1062016 | -| train/ | | -| approx_kl | 0.0054214057 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 0.981 | -| explained_variance | -0.252 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 82960 | -| policy_gradient_loss | -0.0123 | -| std | 0.0908 | -| value_loss | 1.06e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8298 | -| time_elapsed | 51139 | -| total_timesteps | 1062144 | -| train/ | | -| approx_kl | 0.022506367 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 0.98 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 82970 | -| policy_gradient_loss | -0.0134 | -| std | 0.0908 | -| value_loss | 0.000322 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8299 | -| time_elapsed | 51142 | -| total_timesteps | 1062272 | -| train/ | | -| approx_kl | 0.009666818 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 0.98 | -| explained_variance | -0.867 | -| learning_rate | 0.0003 | -| loss | -0.03 | -| n_updates | 82980 | -| policy_gradient_loss | -0.0247 | -| std | 0.0908 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8300 | -| time_elapsed | 51145 | -| total_timesteps | 1062400 | -| train/ | | -| approx_kl | 0.0024299668 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 0.98 | -| explained_variance | -20.7 | -| learning_rate | 0.0003 | -| loss | -0.00045 | -| n_updates | 82990 | -| policy_gradient_loss | -0.000401 | -| std | 0.091 | -| value_loss | 4.97e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8301 | -| time_elapsed | 51148 | -| total_timesteps | 1062528 | -| train/ | | -| approx_kl | 0.00625707 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 0.978 | -| explained_variance | -0.4 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 83000 | -| policy_gradient_loss | -0.0132 | -| std | 0.091 | -| value_loss | 3.03e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8302 | -| time_elapsed | 51151 | -| total_timesteps | 1062656 | -| train/ | | -| approx_kl | 0.0012011691 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.979 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | -0.00734 | -| n_updates | 83010 | -| policy_gradient_loss | -0.00988 | -| std | 0.0908 | -| value_loss | 1.18e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8303 | -| time_elapsed | 51155 | -| total_timesteps | 1062784 | -| train/ | | -| approx_kl | 0.0022537126 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 0.981 | -| explained_variance | 0.0062 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 83020 | -| policy_gradient_loss | -0.000748 | -| std | 0.0906 | -| value_loss | 1.33e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8304 | -| time_elapsed | 51158 | -| total_timesteps | 1062912 | -| train/ | | -| approx_kl | 0.0111559555 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 0.984 | -| explained_variance | -343 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 83030 | -| policy_gradient_loss | -0.00183 | -| std | 0.0905 | -| value_loss | 4.68e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8305 | -| time_elapsed | 51162 | -| total_timesteps | 1063040 | -| train/ | | -| approx_kl | 0.0046544503 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -20.7 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 83040 | -| policy_gradient_loss | -0.0036 | -| std | 0.0905 | -| value_loss | 3.72e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8306 | -| time_elapsed | 51168 | -| total_timesteps | 1063168 | -| train/ | | -| approx_kl | 0.15749438 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.00766 | -| n_updates | 83050 | -| policy_gradient_loss | -0.0113 | -| std | 0.0905 | -| value_loss | 0.0018 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8307 | -| time_elapsed | 51171 | -| total_timesteps | 1063296 | -| train/ | | -| approx_kl | 0.07891529 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -1.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 83060 | -| policy_gradient_loss | -0.00139 | -| std | 0.0907 | -| value_loss | 1.61e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8308 | -| time_elapsed | 51174 | -| total_timesteps | 1063424 | -| train/ | | -| approx_kl | 0.026108434 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 0.98 | -| explained_variance | -1.73e+03 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 83070 | -| policy_gradient_loss | -0.00679 | -| std | 0.0909 | -| value_loss | 3.84e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8309 | -| time_elapsed | 51178 | -| total_timesteps | 1063552 | -| train/ | | -| approx_kl | 0.0076145115 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 0.979 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 83080 | -| policy_gradient_loss | -0.000463 | -| std | 0.0908 | -| value_loss | 4.14e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8310 | -| time_elapsed | 51182 | -| total_timesteps | 1063680 | -| train/ | | -| approx_kl | 0.007851327 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 0.98 | -| explained_variance | -4.51 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 83090 | -| policy_gradient_loss | -0.00198 | -| std | 0.0907 | -| value_loss | 3.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8311 | -| time_elapsed | 51185 | -| total_timesteps | 1063808 | -| train/ | | -| approx_kl | 0.012328326 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 0.981 | -| explained_variance | -0.874 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 83100 | -| policy_gradient_loss | -0.00476 | -| std | 0.0907 | -| value_loss | 1.39e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8312 | -| time_elapsed | 51188 | -| total_timesteps | 1063936 | -| train/ | | -| approx_kl | 0.0023318673 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | -0.00904 | -| n_updates | 83110 | -| policy_gradient_loss | -0.0056 | -| std | 0.0906 | -| value_loss | 6.38e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8313 | -| time_elapsed | 51191 | -| total_timesteps | 1064064 | -| train/ | | -| approx_kl | 0.0017659995 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | 0.000642 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 83120 | -| policy_gradient_loss | -8.5e-05 | -| std | 0.0906 | -| value_loss | 5.08e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8314 | -| time_elapsed | 51197 | -| total_timesteps | 1064192 | -| train/ | | -| approx_kl | 0.025717761 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -0.484 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 83130 | -| policy_gradient_loss | -0.00762 | -| std | 0.0906 | -| value_loss | 0.00296 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8315 | -| time_elapsed | 51201 | -| total_timesteps | 1064320 | -| train/ | | -| approx_kl | 0.00061497977 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -5.53e+03 | -| learning_rate | 0.0003 | -| loss | 0.00647 | -| n_updates | 83140 | -| policy_gradient_loss | -0.00949 | -| std | 0.0906 | -| value_loss | 1.29e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8316 | -| time_elapsed | 51204 | -| total_timesteps | 1064448 | -| train/ | | -| approx_kl | 0.029543007 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -106 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 83150 | -| policy_gradient_loss | -0.0125 | -| std | 0.0906 | -| value_loss | 5.94e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8317 | -| time_elapsed | 51207 | -| total_timesteps | 1064576 | -| train/ | | -| approx_kl | 0.0030086064 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -5.18 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 83160 | -| policy_gradient_loss | 0.00175 | -| std | 0.0905 | -| value_loss | 1.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8318 | -| time_elapsed | 51209 | -| total_timesteps | 1064704 | -| train/ | | -| approx_kl | 0.0107346745 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 83170 | -| policy_gradient_loss | -0.00107 | -| std | 0.0904 | -| value_loss | 1.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8319 | -| time_elapsed | 51213 | -| total_timesteps | 1064832 | -| train/ | | -| approx_kl | 0.024593048 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 0.984 | -| explained_variance | -0.00562 | -| learning_rate | 0.0003 | -| loss | 0.00572 | -| n_updates | 83180 | -| policy_gradient_loss | 0.00113 | -| std | 0.0904 | -| value_loss | 2.02e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 20 | -| iterations | 8320 | -| time_elapsed | 51217 | -| total_timesteps | 1064960 | -| train/ | | -| approx_kl | 0.0025797863 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | 0.00104 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 83190 | -| policy_gradient_loss | -0.00659 | -| std | 0.0906 | -| value_loss | 4.51e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8321 | -| time_elapsed | 51220 | -| total_timesteps | 1065088 | -| train/ | | -| approx_kl | 0.0015950762 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 83200 | -| policy_gradient_loss | -0.00149 | -| std | 0.0907 | -| value_loss | 3.98e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8322 | -| time_elapsed | 51228 | -| total_timesteps | 1065216 | -| train/ | | -| approx_kl | 0.013865961 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 0.981 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 83210 | -| policy_gradient_loss | -0.00675 | -| std | 0.0907 | -| value_loss | 0.00137 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8323 | -| time_elapsed | 51230 | -| total_timesteps | 1065344 | -| train/ | | -| approx_kl | 0.0064011947 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -9.19 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 83220 | -| policy_gradient_loss | -0.0132 | -| std | 0.0906 | -| value_loss | 4.06e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8324 | -| time_elapsed | 51233 | -| total_timesteps | 1065472 | -| train/ | | -| approx_kl | 0.09716693 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -112 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 83230 | -| policy_gradient_loss | -0.00378 | -| std | 0.0906 | -| value_loss | 1.39e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8325 | -| time_elapsed | 51236 | -| total_timesteps | 1065600 | -| train/ | | -| approx_kl | 0.0032792063 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -30.6 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 83240 | -| policy_gradient_loss | -0.0121 | -| std | 0.0906 | -| value_loss | 5.71e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8326 | -| time_elapsed | 51239 | -| total_timesteps | 1065728 | -| train/ | | -| approx_kl | 0.0073456313 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -0.42 | -| learning_rate | 0.0003 | -| loss | -0.00791 | -| n_updates | 83250 | -| policy_gradient_loss | -0.00602 | -| std | 0.0905 | -| value_loss | 1.29e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8327 | -| time_elapsed | 51242 | -| total_timesteps | 1065856 | -| train/ | | -| approx_kl | 0.020603037 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -0.0652 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 83260 | -| policy_gradient_loss | 0.00131 | -| std | 0.0905 | -| value_loss | 9.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.819 | -| time/ | | -| fps | 20 | -| iterations | 8328 | -| time_elapsed | 51245 | -| total_timesteps | 1065984 | -| train/ | | -| approx_kl | 0.030521285 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.00295 | -| n_updates | 83270 | -| policy_gradient_loss | -0.000608 | -| std | 0.0906 | -| value_loss | 2.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 20 | -| iterations | 8329 | -| time_elapsed | 51248 | -| total_timesteps | 1066112 | -| train/ | | -| approx_kl | 0.015274894 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -0.00076 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 83280 | -| policy_gradient_loss | -0.00276 | -| std | 0.0906 | -| value_loss | 1.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 20 | -| iterations | 8330 | -| time_elapsed | 51257 | -| total_timesteps | 1066240 | -| train/ | | -| approx_kl | 0.059587464 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 83290 | -| policy_gradient_loss | -0.0103 | -| std | 0.0906 | -| value_loss | 8.8e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 20 | -| iterations | 8331 | -| time_elapsed | 51260 | -| total_timesteps | 1066368 | -| train/ | | -| approx_kl | 0.0025780825 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -0.442 | -| learning_rate | 0.0003 | -| loss | -0.000612 | -| n_updates | 83300 | -| policy_gradient_loss | 0.00816 | -| std | 0.0907 | -| value_loss | 4.8e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 20 | -| iterations | 8332 | -| time_elapsed | 51263 | -| total_timesteps | 1066496 | -| train/ | | -| approx_kl | 0.0005777846 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 0.982 | -| explained_variance | -4.76 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 83310 | -| policy_gradient_loss | -0.00398 | -| std | 0.0907 | -| value_loss | 0.000133 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 20 | -| iterations | 8333 | -| time_elapsed | 51266 | -| total_timesteps | 1066624 | -| train/ | | -| approx_kl | 0.0036838627 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | 0.983 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 83320 | -| policy_gradient_loss | -0.00124 | -| std | 0.0903 | -| value_loss | 0.00022 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 20 | -| iterations | 8334 | -| time_elapsed | 51269 | -| total_timesteps | 1066752 | -| train/ | | -| approx_kl | 0.0005113841 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 0.988 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.000763 | -| n_updates | 83330 | -| policy_gradient_loss | -8.06e-05 | -| std | 0.0897 | -| value_loss | 0.000276 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 20 | -| iterations | 8335 | -| time_elapsed | 51273 | -| total_timesteps | 1066880 | -| train/ | | -| approx_kl | 0.010185247 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 0.994 | -| explained_variance | -2.84 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 83340 | -| policy_gradient_loss | -0.0064 | -| std | 0.0894 | -| value_loss | 0.00155 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8336 | -| time_elapsed | 51276 | -| total_timesteps | 1067008 | -| train/ | | -| approx_kl | 1.2226868e-05 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 0.997 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.000127 | -| n_updates | 83350 | -| policy_gradient_loss | 0.00142 | -| std | 0.0892 | -| value_loss | 0.000265 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8337 | -| time_elapsed | 51287 | -| total_timesteps | 1067136 | -| train/ | | -| approx_kl | 0.03776687 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 0.998 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 83360 | -| policy_gradient_loss | -0.015 | -| std | 0.0892 | -| value_loss | 0.00217 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8338 | -| time_elapsed | 51290 | -| total_timesteps | 1067264 | -| train/ | | -| approx_kl | 0.07333635 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 0.998 | -| explained_variance | 0.0661 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 83370 | -| policy_gradient_loss | -0.0129 | -| std | 0.0892 | -| value_loss | 0.00123 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8339 | -| time_elapsed | 51295 | -| total_timesteps | 1067392 | -| train/ | | -| approx_kl | 0.0037272372 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 0.998 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 83380 | -| policy_gradient_loss | -0.0104 | -| std | 0.0892 | -| value_loss | 0.000607 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8340 | -| time_elapsed | 51297 | -| total_timesteps | 1067520 | -| train/ | | -| approx_kl | 0.016641425 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 0.999 | -| explained_variance | -2.24 | -| learning_rate | 0.0003 | -| loss | 3.32e-05 | -| n_updates | 83390 | -| policy_gradient_loss | 8.04e-05 | -| std | 0.0891 | -| value_loss | 0.000301 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8341 | -| time_elapsed | 51300 | -| total_timesteps | 1067648 | -| train/ | | -| approx_kl | 0.03918268 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 0.999 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.00736 | -| n_updates | 83400 | -| policy_gradient_loss | 7.93e-05 | -| std | 0.0891 | -| value_loss | 0.000184 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8342 | -| time_elapsed | 51302 | -| total_timesteps | 1067776 | -| train/ | | -| approx_kl | 0.0016442821 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 0.999 | -| explained_variance | -3.74 | -| learning_rate | 0.0003 | -| loss | -0.00988 | -| n_updates | 83410 | -| policy_gradient_loss | -0.00653 | -| std | 0.0891 | -| value_loss | 0.000142 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 20 | -| iterations | 8343 | -| time_elapsed | 51306 | -| total_timesteps | 1067904 | -| train/ | | -| approx_kl | 0.001101065 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 0.999 | -| explained_variance | 0.00476 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 83420 | -| policy_gradient_loss | -0.00417 | -| std | 0.0891 | -| value_loss | 5.23e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8344 | -| time_elapsed | 51310 | -| total_timesteps | 1068032 | -| train/ | | -| approx_kl | 1.7988496e-06 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 0.999 | -| explained_variance | 0.00462 | -| learning_rate | 0.0003 | -| loss | 0.000141 | -| n_updates | 83430 | -| policy_gradient_loss | -0.0022 | -| std | 0.0891 | -| value_loss | 2.47e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8345 | -| time_elapsed | 51318 | -| total_timesteps | 1068160 | -| train/ | | -| approx_kl | 0.008686595 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 1 | -| explained_variance | 0.629 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 83440 | -| policy_gradient_loss | -0.0125 | -| std | 0.089 | -| value_loss | 0.00117 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8346 | -| time_elapsed | 51322 | -| total_timesteps | 1068288 | -| train/ | | -| approx_kl | 0.0009643873 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 1 | -| explained_variance | -0.421 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 83450 | -| policy_gradient_loss | -0.00387 | -| std | 0.089 | -| value_loss | 0.000111 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8347 | -| time_elapsed | 51325 | -| total_timesteps | 1068416 | -| train/ | | -| approx_kl | 0.013928158 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.00699 | -| n_updates | 83460 | -| policy_gradient_loss | -0.00389 | -| std | 0.0889 | -| value_loss | 1.38e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8348 | -| time_elapsed | 51327 | -| total_timesteps | 1068544 | -| train/ | | -| approx_kl | 0.00019692117 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 1 | -| explained_variance | -0.0741 | -| learning_rate | 0.0003 | -| loss | 0.000159 | -| n_updates | 83470 | -| policy_gradient_loss | 0.00106 | -| std | 0.0888 | -| value_loss | 2.3e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8349 | -| time_elapsed | 51330 | -| total_timesteps | 1068672 | -| train/ | | -| approx_kl | 0.0067348145 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 1 | -| explained_variance | 0.00271 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 83480 | -| policy_gradient_loss | -0.0143 | -| std | 0.0886 | -| value_loss | 4.61e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8350 | -| time_elapsed | 51333 | -| total_timesteps | 1068800 | -| train/ | | -| approx_kl | 0.0045473534 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 83490 | -| policy_gradient_loss | -0.00148 | -| std | 0.0885 | -| value_loss | 2.26e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 20 | -| iterations | 8351 | -| time_elapsed | 51337 | -| total_timesteps | 1068928 | -| train/ | | -| approx_kl | 0.0007301937 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | 0.00419 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 83500 | -| policy_gradient_loss | -0.00158 | -| std | 0.0883 | -| value_loss | 3.82e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8352 | -| time_elapsed | 51339 | -| total_timesteps | 1069056 | -| train/ | | -| approx_kl | 0.002547285 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 83510 | -| policy_gradient_loss | -0.00444 | -| std | 0.0882 | -| value_loss | 8.97e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8353 | -| time_elapsed | 51345 | -| total_timesteps | 1069184 | -| train/ | | -| approx_kl | 0.01204161 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -0.8 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 83520 | -| policy_gradient_loss | -0.0117 | -| std | 0.0881 | -| value_loss | 0.00224 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8354 | -| time_elapsed | 51349 | -| total_timesteps | 1069312 | -| train/ | | -| approx_kl | 0.009213829 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -2.69 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 83530 | -| policy_gradient_loss | -0.00709 | -| std | 0.088 | -| value_loss | 1.76e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8355 | -| time_elapsed | 51352 | -| total_timesteps | 1069440 | -| train/ | | -| approx_kl | 0.018983057 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -16.1 | -| learning_rate | 0.0003 | -| loss | -0.00814 | -| n_updates | 83540 | -| policy_gradient_loss | -0.00349 | -| std | 0.088 | -| value_loss | 8.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8356 | -| time_elapsed | 51355 | -| total_timesteps | 1069568 | -| train/ | | -| approx_kl | 0.011235196 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -2.29 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 83550 | -| policy_gradient_loss | -0.00134 | -| std | 0.088 | -| value_loss | 4.79e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8357 | -| time_elapsed | 51359 | -| total_timesteps | 1069696 | -| train/ | | -| approx_kl | 0.02525835 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -0.212 | -| learning_rate | 0.0003 | -| loss | 0.00173 | -| n_updates | 83560 | -| policy_gradient_loss | 0.013 | -| std | 0.088 | -| value_loss | 1.97e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8358 | -| time_elapsed | 51363 | -| total_timesteps | 1069824 | -| train/ | | -| approx_kl | 0.02319679 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -0.0794 | -| learning_rate | 0.0003 | -| loss | -0.00575 | -| n_updates | 83570 | -| policy_gradient_loss | -0.000758 | -| std | 0.088 | -| value_loss | 9.02e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 20 | -| iterations | 8359 | -| time_elapsed | 51367 | -| total_timesteps | 1069952 | -| train/ | | -| approx_kl | 2.9668678e-05 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | 0.000968 | -| learning_rate | 0.0003 | -| loss | -0.000287 | -| n_updates | 83580 | -| policy_gradient_loss | -0.00142 | -| std | 0.088 | -| value_loss | 3.23e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8360 | -| time_elapsed | 51370 | -| total_timesteps | 1070080 | -| train/ | | -| approx_kl | 0.0014832844 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | 0.00253 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 83590 | -| policy_gradient_loss | -0.000347 | -| std | 0.088 | -| value_loss | 3.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8361 | -| time_elapsed | 51377 | -| total_timesteps | 1070208 | -| train/ | | -| approx_kl | 0.010321911 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 83600 | -| policy_gradient_loss | -0.0124 | -| std | 0.088 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8362 | -| time_elapsed | 51381 | -| total_timesteps | 1070336 | -| train/ | | -| approx_kl | 0.0151279345 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -151 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 83610 | -| policy_gradient_loss | -0.0118 | -| std | 0.088 | -| value_loss | 2.03e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8363 | -| time_elapsed | 51385 | -| total_timesteps | 1070464 | -| train/ | | -| approx_kl | 0.0140714105 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -978 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 83620 | -| policy_gradient_loss | 0.000547 | -| std | 0.088 | -| value_loss | 1.56e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8364 | -| time_elapsed | 51389 | -| total_timesteps | 1070592 | -| train/ | | -| approx_kl | 0.10274153 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -126 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 83630 | -| policy_gradient_loss | -0.00531 | -| std | 0.088 | -| value_loss | 1.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8365 | -| time_elapsed | 51392 | -| total_timesteps | 1070720 | -| train/ | | -| approx_kl | 0.04965777 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -12.3 | -| learning_rate | 0.0003 | -| loss | -0.00817 | -| n_updates | 83640 | -| policy_gradient_loss | -0.00495 | -| std | 0.088 | -| value_loss | 1.08e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8366 | -| time_elapsed | 51396 | -| total_timesteps | 1070848 | -| train/ | | -| approx_kl | 0.058626816 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -2.29 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 83650 | -| policy_gradient_loss | -0.00448 | -| std | 0.0879 | -| value_loss | 1.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 20 | -| iterations | 8367 | -| time_elapsed | 51400 | -| total_timesteps | 1070976 | -| train/ | | -| approx_kl | 0.049839575 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 83660 | -| policy_gradient_loss | -0.0029 | -| std | 0.0879 | -| value_loss | 2.26e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 20 | -| iterations | 8368 | -| time_elapsed | 51404 | -| total_timesteps | 1071104 | -| train/ | | -| approx_kl | 0.00066279806 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -0.95 | -| learning_rate | 0.0003 | -| loss | -0.00031 | -| n_updates | 83670 | -| policy_gradient_loss | 0.00118 | -| std | 0.088 | -| value_loss | 6.09e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 20 | -| iterations | 8369 | -| time_elapsed | 51412 | -| total_timesteps | 1071232 | -| train/ | | -| approx_kl | 0.003638179 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | 0.727 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 83680 | -| policy_gradient_loss | -0.0115 | -| std | 0.0881 | -| value_loss | 0.000871 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 20 | -| iterations | 8370 | -| time_elapsed | 51415 | -| total_timesteps | 1071360 | -| train/ | | -| approx_kl | 0.007985892 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -88.3 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 83690 | -| policy_gradient_loss | -0.000418 | -| std | 0.0881 | -| value_loss | 1.57e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 20 | -| iterations | 8371 | -| time_elapsed | 51418 | -| total_timesteps | 1071488 | -| train/ | | -| approx_kl | 0.0004968513 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -102 | -| learning_rate | 0.0003 | -| loss | -0.000831 | -| n_updates | 83700 | -| policy_gradient_loss | 4.62e-06 | -| std | 0.0879 | -| value_loss | 8.79e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 20 | -| iterations | 8372 | -| time_elapsed | 51420 | -| total_timesteps | 1071616 | -| train/ | | -| approx_kl | 0.0055905627 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 1.01 | -| explained_variance | -2.68 | -| learning_rate | 0.0003 | -| loss | -0.000191 | -| n_updates | 83710 | -| policy_gradient_loss | 0.000346 | -| std | 0.0876 | -| value_loss | 3.03e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 20 | -| iterations | 8373 | -| time_elapsed | 51423 | -| total_timesteps | 1071744 | -| train/ | | -| approx_kl | 0.0049921297 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 1.02 | -| explained_variance | -0.0712 | -| learning_rate | 0.0003 | -| loss | -0.0238 | -| n_updates | 83720 | -| policy_gradient_loss | -0.022 | -| std | 0.0875 | -| value_loss | 1.2e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 20 | -| iterations | 8374 | -| time_elapsed | 51426 | -| total_timesteps | 1071872 | -| train/ | | -| approx_kl | 0.012045974 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 1.02 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 83730 | -| policy_gradient_loss | -0.00696 | -| std | 0.0874 | -| value_loss | 1.26e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8375 | -| time_elapsed | 51429 | -| total_timesteps | 1072000 | -| train/ | | -| approx_kl | 0.00010883622 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.02 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.000305 | -| n_updates | 83740 | -| policy_gradient_loss | 0.000141 | -| std | 0.0874 | -| value_loss | 1.35e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8376 | -| time_elapsed | 51433 | -| total_timesteps | 1072128 | -| train/ | | -| approx_kl | 0.0051634153 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.02 | -| explained_variance | -0.00217 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 83750 | -| policy_gradient_loss | -0.000671 | -| std | 0.0874 | -| value_loss | 3.31e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8377 | -| time_elapsed | 51440 | -| total_timesteps | 1072256 | -| train/ | | -| approx_kl | 0.021257278 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.02 | -| explained_variance | -7.57 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 83760 | -| policy_gradient_loss | -0.0126 | -| std | 0.0873 | -| value_loss | 0.00355 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8378 | -| time_elapsed | 51443 | -| total_timesteps | 1072384 | -| train/ | | -| approx_kl | 0.0003606435 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 1.02 | -| explained_variance | -64.1 | -| learning_rate | 0.0003 | -| loss | -0.000474 | -| n_updates | 83770 | -| policy_gradient_loss | -0.000182 | -| std | 0.087 | -| value_loss | 1.72e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8379 | -| time_elapsed | 51447 | -| total_timesteps | 1072512 | -| train/ | | -| approx_kl | 0.0067016645 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 1.03 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 83780 | -| policy_gradient_loss | -0.00757 | -| std | 0.0866 | -| value_loss | 1.1e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8380 | -| time_elapsed | 51449 | -| total_timesteps | 1072640 | -| train/ | | -| approx_kl | 0.0018182192 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.03 | -| explained_variance | -16.3 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 83790 | -| policy_gradient_loss | -0.00151 | -| std | 0.0865 | -| value_loss | 6.31e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8381 | -| time_elapsed | 51455 | -| total_timesteps | 1072768 | -| train/ | | -| approx_kl | 0.0017014388 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 1.03 | -| explained_variance | -2.31 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 83800 | -| policy_gradient_loss | -0.000734 | -| std | 0.0858 | -| value_loss | 1.1e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8382 | -| time_elapsed | 51459 | -| total_timesteps | 1072896 | -| train/ | | -| approx_kl | 0.0011150711 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 1.04 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 83810 | -| policy_gradient_loss | -0.00439 | -| std | 0.0852 | -| value_loss | 2.49e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8383 | -| time_elapsed | 51462 | -| total_timesteps | 1073024 | -| train/ | | -| approx_kl | 0.0117535135 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.04 | -| explained_variance | -0.00855 | -| learning_rate | 0.0003 | -| loss | -7.07e-05 | -| n_updates | 83820 | -| policy_gradient_loss | 0.00076 | -| std | 0.0851 | -| value_loss | 7.31e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8384 | -| time_elapsed | 51469 | -| total_timesteps | 1073152 | -| train/ | | -| approx_kl | 0.003838712 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 83830 | -| policy_gradient_loss | -0.0119 | -| std | 0.085 | -| value_loss | 0.000226 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8385 | -| time_elapsed | 51473 | -| total_timesteps | 1073280 | -| train/ | | -| approx_kl | 0.053135738 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -8.56 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 83840 | -| policy_gradient_loss | -0.00772 | -| std | 0.085 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8386 | -| time_elapsed | 51476 | -| total_timesteps | 1073408 | -| train/ | | -| approx_kl | 0.055493515 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -44.5 | -| learning_rate | 0.0003 | -| loss | -0.00933 | -| n_updates | 83850 | -| policy_gradient_loss | -0.00754 | -| std | 0.085 | -| value_loss | 9.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8387 | -| time_elapsed | 51479 | -| total_timesteps | 1073536 | -| train/ | | -| approx_kl | 0.04860879 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -15.8 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 83860 | -| policy_gradient_loss | -0.0112 | -| std | 0.085 | -| value_loss | 8.61e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8388 | -| time_elapsed | 51481 | -| total_timesteps | 1073664 | -| train/ | | -| approx_kl | 0.009388007 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 83870 | -| policy_gradient_loss | 0.00786 | -| std | 0.0851 | -| value_loss | 6.47e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8389 | -| time_elapsed | 51483 | -| total_timesteps | 1073792 | -| train/ | | -| approx_kl | 0.048756063 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 1.04 | -| explained_variance | -0.606 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 83880 | -| policy_gradient_loss | -0.0112 | -| std | 0.0852 | -| value_loss | 9.58e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.818 | -| time/ | | -| fps | 20 | -| iterations | 8390 | -| time_elapsed | 51487 | -| total_timesteps | 1073920 | -| train/ | | -| approx_kl | 2.2095628e-06 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 1.04 | -| explained_variance | -0.0981 | -| learning_rate | 0.0003 | -| loss | -4.42e-05 | -| n_updates | 83890 | -| policy_gradient_loss | -0.000384 | -| std | 0.0852 | -| value_loss | 4.83e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8391 | -| time_elapsed | 51491 | -| total_timesteps | 1074048 | -| train/ | | -| approx_kl | 0.0011962657 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 1.04 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.000712 | -| n_updates | 83900 | -| policy_gradient_loss | -0.000188 | -| std | 0.0852 | -| value_loss | 5.32e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8392 | -| time_elapsed | 51497 | -| total_timesteps | 1074176 | -| train/ | | -| approx_kl | 0.0026368639 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 1.04 | -| explained_variance | -3.13 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 83910 | -| policy_gradient_loss | -0.0123 | -| std | 0.0851 | -| value_loss | 0.00213 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8393 | -| time_elapsed | 51502 | -| total_timesteps | 1074304 | -| train/ | | -| approx_kl | 0.023905542 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -124 | -| learning_rate | 0.0003 | -| loss | -0.00892 | -| n_updates | 83920 | -| policy_gradient_loss | -0.00669 | -| std | 0.085 | -| value_loss | 2.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8394 | -| time_elapsed | 51506 | -| total_timesteps | 1074432 | -| train/ | | -| approx_kl | 0.018787257 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -215 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 83930 | -| policy_gradient_loss | -0.00573 | -| std | 0.0849 | -| value_loss | 5.01e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8395 | -| time_elapsed | 51509 | -| total_timesteps | 1074560 | -| train/ | | -| approx_kl | 0.0009834496 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -142 | -| learning_rate | 0.0003 | -| loss | -0.00895 | -| n_updates | 83940 | -| policy_gradient_loss | -0.0119 | -| std | 0.0849 | -| value_loss | 1.55e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8396 | -| time_elapsed | 51513 | -| total_timesteps | 1074688 | -| train/ | | -| approx_kl | 0.00080728857 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -1.57 | -| learning_rate | 0.0003 | -| loss | -0.000516 | -| n_updates | 83950 | -| policy_gradient_loss | 4.68e-05 | -| std | 0.0848 | -| value_loss | 5.86e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8397 | -| time_elapsed | 51517 | -| total_timesteps | 1074816 | -| train/ | | -| approx_kl | 0.0108197965 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 83960 | -| policy_gradient_loss | -0.00898 | -| std | 0.0846 | -| value_loss | 2.1e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8398 | -| time_elapsed | 51521 | -| total_timesteps | 1074944 | -| train/ | | -| approx_kl | 0.009981656 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -6.42 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 83970 | -| policy_gradient_loss | -0.00559 | -| std | 0.0845 | -| value_loss | 0.00014 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8399 | -| time_elapsed | 51524 | -| total_timesteps | 1075072 | -| train/ | | -| approx_kl | 0.019271966 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 83980 | -| policy_gradient_loss | -0.00213 | -| std | 0.0845 | -| value_loss | 8.5e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8400 | -| time_elapsed | 51530 | -| total_timesteps | 1075200 | -| train/ | | -| approx_kl | 0.005794045 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | 0.0704 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 83990 | -| policy_gradient_loss | -0.0075 | -| std | 0.0845 | -| value_loss | 0.000851 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8401 | -| time_elapsed | 51533 | -| total_timesteps | 1075328 | -| train/ | | -| approx_kl | 0.009427873 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | 0.000819 | -| n_updates | 84000 | -| policy_gradient_loss | 0.000474 | -| std | 0.0845 | -| value_loss | 2.37e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8402 | -| time_elapsed | 51537 | -| total_timesteps | 1075456 | -| train/ | | -| approx_kl | 0.00011498947 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.000875 | -| n_updates | 84010 | -| policy_gradient_loss | -0.000376 | -| std | 0.084 | -| value_loss | 1.67e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8403 | -| time_elapsed | 51541 | -| total_timesteps | 1075584 | -| train/ | | -| approx_kl | 3.545964e-05 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.0881 | -| learning_rate | 0.0003 | -| loss | 8.25e-06 | -| n_updates | 84020 | -| policy_gradient_loss | 0.00147 | -| std | 0.0836 | -| value_loss | 2.96e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8404 | -| time_elapsed | 51544 | -| total_timesteps | 1075712 | -| train/ | | -| approx_kl | 0.0032958328 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | 0.000186 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 84030 | -| policy_gradient_loss | -0.0104 | -| std | 0.0835 | -| value_loss | 9.01e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8405 | -| time_elapsed | 51547 | -| total_timesteps | 1075840 | -| train/ | | -| approx_kl | 0.0003134911 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | -0.000328 | -| n_updates | 84040 | -| policy_gradient_loss | 0.00155 | -| std | 0.0835 | -| value_loss | 7.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8406 | -| time_elapsed | 51550 | -| total_timesteps | 1075968 | -| train/ | | -| approx_kl | 0.002971741 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | 0.00373 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 84050 | -| policy_gradient_loss | -0.00073 | -| std | 0.0835 | -| value_loss | 6.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8407 | -| time_elapsed | 51555 | -| total_timesteps | 1076096 | -| train/ | | -| approx_kl | 0.011451691 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.0737 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 84060 | -| policy_gradient_loss | 0.00228 | -| std | 0.0834 | -| value_loss | 9.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8408 | -| time_elapsed | 51562 | -| total_timesteps | 1076224 | -| train/ | | -| approx_kl | 0.018501598 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | 0.919 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 84070 | -| policy_gradient_loss | -0.0136 | -| std | 0.0834 | -| value_loss | 0.000513 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8409 | -| time_elapsed | 51565 | -| total_timesteps | 1076352 | -| train/ | | -| approx_kl | 0.043167867 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -3.56 | -| learning_rate | 0.0003 | -| loss | 0.00264 | -| n_updates | 84080 | -| policy_gradient_loss | -0.00022 | -| std | 0.0834 | -| value_loss | 1.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8410 | -| time_elapsed | 51569 | -| total_timesteps | 1076480 | -| train/ | | -| approx_kl | 0.026370857 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -9.55 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 84090 | -| policy_gradient_loss | -0.00272 | -| std | 0.0835 | -| value_loss | 8.42e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8411 | -| time_elapsed | 51573 | -| total_timesteps | 1076608 | -| train/ | | -| approx_kl | 0.0053106626 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 84100 | -| policy_gradient_loss | 0.00399 | -| std | 0.0837 | -| value_loss | 1.7e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8412 | -| time_elapsed | 51576 | -| total_timesteps | 1076736 | -| train/ | | -| approx_kl | 0.0056329933 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 84110 | -| policy_gradient_loss | 0.000668 | -| std | 0.0836 | -| value_loss | 8.1e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8413 | -| time_elapsed | 51580 | -| total_timesteps | 1076864 | -| train/ | | -| approx_kl | 0.0069388184 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | 0.0039 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 84120 | -| policy_gradient_loss | -0.0109 | -| std | 0.0835 | -| value_loss | 1.5e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.811 | -| time/ | | -| fps | 20 | -| iterations | 8414 | -| time_elapsed | 51583 | -| total_timesteps | 1076992 | -| train/ | | -| approx_kl | 0.01110053 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.00699 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 84130 | -| policy_gradient_loss | -0.00186 | -| std | 0.0833 | -| value_loss | 4.51e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8415 | -| time_elapsed | 51586 | -| total_timesteps | 1077120 | -| train/ | | -| approx_kl | 0.0024324805 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.00223 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 84140 | -| policy_gradient_loss | -0.00668 | -| std | 0.0832 | -| value_loss | 2.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8416 | -| time_elapsed | 51595 | -| total_timesteps | 1077248 | -| train/ | | -| approx_kl | 0.019943433 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.423 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 84150 | -| policy_gradient_loss | -0.0159 | -| std | 0.0831 | -| value_loss | 0.000989 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8417 | -| time_elapsed | 51597 | -| total_timesteps | 1077376 | -| train/ | | -| approx_kl | 0.00067530666 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -297 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 84160 | -| policy_gradient_loss | -0.00264 | -| std | 0.083 | -| value_loss | 4.17e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8418 | -| time_elapsed | 51601 | -| total_timesteps | 1077504 | -| train/ | | -| approx_kl | 0.050079197 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -15.5 | -| learning_rate | 0.0003 | -| loss | -0.00718 | -| n_updates | 84170 | -| policy_gradient_loss | -0.00562 | -| std | 0.0828 | -| value_loss | 4.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8419 | -| time_elapsed | 51604 | -| total_timesteps | 1077632 | -| train/ | | -| approx_kl | 0.008828914 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -6.33 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 84180 | -| policy_gradient_loss | -0.0152 | -| std | 0.0829 | -| value_loss | 2.57e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8420 | -| time_elapsed | 51607 | -| total_timesteps | 1077760 | -| train/ | | -| approx_kl | 0.01676181 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 84190 | -| policy_gradient_loss | -0.00181 | -| std | 0.0829 | -| value_loss | 4.5e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 20 | -| iterations | 8421 | -| time_elapsed | 51610 | -| total_timesteps | 1077888 | -| train/ | | -| approx_kl | 0.0035558958 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | -0.000423 | -| n_updates | 84200 | -| policy_gradient_loss | 5.87e-05 | -| std | 0.0831 | -| value_loss | 7.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8422 | -| time_elapsed | 51614 | -| total_timesteps | 1078016 | -| train/ | | -| approx_kl | 0.010077253 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.0815 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 84210 | -| policy_gradient_loss | 0.000367 | -| std | 0.0833 | -| value_loss | 2.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8423 | -| time_elapsed | 51622 | -| total_timesteps | 1078144 | -| train/ | | -| approx_kl | 0.011687269 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | 0.687 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 84220 | -| policy_gradient_loss | -0.00975 | -| std | 0.0833 | -| value_loss | 0.00406 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8424 | -| time_elapsed | 51625 | -| total_timesteps | 1078272 | -| train/ | | -| approx_kl | 0.0692756 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -65.6 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 84230 | -| policy_gradient_loss | -0.00158 | -| std | 0.0834 | -| value_loss | 1.56e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8425 | -| time_elapsed | 51628 | -| total_timesteps | 1078400 | -| train/ | | -| approx_kl | 0.016702544 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -1.57e+03 | -| learning_rate | 0.0003 | -| loss | -0.00428 | -| n_updates | 84240 | -| policy_gradient_loss | -0.00143 | -| std | 0.0835 | -| value_loss | 1.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8426 | -| time_elapsed | 51631 | -| total_timesteps | 1078528 | -| train/ | | -| approx_kl | 0.005581429 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -481 | -| learning_rate | 0.0003 | -| loss | -0.000498 | -| n_updates | 84250 | -| policy_gradient_loss | -0.000326 | -| std | 0.0837 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8427 | -| time_elapsed | 51634 | -| total_timesteps | 1078656 | -| train/ | | -| approx_kl | 0.0062371935 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -29.7 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 84260 | -| policy_gradient_loss | -0.0102 | -| std | 0.0839 | -| value_loss | 9.18e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8428 | -| time_elapsed | 51637 | -| total_timesteps | 1078784 | -| train/ | | -| approx_kl | 0.0004538754 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.75 | -| learning_rate | 0.0003 | -| loss | -0.000289 | -| n_updates | 84270 | -| policy_gradient_loss | 0.000196 | -| std | 0.0842 | -| value_loss | 3.39e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.808 | -| time/ | | -| fps | 20 | -| iterations | 8429 | -| time_elapsed | 51641 | -| total_timesteps | 1078912 | -| train/ | | -| approx_kl | 0.0045857276 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -0.252 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 84280 | -| policy_gradient_loss | -0.000709 | -| std | 0.0843 | -| value_loss | 1.81e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8430 | -| time_elapsed | 51644 | -| total_timesteps | 1079040 | -| train/ | | -| approx_kl | 0.0076667266 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | 0.00398 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 84290 | -| policy_gradient_loss | -0.0033 | -| std | 0.0842 | -| value_loss | 2.74e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8431 | -| time_elapsed | 51653 | -| total_timesteps | 1079168 | -| train/ | | -| approx_kl | 0.09440142 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | 0.609 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 84300 | -| policy_gradient_loss | -0.0103 | -| std | 0.0842 | -| value_loss | 0.000515 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8432 | -| time_elapsed | 51656 | -| total_timesteps | 1079296 | -| train/ | | -| approx_kl | 0.00036183465 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -53.2 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 84310 | -| policy_gradient_loss | -0.0124 | -| std | 0.0842 | -| value_loss | 7.26e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8433 | -| time_elapsed | 51660 | -| total_timesteps | 1079424 | -| train/ | | -| approx_kl | 1.8835533e-05 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -163 | -| learning_rate | 0.0003 | -| loss | -0.000236 | -| n_updates | 84320 | -| policy_gradient_loss | -8.21e-05 | -| std | 0.0839 | -| value_loss | 2.9e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8434 | -| time_elapsed | 51664 | -| total_timesteps | 1079552 | -| train/ | | -| approx_kl | 0.004379759 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -16.7 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 84330 | -| policy_gradient_loss | -0.0111 | -| std | 0.0837 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8435 | -| time_elapsed | 51667 | -| total_timesteps | 1079680 | -| train/ | | -| approx_kl | 0.004911372 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -9.93 | -| learning_rate | 0.0003 | -| loss | -0.00978 | -| n_updates | 84340 | -| policy_gradient_loss | -0.00657 | -| std | 0.0837 | -| value_loss | 3.58e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8436 | -| time_elapsed | 51671 | -| total_timesteps | 1079808 | -| train/ | | -| approx_kl | 0.0010921573 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.851 | -| learning_rate | 0.0003 | -| loss | -0.000446 | -| n_updates | 84350 | -| policy_gradient_loss | -0.000367 | -| std | 0.0837 | -| value_loss | 2.59e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8437 | -| time_elapsed | 51673 | -| total_timesteps | 1079936 | -| train/ | | -| approx_kl | 0.013846586 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.00687 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 84360 | -| policy_gradient_loss | -0.00485 | -| std | 0.0837 | -| value_loss | 4.06e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8438 | -| time_elapsed | 51676 | -| total_timesteps | 1080064 | -| train/ | | -| approx_kl | 0.0068727164 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | 0.000729 | -| n_updates | 84370 | -| policy_gradient_loss | 0.00074 | -| std | 0.0837 | -| value_loss | 1.8e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8439 | -| time_elapsed | 51680 | -| total_timesteps | 1080192 | -| train/ | | -| approx_kl | 0.02317356 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | 0.698 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 84380 | -| policy_gradient_loss | -0.012 | -| std | 0.0837 | -| value_loss | 0.00452 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8440 | -| time_elapsed | 51685 | -| total_timesteps | 1080320 | -| train/ | | -| approx_kl | 0.0029635727 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -80.9 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 84390 | -| policy_gradient_loss | -0.0123 | -| std | 0.0837 | -| value_loss | 4.18e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8441 | -| time_elapsed | 51689 | -| total_timesteps | 1080448 | -| train/ | | -| approx_kl | 0.26486763 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -5.46e+03 | -| learning_rate | 0.0003 | -| loss | -0.000928 | -| n_updates | 84400 | -| policy_gradient_loss | -0.00368 | -| std | 0.0838 | -| value_loss | 2.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8442 | -| time_elapsed | 51692 | -| total_timesteps | 1080576 | -| train/ | | -| approx_kl | 0.124579966 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -1.09e+03 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 84410 | -| policy_gradient_loss | -0.0103 | -| std | 0.0838 | -| value_loss | 2.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8443 | -| time_elapsed | 51695 | -| total_timesteps | 1080704 | -| train/ | | -| approx_kl | 0.061421696 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -147 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 84420 | -| policy_gradient_loss | -0.00202 | -| std | 0.0839 | -| value_loss | 1.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8444 | -| time_elapsed | 51698 | -| total_timesteps | 1080832 | -| train/ | | -| approx_kl | 0.02423473 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -8.56 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 84430 | -| policy_gradient_loss | -0.00204 | -| std | 0.0841 | -| value_loss | 7.42e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.804 | -| time/ | | -| fps | 20 | -| iterations | 8445 | -| time_elapsed | 51701 | -| total_timesteps | 1080960 | -| train/ | | -| approx_kl | 0.008002963 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 84440 | -| policy_gradient_loss | -0.0015 | -| std | 0.0843 | -| value_loss | 4.59e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8446 | -| time_elapsed | 51704 | -| total_timesteps | 1081088 | -| train/ | | -| approx_kl | 0.0013646367 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 84450 | -| policy_gradient_loss | 0.00419 | -| std | 0.0844 | -| value_loss | 3.99e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8447 | -| time_elapsed | 51711 | -| total_timesteps | 1081216 | -| train/ | | -| approx_kl | 0.012292605 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -8.51 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 84460 | -| policy_gradient_loss | -0.0104 | -| std | 0.0844 | -| value_loss | 0.00261 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8448 | -| time_elapsed | 51714 | -| total_timesteps | 1081344 | -| train/ | | -| approx_kl | 0.11186673 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -33 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 84470 | -| policy_gradient_loss | -0.00954 | -| std | 0.0844 | -| value_loss | 3.13e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8449 | -| time_elapsed | 51717 | -| total_timesteps | 1081472 | -| train/ | | -| approx_kl | 0.04989908 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -134 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 84480 | -| policy_gradient_loss | -0.0165 | -| std | 0.0844 | -| value_loss | 1.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8450 | -| time_elapsed | 51719 | -| total_timesteps | 1081600 | -| train/ | | -| approx_kl | 0.017141415 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 1.05 | -| explained_variance | -796 | -| learning_rate | 0.0003 | -| loss | -0.000692 | -| n_updates | 84490 | -| policy_gradient_loss | -0.000119 | -| std | 0.0843 | -| value_loss | 3.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8451 | -| time_elapsed | 51723 | -| total_timesteps | 1081728 | -| train/ | | -| approx_kl | 0.005482232 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -25.3 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 84500 | -| policy_gradient_loss | -0.00214 | -| std | 0.0841 | -| value_loss | 1.64e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8452 | -| time_elapsed | 51726 | -| total_timesteps | 1081856 | -| train/ | | -| approx_kl | 0.019477073 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.75 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 84510 | -| policy_gradient_loss | -0.000768 | -| std | 0.084 | -| value_loss | 1.16e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.81 | -| time/ | | -| fps | 20 | -| iterations | 8453 | -| time_elapsed | 51730 | -| total_timesteps | 1081984 | -| train/ | | -| approx_kl | 0.00040533347 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 84520 | -| policy_gradient_loss | 0.00423 | -| std | 0.0839 | -| value_loss | 8.54e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8454 | -| time_elapsed | 51733 | -| total_timesteps | 1082112 | -| train/ | | -| approx_kl | 0.0077783274 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -0.0051 | -| learning_rate | 0.0003 | -| loss | -0.000739 | -| n_updates | 84530 | -| policy_gradient_loss | 0.000663 | -| std | 0.0838 | -| value_loss | 9.9e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8455 | -| time_elapsed | 51739 | -| total_timesteps | 1082240 | -| train/ | | -| approx_kl | 0.004997322 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -1.64 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 84540 | -| policy_gradient_loss | -0.0121 | -| std | 0.0837 | -| value_loss | 0.0015 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8456 | -| time_elapsed | 51741 | -| total_timesteps | 1082368 | -| train/ | | -| approx_kl | 0.006319737 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -80.5 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 84550 | -| policy_gradient_loss | -0.00155 | -| std | 0.0835 | -| value_loss | 5.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8457 | -| time_elapsed | 51744 | -| total_timesteps | 1082496 | -| train/ | | -| approx_kl | 0.01145138 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 1.06 | -| explained_variance | -1.77e+03 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 84560 | -| policy_gradient_loss | 0.000516 | -| std | 0.0834 | -| value_loss | 3.79e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8458 | -| time_elapsed | 51747 | -| total_timesteps | 1082624 | -| train/ | | -| approx_kl | 0.09591443 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -129 | -| learning_rate | 0.0003 | -| loss | 0.00838 | -| n_updates | 84570 | -| policy_gradient_loss | 0.00573 | -| std | 0.0833 | -| value_loss | 3.24e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8459 | -| time_elapsed | 51750 | -| total_timesteps | 1082752 | -| train/ | | -| approx_kl | 0.029805604 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -17 | -| learning_rate | 0.0003 | -| loss | 0.000416 | -| n_updates | 84580 | -| policy_gradient_loss | -0.000187 | -| std | 0.0832 | -| value_loss | 4.59e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8460 | -| time_elapsed | 51753 | -| total_timesteps | 1082880 | -| train/ | | -| approx_kl | 0.0047632963 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 84590 | -| policy_gradient_loss | -0.00348 | -| std | 0.0832 | -| value_loss | 1.79e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8461 | -| time_elapsed | 51755 | -| total_timesteps | 1083008 | -| train/ | | -| approx_kl | 4.0675048e-05 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.364 | -| learning_rate | 0.0003 | -| loss | -0.000378 | -| n_updates | 84600 | -| policy_gradient_loss | -0.00109 | -| std | 0.0832 | -| value_loss | 7.9e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8462 | -| time_elapsed | 51764 | -| total_timesteps | 1083136 | -| train/ | | -| approx_kl | 0.0016158833 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 84610 | -| policy_gradient_loss | -0.0108 | -| std | 0.0831 | -| value_loss | 0.00152 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8463 | -| time_elapsed | 51766 | -| total_timesteps | 1083264 | -| train/ | | -| approx_kl | 0.040220965 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -35 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 84620 | -| policy_gradient_loss | -0.0127 | -| std | 0.0831 | -| value_loss | 5.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8464 | -| time_elapsed | 51769 | -| total_timesteps | 1083392 | -| train/ | | -| approx_kl | 0.004499528 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -6.5e+03 | -| learning_rate | 0.0003 | -| loss | -0.000319 | -| n_updates | 84630 | -| policy_gradient_loss | 7.81e-05 | -| std | 0.0831 | -| value_loss | 5.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8465 | -| time_elapsed | 51772 | -| total_timesteps | 1083520 | -| train/ | | -| approx_kl | 0.048794318 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -7.45e+03 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 84640 | -| policy_gradient_loss | -0.0126 | -| std | 0.0831 | -| value_loss | 3.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8466 | -| time_elapsed | 51774 | -| total_timesteps | 1083648 | -| train/ | | -| approx_kl | 0.049867947 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 84650 | -| policy_gradient_loss | -0.00131 | -| std | 0.0831 | -| value_loss | 8.73e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8467 | -| time_elapsed | 51777 | -| total_timesteps | 1083776 | -| train/ | | -| approx_kl | 0.025904264 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 84660 | -| policy_gradient_loss | -0.00608 | -| std | 0.0832 | -| value_loss | 1.11e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.805 | -| time/ | | -| fps | 20 | -| iterations | 8468 | -| time_elapsed | 51779 | -| total_timesteps | 1083904 | -| train/ | | -| approx_kl | 0.018647673 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | 0.00605 | -| n_updates | 84670 | -| policy_gradient_loss | 0.00197 | -| std | 0.0832 | -| value_loss | 4.89e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8469 | -| time_elapsed | 51781 | -| total_timesteps | 1084032 | -| train/ | | -| approx_kl | 0.015296172 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 84680 | -| policy_gradient_loss | -0.00668 | -| std | 0.0832 | -| value_loss | 7.12e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8470 | -| time_elapsed | 51789 | -| total_timesteps | 1084160 | -| train/ | | -| approx_kl | 0.016829766 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 84690 | -| policy_gradient_loss | -0.0102 | -| std | 0.0833 | -| value_loss | 0.000595 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8471 | -| time_elapsed | 51793 | -| total_timesteps | 1084288 | -| train/ | | -| approx_kl | 0.03341244 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -65.5 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 84700 | -| policy_gradient_loss | -0.00591 | -| std | 0.0833 | -| value_loss | 2.71e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8472 | -| time_elapsed | 51797 | -| total_timesteps | 1084416 | -| train/ | | -| approx_kl | 0.00072759483 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -76.9 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 84710 | -| policy_gradient_loss | 0.00266 | -| std | 0.0831 | -| value_loss | 1.41e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8473 | -| time_elapsed | 51801 | -| total_timesteps | 1084544 | -| train/ | | -| approx_kl | 0.007521515 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 84720 | -| policy_gradient_loss | -0.0115 | -| std | 0.0829 | -| value_loss | 5.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8474 | -| time_elapsed | 51805 | -| total_timesteps | 1084672 | -| train/ | | -| approx_kl | 0.010907181 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 84730 | -| policy_gradient_loss | -0.01 | -| std | 0.0828 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8475 | -| time_elapsed | 51809 | -| total_timesteps | 1084800 | -| train/ | | -| approx_kl | 0.022164926 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | 0.00741 | -| n_updates | 84740 | -| policy_gradient_loss | 0.00468 | -| std | 0.0828 | -| value_loss | 5.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.807 | -| time/ | | -| fps | 20 | -| iterations | 8476 | -| time_elapsed | 51812 | -| total_timesteps | 1084928 | -| train/ | | -| approx_kl | 0.00557567 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | -0.00646 | -| n_updates | 84750 | -| policy_gradient_loss | -0.00255 | -| std | 0.0828 | -| value_loss | 9.71e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8477 | -| time_elapsed | 51816 | -| total_timesteps | 1085056 | -| train/ | | -| approx_kl | 0.0005746139 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 84760 | -| policy_gradient_loss | 0.000845 | -| std | 0.0828 | -| value_loss | 3.83e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8478 | -| time_elapsed | 51823 | -| total_timesteps | 1085184 | -| train/ | | -| approx_kl | 0.02981212 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 84770 | -| policy_gradient_loss | -0.00168 | -| std | 0.0826 | -| value_loss | 0.00054 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8479 | -| time_elapsed | 51828 | -| total_timesteps | 1085312 | -| train/ | | -| approx_kl | 0.15783001 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | 0.000274 | -| n_updates | 84780 | -| policy_gradient_loss | -0.00182 | -| std | 0.0826 | -| value_loss | 7.75e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8480 | -| time_elapsed | 51831 | -| total_timesteps | 1085440 | -| train/ | | -| approx_kl | 0.0010105227 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 84790 | -| policy_gradient_loss | -0.0124 | -| std | 0.0825 | -| value_loss | 3.33e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8481 | -| time_elapsed | 51833 | -| total_timesteps | 1085568 | -| train/ | | -| approx_kl | 0.0021078251 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -12.7 | -| learning_rate | 0.0003 | -| loss | -0.00891 | -| n_updates | 84800 | -| policy_gradient_loss | -0.008 | -| std | 0.0825 | -| value_loss | 9.61e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8482 | -| time_elapsed | 51836 | -| total_timesteps | 1085696 | -| train/ | | -| approx_kl | 0.08175324 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -5.33 | -| learning_rate | 0.0003 | -| loss | 0.000289 | -| n_updates | 84810 | -| policy_gradient_loss | -0.00161 | -| std | 0.0825 | -| value_loss | 1.14e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8483 | -| time_elapsed | 51840 | -| total_timesteps | 1085824 | -| train/ | | -| approx_kl | 0.0052372306 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.357 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 84820 | -| policy_gradient_loss | 9.89e-05 | -| std | 0.0825 | -| value_loss | 1.16e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8484 | -| time_elapsed | 51843 | -| total_timesteps | 1085952 | -| train/ | | -| approx_kl | 0.00103187 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 84830 | -| policy_gradient_loss | -0.0061 | -| std | 0.0826 | -| value_loss | 4.78e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8485 | -| time_elapsed | 51845 | -| total_timesteps | 1086080 | -| train/ | | -| approx_kl | 0.00618149 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 84840 | -| policy_gradient_loss | -0.00562 | -| std | 0.0826 | -| value_loss | 1.29e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8486 | -| time_elapsed | 51853 | -| total_timesteps | 1086208 | -| train/ | | -| approx_kl | 0.017736156 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 84850 | -| policy_gradient_loss | -0.00507 | -| std | 0.0825 | -| value_loss | 0.00136 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8487 | -| time_elapsed | 51856 | -| total_timesteps | 1086336 | -| train/ | | -| approx_kl | 0.116037734 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -388 | -| learning_rate | 0.0003 | -| loss | 0.00508 | -| n_updates | 84860 | -| policy_gradient_loss | 0.00175 | -| std | 0.0824 | -| value_loss | 5.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8488 | -| time_elapsed | 51860 | -| total_timesteps | 1086464 | -| train/ | | -| approx_kl | 0.12577385 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -599 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 84870 | -| policy_gradient_loss | -0.00424 | -| std | 0.0824 | -| value_loss | 2.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8489 | -| time_elapsed | 51863 | -| total_timesteps | 1086592 | -| train/ | | -| approx_kl | 0.23035316 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -84.4 | -| learning_rate | 0.0003 | -| loss | 0.00868 | -| n_updates | 84880 | -| policy_gradient_loss | 0.00166 | -| std | 0.0825 | -| value_loss | 2.51e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8490 | -| time_elapsed | 51867 | -| total_timesteps | 1086720 | -| train/ | | -| approx_kl | 0.04531256 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -6.71 | -| learning_rate | 0.0003 | -| loss | 0.00329 | -| n_updates | 84890 | -| policy_gradient_loss | 0.0006 | -| std | 0.0825 | -| value_loss | 2.66e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8491 | -| time_elapsed | 51869 | -| total_timesteps | 1086848 | -| train/ | | -| approx_kl | 0.009410737 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.852 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 84900 | -| policy_gradient_loss | -0.00731 | -| std | 0.0824 | -| value_loss | 2.01e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8492 | -| time_elapsed | 51873 | -| total_timesteps | 1086976 | -| train/ | | -| approx_kl | 0.00015199045 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.295 | -| learning_rate | 0.0003 | -| loss | -0.00041 | -| n_updates | 84910 | -| policy_gradient_loss | 0.00516 | -| std | 0.0823 | -| value_loss | 5.69e-09 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8493 | -| time_elapsed | 51876 | -| total_timesteps | 1087104 | -| train/ | | -| approx_kl | 0.046607 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.00503 | -| learning_rate | 0.0003 | -| loss | 0.00264 | -| n_updates | 84920 | -| policy_gradient_loss | -0.00241 | -| std | 0.0821 | -| value_loss | 2.68e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8494 | -| time_elapsed | 51884 | -| total_timesteps | 1087232 | -| train/ | | -| approx_kl | 0.02713236 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 84930 | -| policy_gradient_loss | -0.0127 | -| std | 0.0821 | -| value_loss | 0.00299 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8495 | -| time_elapsed | 51888 | -| total_timesteps | 1087360 | -| train/ | | -| approx_kl | 0.16113853 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -397 | -| learning_rate | 0.0003 | -| loss | -0.0072 | -| n_updates | 84940 | -| policy_gradient_loss | -0.00312 | -| std | 0.0822 | -| value_loss | 4.16e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8496 | -| time_elapsed | 51891 | -| total_timesteps | 1087488 | -| train/ | | -| approx_kl | 0.16826068 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -3.38e+03 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 84950 | -| policy_gradient_loss | -0.00785 | -| std | 0.0823 | -| value_loss | 2.75e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8497 | -| time_elapsed | 51894 | -| total_timesteps | 1087616 | -| train/ | | -| approx_kl | 0.0019156081 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -413 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 84960 | -| policy_gradient_loss | -0.0126 | -| std | 0.0824 | -| value_loss | 1.55e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8498 | -| time_elapsed | 51898 | -| total_timesteps | 1087744 | -| train/ | | -| approx_kl | 0.002740249 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -38.9 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 84970 | -| policy_gradient_loss | -0.0123 | -| std | 0.0824 | -| value_loss | 1.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.813 | -| time/ | | -| fps | 20 | -| iterations | 8499 | -| time_elapsed | 51900 | -| total_timesteps | 1087872 | -| train/ | | -| approx_kl | 0.001983548 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -9.76 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 84980 | -| policy_gradient_loss | -0.000887 | -| std | 0.0825 | -| value_loss | 1.22e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8500 | -| time_elapsed | 51904 | -| total_timesteps | 1088000 | -| train/ | | -| approx_kl | 0.0006964044 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.331 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 84990 | -| policy_gradient_loss | -0.00222 | -| std | 0.0826 | -| value_loss | 2.51e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8501 | -| time_elapsed | 51906 | -| total_timesteps | 1088128 | -| train/ | | -| approx_kl | 0.00015193364 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.00568 | -| learning_rate | 0.0003 | -| loss | -0.000476 | -| n_updates | 85000 | -| policy_gradient_loss | 0.00115 | -| std | 0.0827 | -| value_loss | 2.16e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8502 | -| time_elapsed | 51913 | -| total_timesteps | 1088256 | -| train/ | | -| approx_kl | 0.0024967957 | -| clip_fraction | 0.0133 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 85010 | -| policy_gradient_loss | -0.00644 | -| std | 0.0827 | -| value_loss | 0.00235 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8503 | -| time_elapsed | 51917 | -| total_timesteps | 1088384 | -| train/ | | -| approx_kl | 0.107497774 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -109 | -| learning_rate | 0.0003 | -| loss | -0.00848 | -| n_updates | 85020 | -| policy_gradient_loss | -0.00731 | -| std | 0.0827 | -| value_loss | 1.29e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8504 | -| time_elapsed | 51921 | -| total_timesteps | 1088512 | -| train/ | | -| approx_kl | 0.081372 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -788 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 85030 | -| policy_gradient_loss | -0.00321 | -| std | 0.0826 | -| value_loss | 1.06e-06 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8505 | -| time_elapsed | 51924 | -| total_timesteps | 1088640 | -| train/ | | -| approx_kl | 0.0023450828 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 1.07 | -| explained_variance | -16.6 | -| learning_rate | 0.0003 | -| loss | -0.000182 | -| n_updates | 85040 | -| policy_gradient_loss | 1.23e-05 | -| std | 0.0825 | -| value_loss | 1.39e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8506 | -| time_elapsed | 51928 | -| total_timesteps | 1088768 | -| train/ | | -| approx_kl | 0.0005455846 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.000382 | -| n_updates | 85050 | -| policy_gradient_loss | 0.00379 | -| std | 0.0823 | -| value_loss | 1.08e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8507 | -| time_elapsed | 51932 | -| total_timesteps | 1088896 | -| train/ | | -| approx_kl | 0.0012773522 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.00266 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 85060 | -| policy_gradient_loss | -0.000787 | -| std | 0.0821 | -| value_loss | 4.65e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8508 | -| time_elapsed | 51935 | -| total_timesteps | 1089024 | -| train/ | | -| approx_kl | 0.0015650461 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.00939 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 85070 | -| policy_gradient_loss | -0.00397 | -| std | 0.0821 | -| value_loss | 3.49e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8509 | -| time_elapsed | 51943 | -| total_timesteps | 1089152 | -| train/ | | -| approx_kl | 0.023871273 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 85080 | -| policy_gradient_loss | -0.0132 | -| std | 0.0822 | -| value_loss | 0.0014 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8510 | -| time_elapsed | 51947 | -| total_timesteps | 1089280 | -| train/ | | -| approx_kl | 0.14161722 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -486 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 85090 | -| policy_gradient_loss | -0.00934 | -| std | 0.0822 | -| value_loss | 3.28e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8511 | -| time_elapsed | 51951 | -| total_timesteps | 1089408 | -| train/ | | -| approx_kl | 0.0022288552 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -1.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 85100 | -| policy_gradient_loss | -0.0167 | -| std | 0.0822 | -| value_loss | 2.87e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8512 | -| time_elapsed | 51954 | -| total_timesteps | 1089536 | -| train/ | | -| approx_kl | 0.0021569664 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -24.2 | -| learning_rate | 0.0003 | -| loss | -0.000834 | -| n_updates | 85110 | -| policy_gradient_loss | -0.000557 | -| std | 0.0823 | -| value_loss | 2.53e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8513 | -| time_elapsed | 51957 | -| total_timesteps | 1089664 | -| train/ | | -| approx_kl | 0.002333674 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.473 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 85120 | -| policy_gradient_loss | -0.000932 | -| std | 0.0823 | -| value_loss | 3.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8514 | -| time_elapsed | 51959 | -| total_timesteps | 1089792 | -| train/ | | -| approx_kl | 0.031072475 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.662 | -| learning_rate | 0.0003 | -| loss | 0.00174 | -| n_updates | 85130 | -| policy_gradient_loss | -0.000247 | -| std | 0.0822 | -| value_loss | 8.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.809 | -| time/ | | -| fps | 20 | -| iterations | 8515 | -| time_elapsed | 51963 | -| total_timesteps | 1089920 | -| train/ | | -| approx_kl | 0.015945503 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 85140 | -| policy_gradient_loss | -0.0106 | -| std | 0.0822 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8516 | -| time_elapsed | 51966 | -| total_timesteps | 1090048 | -| train/ | | -| approx_kl | 0.026035063 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | -4.66e-05 | -| n_updates | 85150 | -| policy_gradient_loss | -0.000337 | -| std | 0.0823 | -| value_loss | 3.63e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8517 | -| time_elapsed | 51974 | -| total_timesteps | 1090176 | -| train/ | | -| approx_kl | 0.016631907 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.744 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 85160 | -| policy_gradient_loss | -0.00775 | -| std | 0.0824 | -| value_loss | 0.00324 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8518 | -| time_elapsed | 51977 | -| total_timesteps | 1090304 | -| train/ | | -| approx_kl | 0.024990924 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -88.3 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 85170 | -| policy_gradient_loss | -0.00195 | -| std | 0.0824 | -| value_loss | 6.82e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8519 | -| time_elapsed | 51981 | -| total_timesteps | 1090432 | -| train/ | | -| approx_kl | 7.357029e-05 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -50 | -| learning_rate | 0.0003 | -| loss | -0.000432 | -| n_updates | 85180 | -| policy_gradient_loss | 0.000122 | -| std | 0.0822 | -| value_loss | 1.68e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8520 | -| time_elapsed | 51984 | -| total_timesteps | 1090560 | -| train/ | | -| approx_kl | 0.01942195 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -1.61 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 85190 | -| policy_gradient_loss | -0.000144 | -| std | 0.082 | -| value_loss | 1.4e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8521 | -| time_elapsed | 51987 | -| total_timesteps | 1090688 | -| train/ | | -| approx_kl | 0.018205615 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.000609 | -| learning_rate | 0.0003 | -| loss | 0.000777 | -| n_updates | 85200 | -| policy_gradient_loss | 0.000186 | -| std | 0.0819 | -| value_loss | 7.82e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8522 | -| time_elapsed | 51990 | -| total_timesteps | 1090816 | -| train/ | | -| approx_kl | 0.00040392485 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | -0.000386 | -| n_updates | 85210 | -| policy_gradient_loss | -0.000326 | -| std | 0.0819 | -| value_loss | 2.64e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.816 | -| time/ | | -| fps | 20 | -| iterations | 8523 | -| time_elapsed | 51993 | -| total_timesteps | 1090944 | -| train/ | | -| approx_kl | 2.0977575e-05 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.00134 | -| learning_rate | 0.0003 | -| loss | -0.000382 | -| n_updates | 85220 | -| policy_gradient_loss | -0.00196 | -| std | 0.0819 | -| value_loss | 1.92e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8524 | -| time_elapsed | 51997 | -| total_timesteps | 1091072 | -| train/ | | -| approx_kl | 0.0060319463 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.000643 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 85230 | -| policy_gradient_loss | -0.00652 | -| std | 0.0818 | -| value_loss | 2.3e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8525 | -| time_elapsed | 52003 | -| total_timesteps | 1091200 | -| train/ | | -| approx_kl | 0.004653758 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 85240 | -| policy_gradient_loss | -0.0167 | -| std | 0.0818 | -| value_loss | 0.000419 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8526 | -| time_elapsed | 52006 | -| total_timesteps | 1091328 | -| train/ | | -| approx_kl | 0.0029080133 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -3.04e+03 | -| learning_rate | 0.0003 | -| loss | -0.000528 | -| n_updates | 85250 | -| policy_gradient_loss | -0.00031 | -| std | 0.0821 | -| value_loss | 6.91e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8527 | -| time_elapsed | 52010 | -| total_timesteps | 1091456 | -| train/ | | -| approx_kl | 0.00955705 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -722 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 85260 | -| policy_gradient_loss | -0.0136 | -| std | 0.0822 | -| value_loss | 5.35e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8528 | -| time_elapsed | 52014 | -| total_timesteps | 1091584 | -| train/ | | -| approx_kl | 0.0011524246 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.624 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 85270 | -| policy_gradient_loss | 0.00185 | -| std | 0.0822 | -| value_loss | 3.11e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8529 | -| time_elapsed | 52017 | -| total_timesteps | 1091712 | -| train/ | | -| approx_kl | 0.010641204 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -2.93 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 85280 | -| policy_gradient_loss | -0.00878 | -| std | 0.0822 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8530 | -| time_elapsed | 52021 | -| total_timesteps | 1091840 | -| train/ | | -| approx_kl | 0.004328202 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.000891 | -| n_updates | 85290 | -| policy_gradient_loss | 0.00108 | -| std | 0.0821 | -| value_loss | 3.38e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.812 | -| time/ | | -| fps | 20 | -| iterations | 8531 | -| time_elapsed | 52024 | -| total_timesteps | 1091968 | -| train/ | | -| approx_kl | 0.00232328 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | -0.000776 | -| n_updates | 85300 | -| policy_gradient_loss | -4.21e-05 | -| std | 0.0821 | -| value_loss | 3.72e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8532 | -| time_elapsed | 52027 | -| total_timesteps | 1092096 | -| train/ | | -| approx_kl | 0.007593462 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 85310 | -| policy_gradient_loss | -0.00707 | -| std | 0.0821 | -| value_loss | 2.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8533 | -| time_elapsed | 52034 | -| total_timesteps | 1092224 | -| train/ | | -| approx_kl | 0.026430227 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 85320 | -| policy_gradient_loss | -0.0134 | -| std | 0.0821 | -| value_loss | 4.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8534 | -| time_elapsed | 52037 | -| total_timesteps | 1092352 | -| train/ | | -| approx_kl | 0.022974513 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 85330 | -| policy_gradient_loss | -0.00336 | -| std | 0.0821 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8535 | -| time_elapsed | 52040 | -| total_timesteps | 1092480 | -| train/ | | -| approx_kl | 0.005527256 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -6.8 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 85340 | -| policy_gradient_loss | -0.00554 | -| std | 0.0821 | -| value_loss | 6.53e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8536 | -| time_elapsed | 52043 | -| total_timesteps | 1092608 | -| train/ | | -| approx_kl | 0.0055496367 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.792 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 85350 | -| policy_gradient_loss | 9.1e-05 | -| std | 0.0821 | -| value_loss | 3.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8537 | -| time_elapsed | 52047 | -| total_timesteps | 1092736 | -| train/ | | -| approx_kl | 0.020008117 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 85360 | -| policy_gradient_loss | -0.00301 | -| std | 0.0821 | -| value_loss | 3.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8538 | -| time_elapsed | 52050 | -| total_timesteps | 1092864 | -| train/ | | -| approx_kl | 0.032646395 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.00363 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 85370 | -| policy_gradient_loss | 0.00318 | -| std | 0.0821 | -| value_loss | 6.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 20 | -| iterations | 8539 | -| time_elapsed | 52055 | -| total_timesteps | 1092992 | -| train/ | | -| approx_kl | 0.000256937 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.474 | -| learning_rate | 0.0003 | -| loss | 1.67e-05 | -| n_updates | 85380 | -| policy_gradient_loss | 0.000434 | -| std | 0.082 | -| value_loss | 2.4e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 20 | -| iterations | 8540 | -| time_elapsed | 52058 | -| total_timesteps | 1093120 | -| train/ | | -| approx_kl | 0.004152435 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 85390 | -| policy_gradient_loss | -0.00797 | -| std | 0.0819 | -| value_loss | 1.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 20 | -| iterations | 8541 | -| time_elapsed | 52068 | -| total_timesteps | 1093248 | -| train/ | | -| approx_kl | 0.040919654 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.08 | -| explained_variance | 0.126 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 85400 | -| policy_gradient_loss | -0.011 | -| std | 0.0818 | -| value_loss | 0.00207 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 20 | -| iterations | 8542 | -| time_elapsed | 52072 | -| total_timesteps | 1093376 | -| train/ | | -| approx_kl | 0.014490169 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -264 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 85410 | -| policy_gradient_loss | -0.00118 | -| std | 0.0817 | -| value_loss | 1.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 20 | -| iterations | 8543 | -| time_elapsed | 52076 | -| total_timesteps | 1093504 | -| train/ | | -| approx_kl | 0.07951715 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -311 | -| learning_rate | 0.0003 | -| loss | -0.00755 | -| n_updates | 85420 | -| policy_gradient_loss | -0.0038 | -| std | 0.0815 | -| value_loss | 9.9e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 20 | -| iterations | 8544 | -| time_elapsed | 52080 | -| total_timesteps | 1093632 | -| train/ | | -| approx_kl | 0.04286955 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -3.47 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 85430 | -| policy_gradient_loss | -0.0056 | -| std | 0.0813 | -| value_loss | 7.48e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 20 | -| iterations | 8545 | -| time_elapsed | 52083 | -| total_timesteps | 1093760 | -| train/ | | -| approx_kl | 0.0034318464 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 85440 | -| policy_gradient_loss | -0.00311 | -| std | 0.0813 | -| value_loss | 4.65e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.83 | -| time/ | | -| fps | 21 | -| iterations | 8546 | -| time_elapsed | 52086 | -| total_timesteps | 1093888 | -| train/ | | -| approx_kl | 0.0005626255 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00346 | -| n_updates | 85450 | -| policy_gradient_loss | -0.0056 | -| std | 0.0813 | -| value_loss | 9.11e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8547 | -| time_elapsed | 52090 | -| total_timesteps | 1094016 | -| train/ | | -| approx_kl | 0.0023986609 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 85460 | -| policy_gradient_loss | -0.000575 | -| std | 0.0814 | -| value_loss | 8.65e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8548 | -| time_elapsed | 52098 | -| total_timesteps | 1094144 | -| train/ | | -| approx_kl | 0.0030373312 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -1.83 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 85470 | -| policy_gradient_loss | -0.0114 | -| std | 0.0815 | -| value_loss | 0.00287 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8549 | -| time_elapsed | 52102 | -| total_timesteps | 1094272 | -| train/ | | -| approx_kl | 0.0019111279 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -1e+03 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 85480 | -| policy_gradient_loss | -0.000767 | -| std | 0.0814 | -| value_loss | 8.9e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8550 | -| time_elapsed | 52105 | -| total_timesteps | 1094400 | -| train/ | | -| approx_kl | 0.047347106 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -5.51e+03 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 85490 | -| policy_gradient_loss | -0.00786 | -| std | 0.0812 | -| value_loss | 4.69e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8551 | -| time_elapsed | 52108 | -| total_timesteps | 1094528 | -| train/ | | -| approx_kl | 0.05470071 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -1.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.00894 | -| n_updates | 85500 | -| policy_gradient_loss | -0.00605 | -| std | 0.0812 | -| value_loss | 2.97e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8552 | -| time_elapsed | 52110 | -| total_timesteps | 1094656 | -| train/ | | -| approx_kl | 0.00014017709 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 1.09 | -| explained_variance | -103 | -| learning_rate | 0.0003 | -| loss | -0.000538 | -| n_updates | 85510 | -| policy_gradient_loss | -0.000379 | -| std | 0.0809 | -| value_loss | 2.74e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8553 | -| time_elapsed | 52114 | -| total_timesteps | 1094784 | -| train/ | | -| approx_kl | 0.023585893 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -12.1 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 85520 | -| policy_gradient_loss | -0.00382 | -| std | 0.0807 | -| value_loss | 6.69e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8554 | -| time_elapsed | 52116 | -| total_timesteps | 1094912 | -| train/ | | -| approx_kl | 0.00043295743 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -0.535 | -| learning_rate | 0.0003 | -| loss | 0.00116 | -| n_updates | 85530 | -| policy_gradient_loss | 0.00013 | -| std | 0.0806 | -| value_loss | 2.33e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8555 | -| time_elapsed | 52119 | -| total_timesteps | 1095040 | -| train/ | | -| approx_kl | 0.0037862938 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.000569 | -| n_updates | 85540 | -| policy_gradient_loss | -0.000163 | -| std | 0.0807 | -| value_loss | 1.43e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8556 | -| time_elapsed | 52126 | -| total_timesteps | 1095168 | -| train/ | | -| approx_kl | 0.011489651 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | 0.576 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 85550 | -| policy_gradient_loss | -0.0118 | -| std | 0.0808 | -| value_loss | 0.000647 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8557 | -| time_elapsed | 52129 | -| total_timesteps | 1095296 | -| train/ | | -| approx_kl | 0.08892207 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -91.1 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 85560 | -| policy_gradient_loss | -0.00786 | -| std | 0.0808 | -| value_loss | 2.46e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8558 | -| time_elapsed | 52132 | -| total_timesteps | 1095424 | -| train/ | | -| approx_kl | 0.0033451477 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -373 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 85570 | -| policy_gradient_loss | -0.0141 | -| std | 0.0808 | -| value_loss | 1.77e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8559 | -| time_elapsed | 52134 | -| total_timesteps | 1095552 | -| train/ | | -| approx_kl | 0.06484522 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -13.9 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 85580 | -| policy_gradient_loss | 0.00213 | -| std | 0.0808 | -| value_loss | 1.2e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8560 | -| time_elapsed | 52137 | -| total_timesteps | 1095680 | -| train/ | | -| approx_kl | 0.02355052 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -670 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 85590 | -| policy_gradient_loss | -0.0131 | -| std | 0.0808 | -| value_loss | 5.9e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8561 | -| time_elapsed | 52141 | -| total_timesteps | 1095808 | -| train/ | | -| approx_kl | 0.0052817403 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -4.59 | -| learning_rate | 0.0003 | -| loss | -0.00379 | -| n_updates | 85600 | -| policy_gradient_loss | -0.00156 | -| std | 0.0808 | -| value_loss | 1.2e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 21 | -| iterations | 8562 | -| time_elapsed | 52144 | -| total_timesteps | 1095936 | -| train/ | | -| approx_kl | 0.015648514 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -0.0956 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 85610 | -| policy_gradient_loss | -0.00718 | -| std | 0.0807 | -| value_loss | 8.29e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8563 | -| time_elapsed | 52146 | -| total_timesteps | 1096064 | -| train/ | | -| approx_kl | 0.025121292 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | -0.00661 | -| n_updates | 85620 | -| policy_gradient_loss | -0.00245 | -| std | 0.0807 | -| value_loss | 1.93e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8564 | -| time_elapsed | 52151 | -| total_timesteps | 1096192 | -| train/ | | -| approx_kl | 0.0039472557 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | 0.843 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 85630 | -| policy_gradient_loss | -0.0149 | -| std | 0.0808 | -| value_loss | 0.00155 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8565 | -| time_elapsed | 52154 | -| total_timesteps | 1096320 | -| train/ | | -| approx_kl | 0.11386275 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -186 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 85640 | -| policy_gradient_loss | -0.00733 | -| std | 0.0808 | -| value_loss | 3.31e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8566 | -| time_elapsed | 52157 | -| total_timesteps | 1096448 | -| train/ | | -| approx_kl | 0.0045315586 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -733 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 85650 | -| policy_gradient_loss | -0.0109 | -| std | 0.0808 | -| value_loss | 2.39e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8567 | -| time_elapsed | 52160 | -| total_timesteps | 1096576 | -| train/ | | -| approx_kl | 0.025285695 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -194 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 85660 | -| policy_gradient_loss | -0.0114 | -| std | 0.0808 | -| value_loss | 2.64e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8568 | -| time_elapsed | 52162 | -| total_timesteps | 1096704 | -| train/ | | -| approx_kl | 0.08986307 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -55.5 | -| learning_rate | 0.0003 | -| loss | -0.00712 | -| n_updates | 85670 | -| policy_gradient_loss | -0.00322 | -| std | 0.0808 | -| value_loss | 2.55e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8569 | -| time_elapsed | 52165 | -| total_timesteps | 1096832 | -| train/ | | -| approx_kl | 0.023663543 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -6.45 | -| learning_rate | 0.0003 | -| loss | -0.00913 | -| n_updates | 85680 | -| policy_gradient_loss | -0.0058 | -| std | 0.0808 | -| value_loss | 1.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.821 | -| time/ | | -| fps | 21 | -| iterations | 8570 | -| time_elapsed | 52167 | -| total_timesteps | 1096960 | -| train/ | | -| approx_kl | 0.009041032 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -0.362 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 85690 | -| policy_gradient_loss | -0.000425 | -| std | 0.0809 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8571 | -| time_elapsed | 52169 | -| total_timesteps | 1097088 | -| train/ | | -| approx_kl | 0.020804925 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -0.782 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 85700 | -| policy_gradient_loss | 0.00163 | -| std | 0.0808 | -| value_loss | 1.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8572 | -| time_elapsed | 52177 | -| total_timesteps | 1097216 | -| train/ | | -| approx_kl | 0.021743203 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.00725 | -| n_updates | 85710 | -| policy_gradient_loss | -0.00554 | -| std | 0.0806 | -| value_loss | 0.000188 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8573 | -| time_elapsed | 52181 | -| total_timesteps | 1097344 | -| train/ | | -| approx_kl | 0.010185911 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -593 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 85720 | -| policy_gradient_loss | -0.00807 | -| std | 0.0805 | -| value_loss | 2.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8574 | -| time_elapsed | 52184 | -| total_timesteps | 1097472 | -| train/ | | -| approx_kl | 0.042780794 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -3.92e+03 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 85730 | -| policy_gradient_loss | -0.0129 | -| std | 0.0804 | -| value_loss | 1.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8575 | -| time_elapsed | 52187 | -| total_timesteps | 1097600 | -| train/ | | -| approx_kl | 0.045196317 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -2.07e+03 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 85740 | -| policy_gradient_loss | -0.00455 | -| std | 0.0804 | -| value_loss | 1.3e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8576 | -| time_elapsed | 52190 | -| total_timesteps | 1097728 | -| train/ | | -| approx_kl | 0.11130478 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -1.36e+03 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 85750 | -| policy_gradient_loss | -0.00496 | -| std | 0.0804 | -| value_loss | 1.05e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8577 | -| time_elapsed | 52193 | -| total_timesteps | 1097856 | -| train/ | | -| approx_kl | 0.006418316 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -211 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 85760 | -| policy_gradient_loss | -0.00839 | -| std | 0.0804 | -| value_loss | 9.64e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.82 | -| time/ | | -| fps | 21 | -| iterations | 8578 | -| time_elapsed | 52196 | -| total_timesteps | 1097984 | -| train/ | | -| approx_kl | 0.051433913 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -44.5 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 85770 | -| policy_gradient_loss | -0.00315 | -| std | 0.0805 | -| value_loss | 8.54e-12 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 21 | -| iterations | 8579 | -| time_elapsed | 52199 | -| total_timesteps | 1098112 | -| train/ | | -| approx_kl | 0.0033829105 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -3.37 | -| learning_rate | 0.0003 | -| loss | -0.00981 | -| n_updates | 85780 | -| policy_gradient_loss | -0.0112 | -| std | 0.0806 | -| value_loss | 7.65e-13 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 21 | -| iterations | 8580 | -| time_elapsed | 52207 | -| total_timesteps | 1098240 | -| train/ | | -| approx_kl | 0.008941203 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 85790 | -| policy_gradient_loss | -0.0138 | -| std | 0.0806 | -| value_loss | 1.16e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 21 | -| iterations | 8581 | -| time_elapsed | 52210 | -| total_timesteps | 1098368 | -| train/ | | -| approx_kl | 0.004321335 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -8.74 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 85800 | -| policy_gradient_loss | -0.00136 | -| std | 0.0806 | -| value_loss | 6.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 21 | -| iterations | 8582 | -| time_elapsed | 52214 | -| total_timesteps | 1098496 | -| train/ | | -| approx_kl | 0.020773144 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -10.7 | -| learning_rate | 0.0003 | -| loss | -0.00898 | -| n_updates | 85810 | -| policy_gradient_loss | -0.00408 | -| std | 0.0805 | -| value_loss | 6.35e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 21 | -| iterations | 8583 | -| time_elapsed | 52217 | -| total_timesteps | 1098624 | -| train/ | | -| approx_kl | 0.0015160572 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 1.1 | -| explained_variance | -0.85 | -| learning_rate | 0.0003 | -| loss | 3.17e-06 | -| n_updates | 85820 | -| policy_gradient_loss | 0.000867 | -| std | 0.0802 | -| value_loss | 1.83e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 21 | -| iterations | 8584 | -| time_elapsed | 52220 | -| total_timesteps | 1098752 | -| train/ | | -| approx_kl | 0.005394205 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.0749 | -| learning_rate | 0.0003 | -| loss | -0.00686 | -| n_updates | 85830 | -| policy_gradient_loss | 0.000558 | -| std | 0.08 | -| value_loss | 3.87e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 21 | -| iterations | 8585 | -| time_elapsed | 52223 | -| total_timesteps | 1098880 | -| train/ | | -| approx_kl | 0.00013945764 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.00632 | -| learning_rate | 0.0003 | -| loss | -0.000409 | -| n_updates | 85840 | -| policy_gradient_loss | -0.000188 | -| std | 0.0796 | -| value_loss | 3.48e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8586 | -| time_elapsed | 52226 | -| total_timesteps | 1099008 | -| train/ | | -| approx_kl | 7.7178236e-05 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.661 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 85850 | -| policy_gradient_loss | -0.00266 | -| std | 0.0793 | -| value_loss | 1.72e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8587 | -| time_elapsed | 52235 | -| total_timesteps | 1099136 | -| train/ | | -| approx_kl | 0.019479588 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0276 | -| n_updates | 85860 | -| policy_gradient_loss | -0.0183 | -| std | 0.0791 | -| value_loss | 4.56e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8588 | -| time_elapsed | 52238 | -| total_timesteps | 1099264 | -| train/ | | -| approx_kl | 0.0026450725 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 85870 | -| policy_gradient_loss | -0.0224 | -| std | 0.0791 | -| value_loss | 1.16e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8589 | -| time_elapsed | 52241 | -| total_timesteps | 1099392 | -| train/ | | -| approx_kl | 0.18182059 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -711 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 85880 | -| policy_gradient_loss | -0.00479 | -| std | 0.0791 | -| value_loss | 1.69e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8590 | -| time_elapsed | 52244 | -| total_timesteps | 1099520 | -| train/ | | -| approx_kl | 0.056209233 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -70.4 | -| learning_rate | 0.0003 | -| loss | -0.00981 | -| n_updates | 85890 | -| policy_gradient_loss | -0.00815 | -| std | 0.0791 | -| value_loss | 2.07e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8591 | -| time_elapsed | 52248 | -| total_timesteps | 1099648 | -| train/ | | -| approx_kl | 0.029326053 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -8.93 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 85900 | -| policy_gradient_loss | -0.0182 | -| std | 0.0791 | -| value_loss | 2.64e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8592 | -| time_elapsed | 52250 | -| total_timesteps | 1099776 | -| train/ | | -| approx_kl | 0.014508322 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.993 | -| learning_rate | 0.0003 | -| loss | -0.00362 | -| n_updates | 85910 | -| policy_gradient_loss | 0.00353 | -| std | 0.0791 | -| value_loss | 1.01e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 21 | -| iterations | 8593 | -| time_elapsed | 52253 | -| total_timesteps | 1099904 | -| train/ | | -| approx_kl | 0.028171834 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 85920 | -| policy_gradient_loss | 0.00238 | -| std | 0.0792 | -| value_loss | 5.39e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8594 | -| time_elapsed | 52256 | -| total_timesteps | 1100032 | -| train/ | | -| approx_kl | 0.002094787 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.00658 | -| n_updates | 85930 | -| policy_gradient_loss | -0.0057 | -| std | 0.0793 | -| value_loss | 5.89e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8595 | -| time_elapsed | 52265 | -| total_timesteps | 1100160 | -| train/ | | -| approx_kl | 0.014094764 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 85940 | -| policy_gradient_loss | -0.0132 | -| std | 0.0793 | -| value_loss | 0.00243 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8596 | -| time_elapsed | 52269 | -| total_timesteps | 1100288 | -| train/ | | -| approx_kl | 0.010624821 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -2.85e+03 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 85950 | -| policy_gradient_loss | -0.000763 | -| std | 0.0794 | -| value_loss | 1.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8597 | -| time_elapsed | 52272 | -| total_timesteps | 1100416 | -| train/ | | -| approx_kl | 0.004615666 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -5.51e+03 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 85960 | -| policy_gradient_loss | -0.00741 | -| std | 0.0794 | -| value_loss | 9.64e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8598 | -| time_elapsed | 52276 | -| total_timesteps | 1100544 | -| train/ | | -| approx_kl | 0.00042267097 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -69.9 | -| learning_rate | 0.0003 | -| loss | -0.00023 | -| n_updates | 85970 | -| policy_gradient_loss | 0.000152 | -| std | 0.0795 | -| value_loss | 1.22e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8599 | -| time_elapsed | 52280 | -| total_timesteps | 1100672 | -| train/ | | -| approx_kl | 0.009729446 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -6.05 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 85980 | -| policy_gradient_loss | -0.00773 | -| std | 0.0796 | -| value_loss | 1.69e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8600 | -| time_elapsed | 52284 | -| total_timesteps | 1100800 | -| train/ | | -| approx_kl | 0.0012944937 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.432 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 85990 | -| policy_gradient_loss | 0.0078 | -| std | 0.0796 | -| value_loss | 3.05e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 21 | -| iterations | 8601 | -| time_elapsed | 52287 | -| total_timesteps | 1100928 | -| train/ | | -| approx_kl | 0.03859819 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.00624 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 86000 | -| policy_gradient_loss | 0.00541 | -| std | 0.0796 | -| value_loss | 1.44e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8602 | -| time_elapsed | 52290 | -| total_timesteps | 1101056 | -| train/ | | -| approx_kl | 0.014135197 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -8.5 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 86010 | -| policy_gradient_loss | -0.000986 | -| std | 0.0796 | -| value_loss | 9.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8603 | -| time_elapsed | 52296 | -| total_timesteps | 1101184 | -| train/ | | -| approx_kl | 0.017628597 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.939 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 86020 | -| policy_gradient_loss | -0.0114 | -| std | 0.0796 | -| value_loss | 0.000434 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8604 | -| time_elapsed | 52299 | -| total_timesteps | 1101312 | -| train/ | | -| approx_kl | 0.02882842 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -6.01 | -| learning_rate | 0.0003 | -| loss | 0.00346 | -| n_updates | 86030 | -| policy_gradient_loss | 0.000598 | -| std | 0.0796 | -| value_loss | 3.21e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8605 | -| time_elapsed | 52302 | -| total_timesteps | 1101440 | -| train/ | | -| approx_kl | 0.02386573 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 86040 | -| policy_gradient_loss | -0.00155 | -| std | 0.0796 | -| value_loss | 5.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8606 | -| time_elapsed | 52306 | -| total_timesteps | 1101568 | -| train/ | | -| approx_kl | 0.068651155 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.636 | -| learning_rate | 0.0003 | -| loss | -0.00623 | -| n_updates | 86050 | -| policy_gradient_loss | -0.00495 | -| std | 0.0796 | -| value_loss | 4.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8607 | -| time_elapsed | 52310 | -| total_timesteps | 1101696 | -| train/ | | -| approx_kl | 0.006496681 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -1.43 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 86060 | -| policy_gradient_loss | -0.00539 | -| std | 0.0796 | -| value_loss | 6.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8608 | -| time_elapsed | 52313 | -| total_timesteps | 1101824 | -| train/ | | -| approx_kl | 0.024341904 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -1.63 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 86070 | -| policy_gradient_loss | -0.00294 | -| std | 0.0795 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 8609 | -| time_elapsed | 52316 | -| total_timesteps | 1101952 | -| train/ | | -| approx_kl | 0.0024089012 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.00534 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 86080 | -| policy_gradient_loss | -8.3e-05 | -| std | 0.0796 | -| value_loss | 1.68e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8610 | -| time_elapsed | 52319 | -| total_timesteps | 1102080 | -| train/ | | -| approx_kl | 0.0027893349 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.0044 | -| learning_rate | 0.0003 | -| loss | -0.00594 | -| n_updates | 86090 | -| policy_gradient_loss | -0.0045 | -| std | 0.0796 | -| value_loss | 1.99e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8611 | -| time_elapsed | 52326 | -| total_timesteps | 1102208 | -| train/ | | -| approx_kl | 0.015159187 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -15.8 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 86100 | -| policy_gradient_loss | -0.0137 | -| std | 0.0795 | -| value_loss | 0.00637 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8612 | -| time_elapsed | 52329 | -| total_timesteps | 1102336 | -| train/ | | -| approx_kl | 0.016432244 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -6.73e+03 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 86110 | -| policy_gradient_loss | -0.0099 | -| std | 0.0795 | -| value_loss | 3.09e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8613 | -| time_elapsed | 52333 | -| total_timesteps | 1102464 | -| train/ | | -| approx_kl | 0.082783304 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -1.85e+03 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 86120 | -| policy_gradient_loss | -0.0107 | -| std | 0.0795 | -| value_loss | 1.39e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8614 | -| time_elapsed | 52337 | -| total_timesteps | 1102592 | -| train/ | | -| approx_kl | 0.0552317 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -83.5 | -| learning_rate | 0.0003 | -| loss | -0.00904 | -| n_updates | 86130 | -| policy_gradient_loss | -0.00704 | -| std | 0.0796 | -| value_loss | 3.74e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8615 | -| time_elapsed | 52340 | -| total_timesteps | 1102720 | -| train/ | | -| approx_kl | 0.003954342 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 86140 | -| policy_gradient_loss | 0.000636 | -| std | 0.0796 | -| value_loss | 2.03e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8616 | -| time_elapsed | 52344 | -| total_timesteps | 1102848 | -| train/ | | -| approx_kl | 0.0009390493 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 86150 | -| policy_gradient_loss | 0.00384 | -| std | 0.0796 | -| value_loss | 1.16e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 21 | -| iterations | 8617 | -| time_elapsed | 52348 | -| total_timesteps | 1102976 | -| train/ | | -| approx_kl | 0.0028844145 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.0039 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 86160 | -| policy_gradient_loss | -0.00192 | -| std | 0.0796 | -| value_loss | 7.7e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8618 | -| time_elapsed | 52351 | -| total_timesteps | 1103104 | -| train/ | | -| approx_kl | 0.0016034748 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.00149 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 86170 | -| policy_gradient_loss | -0.0028 | -| std | 0.0795 | -| value_loss | 2.86e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8619 | -| time_elapsed | 52360 | -| total_timesteps | 1103232 | -| train/ | | -| approx_kl | 0.011262993 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.785 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 86180 | -| policy_gradient_loss | -0.015 | -| std | 0.0794 | -| value_loss | 0.00328 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8620 | -| time_elapsed | 52363 | -| total_timesteps | 1103360 | -| train/ | | -| approx_kl | 0.098475285 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -211 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 86190 | -| policy_gradient_loss | -0.00179 | -| std | 0.0795 | -| value_loss | 1.33e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8621 | -| time_elapsed | 52366 | -| total_timesteps | 1103488 | -| train/ | | -| approx_kl | 0.050138623 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -607 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 86200 | -| policy_gradient_loss | -0.00305 | -| std | 0.0797 | -| value_loss | 7.32e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8622 | -| time_elapsed | 52369 | -| total_timesteps | 1103616 | -| train/ | | -| approx_kl | 0.201314 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -24.5 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 86210 | -| policy_gradient_loss | -0.00449 | -| std | 0.0799 | -| value_loss | 5.46e-07 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8623 | -| time_elapsed | 52373 | -| total_timesteps | 1103744 | -| train/ | | -| approx_kl | 0.00038228836 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.703 | -| learning_rate | 0.0003 | -| loss | -0.00071 | -| n_updates | 86220 | -| policy_gradient_loss | 0.00507 | -| std | 0.0799 | -| value_loss | 2.12e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8624 | -| time_elapsed | 52376 | -| total_timesteps | 1103872 | -| train/ | | -| approx_kl | 0.002028727 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.005 | -| n_updates | 86230 | -| policy_gradient_loss | -0.00198 | -| std | 0.08 | -| value_loss | 5.37e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8625 | -| time_elapsed | 52380 | -| total_timesteps | 1104000 | -| train/ | | -| approx_kl | 0.00042962655 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | -0.000984 | -| n_updates | 86240 | -| policy_gradient_loss | 7.92e-05 | -| std | 0.08 | -| value_loss | 8.77e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8626 | -| time_elapsed | 52384 | -| total_timesteps | 1104128 | -| train/ | | -| approx_kl | 2.1007843e-05 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -7.03 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 86250 | -| policy_gradient_loss | -0.00606 | -| std | 0.0799 | -| value_loss | 1.48e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8627 | -| time_elapsed | 52389 | -| total_timesteps | 1104256 | -| train/ | | -| approx_kl | 0.10250954 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.566 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 86260 | -| policy_gradient_loss | -0.0117 | -| std | 0.0799 | -| value_loss | 0.00136 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8628 | -| time_elapsed | 52391 | -| total_timesteps | 1104384 | -| train/ | | -| approx_kl | 0.055178426 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -283 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 86270 | -| policy_gradient_loss | -0.003 | -| std | 0.0797 | -| value_loss | 4.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8629 | -| time_elapsed | 52394 | -| total_timesteps | 1104512 | -| train/ | | -| approx_kl | 0.010593372 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -228 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 86280 | -| policy_gradient_loss | -0.00303 | -| std | 0.0796 | -| value_loss | 2.68e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8630 | -| time_elapsed | 52398 | -| total_timesteps | 1104640 | -| train/ | | -| approx_kl | 0.014170479 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -7.99 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 86290 | -| policy_gradient_loss | -0.00867 | -| std | 0.0795 | -| value_loss | 4.36e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8631 | -| time_elapsed | 52402 | -| total_timesteps | 1104768 | -| train/ | | -| approx_kl | 0.00073977606 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 86300 | -| policy_gradient_loss | -0.00332 | -| std | 0.0795 | -| value_loss | 1.29e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 21 | -| iterations | 8632 | -| time_elapsed | 52405 | -| total_timesteps | 1104896 | -| train/ | | -| approx_kl | 1.3454817e-05 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -1.49 | -| learning_rate | 0.0003 | -| loss | -0.000594 | -| n_updates | 86310 | -| policy_gradient_loss | -0.00362 | -| std | 0.0795 | -| value_loss | 8.65e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8633 | -| time_elapsed | 52408 | -| total_timesteps | 1105024 | -| train/ | | -| approx_kl | 0.008205718 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -0.00665 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 86320 | -| policy_gradient_loss | -0.00482 | -| std | 0.0795 | -| value_loss | 6.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8634 | -| time_elapsed | 52416 | -| total_timesteps | 1105152 | -| train/ | | -| approx_kl | 0.032909438 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.649 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 86330 | -| policy_gradient_loss | -0.013 | -| std | 0.0795 | -| value_loss | 0.000996 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8635 | -| time_elapsed | 52420 | -| total_timesteps | 1105280 | -| train/ | | -| approx_kl | 0.0005343701 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | -16 | -| learning_rate | 0.0003 | -| loss | -0.00088 | -| n_updates | 86340 | -| policy_gradient_loss | -0.00087 | -| std | 0.0794 | -| value_loss | 7.07e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8636 | -| time_elapsed | 52422 | -| total_timesteps | 1105408 | -| train/ | | -| approx_kl | 0.0024752761 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -94.2 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 86350 | -| policy_gradient_loss | -0.0109 | -| std | 0.0793 | -| value_loss | 2.62e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8637 | -| time_elapsed | 52425 | -| total_timesteps | 1105536 | -| train/ | | -| approx_kl | 0.0051079853 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 86360 | -| policy_gradient_loss | -0.0068 | -| std | 0.0793 | -| value_loss | 0.000115 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8638 | -| time_elapsed | 52428 | -| total_timesteps | 1105664 | -| train/ | | -| approx_kl | 7.2675757e-06 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.537 | -| learning_rate | 0.0003 | -| loss | 0.0002 | -| n_updates | 86370 | -| policy_gradient_loss | -0.000859 | -| std | 0.0793 | -| value_loss | 0.000322 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8639 | -| time_elapsed | 52432 | -| total_timesteps | 1105792 | -| train/ | | -| approx_kl | 0.003230251 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -3.03 | -| learning_rate | 0.0003 | -| loss | -0.000915 | -| n_updates | 86380 | -| policy_gradient_loss | -0.000404 | -| std | 0.0792 | -| value_loss | 3.78e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 21 | -| iterations | 8640 | -| time_elapsed | 52434 | -| total_timesteps | 1105920 | -| train/ | | -| approx_kl | 0.0073112277 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.00449 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 86390 | -| policy_gradient_loss | -0.00394 | -| std | 0.0791 | -| value_loss | 9.95e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8641 | -| time_elapsed | 52438 | -| total_timesteps | 1106048 | -| train/ | | -| approx_kl | 0.06158359 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -55.9 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 86400 | -| policy_gradient_loss | -0.00335 | -| std | 0.0791 | -| value_loss | 9.65e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8642 | -| time_elapsed | 52445 | -| total_timesteps | 1106176 | -| train/ | | -| approx_kl | 0.14252666 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | 0.305 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 86410 | -| policy_gradient_loss | -0.00798 | -| std | 0.0791 | -| value_loss | 0.00113 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8643 | -| time_elapsed | 52450 | -| total_timesteps | 1106304 | -| train/ | | -| approx_kl | 0.026266579 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -35.2 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 86420 | -| policy_gradient_loss | -0.00462 | -| std | 0.0792 | -| value_loss | 1.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8644 | -| time_elapsed | 52454 | -| total_timesteps | 1106432 | -| train/ | | -| approx_kl | 0.17031956 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -115 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 86430 | -| policy_gradient_loss | -0.0111 | -| std | 0.0791 | -| value_loss | 7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8645 | -| time_elapsed | 52458 | -| total_timesteps | 1106560 | -| train/ | | -| approx_kl | 0.010951508 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -4.1e+03 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 86440 | -| policy_gradient_loss | -0.0135 | -| std | 0.0791 | -| value_loss | 1.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8646 | -| time_elapsed | 52460 | -| total_timesteps | 1106688 | -| train/ | | -| approx_kl | 0.027864832 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -4.72 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 86450 | -| policy_gradient_loss | -0.0025 | -| std | 0.0791 | -| value_loss | 4e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8647 | -| time_elapsed | 52465 | -| total_timesteps | 1106816 | -| train/ | | -| approx_kl | 0.0012254957 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 86460 | -| policy_gradient_loss | -0.002 | -| std | 0.0791 | -| value_loss | 4.33e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8648 | -| time_elapsed | 52469 | -| total_timesteps | 1106944 | -| train/ | | -| approx_kl | 0.00021229591 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.00657 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 86470 | -| policy_gradient_loss | -0.00329 | -| std | 0.0792 | -| value_loss | 1e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8649 | -| time_elapsed | 52472 | -| total_timesteps | 1107072 | -| train/ | | -| approx_kl | 0.000702708 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | 0.00463 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 86480 | -| policy_gradient_loss | 0.0012 | -| std | 0.079 | -| value_loss | 7.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8650 | -| time_elapsed | 52479 | -| total_timesteps | 1107200 | -| train/ | | -| approx_kl | 0.03919165 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 86490 | -| policy_gradient_loss | -0.0126 | -| std | 0.0789 | -| value_loss | 0.000817 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8651 | -| time_elapsed | 52483 | -| total_timesteps | 1107328 | -| train/ | | -| approx_kl | 0.15804482 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -244 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 86500 | -| policy_gradient_loss | -0.00536 | -| std | 0.0789 | -| value_loss | 8.7e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8652 | -| time_elapsed | 52486 | -| total_timesteps | 1107456 | -| train/ | | -| approx_kl | 0.047734503 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -299 | -| learning_rate | 0.0003 | -| loss | -0.00066 | -| n_updates | 86510 | -| policy_gradient_loss | -0.00164 | -| std | 0.079 | -| value_loss | 3.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8653 | -| time_elapsed | 52490 | -| total_timesteps | 1107584 | -| train/ | | -| approx_kl | 0.0004451964 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -5.23 | -| learning_rate | 0.0003 | -| loss | -0.0004 | -| n_updates | 86520 | -| policy_gradient_loss | 0.000979 | -| std | 0.079 | -| value_loss | 4.26e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8654 | -| time_elapsed | 52493 | -| total_timesteps | 1107712 | -| train/ | | -| approx_kl | 0.0021428694 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.307 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 86530 | -| policy_gradient_loss | -0.000573 | -| std | 0.079 | -| value_loss | 1.38e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8655 | -| time_elapsed | 52497 | -| total_timesteps | 1107840 | -| train/ | | -| approx_kl | 0.0010839296 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.00142 | -| learning_rate | 0.0003 | -| loss | -0.000776 | -| n_updates | 86540 | -| policy_gradient_loss | 0.000131 | -| std | 0.079 | -| value_loss | 4.28e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 8656 | -| time_elapsed | 52500 | -| total_timesteps | 1107968 | -| train/ | | -| approx_kl | 0.007166469 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | 0.00249 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 86550 | -| policy_gradient_loss | -0.00422 | -| std | 0.0792 | -| value_loss | 6.93e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8657 | -| time_elapsed | 52504 | -| total_timesteps | 1108096 | -| train/ | | -| approx_kl | 0.0061878837 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | -0.00647 | -| n_updates | 86560 | -| policy_gradient_loss | -0.00463 | -| std | 0.0793 | -| value_loss | 7.5e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8658 | -| time_elapsed | 52513 | -| total_timesteps | 1108224 | -| train/ | | -| approx_kl | 0.01040443 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.11 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 86570 | -| policy_gradient_loss | -0.0147 | -| std | 0.0794 | -| value_loss | 0.000138 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8659 | -| time_elapsed | 52516 | -| total_timesteps | 1108352 | -| train/ | | -| approx_kl | 0.13381828 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -26.5 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 86580 | -| policy_gradient_loss | -0.00969 | -| std | 0.0793 | -| value_loss | 1.45e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8660 | -| time_elapsed | 52519 | -| total_timesteps | 1108480 | -| train/ | | -| approx_kl | 0.029358165 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -126 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 86590 | -| policy_gradient_loss | -0.00693 | -| std | 0.0793 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8661 | -| time_elapsed | 52522 | -| total_timesteps | 1108608 | -| train/ | | -| approx_kl | 0.030972552 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -9.78 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 86600 | -| policy_gradient_loss | -0.00471 | -| std | 0.0792 | -| value_loss | 2.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8662 | -| time_elapsed | 52525 | -| total_timesteps | 1108736 | -| train/ | | -| approx_kl | 0.0075047337 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.00284 | -| n_updates | 86610 | -| policy_gradient_loss | 0.00127 | -| std | 0.0789 | -| value_loss | 4.99e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8663 | -| time_elapsed | 52529 | -| total_timesteps | 1108864 | -| train/ | | -| approx_kl | 0.0014125248 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 86620 | -| policy_gradient_loss | -0.00129 | -| std | 0.0787 | -| value_loss | 5.73e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 8664 | -| time_elapsed | 52532 | -| total_timesteps | 1108992 | -| train/ | | -| approx_kl | 0.010816928 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.000956 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 86630 | -| policy_gradient_loss | -0.00165 | -| std | 0.0786 | -| value_loss | 5.27e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8665 | -| time_elapsed | 52535 | -| total_timesteps | 1109120 | -| train/ | | -| approx_kl | 3.3475924e-05 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.000126 | -| n_updates | 86640 | -| policy_gradient_loss | 0.00208 | -| std | 0.0786 | -| value_loss | 1.59e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8666 | -| time_elapsed | 52544 | -| total_timesteps | 1109248 | -| train/ | | -| approx_kl | 0.034419406 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | 0.919 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 86650 | -| policy_gradient_loss | -0.0135 | -| std | 0.0786 | -| value_loss | 0.000275 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8667 | -| time_elapsed | 52548 | -| total_timesteps | 1109376 | -| train/ | | -| approx_kl | 0.10967977 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 1.12 | -| explained_variance | -36.1 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 86660 | -| policy_gradient_loss | -0.00553 | -| std | 0.0785 | -| value_loss | 1.6e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8668 | -| time_elapsed | 52553 | -| total_timesteps | 1109504 | -| train/ | | -| approx_kl | 0.041671418 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 1.13 | -| explained_variance | -99 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 86670 | -| policy_gradient_loss | -0.014 | -| std | 0.0785 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8669 | -| time_elapsed | 52556 | -| total_timesteps | 1109632 | -| train/ | | -| approx_kl | 0.0058873286 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 1.13 | -| explained_variance | -13.6 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 86680 | -| policy_gradient_loss | -0.00455 | -| std | 0.0785 | -| value_loss | 1.44e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8670 | -| time_elapsed | 52560 | -| total_timesteps | 1109760 | -| train/ | | -| approx_kl | 0.047392644 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 1.13 | -| explained_variance | -1.47 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 86690 | -| policy_gradient_loss | -0.00781 | -| std | 0.0785 | -| value_loss | 5.92e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8671 | -| time_elapsed | 52563 | -| total_timesteps | 1109888 | -| train/ | | -| approx_kl | 0.0024266941 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 1.13 | -| explained_variance | -0.559 | -| learning_rate | 0.0003 | -| loss | -0.000754 | -| n_updates | 86700 | -| policy_gradient_loss | -0.000338 | -| std | 0.0781 | -| value_loss | 2.24e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8672 | -| time_elapsed | 52568 | -| total_timesteps | 1110016 | -| train/ | | -| approx_kl | 0.0077116503 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 1.13 | -| explained_variance | -0.088 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 86710 | -| policy_gradient_loss | -0.00516 | -| std | 0.0778 | -| value_loss | 1.07e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8673 | -| time_elapsed | 52576 | -| total_timesteps | 1110144 | -| train/ | | -| approx_kl | 0.11420196 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | 0.547 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 86720 | -| policy_gradient_loss | -0.0138 | -| std | 0.0777 | -| value_loss | 0.000836 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8674 | -| time_elapsed | 52579 | -| total_timesteps | 1110272 | -| train/ | | -| approx_kl | 0.003113395 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 86730 | -| policy_gradient_loss | -0.0015 | -| std | 0.0775 | -| value_loss | 3.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8675 | -| time_elapsed | 52583 | -| total_timesteps | 1110400 | -| train/ | | -| approx_kl | 0.04734871 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -519 | -| learning_rate | 0.0003 | -| loss | -0.00565 | -| n_updates | 86740 | -| policy_gradient_loss | -0.00384 | -| std | 0.0774 | -| value_loss | 2.29e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8676 | -| time_elapsed | 52585 | -| total_timesteps | 1110528 | -| train/ | | -| approx_kl | 0.0016060448 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -61.6 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 86750 | -| policy_gradient_loss | -0.00107 | -| std | 0.0772 | -| value_loss | 2.41e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8677 | -| time_elapsed | 52587 | -| total_timesteps | 1110656 | -| train/ | | -| approx_kl | 0.013456625 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -6.94 | -| learning_rate | 0.0003 | -| loss | -0.00648 | -| n_updates | 86760 | -| policy_gradient_loss | -0.00463 | -| std | 0.0771 | -| value_loss | 4.41e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8678 | -| time_elapsed | 52589 | -| total_timesteps | 1110784 | -| train/ | | -| approx_kl | 0.0004643863 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -0.726 | -| learning_rate | 0.0003 | -| loss | 0.00153 | -| n_updates | 86770 | -| policy_gradient_loss | -0.000625 | -| std | 0.077 | -| value_loss | 1.15e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 8679 | -| time_elapsed | 52591 | -| total_timesteps | 1110912 | -| train/ | | -| approx_kl | 0.00017242273 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.00602 | -| learning_rate | 0.0003 | -| loss | -0.000175 | -| n_updates | 86780 | -| policy_gradient_loss | 5.29e-06 | -| std | 0.0768 | -| value_loss | 4.32e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8680 | -| time_elapsed | 52593 | -| total_timesteps | 1111040 | -| train/ | | -| approx_kl | 0.0019934694 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.00256 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 86790 | -| policy_gradient_loss | 0.000263 | -| std | 0.0767 | -| value_loss | 1.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8681 | -| time_elapsed | 52600 | -| total_timesteps | 1111168 | -| train/ | | -| approx_kl | 0.020025283 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.776 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 86800 | -| policy_gradient_loss | -0.00386 | -| std | 0.0766 | -| value_loss | 0.00366 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8682 | -| time_elapsed | 52604 | -| total_timesteps | 1111296 | -| train/ | | -| approx_kl | 6.788876e-06 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -44.9 | -| learning_rate | 0.0003 | -| loss | -0.000966 | -| n_updates | 86810 | -| policy_gradient_loss | -0.00924 | -| std | 0.0764 | -| value_loss | 1.22e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8683 | -| time_elapsed | 52608 | -| total_timesteps | 1111424 | -| train/ | | -| approx_kl | 0.03593257 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -4.44e+03 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 86820 | -| policy_gradient_loss | -0.0119 | -| std | 0.0763 | -| value_loss | 2.55e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8684 | -| time_elapsed | 52612 | -| total_timesteps | 1111552 | -| train/ | | -| approx_kl | 0.068148024 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -5.26e+03 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 86830 | -| policy_gradient_loss | -0.000674 | -| std | 0.0765 | -| value_loss | 1.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8685 | -| time_elapsed | 52615 | -| total_timesteps | 1111680 | -| train/ | | -| approx_kl | 0.034836948 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -366 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 86840 | -| policy_gradient_loss | 0.00139 | -| std | 0.0767 | -| value_loss | 7.01e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8686 | -| time_elapsed | 52617 | -| total_timesteps | 1111808 | -| train/ | | -| approx_kl | 0.0012313733 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -128 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 86850 | -| policy_gradient_loss | -0.00108 | -| std | 0.0767 | -| value_loss | 1.48e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 8687 | -| time_elapsed | 52620 | -| total_timesteps | 1111936 | -| train/ | | -| approx_kl | 0.007627305 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 86860 | -| policy_gradient_loss | 0.000277 | -| std | 0.0769 | -| value_loss | 2.36e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8688 | -| time_elapsed | 52622 | -| total_timesteps | 1112064 | -| train/ | | -| approx_kl | 0.0023083328 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -0.229 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 86870 | -| policy_gradient_loss | 0.00266 | -| std | 0.0771 | -| value_loss | 2.84e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8689 | -| time_elapsed | 52628 | -| total_timesteps | 1112192 | -| train/ | | -| approx_kl | 0.049245518 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 86880 | -| policy_gradient_loss | -0.00272 | -| std | 0.0771 | -| value_loss | 0.0021 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8690 | -| time_elapsed | 52631 | -| total_timesteps | 1112320 | -| train/ | | -| approx_kl | 0.032190993 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -158 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 86890 | -| policy_gradient_loss | -0.00317 | -| std | 0.0771 | -| value_loss | 2.17e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8691 | -| time_elapsed | 52635 | -| total_timesteps | 1112448 | -| train/ | | -| approx_kl | 0.17069529 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -246 | -| learning_rate | 0.0003 | -| loss | 0.000912 | -| n_updates | 86900 | -| policy_gradient_loss | -0.00154 | -| std | 0.0773 | -| value_loss | 7.59e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8692 | -| time_elapsed | 52640 | -| total_timesteps | 1112576 | -| train/ | | -| approx_kl | 0.00061174063 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.000553 | -| n_updates | 86910 | -| policy_gradient_loss | -0.000455 | -| std | 0.0772 | -| value_loss | 2.65e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8693 | -| time_elapsed | 52643 | -| total_timesteps | 1112704 | -| train/ | | -| approx_kl | 0.000980346 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.14 | -| explained_variance | -0.0837 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 86920 | -| policy_gradient_loss | 0.00134 | -| std | 0.0771 | -| value_loss | 2.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8694 | -| time_elapsed | 52646 | -| total_timesteps | 1112832 | -| train/ | | -| approx_kl | 0.0010394515 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -0.0076 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 86930 | -| policy_gradient_loss | 0.00428 | -| std | 0.0769 | -| value_loss | 6.41e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 8695 | -| time_elapsed | 52649 | -| total_timesteps | 1112960 | -| train/ | | -| approx_kl | 0.0012825695 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 86940 | -| policy_gradient_loss | -0.00313 | -| std | 0.0766 | -| value_loss | 1.08e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8696 | -| time_elapsed | 52651 | -| total_timesteps | 1113088 | -| train/ | | -| approx_kl | 0.020476924 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.00025 | -| learning_rate | 0.0003 | -| loss | -0.00928 | -| n_updates | 86950 | -| policy_gradient_loss | -0.0051 | -| std | 0.0765 | -| value_loss | 5.91e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8697 | -| time_elapsed | 52658 | -| total_timesteps | 1113216 | -| train/ | | -| approx_kl | 0.016470175 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0262 | -| n_updates | 86960 | -| policy_gradient_loss | -0.0189 | -| std | 0.0765 | -| value_loss | 9.04e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8698 | -| time_elapsed | 52663 | -| total_timesteps | 1113344 | -| train/ | | -| approx_kl | 0.0029713144 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 86970 | -| policy_gradient_loss | 0.000793 | -| std | 0.0763 | -| value_loss | 1.04e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8699 | -| time_elapsed | 52668 | -| total_timesteps | 1113472 | -| train/ | | -| approx_kl | 0.0067329863 | -| clip_fraction | 0.0125 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -0.454 | -| learning_rate | 0.0003 | -| loss | -0.000135 | -| n_updates | 86980 | -| policy_gradient_loss | -0.00131 | -| std | 0.0763 | -| value_loss | 1.97e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8700 | -| time_elapsed | 52671 | -| total_timesteps | 1113600 | -| train/ | | -| approx_kl | 0.0103362575 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 86990 | -| policy_gradient_loss | -0.00762 | -| std | 0.0763 | -| value_loss | 1.58e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8701 | -| time_elapsed | 52675 | -| total_timesteps | 1113728 | -| train/ | | -| approx_kl | 0.0111019 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.00243 | -| learning_rate | 0.0003 | -| loss | -0.00615 | -| n_updates | 87000 | -| policy_gradient_loss | -0.0054 | -| std | 0.0763 | -| value_loss | 9.89e-05 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8702 | -| time_elapsed | 52678 | -| total_timesteps | 1113856 | -| train/ | | -| approx_kl | 0.00023358269 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -0.915 | -| learning_rate | 0.0003 | -| loss | -0.000194 | -| n_updates | 87010 | -| policy_gradient_loss | 0.000595 | -| std | 0.0763 | -| value_loss | 1.02e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 8703 | -| time_elapsed | 52681 | -| total_timesteps | 1113984 | -| train/ | | -| approx_kl | 0.0008654725 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | -0.0907 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 87020 | -| policy_gradient_loss | 0.00125 | -| std | 0.0762 | -| value_loss | 2.99e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 8704 | -| time_elapsed | 52684 | -| total_timesteps | 1114112 | -| train/ | | -| approx_kl | 0.0054435753 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 87030 | -| policy_gradient_loss | -0.00625 | -| std | 0.0762 | -| value_loss | 2.46e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 8705 | -| time_elapsed | 52691 | -| total_timesteps | 1114240 | -| train/ | | -| approx_kl | 0.022421286 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 87040 | -| policy_gradient_loss | -0.0161 | -| std | 0.0762 | -| value_loss | 0.000786 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 8706 | -| time_elapsed | 52695 | -| total_timesteps | 1114368 | -| train/ | | -| approx_kl | 0.017887097 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | -195 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 87050 | -| policy_gradient_loss | -0.0121 | -| std | 0.0762 | -| value_loss | 1.01e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 8707 | -| time_elapsed | 52698 | -| total_timesteps | 1114496 | -| train/ | | -| approx_kl | 0.005731895 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | -118 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 87060 | -| policy_gradient_loss | 0.00062 | -| std | 0.0763 | -| value_loss | 7.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 8708 | -| time_elapsed | 52701 | -| total_timesteps | 1114624 | -| train/ | | -| approx_kl | 0.016636416 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -2.31 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 87070 | -| policy_gradient_loss | -0.00368 | -| std | 0.0763 | -| value_loss | 5.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 8709 | -| time_elapsed | 52703 | -| total_timesteps | 1114752 | -| train/ | | -| approx_kl | 0.003470031 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -3.77 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 87080 | -| policy_gradient_loss | 0.00129 | -| std | 0.0764 | -| value_loss | 6.77e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 8710 | -| time_elapsed | 52707 | -| total_timesteps | 1114880 | -| train/ | | -| approx_kl | 0.0037380029 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.00214 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 87090 | -| policy_gradient_loss | -0.00855 | -| std | 0.0764 | -| value_loss | 2.38e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8711 | -| time_elapsed | 52710 | -| total_timesteps | 1115008 | -| train/ | | -| approx_kl | 0.0028804233 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 87100 | -| policy_gradient_loss | -0.00897 | -| std | 0.0764 | -| value_loss | 2.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8712 | -| time_elapsed | 52720 | -| total_timesteps | 1115136 | -| train/ | | -| approx_kl | 0.019052517 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 87110 | -| policy_gradient_loss | -0.0114 | -| std | 0.0765 | -| value_loss | 3.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8713 | -| time_elapsed | 52724 | -| total_timesteps | 1115264 | -| train/ | | -| approx_kl | 0.011190118 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -1.78 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 87120 | -| policy_gradient_loss | -0.00184 | -| std | 0.0765 | -| value_loss | 7.25e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8714 | -| time_elapsed | 52728 | -| total_timesteps | 1115392 | -| train/ | | -| approx_kl | 0.00018010009 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 1.15 | -| explained_variance | -4.68 | -| learning_rate | 0.0003 | -| loss | -0.000527 | -| n_updates | 87130 | -| policy_gradient_loss | 8.98e-05 | -| std | 0.0762 | -| value_loss | 7.03e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8715 | -| time_elapsed | 52732 | -| total_timesteps | 1115520 | -| train/ | | -| approx_kl | 0.00023395568 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | 0.000873 | -| n_updates | 87140 | -| policy_gradient_loss | 0.00146 | -| std | 0.076 | -| value_loss | 4.14e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8716 | -| time_elapsed | 52735 | -| total_timesteps | 1115648 | -| train/ | | -| approx_kl | 0.010751329 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | -6.55 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 87150 | -| policy_gradient_loss | -0.0107 | -| std | 0.0759 | -| value_loss | 1.6e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8717 | -| time_elapsed | 52740 | -| total_timesteps | 1115776 | -| train/ | | -| approx_kl | 0.0026195613 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | -0.391 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 87160 | -| policy_gradient_loss | -0.000561 | -| std | 0.0758 | -| value_loss | 5.05e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8718 | -| time_elapsed | 52744 | -| total_timesteps | 1115904 | -| train/ | | -| approx_kl | 0.0011901362 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | 0.00432 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 87170 | -| policy_gradient_loss | 0.000358 | -| std | 0.0758 | -| value_loss | 8.11e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8719 | -| time_elapsed | 52748 | -| total_timesteps | 1116032 | -| train/ | | -| approx_kl | 0.000273515 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | 0.00339 | -| learning_rate | 0.0003 | -| loss | -0.000985 | -| n_updates | 87180 | -| policy_gradient_loss | 0.000364 | -| std | 0.0757 | -| value_loss | 2.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8720 | -| time_elapsed | 52756 | -| total_timesteps | 1116160 | -| train/ | | -| approx_kl | 0.01220304 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 1.16 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.00863 | -| n_updates | 87190 | -| policy_gradient_loss | -0.00645 | -| std | 0.0755 | -| value_loss | 0.000165 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8721 | -| time_elapsed | 52760 | -| total_timesteps | 1116288 | -| train/ | | -| approx_kl | 0.008624433 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -2.53 | -| learning_rate | 0.0003 | -| loss | -0.00982 | -| n_updates | 87200 | -| policy_gradient_loss | -0.00525 | -| std | 0.0753 | -| value_loss | 1.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8722 | -| time_elapsed | 52763 | -| total_timesteps | 1116416 | -| train/ | | -| approx_kl | 0.008582091 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -3.12 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 87210 | -| policy_gradient_loss | -0.00066 | -| std | 0.0752 | -| value_loss | 9.95e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8723 | -| time_elapsed | 52766 | -| total_timesteps | 1116544 | -| train/ | | -| approx_kl | 1.5133526e-05 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | -0.000174 | -| n_updates | 87220 | -| policy_gradient_loss | 0.000762 | -| std | 0.0753 | -| value_loss | 0.000239 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8724 | -| time_elapsed | 52770 | -| total_timesteps | 1116672 | -| train/ | | -| approx_kl | 0.00034469645 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | -0.000272 | -| n_updates | 87230 | -| policy_gradient_loss | -0.000728 | -| std | 0.0754 | -| value_loss | 0.000309 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8725 | -| time_elapsed | 52772 | -| total_timesteps | 1116800 | -| train/ | | -| approx_kl | 0.0013329401 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.00262 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 87240 | -| policy_gradient_loss | -0.00376 | -| std | 0.0754 | -| value_loss | 0.000934 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 8726 | -| time_elapsed | 52776 | -| total_timesteps | 1116928 | -| train/ | | -| approx_kl | 0.0027217367 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 87250 | -| policy_gradient_loss | -0.00998 | -| std | 0.0754 | -| value_loss | 0.000984 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8727 | -| time_elapsed | 52780 | -| total_timesteps | 1117056 | -| train/ | | -| approx_kl | 0.0003096969 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.00299 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 87260 | -| policy_gradient_loss | -0.00355 | -| std | 0.0754 | -| value_loss | 0.000181 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8728 | -| time_elapsed | 52786 | -| total_timesteps | 1117184 | -| train/ | | -| approx_kl | 0.024629753 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.624 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 87270 | -| policy_gradient_loss | -0.0124 | -| std | 0.0754 | -| value_loss | 0.00188 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8729 | -| time_elapsed | 52789 | -| total_timesteps | 1117312 | -| train/ | | -| approx_kl | 0.00031142868 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 87280 | -| policy_gradient_loss | 0.00178 | -| std | 0.0752 | -| value_loss | 0.00172 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8730 | -| time_elapsed | 52792 | -| total_timesteps | 1117440 | -| train/ | | -| approx_kl | 0.0020042928 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.0039 | -| learning_rate | 0.0003 | -| loss | -0.000873 | -| n_updates | 87290 | -| policy_gradient_loss | -0.00617 | -| std | 0.075 | -| value_loss | 0.0239 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8731 | -| time_elapsed | 52795 | -| total_timesteps | 1117568 | -| train/ | | -| approx_kl | 0.002975542 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.000159 | -| learning_rate | 0.0003 | -| loss | -0.00028 | -| n_updates | 87300 | -| policy_gradient_loss | -0.00561 | -| std | 0.0749 | -| value_loss | 0.00412 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8732 | -| time_elapsed | 52798 | -| total_timesteps | 1117696 | -| train/ | | -| approx_kl | 0.00038063806 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.00223 | -| n_updates | 87310 | -| policy_gradient_loss | 0.00542 | -| std | 0.0749 | -| value_loss | 0.00468 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8733 | -| time_elapsed | 52801 | -| total_timesteps | 1117824 | -| train/ | | -| approx_kl | 0.008737159 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.00809 | -| n_updates | 87320 | -| policy_gradient_loss | -0.00546 | -| std | 0.0749 | -| value_loss | 0.0356 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8734 | -| time_elapsed | 52804 | -| total_timesteps | 1117952 | -| train/ | | -| approx_kl | 0.037115462 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.00276 | -| learning_rate | 0.0003 | -| loss | 0.0041 | -| n_updates | 87330 | -| policy_gradient_loss | -0.00653 | -| std | 0.0749 | -| value_loss | 0.0187 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8735 | -| time_elapsed | 52808 | -| total_timesteps | 1118080 | -| train/ | | -| approx_kl | 3.3038203e-05 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.65 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 87340 | -| policy_gradient_loss | -0.00154 | -| std | 0.0749 | -| value_loss | 0.00411 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8736 | -| time_elapsed | 52814 | -| total_timesteps | 1118208 | -| train/ | | -| approx_kl | 0.0076247384 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 87350 | -| policy_gradient_loss | -0.00692 | -| std | 0.0749 | -| value_loss | 0.00251 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8737 | -| time_elapsed | 52816 | -| total_timesteps | 1118336 | -| train/ | | -| approx_kl | 0.0012763953 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 87360 | -| policy_gradient_loss | -0.000612 | -| std | 0.0751 | -| value_loss | 0.000268 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8738 | -| time_elapsed | 52818 | -| total_timesteps | 1118464 | -| train/ | | -| approx_kl | 0.0012268052 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 87370 | -| policy_gradient_loss | -0.00619 | -| std | 0.0752 | -| value_loss | 0.000639 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8739 | -| time_elapsed | 52821 | -| total_timesteps | 1118592 | -| train/ | | -| approx_kl | 8.009374e-07 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.00309 | -| learning_rate | 0.0003 | -| loss | -3.72e-06 | -| n_updates | 87380 | -| policy_gradient_loss | -0.00132 | -| std | 0.0752 | -| value_loss | 8.84e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8740 | -| time_elapsed | 52824 | -| total_timesteps | 1118720 | -| train/ | | -| approx_kl | 0.0045799464 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 87390 | -| policy_gradient_loss | -0.0111 | -| std | 0.0752 | -| value_loss | 6.61e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8741 | -| time_elapsed | 52826 | -| total_timesteps | 1118848 | -| train/ | | -| approx_kl | 0.013784808 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 87400 | -| policy_gradient_loss | -0.00951 | -| std | 0.0752 | -| value_loss | 4.02e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 8742 | -| time_elapsed | 52829 | -| total_timesteps | 1118976 | -| train/ | | -| approx_kl | 0.0030667656 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 87410 | -| policy_gradient_loss | -0.00192 | -| std | 0.0752 | -| value_loss | 2.55e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 8743 | -| time_elapsed | 52832 | -| total_timesteps | 1119104 | -| train/ | | -| approx_kl | 2.3690052e-05 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.000193 | -| n_updates | 87420 | -| policy_gradient_loss | 0.00101 | -| std | 0.0752 | -| value_loss | 1.62e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 8744 | -| time_elapsed | 52839 | -| total_timesteps | 1119232 | -| train/ | | -| approx_kl | 0.03843382 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -4.13 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 87430 | -| policy_gradient_loss | -0.0143 | -| std | 0.0752 | -| value_loss | 0.00383 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 8745 | -| time_elapsed | 52843 | -| total_timesteps | 1119360 | -| train/ | | -| approx_kl | 0.0021657627 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.72 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 87440 | -| policy_gradient_loss | -0.00386 | -| std | 0.0751 | -| value_loss | 2.08e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 8746 | -| time_elapsed | 52846 | -| total_timesteps | 1119488 | -| train/ | | -| approx_kl | 0.01644386 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | -0.00746 | -| n_updates | 87450 | -| policy_gradient_loss | 0.00175 | -| std | 0.0751 | -| value_loss | 7.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 8747 | -| time_elapsed | 52849 | -| total_timesteps | 1119616 | -| train/ | | -| approx_kl | 0.039437518 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.412 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 87460 | -| policy_gradient_loss | 0.00477 | -| std | 0.0751 | -| value_loss | 3e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 8748 | -| time_elapsed | 52853 | -| total_timesteps | 1119744 | -| train/ | | -| approx_kl | 0.0012061326 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 87470 | -| policy_gradient_loss | -0.00156 | -| std | 0.0751 | -| value_loss | 1.39e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 8749 | -| time_elapsed | 52857 | -| total_timesteps | 1119872 | -| train/ | | -| approx_kl | 4.4349115e-05 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0679 | -| learning_rate | 0.0003 | -| loss | -2.7e-05 | -| n_updates | 87480 | -| policy_gradient_loss | 0.000489 | -| std | 0.0751 | -| value_loss | 1.83e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8750 | -| time_elapsed | 52861 | -| total_timesteps | 1120000 | -| train/ | | -| approx_kl | 0.051350955 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 87490 | -| policy_gradient_loss | -0.015 | -| std | 0.0751 | -| value_loss | 1.59e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8751 | -| time_elapsed | 52864 | -| total_timesteps | 1120128 | -| train/ | | -| approx_kl | 0.010009079 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.00282 | -| learning_rate | 0.0003 | -| loss | -0.000971 | -| n_updates | 87500 | -| policy_gradient_loss | 0.000526 | -| std | 0.0751 | -| value_loss | 1.02e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8752 | -| time_elapsed | 52871 | -| total_timesteps | 1120256 | -| train/ | | -| approx_kl | 0.024950145 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -4.68 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 87510 | -| policy_gradient_loss | -0.0101 | -| std | 0.0751 | -| value_loss | 0.00312 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8753 | -| time_elapsed | 52876 | -| total_timesteps | 1120384 | -| train/ | | -| approx_kl | 0.0017714174 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 87520 | -| policy_gradient_loss | -0.000863 | -| std | 0.0751 | -| value_loss | 1.53e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8754 | -| time_elapsed | 52879 | -| total_timesteps | 1120512 | -| train/ | | -| approx_kl | 5.669892e-05 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -8.79 | -| learning_rate | 0.0003 | -| loss | -0.000156 | -| n_updates | 87530 | -| policy_gradient_loss | 1.68e-05 | -| std | 0.075 | -| value_loss | 7.31e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8755 | -| time_elapsed | 52884 | -| total_timesteps | 1120640 | -| train/ | | -| approx_kl | 0.00022293162 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.621 | -| learning_rate | 0.0003 | -| loss | -0.000276 | -| n_updates | 87540 | -| policy_gradient_loss | 0.000577 | -| std | 0.0748 | -| value_loss | 2.8e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8756 | -| time_elapsed | 52887 | -| total_timesteps | 1120768 | -| train/ | | -| approx_kl | 0.0032053431 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 87550 | -| policy_gradient_loss | -0.00202 | -| std | 0.0748 | -| value_loss | 5.27e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8757 | -| time_elapsed | 52890 | -| total_timesteps | 1120896 | -| train/ | | -| approx_kl | 0.001432064 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.00737 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 87560 | -| policy_gradient_loss | 4.51e-05 | -| std | 0.0747 | -| value_loss | 9.7e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8758 | -| time_elapsed | 52894 | -| total_timesteps | 1121024 | -| train/ | | -| approx_kl | 0.0038955351 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 87570 | -| policy_gradient_loss | -0.00181 | -| std | 0.0748 | -| value_loss | 4.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8759 | -| time_elapsed | 52903 | -| total_timesteps | 1121152 | -| train/ | | -| approx_kl | 0.030400906 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.953 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 87580 | -| policy_gradient_loss | -0.0152 | -| std | 0.0749 | -| value_loss | 0.000443 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8760 | -| time_elapsed | 52907 | -| total_timesteps | 1121280 | -| train/ | | -| approx_kl | 0.010582071 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 87590 | -| policy_gradient_loss | -0.0173 | -| std | 0.0749 | -| value_loss | 1.29e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8761 | -| time_elapsed | 52910 | -| total_timesteps | 1121408 | -| train/ | | -| approx_kl | 0.07473961 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -1.69e+03 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 87600 | -| policy_gradient_loss | -0.00913 | -| std | 0.0749 | -| value_loss | 1.26e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8762 | -| time_elapsed | 52913 | -| total_timesteps | 1121536 | -| train/ | | -| approx_kl | 0.0019484009 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -8.12 | -| learning_rate | 0.0003 | -| loss | -0.00909 | -| n_updates | 87610 | -| policy_gradient_loss | -0.0116 | -| std | 0.075 | -| value_loss | 2.13e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8763 | -| time_elapsed | 52915 | -| total_timesteps | 1121664 | -| train/ | | -| approx_kl | 0.085146256 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -19.9 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 87620 | -| policy_gradient_loss | -0.0021 | -| std | 0.075 | -| value_loss | 1.15e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8764 | -| time_elapsed | 52918 | -| total_timesteps | 1121792 | -| train/ | | -| approx_kl | 0.00045414641 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -15 | -| learning_rate | 0.0003 | -| loss | 0.000122 | -| n_updates | 87630 | -| policy_gradient_loss | 0.000203 | -| std | 0.0749 | -| value_loss | 1.37e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8765 | -| time_elapsed | 52921 | -| total_timesteps | 1121920 | -| train/ | | -| approx_kl | 0.00038421992 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.502 | -| learning_rate | 0.0003 | -| loss | -0.000784 | -| n_updates | 87640 | -| policy_gradient_loss | 0.00153 | -| std | 0.0749 | -| value_loss | 2.54e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8766 | -| time_elapsed | 52925 | -| total_timesteps | 1122048 | -| train/ | | -| approx_kl | 0.00013260683 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0734 | -| learning_rate | 0.0003 | -| loss | -0.00088 | -| n_updates | 87650 | -| policy_gradient_loss | -0.000683 | -| std | 0.0749 | -| value_loss | 8.12e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8767 | -| time_elapsed | 52932 | -| total_timesteps | 1122176 | -| train/ | | -| approx_kl | 0.048203114 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | 0.915 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 87660 | -| policy_gradient_loss | -0.0158 | -| std | 0.0748 | -| value_loss | 0.000312 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8768 | -| time_elapsed | 52935 | -| total_timesteps | 1122304 | -| train/ | | -| approx_kl | 0.05975151 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -24.8 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 87670 | -| policy_gradient_loss | -0.0101 | -| std | 0.0748 | -| value_loss | 7.43e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8769 | -| time_elapsed | 52937 | -| total_timesteps | 1122432 | -| train/ | | -| approx_kl | 0.00858939 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -67 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 87680 | -| policy_gradient_loss | -0.0116 | -| std | 0.0748 | -| value_loss | 5.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8770 | -| time_elapsed | 52940 | -| total_timesteps | 1122560 | -| train/ | | -| approx_kl | 0.003338568 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 87690 | -| policy_gradient_loss | -0.0111 | -| std | 0.0749 | -| value_loss | 8.1e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8771 | -| time_elapsed | 52943 | -| total_timesteps | 1122688 | -| train/ | | -| approx_kl | 0.0021708813 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -3.25 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 87700 | -| policy_gradient_loss | -0.00347 | -| std | 0.0749 | -| value_loss | 1.68e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8772 | -| time_elapsed | 52946 | -| total_timesteps | 1122816 | -| train/ | | -| approx_kl | 0.013457632 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.649 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 87710 | -| policy_gradient_loss | 0.000747 | -| std | 0.0749 | -| value_loss | 6.76e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8773 | -| time_elapsed | 52949 | -| total_timesteps | 1122944 | -| train/ | | -| approx_kl | 0.00072348956 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.000834 | -| n_updates | 87720 | -| policy_gradient_loss | 0.00759 | -| std | 0.0748 | -| value_loss | 3.06e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8774 | -| time_elapsed | 52951 | -| total_timesteps | 1123072 | -| train/ | | -| approx_kl | 0.0073526227 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.17 | -| explained_variance | -0.0716 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 87730 | -| policy_gradient_loss | -0.00638 | -| std | 0.0747 | -| value_loss | 3.02e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8775 | -| time_elapsed | 52957 | -| total_timesteps | 1123200 | -| train/ | | -| approx_kl | 0.20264697 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 1.18 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 87740 | -| policy_gradient_loss | -0.0149 | -| std | 0.0747 | -| value_loss | 2.7e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8776 | -| time_elapsed | 52961 | -| total_timesteps | 1123328 | -| train/ | | -| approx_kl | 6.4174645e-05 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.18 | -| explained_variance | -1.88 | -| learning_rate | 0.0003 | -| loss | -0.000238 | -| n_updates | 87750 | -| policy_gradient_loss | 7.34e-05 | -| std | 0.0747 | -| value_loss | 8.8e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8777 | -| time_elapsed | 52965 | -| total_timesteps | 1123456 | -| train/ | | -| approx_kl | 0.006620277 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.18 | -| explained_variance | -9.9 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 87760 | -| policy_gradient_loss | -0.014 | -| std | 0.0746 | -| value_loss | 6.25e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8778 | -| time_elapsed | 52967 | -| total_timesteps | 1123584 | -| train/ | | -| approx_kl | 0.0041258126 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.18 | -| explained_variance | -2.98 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 87770 | -| policy_gradient_loss | -0.00223 | -| std | 0.0746 | -| value_loss | 1.2e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8779 | -| time_elapsed | 52968 | -| total_timesteps | 1123712 | -| train/ | | -| approx_kl | 2.106186e-06 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.18 | -| explained_variance | -0.555 | -| learning_rate | 0.0003 | -| loss | 1.5e-05 | -| n_updates | 87780 | -| policy_gradient_loss | 0.00467 | -| std | 0.0746 | -| value_loss | 6.31e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8780 | -| time_elapsed | 52970 | -| total_timesteps | 1123840 | -| train/ | | -| approx_kl | 0.0022291183 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 1.18 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 87790 | -| policy_gradient_loss | -0.00314 | -| std | 0.0746 | -| value_loss | 6.71e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 8781 | -| time_elapsed | 52972 | -| total_timesteps | 1123968 | -| train/ | | -| approx_kl | 0.00010458194 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.18 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 87800 | -| policy_gradient_loss | -0.000993 | -| std | 0.0738 | -| value_loss | 2.83e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8782 | -| time_elapsed | 52976 | -| total_timesteps | 1124096 | -| train/ | | -| approx_kl | 0.0011999505 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.19 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.00289 | -| n_updates | 87810 | -| policy_gradient_loss | -0.00189 | -| std | 0.0732 | -| value_loss | 6.03e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8783 | -| time_elapsed | 52983 | -| total_timesteps | 1124224 | -| train/ | | -| approx_kl | 0.02088827 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 1.2 | -| explained_variance | -4.63 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 87820 | -| policy_gradient_loss | -0.0131 | -| std | 0.073 | -| value_loss | 0.00288 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8784 | -| time_elapsed | 52987 | -| total_timesteps | 1124352 | -| train/ | | -| approx_kl | 0.018847004 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 1.2 | -| explained_variance | -101 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 87830 | -| policy_gradient_loss | -0.0118 | -| std | 0.0729 | -| value_loss | 3.18e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8785 | -| time_elapsed | 52990 | -| total_timesteps | 1124480 | -| train/ | | -| approx_kl | 0.02983303 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 1.2 | -| explained_variance | -2.82e+03 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 87840 | -| policy_gradient_loss | -0.003 | -| std | 0.0729 | -| value_loss | 1.54e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8786 | -| time_elapsed | 52994 | -| total_timesteps | 1124608 | -| train/ | | -| approx_kl | 0.04615152 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 1.2 | -| explained_variance | -490 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 87850 | -| policy_gradient_loss | -0.00973 | -| std | 0.0728 | -| value_loss | 3.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8787 | -| time_elapsed | 52998 | -| total_timesteps | 1124736 | -| train/ | | -| approx_kl | 0.005285583 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 1.2 | -| explained_variance | -5.43e+03 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 87860 | -| policy_gradient_loss | -0.00127 | -| std | 0.0728 | -| value_loss | 8.69e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8788 | -| time_elapsed | 53001 | -| total_timesteps | 1124864 | -| train/ | | -| approx_kl | 0.0006766771 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.2 | -| explained_variance | -25 | -| learning_rate | 0.0003 | -| loss | -0.000464 | -| n_updates | 87870 | -| policy_gradient_loss | -0.000207 | -| std | 0.0724 | -| value_loss | 6.47e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8789 | -| time_elapsed | 53005 | -| total_timesteps | 1124992 | -| train/ | | -| approx_kl | 0.00079124235 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -0.802 | -| learning_rate | 0.0003 | -| loss | -0.000717 | -| n_updates | 87880 | -| policy_gradient_loss | -0.000191 | -| std | 0.0721 | -| value_loss | 5.44e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8790 | -| time_elapsed | 53009 | -| total_timesteps | 1125120 | -| train/ | | -| approx_kl | 0.0026384527 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | 0.000373 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 87890 | -| policy_gradient_loss | 0.00247 | -| std | 0.072 | -| value_loss | 7.39e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8791 | -| time_elapsed | 53018 | -| total_timesteps | 1125248 | -| train/ | | -| approx_kl | 0.027060747 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | 0.932 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 87900 | -| policy_gradient_loss | -0.0128 | -| std | 0.072 | -| value_loss | 0.000592 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8792 | -| time_elapsed | 53021 | -| total_timesteps | 1125376 | -| train/ | | -| approx_kl | 0.003310151 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -3.02 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 87910 | -| policy_gradient_loss | -0.0146 | -| std | 0.072 | -| value_loss | 3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8793 | -| time_elapsed | 53024 | -| total_timesteps | 1125504 | -| train/ | | -| approx_kl | 0.009667618 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 87920 | -| policy_gradient_loss | -0.0143 | -| std | 0.0719 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8794 | -| time_elapsed | 53031 | -| total_timesteps | 1125632 | -| train/ | | -| approx_kl | 0.0032575256 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -2.08 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 87930 | -| policy_gradient_loss | -0.00121 | -| std | 0.0719 | -| value_loss | 1.95e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8795 | -| time_elapsed | 53035 | -| total_timesteps | 1125760 | -| train/ | | -| approx_kl | 8.028094e-05 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 87940 | -| policy_gradient_loss | -0.00343 | -| std | 0.0719 | -| value_loss | 7.21e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8796 | -| time_elapsed | 53037 | -| total_timesteps | 1125888 | -| train/ | | -| approx_kl | 0.005572222 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -0.439 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 87950 | -| policy_gradient_loss | 0.00248 | -| std | 0.0719 | -| value_loss | 5.03e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8797 | -| time_elapsed | 53040 | -| total_timesteps | 1126016 | -| train/ | | -| approx_kl | 0.0010104426 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | -0.00592 | -| n_updates | 87960 | -| policy_gradient_loss | -0.00935 | -| std | 0.0719 | -| value_loss | 5.31e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8798 | -| time_elapsed | 53049 | -| total_timesteps | 1126144 | -| train/ | | -| approx_kl | 0.04882185 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | 0.902 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 87970 | -| policy_gradient_loss | -0.00757 | -| std | 0.0718 | -| value_loss | 0.00105 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8799 | -| time_elapsed | 53053 | -| total_timesteps | 1126272 | -| train/ | | -| approx_kl | 0.008033493 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | 0.298 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 87980 | -| policy_gradient_loss | -0.0133 | -| std | 0.0718 | -| value_loss | 5.41e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8800 | -| time_elapsed | 53056 | -| total_timesteps | 1126400 | -| train/ | | -| approx_kl | 0.0073154806 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -7.82 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 87990 | -| policy_gradient_loss | -0.000449 | -| std | 0.0718 | -| value_loss | 2.01e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8801 | -| time_elapsed | 53060 | -| total_timesteps | 1126528 | -| train/ | | -| approx_kl | 0.07111344 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -2.93 | -| learning_rate | 0.0003 | -| loss | -0.00763 | -| n_updates | 88000 | -| policy_gradient_loss | -0.0079 | -| std | 0.0718 | -| value_loss | 8.11e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8802 | -| time_elapsed | 53063 | -| total_timesteps | 1126656 | -| train/ | | -| approx_kl | 0.004563932 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -1.52 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 88010 | -| policy_gradient_loss | -0.00488 | -| std | 0.0717 | -| value_loss | 1.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8803 | -| time_elapsed | 53067 | -| total_timesteps | 1126784 | -| train/ | | -| approx_kl | 0.025098322 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.358 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 88020 | -| policy_gradient_loss | -0.00871 | -| std | 0.0717 | -| value_loss | 1.12e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8804 | -| time_elapsed | 53071 | -| total_timesteps | 1126912 | -| train/ | | -| approx_kl | 0.00051882677 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | 0.00206 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 88030 | -| policy_gradient_loss | 0.00418 | -| std | 0.0717 | -| value_loss | 6.82e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8805 | -| time_elapsed | 53075 | -| total_timesteps | 1127040 | -| train/ | | -| approx_kl | 4.9625058e-05 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | -0.000209 | -| n_updates | 88040 | -| policy_gradient_loss | 0.00207 | -| std | 0.0718 | -| value_loss | 1.83e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8806 | -| time_elapsed | 53082 | -| total_timesteps | 1127168 | -| train/ | | -| approx_kl | 0.0047060275 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | 0.405 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 88050 | -| policy_gradient_loss | -0.0144 | -| std | 0.0719 | -| value_loss | 0.000984 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8807 | -| time_elapsed | 53084 | -| total_timesteps | 1127296 | -| train/ | | -| approx_kl | 0.009609629 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -2.26e+03 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 88060 | -| policy_gradient_loss | -0.0123 | -| std | 0.072 | -| value_loss | 2.02e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8808 | -| time_elapsed | 53089 | -| total_timesteps | 1127424 | -| train/ | | -| approx_kl | 0.0036866693 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -634 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 88070 | -| policy_gradient_loss | -0.00114 | -| std | 0.0719 | -| value_loss | 5.13e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8809 | -| time_elapsed | 53091 | -| total_timesteps | 1127552 | -| train/ | | -| approx_kl | 0.004159816 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.21 | -| explained_variance | -34.5 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 88080 | -| policy_gradient_loss | -0.000154 | -| std | 0.0718 | -| value_loss | 4.73e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8810 | -| time_elapsed | 53095 | -| total_timesteps | 1127680 | -| train/ | | -| approx_kl | 0.0013115066 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -3.46 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 88090 | -| policy_gradient_loss | 0.000532 | -| std | 0.0716 | -| value_loss | 1.22e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8811 | -| time_elapsed | 53098 | -| total_timesteps | 1127808 | -| train/ | | -| approx_kl | 0.037059713 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.407 | -| learning_rate | 0.0003 | -| loss | -0.00377 | -| n_updates | 88100 | -| policy_gradient_loss | -0.00363 | -| std | 0.0715 | -| value_loss | 5.06e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8812 | -| time_elapsed | 53101 | -| total_timesteps | 1127936 | -| train/ | | -| approx_kl | 0.0047176555 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.000586 | -| n_updates | 88110 | -| policy_gradient_loss | 0.00085 | -| std | 0.0713 | -| value_loss | 9.07e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8813 | -| time_elapsed | 53104 | -| total_timesteps | 1128064 | -| train/ | | -| approx_kl | 0.003109851 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | 0.000713 | -| learning_rate | 0.0003 | -| loss | -0.000522 | -| n_updates | 88120 | -| policy_gradient_loss | 0.00204 | -| std | 0.0714 | -| value_loss | 1.73e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8814 | -| time_elapsed | 53110 | -| total_timesteps | 1128192 | -| train/ | | -| approx_kl | 0.020861695 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 88130 | -| policy_gradient_loss | -0.0163 | -| std | 0.0714 | -| value_loss | 0.000166 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8815 | -| time_elapsed | 53112 | -| total_timesteps | 1128320 | -| train/ | | -| approx_kl | 0.12524894 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -52.1 | -| learning_rate | 0.0003 | -| loss | -0.00866 | -| n_updates | 88140 | -| policy_gradient_loss | -0.00713 | -| std | 0.0714 | -| value_loss | 1.97e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8816 | -| time_elapsed | 53116 | -| total_timesteps | 1128448 | -| train/ | | -| approx_kl | 0.11726337 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -206 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 88150 | -| policy_gradient_loss | -0.00396 | -| std | 0.0713 | -| value_loss | 1.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8817 | -| time_elapsed | 53119 | -| total_timesteps | 1128576 | -| train/ | | -| approx_kl | 0.007993853 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -47.3 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 88160 | -| policy_gradient_loss | -0.000832 | -| std | 0.0712 | -| value_loss | 1.17e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8818 | -| time_elapsed | 53122 | -| total_timesteps | 1128704 | -| train/ | | -| approx_kl | 0.048231952 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -6.16 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 88170 | -| policy_gradient_loss | -0.00288 | -| std | 0.0711 | -| value_loss | 4.14e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8819 | -| time_elapsed | 53124 | -| total_timesteps | 1128832 | -| train/ | | -| approx_kl | 0.019955404 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -2.61 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 88180 | -| policy_gradient_loss | -0.0139 | -| std | 0.0711 | -| value_loss | 1.9e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8820 | -| time_elapsed | 53127 | -| total_timesteps | 1128960 | -| train/ | | -| approx_kl | 0.040611707 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.23 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | 0.0074 | -| n_updates | 88190 | -| policy_gradient_loss | 0.00193 | -| std | 0.0711 | -| value_loss | 3.86e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8821 | -| time_elapsed | 53131 | -| total_timesteps | 1129088 | -| train/ | | -| approx_kl | 0.0009976304 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.23 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | -0.000918 | -| n_updates | 88200 | -| policy_gradient_loss | -0.000308 | -| std | 0.0711 | -| value_loss | 1.85e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8822 | -| time_elapsed | 53139 | -| total_timesteps | 1129216 | -| train/ | | -| approx_kl | 0.007586943 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 88210 | -| policy_gradient_loss | -0.0168 | -| std | 0.0711 | -| value_loss | 0.00019 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8823 | -| time_elapsed | 53144 | -| total_timesteps | 1129344 | -| train/ | | -| approx_kl | 5.7308935e-06 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -23.4 | -| learning_rate | 0.0003 | -| loss | -0.000276 | -| n_updates | 88220 | -| policy_gradient_loss | -0.000172 | -| std | 0.0713 | -| value_loss | 2.2e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8824 | -| time_elapsed | 53147 | -| total_timesteps | 1129472 | -| train/ | | -| approx_kl | 0.010360368 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -21.8 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 88230 | -| policy_gradient_loss | -0.00653 | -| std | 0.0715 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8825 | -| time_elapsed | 53150 | -| total_timesteps | 1129600 | -| train/ | | -| approx_kl | 0.0013189334 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 88240 | -| policy_gradient_loss | -0.00272 | -| std | 0.0715 | -| value_loss | 3.46e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8826 | -| time_elapsed | 53153 | -| total_timesteps | 1129728 | -| train/ | | -| approx_kl | 0.00022792723 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.958 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 88250 | -| policy_gradient_loss | -0.00334 | -| std | 0.0715 | -| value_loss | 1.53e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8827 | -| time_elapsed | 53156 | -| total_timesteps | 1129856 | -| train/ | | -| approx_kl | 0.006232579 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 88260 | -| policy_gradient_loss | -0.0096 | -| std | 0.0714 | -| value_loss | 3.95e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8828 | -| time_elapsed | 53159 | -| total_timesteps | 1129984 | -| train/ | | -| approx_kl | 0.002212138 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.0728 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 88270 | -| policy_gradient_loss | -0.000581 | -| std | 0.0714 | -| value_loss | 3.42e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8829 | -| time_elapsed | 53163 | -| total_timesteps | 1130112 | -| train/ | | -| approx_kl | 0.004807889 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | -0.00361 | -| n_updates | 88280 | -| policy_gradient_loss | -0.00283 | -| std | 0.0713 | -| value_loss | 1.98e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8830 | -| time_elapsed | 53172 | -| total_timesteps | 1130240 | -| train/ | | -| approx_kl | 0.0025561778 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 88290 | -| policy_gradient_loss | -0.0141 | -| std | 0.0713 | -| value_loss | 0.000126 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8831 | -| time_elapsed | 53175 | -| total_timesteps | 1130368 | -| train/ | | -| approx_kl | 0.011355188 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -192 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 88300 | -| policy_gradient_loss | -0.0038 | -| std | 0.0713 | -| value_loss | 2.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8832 | -| time_elapsed | 53179 | -| total_timesteps | 1130496 | -| train/ | | -| approx_kl | 0.011913359 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -508 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 88310 | -| policy_gradient_loss | -0.0112 | -| std | 0.0712 | -| value_loss | 1.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8833 | -| time_elapsed | 53183 | -| total_timesteps | 1130624 | -| train/ | | -| approx_kl | 0.031737722 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -52.8 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 88320 | -| policy_gradient_loss | -0.00262 | -| std | 0.0712 | -| value_loss | 1.29e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8834 | -| time_elapsed | 53186 | -| total_timesteps | 1130752 | -| train/ | | -| approx_kl | 0.022160238 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 1.22 | -| explained_variance | -5.4 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 88330 | -| policy_gradient_loss | -0.000778 | -| std | 0.0711 | -| value_loss | 3.17e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8835 | -| time_elapsed | 53189 | -| total_timesteps | 1130880 | -| train/ | | -| approx_kl | 0.0005739294 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 1.23 | -| explained_variance | -0.651 | -| learning_rate | 0.0003 | -| loss | -0.000585 | -| n_updates | 88340 | -| policy_gradient_loss | -0.000135 | -| std | 0.0708 | -| value_loss | 1.14e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8836 | -| time_elapsed | 53191 | -| total_timesteps | 1131008 | -| train/ | | -| approx_kl | 9.6620526e-05 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.23 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | 0.00102 | -| n_updates | 88350 | -| policy_gradient_loss | -0.00272 | -| std | 0.0705 | -| value_loss | 1.75e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8837 | -| time_elapsed | 53201 | -| total_timesteps | 1131136 | -| train/ | | -| approx_kl | 0.008601484 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 1.23 | -| explained_variance | 0.588 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 88360 | -| policy_gradient_loss | -0.0153 | -| std | 0.0703 | -| value_loss | 0.00067 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8838 | -| time_elapsed | 53205 | -| total_timesteps | 1131264 | -| train/ | | -| approx_kl | 0.0015135803 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | -0.00289 | -| n_updates | 88370 | -| policy_gradient_loss | -0.00257 | -| std | 0.0703 | -| value_loss | 4.42e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8839 | -| time_elapsed | 53208 | -| total_timesteps | 1131392 | -| train/ | | -| approx_kl | 0.0385341 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -680 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 88380 | -| policy_gradient_loss | -0.00855 | -| std | 0.0703 | -| value_loss | 2.34e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8840 | -| time_elapsed | 53212 | -| total_timesteps | 1131520 | -| train/ | | -| approx_kl | 0.0017041238 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -119 | -| learning_rate | 0.0003 | -| loss | -0.00567 | -| n_updates | 88390 | -| policy_gradient_loss | -0.00947 | -| std | 0.0703 | -| value_loss | 7.12e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8841 | -| time_elapsed | 53215 | -| total_timesteps | 1131648 | -| train/ | | -| approx_kl | 0.0037749037 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -6.66 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 88400 | -| policy_gradient_loss | -0.00266 | -| std | 0.0703 | -| value_loss | 9.36e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8842 | -| time_elapsed | 53218 | -| total_timesteps | 1131776 | -| train/ | | -| approx_kl | 0.00016413676 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.837 | -| learning_rate | 0.0003 | -| loss | -0.000132 | -| n_updates | 88410 | -| policy_gradient_loss | 0.000637 | -| std | 0.0702 | -| value_loss | 3.52e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8843 | -| time_elapsed | 53222 | -| total_timesteps | 1131904 | -| train/ | | -| approx_kl | 0.0008251178 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.0781 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 88420 | -| policy_gradient_loss | -0.00348 | -| std | 0.0701 | -| value_loss | 4.75e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8844 | -| time_elapsed | 53226 | -| total_timesteps | 1132032 | -| train/ | | -| approx_kl | 0.00068102824 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.000178 | -| n_updates | 88430 | -| policy_gradient_loss | 0.00142 | -| std | 0.0702 | -| value_loss | 1.15e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8845 | -| time_elapsed | 53234 | -| total_timesteps | 1132160 | -| train/ | | -| approx_kl | 0.0003466569 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | 0.000665 | -| n_updates | 88440 | -| policy_gradient_loss | -0.000437 | -| std | 0.0702 | -| value_loss | 0.00313 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8846 | -| time_elapsed | 53237 | -| total_timesteps | 1132288 | -| train/ | | -| approx_kl | 0.24853553 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -2.91e+03 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 88450 | -| policy_gradient_loss | -0.00246 | -| std | 0.0701 | -| value_loss | 6.67e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8847 | -| time_elapsed | 53241 | -| total_timesteps | 1132416 | -| train/ | | -| approx_kl | 0.09478494 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -17.3 | -| learning_rate | 0.0003 | -| loss | -0.00789 | -| n_updates | 88460 | -| policy_gradient_loss | -0.00674 | -| std | 0.0701 | -| value_loss | 6.69e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8848 | -| time_elapsed | 53243 | -| total_timesteps | 1132544 | -| train/ | | -| approx_kl | 0.0030745962 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -56.6 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 88470 | -| policy_gradient_loss | -0.00279 | -| std | 0.0702 | -| value_loss | 5.92e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8849 | -| time_elapsed | 53247 | -| total_timesteps | 1132672 | -| train/ | | -| approx_kl | 0.0032923426 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -11.3 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 88480 | -| policy_gradient_loss | -0.00391 | -| std | 0.0702 | -| value_loss | 1.02e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8850 | -| time_elapsed | 53250 | -| total_timesteps | 1132800 | -| train/ | | -| approx_kl | 0.0006058188 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.656 | -| learning_rate | 0.0003 | -| loss | -0.000781 | -| n_updates | 88490 | -| policy_gradient_loss | 0.00208 | -| std | 0.0702 | -| value_loss | 2.92e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8851 | -| time_elapsed | 53253 | -| total_timesteps | 1132928 | -| train/ | | -| approx_kl | 0.0013411869 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.00162 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 88500 | -| policy_gradient_loss | -0.0115 | -| std | 0.0702 | -| value_loss | 5.92e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8852 | -| time_elapsed | 53256 | -| total_timesteps | 1133056 | -| train/ | | -| approx_kl | 0.0012469268 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.00403 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 88510 | -| policy_gradient_loss | -0.00916 | -| std | 0.0702 | -| value_loss | 1.44e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8853 | -| time_elapsed | 53261 | -| total_timesteps | 1133184 | -| train/ | | -| approx_kl | 0.004886079 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 88520 | -| policy_gradient_loss | -0.0141 | -| std | 0.0701 | -| value_loss | 0.00025 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8854 | -| time_elapsed | 53264 | -| total_timesteps | 1133312 | -| train/ | | -| approx_kl | 0.0001590657 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 88530 | -| policy_gradient_loss | -0.00242 | -| std | 0.0701 | -| value_loss | 2.5e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8855 | -| time_elapsed | 53266 | -| total_timesteps | 1133440 | -| train/ | | -| approx_kl | 0.0022518756 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 88540 | -| policy_gradient_loss | 8.29e-05 | -| std | 0.0702 | -| value_loss | 6.26e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8856 | -| time_elapsed | 53269 | -| total_timesteps | 1133568 | -| train/ | | -| approx_kl | 0.00018214202 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.095 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 88550 | -| policy_gradient_loss | 0.00183 | -| std | 0.0702 | -| value_loss | 2.5e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8857 | -| time_elapsed | 53272 | -| total_timesteps | 1133696 | -| train/ | | -| approx_kl | 0.0041655446 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.000546 | -| learning_rate | 0.0003 | -| loss | 0.000166 | -| n_updates | 88560 | -| policy_gradient_loss | 0.000109 | -| std | 0.0702 | -| value_loss | 1.46e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8858 | -| time_elapsed | 53276 | -| total_timesteps | 1133824 | -| train/ | | -| approx_kl | 0.0008418462 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.000862 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 88570 | -| policy_gradient_loss | -0.00145 | -| std | 0.0702 | -| value_loss | 4.6e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8859 | -| time_elapsed | 53278 | -| total_timesteps | 1133952 | -| train/ | | -| approx_kl | 0.0064315954 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 88580 | -| policy_gradient_loss | -0.00488 | -| std | 0.0702 | -| value_loss | 1.8e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8860 | -| time_elapsed | 53281 | -| total_timesteps | 1134080 | -| train/ | | -| approx_kl | 9.4056595e-05 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.000167 | -| n_updates | 88590 | -| policy_gradient_loss | 0.000589 | -| std | 0.0702 | -| value_loss | 3.11e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8861 | -| time_elapsed | 53287 | -| total_timesteps | 1134208 | -| train/ | | -| approx_kl | 0.019513968 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.943 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 88600 | -| policy_gradient_loss | -0.0146 | -| std | 0.0702 | -| value_loss | 0.000483 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8862 | -| time_elapsed | 53291 | -| total_timesteps | 1134336 | -| train/ | | -| approx_kl | 0.0041761524 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 88610 | -| policy_gradient_loss | -0.0049 | -| std | 0.0702 | -| value_loss | 7.88e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8863 | -| time_elapsed | 53294 | -| total_timesteps | 1134464 | -| train/ | | -| approx_kl | 0.04022944 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -24.3 | -| learning_rate | 0.0003 | -| loss | -0.00989 | -| n_updates | 88620 | -| policy_gradient_loss | -0.00741 | -| std | 0.0702 | -| value_loss | 2.36e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8864 | -| time_elapsed | 53297 | -| total_timesteps | 1134592 | -| train/ | | -| approx_kl | 0.04030434 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -4.1 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 88630 | -| policy_gradient_loss | 0.00582 | -| std | 0.0701 | -| value_loss | 6.85e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8865 | -| time_elapsed | 53301 | -| total_timesteps | 1134720 | -| train/ | | -| approx_kl | 0.04425541 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -1.78 | -| learning_rate | 0.0003 | -| loss | 0.00784 | -| n_updates | 88640 | -| policy_gradient_loss | 0.00153 | -| std | 0.0701 | -| value_loss | 1.21e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8866 | -| time_elapsed | 53305 | -| total_timesteps | 1134848 | -| train/ | | -| approx_kl | 0.00067455694 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.000889 | -| n_updates | 88650 | -| policy_gradient_loss | 0.00076 | -| std | 0.0702 | -| value_loss | 1.12e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 8867 | -| time_elapsed | 53308 | -| total_timesteps | 1134976 | -| train/ | | -| approx_kl | 0.00013463758 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.0663 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 88660 | -| policy_gradient_loss | -0.00361 | -| std | 0.0702 | -| value_loss | 4.42e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8868 | -| time_elapsed | 53312 | -| total_timesteps | 1135104 | -| train/ | | -| approx_kl | 0.0016860855 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 88670 | -| policy_gradient_loss | 0.00475 | -| std | 0.0703 | -| value_loss | 6.43e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8869 | -| time_elapsed | 53319 | -| total_timesteps | 1135232 | -| train/ | | -| approx_kl | 0.018437456 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.281 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 88680 | -| policy_gradient_loss | -0.0138 | -| std | 0.0703 | -| value_loss | 0.00117 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8870 | -| time_elapsed | 53323 | -| total_timesteps | 1135360 | -| train/ | | -| approx_kl | 0.0017029634 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -79.2 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 88690 | -| policy_gradient_loss | -0.000654 | -| std | 0.0702 | -| value_loss | 4.9e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8871 | -| time_elapsed | 53326 | -| total_timesteps | 1135488 | -| train/ | | -| approx_kl | 0.0006401115 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -73.7 | -| learning_rate | 0.0003 | -| loss | -0.00047 | -| n_updates | 88700 | -| policy_gradient_loss | -0.000174 | -| std | 0.07 | -| value_loss | 2.32e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8872 | -| time_elapsed | 53330 | -| total_timesteps | 1135616 | -| train/ | | -| approx_kl | 0.0017845929 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -5.76 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 88710 | -| policy_gradient_loss | -0.000334 | -| std | 0.0698 | -| value_loss | 3.47e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8873 | -| time_elapsed | 53333 | -| total_timesteps | 1135744 | -| train/ | | -| approx_kl | 0.0018053297 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 88720 | -| policy_gradient_loss | -0.00327 | -| std | 0.0697 | -| value_loss | 1.68e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8874 | -| time_elapsed | 53337 | -| total_timesteps | 1135872 | -| train/ | | -| approx_kl | 0.014322579 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 88730 | -| policy_gradient_loss | -0.00342 | -| std | 0.0697 | -| value_loss | 2.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8875 | -| time_elapsed | 53340 | -| total_timesteps | 1136000 | -| train/ | | -| approx_kl | 0.016967393 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -9.63e-06 | -| n_updates | 88740 | -| policy_gradient_loss | 0.0192 | -| std | 0.0697 | -| value_loss | 6.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8876 | -| time_elapsed | 53344 | -| total_timesteps | 1136128 | -| train/ | | -| approx_kl | 0.024718994 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.00194 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 88750 | -| policy_gradient_loss | 0.000974 | -| std | 0.0697 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8877 | -| time_elapsed | 53351 | -| total_timesteps | 1136256 | -| train/ | | -| approx_kl | 0.022480302 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 1.24 | -| explained_variance | 0.857 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 88760 | -| policy_gradient_loss | -0.00979 | -| std | 0.0697 | -| value_loss | 0.00187 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8878 | -| time_elapsed | 53355 | -| total_timesteps | 1136384 | -| train/ | | -| approx_kl | 0.036830734 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | -0.00633 | -| n_updates | 88770 | -| policy_gradient_loss | -0.0052 | -| std | 0.0696 | -| value_loss | 8.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8879 | -| time_elapsed | 53359 | -| total_timesteps | 1136512 | -| train/ | | -| approx_kl | 0.049291693 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -3.22 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 88780 | -| policy_gradient_loss | -0.000497 | -| std | 0.0696 | -| value_loss | 3.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8880 | -| time_elapsed | 53362 | -| total_timesteps | 1136640 | -| train/ | | -| approx_kl | 0.0025917287 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.802 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 88790 | -| policy_gradient_loss | 0.000589 | -| std | 0.0697 | -| value_loss | 1.69e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8881 | -| time_elapsed | 53365 | -| total_timesteps | 1136768 | -| train/ | | -| approx_kl | 0.000965897 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 88800 | -| policy_gradient_loss | -0.0124 | -| std | 0.0696 | -| value_loss | 8.17e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8882 | -| time_elapsed | 53368 | -| total_timesteps | 1136896 | -| train/ | | -| approx_kl | 5.569309e-07 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.000159 | -| n_updates | 88810 | -| policy_gradient_loss | -0.00629 | -| std | 0.0696 | -| value_loss | 4.25e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8883 | -| time_elapsed | 53371 | -| total_timesteps | 1137024 | -| train/ | | -| approx_kl | 0.00011232309 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.000122 | -| n_updates | 88820 | -| policy_gradient_loss | 0.00101 | -| std | 0.0696 | -| value_loss | 1.02e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8884 | -| time_elapsed | 53380 | -| total_timesteps | 1137152 | -| train/ | | -| approx_kl | 0.013646507 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 88830 | -| policy_gradient_loss | -0.0118 | -| std | 0.0696 | -| value_loss | 0.000325 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8885 | -| time_elapsed | 53385 | -| total_timesteps | 1137280 | -| train/ | | -| approx_kl | 0.00027888594 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | 0.0329 | -| learning_rate | 0.0003 | -| loss | 7.5e-05 | -| n_updates | 88840 | -| policy_gradient_loss | 0.00127 | -| std | 0.0695 | -| value_loss | 5.16e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8886 | -| time_elapsed | 53387 | -| total_timesteps | 1137408 | -| train/ | | -| approx_kl | 0.07821116 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -4.02e+03 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 88850 | -| policy_gradient_loss | -0.00905 | -| std | 0.0694 | -| value_loss | 6.58e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8887 | -| time_elapsed | 53390 | -| total_timesteps | 1137536 | -| train/ | | -| approx_kl | 0.028086256 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 88860 | -| policy_gradient_loss | -0.011 | -| std | 0.0694 | -| value_loss | 2.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8888 | -| time_elapsed | 53394 | -| total_timesteps | 1137664 | -| train/ | | -| approx_kl | 0.021748772 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -16.4 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 88870 | -| policy_gradient_loss | -0.00716 | -| std | 0.0694 | -| value_loss | 4.24e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8889 | -| time_elapsed | 53397 | -| total_timesteps | 1137792 | -| train/ | | -| approx_kl | 2.8917566e-07 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.54 | -| learning_rate | 0.0003 | -| loss | -6.76e-05 | -| n_updates | 88880 | -| policy_gradient_loss | 0.00542 | -| std | 0.0693 | -| value_loss | 1.64e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8890 | -| time_elapsed | 53400 | -| total_timesteps | 1137920 | -| train/ | | -| approx_kl | 0.005340373 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 88890 | -| policy_gradient_loss | -0.00282 | -| std | 0.0693 | -| value_loss | 8.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8891 | -| time_elapsed | 53403 | -| total_timesteps | 1138048 | -| train/ | | -| approx_kl | 0.006586433 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.0725 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 88900 | -| policy_gradient_loss | -0.0142 | -| std | 0.0693 | -| value_loss | 8.37e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8892 | -| time_elapsed | 53409 | -| total_timesteps | 1138176 | -| train/ | | -| approx_kl | 0.011825403 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 88910 | -| policy_gradient_loss | -0.0148 | -| std | 0.0693 | -| value_loss | 0.00229 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8893 | -| time_elapsed | 53412 | -| total_timesteps | 1138304 | -| train/ | | -| approx_kl | 0.0015463992 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -170 | -| learning_rate | 0.0003 | -| loss | -0.00786 | -| n_updates | 88920 | -| policy_gradient_loss | -0.0122 | -| std | 0.0693 | -| value_loss | 6.18e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8894 | -| time_elapsed | 53415 | -| total_timesteps | 1138432 | -| train/ | | -| approx_kl | 0.007738041 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -293 | -| learning_rate | 0.0003 | -| loss | -0.000932 | -| n_updates | 88930 | -| policy_gradient_loss | -0.000364 | -| std | 0.0695 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8895 | -| time_elapsed | 53418 | -| total_timesteps | 1138560 | -| train/ | | -| approx_kl | 0.049130555 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -24.9 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 88940 | -| policy_gradient_loss | -0.0117 | -| std | 0.0696 | -| value_loss | 3.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8896 | -| time_elapsed | 53421 | -| total_timesteps | 1138688 | -| train/ | | -| approx_kl | 0.05395411 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 88950 | -| policy_gradient_loss | -0.00222 | -| std | 0.0697 | -| value_loss | 3.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8897 | -| time_elapsed | 53423 | -| total_timesteps | 1138816 | -| train/ | | -| approx_kl | 0.0031697033 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.000658 | -| n_updates | 88960 | -| policy_gradient_loss | -0.000327 | -| std | 0.0694 | -| value_loss | 4.97e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 8898 | -| time_elapsed | 53426 | -| total_timesteps | 1138944 | -| train/ | | -| approx_kl | 0.00019401498 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.093 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 88970 | -| policy_gradient_loss | -0.0065 | -| std | 0.0692 | -| value_loss | 1.69e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8899 | -| time_elapsed | 53429 | -| total_timesteps | 1139072 | -| train/ | | -| approx_kl | 0.00596523 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 1.25 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 88980 | -| policy_gradient_loss | -0.00215 | -| std | 0.069 | -| value_loss | 1.84e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8900 | -| time_elapsed | 53435 | -| total_timesteps | 1139200 | -| train/ | | -| approx_kl | 0.03701445 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | 0.917 | -| learning_rate | 0.0003 | -| loss | -0.00641 | -| n_updates | 88990 | -| policy_gradient_loss | -0.00486 | -| std | 0.0687 | -| value_loss | 0.00104 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8901 | -| time_elapsed | 53438 | -| total_timesteps | 1139328 | -| train/ | | -| approx_kl | 0.15308417 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -1.16e+03 | -| learning_rate | 0.0003 | -| loss | -0.00489 | -| n_updates | 89000 | -| policy_gradient_loss | -0.00496 | -| std | 0.0686 | -| value_loss | 1.2e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8902 | -| time_elapsed | 53442 | -| total_timesteps | 1139456 | -| train/ | | -| approx_kl | 0.10947335 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -1.18e+03 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 89010 | -| policy_gradient_loss | -0.00423 | -| std | 0.0686 | -| value_loss | 6.81e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8903 | -| time_elapsed | 53445 | -| total_timesteps | 1139584 | -| train/ | | -| approx_kl | 0.006339587 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -421 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 89020 | -| policy_gradient_loss | -0.0106 | -| std | 0.0686 | -| value_loss | 8.46e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8904 | -| time_elapsed | 53448 | -| total_timesteps | 1139712 | -| train/ | | -| approx_kl | 0.23466921 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -32.9 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 89030 | -| policy_gradient_loss | -0.00381 | -| std | 0.0686 | -| value_loss | 3.42e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8905 | -| time_elapsed | 53451 | -| total_timesteps | 1139840 | -| train/ | | -| approx_kl | 0.029855719 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -99.7 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 89040 | -| policy_gradient_loss | -0.00266 | -| std | 0.0686 | -| value_loss | 9.66e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 8906 | -| time_elapsed | 53454 | -| total_timesteps | 1139968 | -| train/ | | -| approx_kl | 0.0005130125 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.000176 | -| n_updates | 89050 | -| policy_gradient_loss | 0.00101 | -| std | 0.0686 | -| value_loss | 2.89e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8907 | -| time_elapsed | 53459 | -| total_timesteps | 1140096 | -| train/ | | -| approx_kl | 0.00022902805 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -70.7 | -| learning_rate | 0.0003 | -| loss | -0.000278 | -| n_updates | 89060 | -| policy_gradient_loss | 0.000762 | -| std | 0.0686 | -| value_loss | 5.24e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8908 | -| time_elapsed | 53466 | -| total_timesteps | 1140224 | -| train/ | | -| approx_kl | 0.026456065 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0319 | -| n_updates | 89070 | -| policy_gradient_loss | -0.0214 | -| std | 0.0686 | -| value_loss | 1.6e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8909 | -| time_elapsed | 53468 | -| total_timesteps | 1140352 | -| train/ | | -| approx_kl | 0.0015911786 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.23 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 89080 | -| policy_gradient_loss | -0.000737 | -| std | 0.0687 | -| value_loss | 1.22e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8910 | -| time_elapsed | 53471 | -| total_timesteps | 1140480 | -| train/ | | -| approx_kl | 0.002951798 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.00631 | -| n_updates | 89090 | -| policy_gradient_loss | -0.00245 | -| std | 0.0687 | -| value_loss | 5.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8911 | -| time_elapsed | 53475 | -| total_timesteps | 1140608 | -| train/ | | -| approx_kl | 0.023253243 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 89100 | -| policy_gradient_loss | -0.0106 | -| std | 0.0686 | -| value_loss | 5.24e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8912 | -| time_elapsed | 53478 | -| total_timesteps | 1140736 | -| train/ | | -| approx_kl | 0.008713314 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.0697 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 89110 | -| policy_gradient_loss | -0.000304 | -| std | 0.0686 | -| value_loss | 1.18e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8913 | -| time_elapsed | 53482 | -| total_timesteps | 1140864 | -| train/ | | -| approx_kl | 0.0036907494 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 89120 | -| policy_gradient_loss | -0.00296 | -| std | 0.0686 | -| value_loss | 5.19e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 8914 | -| time_elapsed | 53486 | -| total_timesteps | 1140992 | -| train/ | | -| approx_kl | 0.0016945298 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.00231 | -| n_updates | 89130 | -| policy_gradient_loss | 0.00314 | -| std | 0.0687 | -| value_loss | 9.98e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8915 | -| time_elapsed | 53489 | -| total_timesteps | 1141120 | -| train/ | | -| approx_kl | 3.518164e-05 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.000401 | -| n_updates | 89140 | -| policy_gradient_loss | 0.00573 | -| std | 0.0687 | -| value_loss | 1.81e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8916 | -| time_elapsed | 53498 | -| total_timesteps | 1141248 | -| train/ | | -| approx_kl | 0.029171454 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 89150 | -| policy_gradient_loss | -0.0119 | -| std | 0.0687 | -| value_loss | 0.000148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8917 | -| time_elapsed | 53501 | -| total_timesteps | 1141376 | -| train/ | | -| approx_kl | 0.053151775 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -735 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 89160 | -| policy_gradient_loss | -0.0103 | -| std | 0.0687 | -| value_loss | 1.73e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8918 | -| time_elapsed | 53505 | -| total_timesteps | 1141504 | -| train/ | | -| approx_kl | 0.0041716946 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -5.73e+03 | -| learning_rate | 0.0003 | -| loss | -0.000425 | -| n_updates | 89170 | -| policy_gradient_loss | 7.51e-05 | -| std | 0.0686 | -| value_loss | 6.7e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8919 | -| time_elapsed | 53508 | -| total_timesteps | 1141632 | -| train/ | | -| approx_kl | 0.042778045 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -2.4e+03 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 89180 | -| policy_gradient_loss | -0.00547 | -| std | 0.0686 | -| value_loss | 2.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8920 | -| time_elapsed | 53511 | -| total_timesteps | 1141760 | -| train/ | | -| approx_kl | 0.040601075 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -6.43 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 89190 | -| policy_gradient_loss | -0.00236 | -| std | 0.0686 | -| value_loss | 5.99e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 8921 | -| time_elapsed | 53515 | -| total_timesteps | 1141888 | -| train/ | | -| approx_kl | 4.583504e-06 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 1.26 | -| explained_variance | -0.00339 | -| learning_rate | 0.0003 | -| loss | -0.000354 | -| n_updates | 89200 | -| policy_gradient_loss | -8.16e-05 | -| std | 0.0684 | -| value_loss | 7.28e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8922 | -| time_elapsed | 53518 | -| total_timesteps | 1142016 | -| train/ | | -| approx_kl | 0.0054534003 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | 0.00143 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 89210 | -| policy_gradient_loss | -0.000509 | -| std | 0.0681 | -| value_loss | 2.48e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8923 | -| time_elapsed | 53527 | -| total_timesteps | 1142144 | -| train/ | | -| approx_kl | 0.01224823 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 89220 | -| policy_gradient_loss | -0.0141 | -| std | 0.068 | -| value_loss | 0.000867 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8924 | -| time_elapsed | 53532 | -| total_timesteps | 1142272 | -| train/ | | -| approx_kl | 0.0007285238 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | -0.000456 | -| n_updates | 89230 | -| policy_gradient_loss | -0.00015 | -| std | 0.0679 | -| value_loss | 1.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8925 | -| time_elapsed | 53535 | -| total_timesteps | 1142400 | -| train/ | | -| approx_kl | 0.0074064624 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | -3.25e+03 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 89240 | -| policy_gradient_loss | -0.0144 | -| std | 0.0678 | -| value_loss | 1.29e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8926 | -| time_elapsed | 53538 | -| total_timesteps | 1142528 | -| train/ | | -| approx_kl | 0.0021519712 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | -5.67 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 89250 | -| policy_gradient_loss | -0.0039 | -| std | 0.0678 | -| value_loss | 5.84e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8927 | -| time_elapsed | 53542 | -| total_timesteps | 1142656 | -| train/ | | -| approx_kl | 0.002253375 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | -0.385 | -| learning_rate | 0.0003 | -| loss | -0.00476 | -| n_updates | 89260 | -| policy_gradient_loss | -0.00199 | -| std | 0.0677 | -| value_loss | 2.35e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8928 | -| time_elapsed | 53546 | -| total_timesteps | 1142784 | -| train/ | | -| approx_kl | 0.00037651835 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 89270 | -| policy_gradient_loss | -0.000827 | -| std | 0.0677 | -| value_loss | 9.16e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 8929 | -| time_elapsed | 53549 | -| total_timesteps | 1142912 | -| train/ | | -| approx_kl | 0.0013509518 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | 1.27 | -| explained_variance | -0.248 | -| learning_rate | 0.0003 | -| loss | -0.000802 | -| n_updates | 89280 | -| policy_gradient_loss | -0.000566 | -| std | 0.0676 | -| value_loss | 8.4e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8930 | -| time_elapsed | 53552 | -| total_timesteps | 1143040 | -| train/ | | -| approx_kl | 0.0089545725 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.0035 | -| learning_rate | 0.0003 | -| loss | -0.000516 | -| n_updates | 89290 | -| policy_gradient_loss | -0.00213 | -| std | 0.0674 | -| value_loss | 7.26e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8931 | -| time_elapsed | 53559 | -| total_timesteps | 1143168 | -| train/ | | -| approx_kl | 0.03955631 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 89300 | -| policy_gradient_loss | -0.0141 | -| std | 0.0672 | -| value_loss | 0.000349 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8932 | -| time_elapsed | 53564 | -| total_timesteps | 1143296 | -| train/ | | -| approx_kl | 0.20018536 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -66.8 | -| learning_rate | 0.0003 | -| loss | 0.00426 | -| n_updates | 89310 | -| policy_gradient_loss | -0.00142 | -| std | 0.0672 | -| value_loss | 8.41e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8933 | -| time_elapsed | 53567 | -| total_timesteps | 1143424 | -| train/ | | -| approx_kl | 0.03432438 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -17.6 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 89320 | -| policy_gradient_loss | -0.00715 | -| std | 0.0672 | -| value_loss | 3.55e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8934 | -| time_elapsed | 53570 | -| total_timesteps | 1143552 | -| train/ | | -| approx_kl | 0.04869328 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -3.49 | -| learning_rate | 0.0003 | -| loss | -0.00807 | -| n_updates | 89330 | -| policy_gradient_loss | -0.00568 | -| std | 0.0672 | -| value_loss | 6.58e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8935 | -| time_elapsed | 53574 | -| total_timesteps | 1143680 | -| train/ | | -| approx_kl | 0.009271404 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.478 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 89340 | -| policy_gradient_loss | -0.0114 | -| std | 0.0673 | -| value_loss | 1.05e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8936 | -| time_elapsed | 53577 | -| total_timesteps | 1143808 | -| train/ | | -| approx_kl | 0.0017711078 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 89350 | -| policy_gradient_loss | -0.000154 | -| std | 0.0674 | -| value_loss | 4.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 21 | -| iterations | 8937 | -| time_elapsed | 53580 | -| total_timesteps | 1143936 | -| train/ | | -| approx_kl | 0.034166194 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.000316 | -| n_updates | 89360 | -| policy_gradient_loss | -0.000459 | -| std | 0.0674 | -| value_loss | 3.89e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8938 | -| time_elapsed | 53584 | -| total_timesteps | 1144064 | -| train/ | | -| approx_kl | 0.00012645358 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 89370 | -| policy_gradient_loss | -0.000533 | -| std | 0.0674 | -| value_loss | 8.38e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8939 | -| time_elapsed | 53590 | -| total_timesteps | 1144192 | -| train/ | | -| approx_kl | 0.0039337142 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | 0.864 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 89380 | -| policy_gradient_loss | -0.0122 | -| std | 0.0674 | -| value_loss | 0.00245 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8940 | -| time_elapsed | 53594 | -| total_timesteps | 1144320 | -| train/ | | -| approx_kl | 0.0019291374 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | 0.0633 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 89390 | -| policy_gradient_loss | -0.00749 | -| std | 0.0674 | -| value_loss | 3.61e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8941 | -| time_elapsed | 53598 | -| total_timesteps | 1144448 | -| train/ | | -| approx_kl | 0.0018136334 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.719 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 89400 | -| policy_gradient_loss | -0.00295 | -| std | 0.0674 | -| value_loss | 1.94e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8942 | -| time_elapsed | 53601 | -| total_timesteps | 1144576 | -| train/ | | -| approx_kl | 0.0012636199 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.075 | -| learning_rate | 0.0003 | -| loss | -0.000674 | -| n_updates | 89410 | -| policy_gradient_loss | 0.000384 | -| std | 0.0672 | -| value_loss | 9.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8943 | -| time_elapsed | 53604 | -| total_timesteps | 1144704 | -| train/ | | -| approx_kl | 0.0015914394 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | 0.00344 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 89420 | -| policy_gradient_loss | 0.00182 | -| std | 0.0671 | -| value_loss | 4.37e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8944 | -| time_elapsed | 53606 | -| total_timesteps | 1144832 | -| train/ | | -| approx_kl | 0.0012398842 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 89430 | -| policy_gradient_loss | 7.25e-05 | -| std | 0.067 | -| value_loss | 1.49e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 8945 | -| time_elapsed | 53609 | -| total_timesteps | 1144960 | -| train/ | | -| approx_kl | 0.0012038853 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.28 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 89440 | -| policy_gradient_loss | -0.00239 | -| std | 0.067 | -| value_loss | 7.3e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8946 | -| time_elapsed | 53613 | -| total_timesteps | 1145088 | -| train/ | | -| approx_kl | 2.9718503e-06 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.000193 | -| n_updates | 89450 | -| policy_gradient_loss | -0.00344 | -| std | 0.0669 | -| value_loss | 5.8e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8947 | -| time_elapsed | 53622 | -| total_timesteps | 1145216 | -| train/ | | -| approx_kl | 0.03791523 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 89460 | -| policy_gradient_loss | -0.014 | -| std | 0.0669 | -| value_loss | 0.00198 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8948 | -| time_elapsed | 53626 | -| total_timesteps | 1145344 | -| train/ | | -| approx_kl | 0.06285669 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -20.6 | -| learning_rate | 0.0003 | -| loss | 0.00523 | -| n_updates | 89470 | -| policy_gradient_loss | 0.00106 | -| std | 0.0669 | -| value_loss | 1.53e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8949 | -| time_elapsed | 53630 | -| total_timesteps | 1145472 | -| train/ | | -| approx_kl | 0.0012232582 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -129 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 89480 | -| policy_gradient_loss | -0.000679 | -| std | 0.0668 | -| value_loss | 4.95e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8950 | -| time_elapsed | 53634 | -| total_timesteps | 1145600 | -| train/ | | -| approx_kl | 0.0003988142 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | 0.000424 | -| n_updates | 89490 | -| policy_gradient_loss | -0.00012 | -| std | 0.0667 | -| value_loss | 7.3e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8951 | -| time_elapsed | 53637 | -| total_timesteps | 1145728 | -| train/ | | -| approx_kl | 0.0054696603 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.879 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 89500 | -| policy_gradient_loss | -0.00156 | -| std | 0.0667 | -| value_loss | 5.55e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8952 | -| time_elapsed | 53641 | -| total_timesteps | 1145856 | -| train/ | | -| approx_kl | 0.00092126103 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 89510 | -| policy_gradient_loss | 0.00261 | -| std | 0.0667 | -| value_loss | 4.49e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 8953 | -| time_elapsed | 53646 | -| total_timesteps | 1145984 | -| train/ | | -| approx_kl | 0.0041116523 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.00927 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 89520 | -| policy_gradient_loss | -0.0023 | -| std | 0.0668 | -| value_loss | 1.63e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8954 | -| time_elapsed | 53649 | -| total_timesteps | 1146112 | -| train/ | | -| approx_kl | 0.008562606 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.00848 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 89530 | -| policy_gradient_loss | -0.00143 | -| std | 0.0668 | -| value_loss | 4.41e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8955 | -| time_elapsed | 53658 | -| total_timesteps | 1146240 | -| train/ | | -| approx_kl | 0.012477264 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 89540 | -| policy_gradient_loss | -0.0141 | -| std | 0.0668 | -| value_loss | 7.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8956 | -| time_elapsed | 53661 | -| total_timesteps | 1146368 | -| train/ | | -| approx_kl | 0.008300103 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -9.21 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 89550 | -| policy_gradient_loss | -0.00522 | -| std | 0.0668 | -| value_loss | 9.06e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8957 | -| time_elapsed | 53664 | -| total_timesteps | 1146496 | -| train/ | | -| approx_kl | 0.046698872 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -47.2 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 89560 | -| policy_gradient_loss | -0.0013 | -| std | 0.0668 | -| value_loss | 6.39e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8958 | -| time_elapsed | 53668 | -| total_timesteps | 1146624 | -| train/ | | -| approx_kl | 0.0008305744 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -7.12 | -| learning_rate | 0.0003 | -| loss | -0.000779 | -| n_updates | 89570 | -| policy_gradient_loss | 0.000624 | -| std | 0.0667 | -| value_loss | 1.08e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8959 | -| time_elapsed | 53671 | -| total_timesteps | 1146752 | -| train/ | | -| approx_kl | 1.0004267e-05 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.592 | -| learning_rate | 0.0003 | -| loss | 0.00058 | -| n_updates | 89580 | -| policy_gradient_loss | -0.00322 | -| std | 0.0666 | -| value_loss | 3.05e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8960 | -| time_elapsed | 53675 | -| total_timesteps | 1146880 | -| train/ | | -| approx_kl | 0.055447157 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 89590 | -| policy_gradient_loss | -0.0116 | -| std | 0.0666 | -| value_loss | 3.33e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8961 | -| time_elapsed | 53678 | -| total_timesteps | 1147008 | -| train/ | | -| approx_kl | 0.013800383 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.00801 | -| learning_rate | 0.0003 | -| loss | -0.00764 | -| n_updates | 89600 | -| policy_gradient_loss | -0.00248 | -| std | 0.0666 | -| value_loss | 2.37e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8962 | -| time_elapsed | 53688 | -| total_timesteps | 1147136 | -| train/ | | -| approx_kl | 0.010451105 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 89610 | -| policy_gradient_loss | -0.015 | -| std | 0.0666 | -| value_loss | 0.000101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8963 | -| time_elapsed | 53693 | -| total_timesteps | 1147264 | -| train/ | | -| approx_kl | 0.008844887 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.0988 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 89620 | -| policy_gradient_loss | -0.00338 | -| std | 0.0665 | -| value_loss | 4.36e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8964 | -| time_elapsed | 53696 | -| total_timesteps | 1147392 | -| train/ | | -| approx_kl | 0.0037049307 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 89630 | -| policy_gradient_loss | -0.0031 | -| std | 0.0665 | -| value_loss | 1.99e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8965 | -| time_elapsed | 53700 | -| total_timesteps | 1147520 | -| train/ | | -| approx_kl | 0.034737717 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.681 | -| learning_rate | 0.0003 | -| loss | 0.000433 | -| n_updates | 89640 | -| policy_gradient_loss | -0.000264 | -| std | 0.0665 | -| value_loss | 3.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8966 | -| time_elapsed | 53703 | -| total_timesteps | 1147648 | -| train/ | | -| approx_kl | 0.010428427 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | -0.00997 | -| n_updates | 89650 | -| policy_gradient_loss | -0.00353 | -| std | 0.0665 | -| value_loss | 8.14e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8967 | -| time_elapsed | 53707 | -| total_timesteps | 1147776 | -| train/ | | -| approx_kl | 0.0019643055 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.00544 | -| n_updates | 89660 | -| policy_gradient_loss | 0.004 | -| std | 0.0665 | -| value_loss | 3.61e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8968 | -| time_elapsed | 53711 | -| total_timesteps | 1147904 | -| train/ | | -| approx_kl | 0.0015893425 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | -0.00519 | -| n_updates | 89670 | -| policy_gradient_loss | -0.00065 | -| std | 0.0665 | -| value_loss | 2.4e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8969 | -| time_elapsed | 53715 | -| total_timesteps | 1148032 | -| train/ | | -| approx_kl | 0.0040531345 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | -0.00903 | -| n_updates | 89680 | -| policy_gradient_loss | -0.00658 | -| std | 0.0664 | -| value_loss | 1.79e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8970 | -| time_elapsed | 53723 | -| total_timesteps | 1148160 | -| train/ | | -| approx_kl | 0.014180345 | -| clip_fraction | 0.025 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -0.253 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 89690 | -| policy_gradient_loss | -0.0145 | -| std | 0.0664 | -| value_loss | 0.00181 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8971 | -| time_elapsed | 53727 | -| total_timesteps | 1148288 | -| train/ | | -| approx_kl | 0.0034234868 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 1.29 | -| explained_variance | -1.54e+04 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 89700 | -| policy_gradient_loss | -0.00178 | -| std | 0.0663 | -| value_loss | 4.29e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8972 | -| time_elapsed | 53730 | -| total_timesteps | 1148416 | -| train/ | | -| approx_kl | 0.056316067 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -2.67e+03 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 89710 | -| policy_gradient_loss | -0.00638 | -| std | 0.0662 | -| value_loss | 2.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8973 | -| time_elapsed | 53733 | -| total_timesteps | 1148544 | -| train/ | | -| approx_kl | 0.054329067 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -240 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 89720 | -| policy_gradient_loss | -0.00366 | -| std | 0.0661 | -| value_loss | 2.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8974 | -| time_elapsed | 53736 | -| total_timesteps | 1148672 | -| train/ | | -| approx_kl | 0.022967998 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -29 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 89730 | -| policy_gradient_loss | -0.00591 | -| std | 0.0661 | -| value_loss | 3.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8975 | -| time_elapsed | 53739 | -| total_timesteps | 1148800 | -| train/ | | -| approx_kl | 0.016520733 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -4.71 | -| learning_rate | 0.0003 | -| loss | 0.000256 | -| n_updates | 89740 | -| policy_gradient_loss | 0.000709 | -| std | 0.0661 | -| value_loss | 1.01e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 8976 | -| time_elapsed | 53742 | -| total_timesteps | 1148928 | -| train/ | | -| approx_kl | 0.0053949296 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -0.612 | -| learning_rate | 0.0003 | -| loss | 0.000171 | -| n_updates | 89750 | -| policy_gradient_loss | 0.000596 | -| std | 0.066 | -| value_loss | 1.03e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8977 | -| time_elapsed | 53745 | -| total_timesteps | 1149056 | -| train/ | | -| approx_kl | 0.00054439437 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 89760 | -| policy_gradient_loss | -0.001 | -| std | 0.066 | -| value_loss | 2.11e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8978 | -| time_elapsed | 53749 | -| total_timesteps | 1149184 | -| train/ | | -| approx_kl | 0.061592728 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 89770 | -| policy_gradient_loss | -0.0161 | -| std | 0.066 | -| value_loss | 5.87e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8979 | -| time_elapsed | 53751 | -| total_timesteps | 1149312 | -| train/ | | -| approx_kl | 0.00012476789 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -24 | -| learning_rate | 0.0003 | -| loss | -3.31e-05 | -| n_updates | 89780 | -| policy_gradient_loss | -8.13e-06 | -| std | 0.0659 | -| value_loss | 9.73e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8980 | -| time_elapsed | 53755 | -| total_timesteps | 1149440 | -| train/ | | -| approx_kl | 0.024571698 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -32.2 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 89790 | -| policy_gradient_loss | -0.0145 | -| std | 0.0658 | -| value_loss | 2.13e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8981 | -| time_elapsed | 53758 | -| total_timesteps | 1149568 | -| train/ | | -| approx_kl | 0.06928581 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -4.22 | -| learning_rate | 0.0003 | -| loss | -8.37e-05 | -| n_updates | 89800 | -| policy_gradient_loss | -0.00209 | -| std | 0.0658 | -| value_loss | 1.01e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8982 | -| time_elapsed | 53762 | -| total_timesteps | 1149696 | -| train/ | | -| approx_kl | 0.0012614792 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 89810 | -| policy_gradient_loss | 0.00267 | -| std | 0.0658 | -| value_loss | 3.31e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8983 | -| time_elapsed | 53765 | -| total_timesteps | 1149824 | -| train/ | | -| approx_kl | 0.0007048906 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -0.00711 | -| learning_rate | 0.0003 | -| loss | -0.000357 | -| n_updates | 89820 | -| policy_gradient_loss | 0.00212 | -| std | 0.066 | -| value_loss | 5.34e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 8984 | -| time_elapsed | 53769 | -| total_timesteps | 1149952 | -| train/ | | -| approx_kl | 0.0018558418 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 89830 | -| policy_gradient_loss | -0.00847 | -| std | 0.0662 | -| value_loss | 9.02e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8985 | -| time_elapsed | 53772 | -| total_timesteps | 1150080 | -| train/ | | -| approx_kl | 0.0043642223 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 89840 | -| policy_gradient_loss | -0.00773 | -| std | 0.0663 | -| value_loss | 6.72e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8986 | -| time_elapsed | 53777 | -| total_timesteps | 1150208 | -| train/ | | -| approx_kl | 0.060233165 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | 0.855 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 89850 | -| policy_gradient_loss | -0.0175 | -| std | 0.0662 | -| value_loss | 0.000329 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8987 | -| time_elapsed | 53780 | -| total_timesteps | 1150336 | -| train/ | | -| approx_kl | 0.022915093 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -251 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 89860 | -| policy_gradient_loss | -0.0014 | -| std | 0.0662 | -| value_loss | 6.33e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8988 | -| time_elapsed | 53783 | -| total_timesteps | 1150464 | -| train/ | | -| approx_kl | 0.0039311284 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -290 | -| learning_rate | 0.0003 | -| loss | -0.000493 | -| n_updates | 89870 | -| policy_gradient_loss | -5.49e-05 | -| std | 0.0661 | -| value_loss | 2.2e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8989 | -| time_elapsed | 53785 | -| total_timesteps | 1150592 | -| train/ | | -| approx_kl | 0.04293702 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -37.3 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 89880 | -| policy_gradient_loss | -0.00497 | -| std | 0.0659 | -| value_loss | 2.49e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8990 | -| time_elapsed | 53789 | -| total_timesteps | 1150720 | -| train/ | | -| approx_kl | 0.00029380666 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -9.45 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 89890 | -| policy_gradient_loss | -0.00108 | -| std | 0.0659 | -| value_loss | 6.32e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8991 | -| time_elapsed | 53792 | -| total_timesteps | 1150848 | -| train/ | | -| approx_kl | 0.012168005 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -13.9 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 89900 | -| policy_gradient_loss | -0.0033 | -| std | 0.0658 | -| value_loss | 9.52e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 21 | -| iterations | 8992 | -| time_elapsed | 53795 | -| total_timesteps | 1150976 | -| train/ | | -| approx_kl | 0.0005687983 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | 0.00697 | -| learning_rate | 0.0003 | -| loss | -0.000866 | -| n_updates | 89910 | -| policy_gradient_loss | 0.000203 | -| std | 0.0657 | -| value_loss | 3.22e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8993 | -| time_elapsed | 53797 | -| total_timesteps | 1151104 | -| train/ | | -| approx_kl | 0.0040610153 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | 0.00563 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 89920 | -| policy_gradient_loss | -0.00611 | -| std | 0.0657 | -| value_loss | 2.19e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8994 | -| time_elapsed | 53804 | -| total_timesteps | 1151232 | -| train/ | | -| approx_kl | 0.0093434965 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 89930 | -| policy_gradient_loss | -0.0172 | -| std | 0.0657 | -| value_loss | 3.69e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8995 | -| time_elapsed | 53808 | -| total_timesteps | 1151360 | -| train/ | | -| approx_kl | 0.001809557 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.3 | -| explained_variance | -0.413 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 89940 | -| policy_gradient_loss | -8.68e-05 | -| std | 0.0658 | -| value_loss | 2.55e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8996 | -| time_elapsed | 53811 | -| total_timesteps | 1151488 | -| train/ | | -| approx_kl | 4.687626e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.31 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 89950 | -| policy_gradient_loss | -0.000613 | -| std | 0.0652 | -| value_loss | 1.27e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8997 | -| time_elapsed | 53815 | -| total_timesteps | 1151616 | -| train/ | | -| approx_kl | 0.0023417375 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 1.31 | -| explained_variance | -0.00168 | -| learning_rate | 0.0003 | -| loss | -0.000418 | -| n_updates | 89960 | -| policy_gradient_loss | 0.000524 | -| std | 0.0648 | -| value_loss | 2.54e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8998 | -| time_elapsed | 53818 | -| total_timesteps | 1151744 | -| train/ | | -| approx_kl | 9.3219336e-05 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -0.000248 | -| n_updates | 89970 | -| policy_gradient_loss | 0.0076 | -| std | 0.0647 | -| value_loss | 3.89e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 8999 | -| time_elapsed | 53822 | -| total_timesteps | 1151872 | -| train/ | | -| approx_kl | 0.011517551 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -0.00437 | -| n_updates | 89980 | -| policy_gradient_loss | -0.000408 | -| std | 0.0646 | -| value_loss | 3.46e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9000 | -| time_elapsed | 53827 | -| total_timesteps | 1152000 | -| train/ | | -| approx_kl | 0.0024166103 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | 0.0018 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 89990 | -| policy_gradient_loss | 0.0109 | -| std | 0.0646 | -| value_loss | 1.51e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9001 | -| time_elapsed | 53830 | -| total_timesteps | 1152128 | -| train/ | | -| approx_kl | 0.01552796 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | 0.00207 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 90000 | -| policy_gradient_loss | 0.000501 | -| std | 0.0646 | -| value_loss | 3.02e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9002 | -| time_elapsed | 53837 | -| total_timesteps | 1152256 | -| train/ | | -| approx_kl | 0.048552625 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | 0.773 | -| learning_rate | 0.0003 | -| loss | 0.00167 | -| n_updates | 90010 | -| policy_gradient_loss | 0.000827 | -| std | 0.0645 | -| value_loss | 0.00319 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9003 | -| time_elapsed | 53842 | -| total_timesteps | 1152384 | -| train/ | | -| approx_kl | 0.0006780061 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -2.61e+03 | -| learning_rate | 0.0003 | -| loss | -0.000835 | -| n_updates | 90020 | -| policy_gradient_loss | -0.00122 | -| std | 0.0644 | -| value_loss | 6.9e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9004 | -| time_elapsed | 53845 | -| total_timesteps | 1152512 | -| train/ | | -| approx_kl | 0.01672573 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -124 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 90030 | -| policy_gradient_loss | -0.00944 | -| std | 0.0644 | -| value_loss | 1.13e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9005 | -| time_elapsed | 53849 | -| total_timesteps | 1152640 | -| train/ | | -| approx_kl | 0.0070084487 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -17.5 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 90040 | -| policy_gradient_loss | -0.00164 | -| std | 0.0645 | -| value_loss | 2.42e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9006 | -| time_elapsed | 53852 | -| total_timesteps | 1152768 | -| train/ | | -| approx_kl | 0.004881984 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.928 | -| learning_rate | 0.0003 | -| loss | -0.0233 | -| n_updates | 90050 | -| policy_gradient_loss | -0.0198 | -| std | 0.0645 | -| value_loss | 3.14e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9007 | -| time_elapsed | 53855 | -| total_timesteps | 1152896 | -| train/ | | -| approx_kl | 0.0030625039 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 90060 | -| policy_gradient_loss | 0.00147 | -| std | 0.0645 | -| value_loss | 1.99e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9008 | -| time_elapsed | 53860 | -| total_timesteps | 1153024 | -| train/ | | -| approx_kl | 0.006798796 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 90070 | -| policy_gradient_loss | -0.0106 | -| std | 0.0645 | -| value_loss | 9.09e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9009 | -| time_elapsed | 53868 | -| total_timesteps | 1153152 | -| train/ | | -| approx_kl | 0.010887566 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 90080 | -| policy_gradient_loss | -0.015 | -| std | 0.0645 | -| value_loss | 0.000253 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9010 | -| time_elapsed | 53872 | -| total_timesteps | 1153280 | -| train/ | | -| approx_kl | 0.0024552234 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.68 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 90090 | -| policy_gradient_loss | 0.00198 | -| std | 0.0645 | -| value_loss | 1.54e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9011 | -| time_elapsed | 53875 | -| total_timesteps | 1153408 | -| train/ | | -| approx_kl | 0.032702617 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -13.9 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 90100 | -| policy_gradient_loss | -0.00759 | -| std | 0.0644 | -| value_loss | 5.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9012 | -| time_elapsed | 53879 | -| total_timesteps | 1153536 | -| train/ | | -| approx_kl | 0.022472555 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | 0.0053 | -| n_updates | 90110 | -| policy_gradient_loss | 0.00172 | -| std | 0.0644 | -| value_loss | 9.31e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9013 | -| time_elapsed | 53883 | -| total_timesteps | 1153664 | -| train/ | | -| approx_kl | 0.0017167395 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.089 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 90120 | -| policy_gradient_loss | -0.00198 | -| std | 0.0644 | -| value_loss | 4.33e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9014 | -| time_elapsed | 53886 | -| total_timesteps | 1153792 | -| train/ | | -| approx_kl | 9.736512e-06 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.00597 | -| learning_rate | 0.0003 | -| loss | -0.000657 | -| n_updates | 90130 | -| policy_gradient_loss | -0.00721 | -| std | 0.0644 | -| value_loss | 2.89e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9015 | -| time_elapsed | 53889 | -| total_timesteps | 1153920 | -| train/ | | -| approx_kl | 4.2796135e-05 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 1.32 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | -0.000601 | -| n_updates | 90140 | -| policy_gradient_loss | 0.000273 | -| std | 0.0642 | -| value_loss | 2.4e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9016 | -| time_elapsed | 53894 | -| total_timesteps | 1154048 | -| train/ | | -| approx_kl | 0.005557875 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | 0.00353 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 90150 | -| policy_gradient_loss | -0.0017 | -| std | 0.0641 | -| value_loss | 8.39e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9017 | -| time_elapsed | 53902 | -| total_timesteps | 1154176 | -| train/ | | -| approx_kl | 0.0014335057 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.00852 | -| n_updates | 90160 | -| policy_gradient_loss | -0.00527 | -| std | 0.064 | -| value_loss | 0.000104 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9018 | -| time_elapsed | 53905 | -| total_timesteps | 1154304 | -| train/ | | -| approx_kl | 0.00020145159 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | -0.000625 | -| n_updates | 90170 | -| policy_gradient_loss | 0.000394 | -| std | 0.0639 | -| value_loss | 1.42e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9019 | -| time_elapsed | 53908 | -| total_timesteps | 1154432 | -| train/ | | -| approx_kl | 0.005732719 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.00582 | -| n_updates | 90180 | -| policy_gradient_loss | -0.000438 | -| std | 0.0639 | -| value_loss | 1.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9020 | -| time_elapsed | 53911 | -| total_timesteps | 1154560 | -| train/ | | -| approx_kl | 0.0005474435 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 90190 | -| policy_gradient_loss | -0.00354 | -| std | 0.0639 | -| value_loss | 4.82e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9021 | -| time_elapsed | 53914 | -| total_timesteps | 1154688 | -| train/ | | -| approx_kl | 0.0041629365 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 90200 | -| policy_gradient_loss | -0.00239 | -| std | 0.064 | -| value_loss | 9.41e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9022 | -| time_elapsed | 53917 | -| total_timesteps | 1154816 | -| train/ | | -| approx_kl | 0.014869658 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 90210 | -| policy_gradient_loss | -0.00345 | -| std | 0.064 | -| value_loss | 4.17e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9023 | -| time_elapsed | 53921 | -| total_timesteps | 1154944 | -| train/ | | -| approx_kl | 0.00094457064 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.00415 | -| n_updates | 90220 | -| policy_gradient_loss | 0.000964 | -| std | 0.0639 | -| value_loss | 4.06e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9024 | -| time_elapsed | 53923 | -| total_timesteps | 1155072 | -| train/ | | -| approx_kl | 0.006902947 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 90230 | -| policy_gradient_loss | -0.00449 | -| std | 0.0639 | -| value_loss | 1.81e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9025 | -| time_elapsed | 53930 | -| total_timesteps | 1155200 | -| train/ | | -| approx_kl | 0.024553884 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 90240 | -| policy_gradient_loss | -0.0163 | -| std | 0.064 | -| value_loss | 0.0016 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9026 | -| time_elapsed | 53933 | -| total_timesteps | 1155328 | -| train/ | | -| approx_kl | 0.006922567 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -956 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 90250 | -| policy_gradient_loss | -0.00922 | -| std | 0.064 | -| value_loss | 1.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9027 | -| time_elapsed | 53937 | -| total_timesteps | 1155456 | -| train/ | | -| approx_kl | 0.011507401 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -420 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 90260 | -| policy_gradient_loss | -0.0005 | -| std | 0.0639 | -| value_loss | 6.83e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9028 | -| time_elapsed | 53940 | -| total_timesteps | 1155584 | -| train/ | | -| approx_kl | 0.07663474 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -33.8 | -| learning_rate | 0.0003 | -| loss | -0.00853 | -| n_updates | 90270 | -| policy_gradient_loss | -0.00445 | -| std | 0.0638 | -| value_loss | 5.11e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9029 | -| time_elapsed | 53943 | -| total_timesteps | 1155712 | -| train/ | | -| approx_kl | 0.001517206 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | 1.33 | -| explained_variance | -0.448 | -| learning_rate | 0.0003 | -| loss | -0.000353 | -| n_updates | 90280 | -| policy_gradient_loss | -0.000161 | -| std | 0.0636 | -| value_loss | 3.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9030 | -| time_elapsed | 53948 | -| total_timesteps | 1155840 | -| train/ | | -| approx_kl | 0.007894568 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 90290 | -| policy_gradient_loss | -0.000481 | -| std | 0.0634 | -| value_loss | 8.66e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9031 | -| time_elapsed | 53951 | -| total_timesteps | 1155968 | -| train/ | | -| approx_kl | 0.0022373693 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00666 | -| n_updates | 90300 | -| policy_gradient_loss | -0.00344 | -| std | 0.0634 | -| value_loss | 1.34e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9032 | -| time_elapsed | 53955 | -| total_timesteps | 1156096 | -| train/ | | -| approx_kl | 0.0018432289 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | 0.00103 | -| learning_rate | 0.0003 | -| loss | -0.00666 | -| n_updates | 90310 | -| policy_gradient_loss | -0.00613 | -| std | 0.0633 | -| value_loss | 1.17e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9033 | -| time_elapsed | 53962 | -| total_timesteps | 1156224 | -| train/ | | -| approx_kl | 0.027174301 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.0233 | -| n_updates | 90320 | -| policy_gradient_loss | -0.0191 | -| std | 0.0633 | -| value_loss | 2.04e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9034 | -| time_elapsed | 53965 | -| total_timesteps | 1156352 | -| train/ | | -| approx_kl | 0.00114652 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 90330 | -| policy_gradient_loss | -0.00488 | -| std | 0.0632 | -| value_loss | 8.17e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9035 | -| time_elapsed | 53969 | -| total_timesteps | 1156480 | -| train/ | | -| approx_kl | 0.04444076 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 90340 | -| policy_gradient_loss | -0.00873 | -| std | 0.0632 | -| value_loss | 3.96e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9036 | -| time_elapsed | 53972 | -| total_timesteps | 1156608 | -| train/ | | -| approx_kl | 0.0120824855 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 90350 | -| policy_gradient_loss | 0.000477 | -| std | 0.0632 | -| value_loss | 5.71e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9037 | -| time_elapsed | 53975 | -| total_timesteps | 1156736 | -| train/ | | -| approx_kl | 0.0055136443 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.061 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 90360 | -| policy_gradient_loss | -0.00102 | -| std | 0.0631 | -| value_loss | 2.58e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9038 | -| time_elapsed | 53978 | -| total_timesteps | 1156864 | -| train/ | | -| approx_kl | 0.0051295757 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 90370 | -| policy_gradient_loss | -0.00807 | -| std | 0.0631 | -| value_loss | 1.16e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9039 | -| time_elapsed | 53982 | -| total_timesteps | 1156992 | -| train/ | | -| approx_kl | 0.0010932074 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.000845 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 90380 | -| policy_gradient_loss | -0.00146 | -| std | 0.0631 | -| value_loss | 1.01e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9040 | -| time_elapsed | 53985 | -| total_timesteps | 1157120 | -| train/ | | -| approx_kl | 0.0033704056 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -4.7 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 90390 | -| policy_gradient_loss | -0.000612 | -| std | 0.0631 | -| value_loss | 6.66e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9041 | -| time_elapsed | 53995 | -| total_timesteps | 1157248 | -| train/ | | -| approx_kl | 0.019752666 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 90400 | -| policy_gradient_loss | -0.0156 | -| std | 0.0632 | -| value_loss | 0.00116 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9042 | -| time_elapsed | 53997 | -| total_timesteps | 1157376 | -| train/ | | -| approx_kl | 0.032074425 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -233 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 90410 | -| policy_gradient_loss | -0.00199 | -| std | 0.0632 | -| value_loss | 4.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9043 | -| time_elapsed | 54002 | -| total_timesteps | 1157504 | -| train/ | | -| approx_kl | 0.06785672 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -756 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 90420 | -| policy_gradient_loss | -0.00047 | -| std | 0.0633 | -| value_loss | 7.59e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9044 | -| time_elapsed | 54003 | -| total_timesteps | 1157632 | -| train/ | | -| approx_kl | 0.12099515 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -195 | -| learning_rate | 0.0003 | -| loss | 0.00294 | -| n_updates | 90430 | -| policy_gradient_loss | -0.000677 | -| std | 0.0633 | -| value_loss | 6.29e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9045 | -| time_elapsed | 54006 | -| total_timesteps | 1157760 | -| train/ | | -| approx_kl | 0.03169607 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -24.9 | -| learning_rate | 0.0003 | -| loss | -0.00953 | -| n_updates | 90440 | -| policy_gradient_loss | -0.00564 | -| std | 0.0633 | -| value_loss | 7.72e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9046 | -| time_elapsed | 54008 | -| total_timesteps | 1157888 | -| train/ | | -| approx_kl | 0.058277793 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -3.23 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 90450 | -| policy_gradient_loss | -0.0044 | -| std | 0.0634 | -| value_loss | 1.77e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9047 | -| time_elapsed | 54010 | -| total_timesteps | 1158016 | -| train/ | | -| approx_kl | 0.00048598275 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.323 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 90460 | -| policy_gradient_loss | -0.00545 | -| std | 0.0634 | -| value_loss | 5.67e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9048 | -| time_elapsed | 54016 | -| total_timesteps | 1158144 | -| train/ | | -| approx_kl | 0.082841575 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 90470 | -| policy_gradient_loss | -0.0159 | -| std | 0.0634 | -| value_loss | 0.00205 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9049 | -| time_elapsed | 54019 | -| total_timesteps | 1158272 | -| train/ | | -| approx_kl | 0.08543029 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -21.3 | -| learning_rate | 0.0003 | -| loss | -0.00925 | -| n_updates | 90480 | -| policy_gradient_loss | -0.00724 | -| std | 0.0634 | -| value_loss | 6.63e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9050 | -| time_elapsed | 54021 | -| total_timesteps | 1158400 | -| train/ | | -| approx_kl | 0.004760035 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -126 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 90490 | -| policy_gradient_loss | -0.0136 | -| std | 0.0634 | -| value_loss | 2.9e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9051 | -| time_elapsed | 54025 | -| total_timesteps | 1158528 | -| train/ | | -| approx_kl | 0.052673884 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -21.3 | -| learning_rate | 0.0003 | -| loss | -0.00813 | -| n_updates | 90500 | -| policy_gradient_loss | -0.00379 | -| std | 0.0634 | -| value_loss | 4.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9052 | -| time_elapsed | 54028 | -| total_timesteps | 1158656 | -| train/ | | -| approx_kl | 0.05700426 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -4.98 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 90510 | -| policy_gradient_loss | -0.00459 | -| std | 0.0634 | -| value_loss | 7.74e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9053 | -| time_elapsed | 54031 | -| total_timesteps | 1158784 | -| train/ | | -| approx_kl | 0.0062440457 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.863 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 90520 | -| policy_gradient_loss | -0.0101 | -| std | 0.0634 | -| value_loss | 3.58e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9054 | -| time_elapsed | 54034 | -| total_timesteps | 1158912 | -| train/ | | -| approx_kl | 4.622247e-05 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.000653 | -| n_updates | 90530 | -| policy_gradient_loss | 0.000703 | -| std | 0.0634 | -| value_loss | 1.5e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9055 | -| time_elapsed | 54037 | -| total_timesteps | 1159040 | -| train/ | | -| approx_kl | 0.0058625983 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.000455 | -| n_updates | 90540 | -| policy_gradient_loss | -4.6e-05 | -| std | 0.0634 | -| value_loss | 7.08e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9056 | -| time_elapsed | 54044 | -| total_timesteps | 1159168 | -| train/ | | -| approx_kl | 0.030963702 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 90550 | -| policy_gradient_loss | -0.0164 | -| std | 0.0633 | -| value_loss | 0.000446 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9057 | -| time_elapsed | 54046 | -| total_timesteps | 1159296 | -| train/ | | -| approx_kl | 0.0058373613 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -4.19e+03 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 90560 | -| policy_gradient_loss | -0.00181 | -| std | 0.0633 | -| value_loss | 9.6e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9058 | -| time_elapsed | 54050 | -| total_timesteps | 1159424 | -| train/ | | -| approx_kl | 0.0022073518 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -1.78e+03 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 90570 | -| policy_gradient_loss | -0.00127 | -| std | 0.0632 | -| value_loss | 5.06e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9059 | -| time_elapsed | 54052 | -| total_timesteps | 1159552 | -| train/ | | -| approx_kl | 0.016384166 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -212 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 90580 | -| policy_gradient_loss | -0.0157 | -| std | 0.0632 | -| value_loss | 4.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9060 | -| time_elapsed | 54057 | -| total_timesteps | 1159680 | -| train/ | | -| approx_kl | 0.004024678 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -19.3 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 90590 | -| policy_gradient_loss | -0.00306 | -| std | 0.0632 | -| value_loss | 4.63e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9061 | -| time_elapsed | 54060 | -| total_timesteps | 1159808 | -| train/ | | -| approx_kl | 0.0038752016 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.00984 | -| n_updates | 90600 | -| policy_gradient_loss | -0.00733 | -| std | 0.0631 | -| value_loss | 2.56e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 21 | -| iterations | 9062 | -| time_elapsed | 54064 | -| total_timesteps | 1159936 | -| train/ | | -| approx_kl | 0.0010094051 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 1.34 | -| explained_variance | -0.0922 | -| learning_rate | 0.0003 | -| loss | -0.000182 | -| n_updates | 90610 | -| policy_gradient_loss | 3.61e-05 | -| std | 0.063 | -| value_loss | 8.62e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9063 | -| time_elapsed | 54068 | -| total_timesteps | 1160064 | -| train/ | | -| approx_kl | 0.00061435765 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.00516 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 90620 | -| policy_gradient_loss | 0.0028 | -| std | 0.0629 | -| value_loss | 8.75e-10 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9064 | -| time_elapsed | 54074 | -| total_timesteps | 1160192 | -| train/ | | -| approx_kl | 0.03730889 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -19 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 90630 | -| policy_gradient_loss | -0.0157 | -| std | 0.0629 | -| value_loss | 0.00414 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9065 | -| time_elapsed | 54078 | -| total_timesteps | 1160320 | -| train/ | | -| approx_kl | 0.015649904 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -178 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 90640 | -| policy_gradient_loss | -0.0132 | -| std | 0.0628 | -| value_loss | 1.21e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9066 | -| time_elapsed | 54083 | -| total_timesteps | 1160448 | -| train/ | | -| approx_kl | 0.03638209 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -551 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 90650 | -| policy_gradient_loss | -0.000511 | -| std | 0.0628 | -| value_loss | 4.53e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9067 | -| time_elapsed | 54086 | -| total_timesteps | 1160576 | -| train/ | | -| approx_kl | 0.09078648 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -134 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 90660 | -| policy_gradient_loss | -0.00169 | -| std | 0.0627 | -| value_loss | 6.46e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9068 | -| time_elapsed | 54090 | -| total_timesteps | 1160704 | -| train/ | | -| approx_kl | 0.07270993 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -31.9 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 90670 | -| policy_gradient_loss | -0.00649 | -| std | 0.0627 | -| value_loss | 9.33e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9069 | -| time_elapsed | 54093 | -| total_timesteps | 1160832 | -| train/ | | -| approx_kl | 0.05579312 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -3.23 | -| learning_rate | 0.0003 | -| loss | -0.000994 | -| n_updates | 90680 | -| policy_gradient_loss | -0.000987 | -| std | 0.0626 | -| value_loss | 6.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 21 | -| iterations | 9070 | -| time_elapsed | 54097 | -| total_timesteps | 1160960 | -| train/ | | -| approx_kl | 0.005063826 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.000953 | -| n_updates | 90690 | -| policy_gradient_loss | -0.000777 | -| std | 0.0627 | -| value_loss | 4.98e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9071 | -| time_elapsed | 54100 | -| total_timesteps | 1161088 | -| train/ | | -| approx_kl | 0.0042900816 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 90700 | -| policy_gradient_loss | -0.00286 | -| std | 0.0628 | -| value_loss | 4.6e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9072 | -| time_elapsed | 54107 | -| total_timesteps | 1161216 | -| train/ | | -| approx_kl | 0.004724741 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | 0.738 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 90710 | -| policy_gradient_loss | -0.0149 | -| std | 0.0628 | -| value_loss | 0.00363 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9073 | -| time_elapsed | 54112 | -| total_timesteps | 1161344 | -| train/ | | -| approx_kl | 0.008450594 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -80.7 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 90720 | -| policy_gradient_loss | -0.000481 | -| std | 0.0628 | -| value_loss | 8.67e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9074 | -| time_elapsed | 54115 | -| total_timesteps | 1161472 | -| train/ | | -| approx_kl | 0.038474306 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -109 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 90730 | -| policy_gradient_loss | -0.0115 | -| std | 0.0628 | -| value_loss | 1.28e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9075 | -| time_elapsed | 54117 | -| total_timesteps | 1161600 | -| train/ | | -| approx_kl | 0.2043188 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -89.3 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 90740 | -| policy_gradient_loss | -0.00406 | -| std | 0.0628 | -| value_loss | 3.35e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9076 | -| time_elapsed | 54121 | -| total_timesteps | 1161728 | -| train/ | | -| approx_kl | 0.03264302 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | -0.000237 | -| n_updates | 90750 | -| policy_gradient_loss | 0.00178 | -| std | 0.0628 | -| value_loss | 1.03e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9077 | -| time_elapsed | 54124 | -| total_timesteps | 1161856 | -| train/ | | -| approx_kl | 5.4906122e-06 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.000202 | -| n_updates | 90760 | -| policy_gradient_loss | 0.000929 | -| std | 0.0627 | -| value_loss | 3.93e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9078 | -| time_elapsed | 54126 | -| total_timesteps | 1161984 | -| train/ | | -| approx_kl | 1.0988675e-05 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.00021 | -| n_updates | 90770 | -| policy_gradient_loss | -0.000598 | -| std | 0.0627 | -| value_loss | 1.55e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9079 | -| time_elapsed | 54129 | -| total_timesteps | 1162112 | -| train/ | | -| approx_kl | 0.0019548652 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.074 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 90780 | -| policy_gradient_loss | -0.00329 | -| std | 0.0627 | -| value_loss | 3.42e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9080 | -| time_elapsed | 54138 | -| total_timesteps | 1162240 | -| train/ | | -| approx_kl | 0.052093614 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -7.81 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 90790 | -| policy_gradient_loss | -0.0136 | -| std | 0.0627 | -| value_loss | 0.00332 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9081 | -| time_elapsed | 54140 | -| total_timesteps | 1162368 | -| train/ | | -| approx_kl | 0.04165858 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -1.85e+03 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 90800 | -| policy_gradient_loss | -0.00773 | -| std | 0.0627 | -| value_loss | 3.2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9082 | -| time_elapsed | 54143 | -| total_timesteps | 1162496 | -| train/ | | -| approx_kl | 0.011106741 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -6.91e+03 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 90810 | -| policy_gradient_loss | 0.000655 | -| std | 0.0626 | -| value_loss | 1.94e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9083 | -| time_elapsed | 54145 | -| total_timesteps | 1162624 | -| train/ | | -| approx_kl | 0.00795487 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -1.98e+03 | -| learning_rate | 0.0003 | -| loss | -0.00697 | -| n_updates | 90820 | -| policy_gradient_loss | -0.00443 | -| std | 0.0626 | -| value_loss | 1.97e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9084 | -| time_elapsed | 54147 | -| total_timesteps | 1162752 | -| train/ | | -| approx_kl | 0.002087708 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -159 | -| learning_rate | 0.0003 | -| loss | 5.94e-05 | -| n_updates | 90830 | -| policy_gradient_loss | 0.00015 | -| std | 0.0625 | -| value_loss | 1.48e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9085 | -| time_elapsed | 54149 | -| total_timesteps | 1162880 | -| train/ | | -| approx_kl | 1.3895333e-06 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -15.9 | -| learning_rate | 0.0003 | -| loss | 8.72e-05 | -| n_updates | 90840 | -| policy_gradient_loss | -0.00854 | -| std | 0.0625 | -| value_loss | 2.88e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9086 | -| time_elapsed | 54151 | -| total_timesteps | 1163008 | -| train/ | | -| approx_kl | 6.241724e-06 | -| clip_fraction | 0.0187 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.442 | -| learning_rate | 0.0003 | -| loss | -0.000204 | -| n_updates | 90850 | -| policy_gradient_loss | -0.00207 | -| std | 0.0624 | -| value_loss | 3.88e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9087 | -| time_elapsed | 54160 | -| total_timesteps | 1163136 | -| train/ | | -| approx_kl | 0.030697307 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | 0.634 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 90860 | -| policy_gradient_loss | -0.00883 | -| std | 0.0625 | -| value_loss | 0.000581 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9088 | -| time_elapsed | 54163 | -| total_timesteps | 1163264 | -| train/ | | -| approx_kl | 0.0071075466 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.35 | -| explained_variance | -0.331 | -| learning_rate | 0.0003 | -| loss | -0.00467 | -| n_updates | 90870 | -| policy_gradient_loss | -0.00217 | -| std | 0.0624 | -| value_loss | 5.38e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9089 | -| time_elapsed | 54166 | -| total_timesteps | 1163392 | -| train/ | | -| approx_kl | 0.07980156 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | -3.42e+03 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 90880 | -| policy_gradient_loss | -0.00526 | -| std | 0.0623 | -| value_loss | 9.98e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9090 | -| time_elapsed | 54169 | -| total_timesteps | 1163520 | -| train/ | | -| approx_kl | 0.0437138 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 90890 | -| policy_gradient_loss | -0.00429 | -| std | 0.0623 | -| value_loss | 1.18e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9091 | -| time_elapsed | 54172 | -| total_timesteps | 1163648 | -| train/ | | -| approx_kl | 0.0026321984 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | -0.434 | -| learning_rate | 0.0003 | -| loss | 0.000497 | -| n_updates | 90900 | -| policy_gradient_loss | 0.00489 | -| std | 0.0623 | -| value_loss | 5.21e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9092 | -| time_elapsed | 54175 | -| total_timesteps | 1163776 | -| train/ | | -| approx_kl | 0.014184006 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | 0.00362 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 90910 | -| policy_gradient_loss | -0.0104 | -| std | 0.0622 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9093 | -| time_elapsed | 54178 | -| total_timesteps | 1163904 | -| train/ | | -| approx_kl | 0.036057033 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | -0.000974 | -| learning_rate | 0.0003 | -| loss | 0.000986 | -| n_updates | 90920 | -| policy_gradient_loss | 0.000242 | -| std | 0.0622 | -| value_loss | 9.48e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9094 | -| time_elapsed | 54182 | -| total_timesteps | 1164032 | -| train/ | | -| approx_kl | 0.0026173657 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | -0.000381 | -| n_updates | 90930 | -| policy_gradient_loss | 0.000261 | -| std | 0.062 | -| value_loss | 1.66e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9095 | -| time_elapsed | 54190 | -| total_timesteps | 1164160 | -| train/ | | -| approx_kl | 0.030775364 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.0261 | -| n_updates | 90940 | -| policy_gradient_loss | -0.0183 | -| std | 0.0619 | -| value_loss | 1.11e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9096 | -| time_elapsed | 54193 | -| total_timesteps | 1164288 | -| train/ | | -| approx_kl | 0.0074101095 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 90950 | -| policy_gradient_loss | -0.00278 | -| std | 0.0618 | -| value_loss | 2.24e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9097 | -| time_elapsed | 54196 | -| total_timesteps | 1164416 | -| train/ | | -| approx_kl | 0.0026086378 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 90960 | -| policy_gradient_loss | -0.00124 | -| std | 0.0618 | -| value_loss | 1.93e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9098 | -| time_elapsed | 54199 | -| total_timesteps | 1164544 | -| train/ | | -| approx_kl | 0.01801518 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 90970 | -| policy_gradient_loss | -0.00106 | -| std | 0.0618 | -| value_loss | 9.72e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9099 | -| time_elapsed | 54202 | -| total_timesteps | 1164672 | -| train/ | | -| approx_kl | 0.0017060009 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | 0.00107 | -| learning_rate | 0.0003 | -| loss | -0.00465 | -| n_updates | 90980 | -| policy_gradient_loss | 0.00995 | -| std | 0.0618 | -| value_loss | 4.07e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9100 | -| time_elapsed | 54205 | -| total_timesteps | 1164800 | -| train/ | | -| approx_kl | 0.0023154346 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | -3.03 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 90990 | -| policy_gradient_loss | -0.00304 | -| std | 0.0618 | -| value_loss | 2.06e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 21 | -| iterations | 9101 | -| time_elapsed | 54209 | -| total_timesteps | 1164928 | -| train/ | | -| approx_kl | 0.0039205123 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | 0.00181 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 91000 | -| policy_gradient_loss | -0.0116 | -| std | 0.0618 | -| value_loss | 1.88e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9102 | -| time_elapsed | 54212 | -| total_timesteps | 1165056 | -| train/ | | -| approx_kl | 0.0011925497 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.36 | -| explained_variance | 0.00179 | -| learning_rate | 0.0003 | -| loss | 0.00336 | -| n_updates | 91010 | -| policy_gradient_loss | 0.00458 | -| std | 0.0618 | -| value_loss | 2.13e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9103 | -| time_elapsed | 54218 | -| total_timesteps | 1165184 | -| train/ | | -| approx_kl | 0.00053031 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | 0.809 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 91020 | -| policy_gradient_loss | -0.0114 | -| std | 0.0618 | -| value_loss | 0.00227 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9104 | -| time_elapsed | 54221 | -| total_timesteps | 1165312 | -| train/ | | -| approx_kl | 0.0039772484 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -4.56 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 91030 | -| policy_gradient_loss | -0.00827 | -| std | 0.0618 | -| value_loss | 3.01e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9105 | -| time_elapsed | 54224 | -| total_timesteps | 1165440 | -| train/ | | -| approx_kl | 0.0010464643 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 91040 | -| policy_gradient_loss | -8.66e-05 | -| std | 0.0618 | -| value_loss | 4.27e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9106 | -| time_elapsed | 54227 | -| total_timesteps | 1165568 | -| train/ | | -| approx_kl | 0.0007789745 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 91050 | -| policy_gradient_loss | -0.000892 | -| std | 0.0617 | -| value_loss | 2.32e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9107 | -| time_elapsed | 54230 | -| total_timesteps | 1165696 | -| train/ | | -| approx_kl | 0.0010675043 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.00356 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 91060 | -| policy_gradient_loss | 0.000667 | -| std | 0.0617 | -| value_loss | 2.09e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9108 | -| time_elapsed | 54234 | -| total_timesteps | 1165824 | -| train/ | | -| approx_kl | 0.010763523 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 91070 | -| policy_gradient_loss | -0.00513 | -| std | 0.0617 | -| value_loss | 1.42e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9109 | -| time_elapsed | 54238 | -| total_timesteps | 1165952 | -| train/ | | -| approx_kl | 0.013393937 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | 0.00397 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 91080 | -| policy_gradient_loss | -8.41e-05 | -| std | 0.0618 | -| value_loss | 0.000228 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9110 | -| time_elapsed | 54243 | -| total_timesteps | 1166080 | -| train/ | | -| approx_kl | 0.0013550809 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | -0.00094 | -| n_updates | 91090 | -| policy_gradient_loss | 0.00172 | -| std | 0.0617 | -| value_loss | 4.13e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9111 | -| time_elapsed | 54250 | -| total_timesteps | 1166208 | -| train/ | | -| approx_kl | 0.04822115 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | 0.934 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 91100 | -| policy_gradient_loss | -0.0152 | -| std | 0.0617 | -| value_loss | 0.000628 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9112 | -| time_elapsed | 54254 | -| total_timesteps | 1166336 | -| train/ | | -| approx_kl | 0.0036251233 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 91110 | -| policy_gradient_loss | -0.00575 | -| std | 0.0616 | -| value_loss | 2.53e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9113 | -| time_elapsed | 54258 | -| total_timesteps | 1166464 | -| train/ | | -| approx_kl | 0.0038232794 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.401 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 91120 | -| policy_gradient_loss | -0.00546 | -| std | 0.0616 | -| value_loss | 8.36e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9114 | -| time_elapsed | 54262 | -| total_timesteps | 1166592 | -| train/ | | -| approx_kl | 0.010192975 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 91130 | -| policy_gradient_loss | -0.000749 | -| std | 0.0615 | -| value_loss | 2.39e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9115 | -| time_elapsed | 54265 | -| total_timesteps | 1166720 | -| train/ | | -| approx_kl | 0.0012541064 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.00246 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 91140 | -| policy_gradient_loss | -0.00208 | -| std | 0.0615 | -| value_loss | 3.23e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9116 | -| time_elapsed | 54268 | -| total_timesteps | 1166848 | -| train/ | | -| approx_kl | 0.0038507883 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 91150 | -| policy_gradient_loss | -0.00116 | -| std | 0.0616 | -| value_loss | 5.44e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9117 | -| time_elapsed | 54270 | -| total_timesteps | 1166976 | -| train/ | | -| approx_kl | 0.0061417106 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | 0.00331 | -| learning_rate | 0.0003 | -| loss | -0.00075 | -| n_updates | 91160 | -| policy_gradient_loss | -0.000822 | -| std | 0.0618 | -| value_loss | 5.96e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9118 | -| time_elapsed | 54272 | -| total_timesteps | 1167104 | -| train/ | | -| approx_kl | 0.0006604353 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.00214 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 91170 | -| policy_gradient_loss | -9.2e-06 | -| std | 0.0616 | -| value_loss | 5.88e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9119 | -| time_elapsed | 54280 | -| total_timesteps | 1167232 | -| train/ | | -| approx_kl | 0.31330806 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 91180 | -| policy_gradient_loss | -0.0169 | -| std | 0.0615 | -| value_loss | 0.000915 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9120 | -| time_elapsed | 54284 | -| total_timesteps | 1167360 | -| train/ | | -| approx_kl | 0.07005525 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -26.1 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 91190 | -| policy_gradient_loss | -0.00966 | -| std | 0.0614 | -| value_loss | 3.82e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9121 | -| time_elapsed | 54288 | -| total_timesteps | 1167488 | -| train/ | | -| approx_kl | 0.19617897 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -39.7 | -| learning_rate | 0.0003 | -| loss | 0.00767 | -| n_updates | 91200 | -| policy_gradient_loss | 4.92e-05 | -| std | 0.0614 | -| value_loss | 1.78e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9122 | -| time_elapsed | 54292 | -| total_timesteps | 1167616 | -| train/ | | -| approx_kl | 0.0027645077 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -3.99 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 91210 | -| policy_gradient_loss | -0.00336 | -| std | 0.0615 | -| value_loss | 4.81e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9123 | -| time_elapsed | 54295 | -| total_timesteps | 1167744 | -| train/ | | -| approx_kl | 0.0010010032 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | -0.0041 | -| n_updates | 91220 | -| policy_gradient_loss | -0.00112 | -| std | 0.0615 | -| value_loss | 1.43e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9124 | -| time_elapsed | 54298 | -| total_timesteps | 1167872 | -| train/ | | -| approx_kl | 0.0015661144 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.00568 | -| n_updates | 91230 | -| policy_gradient_loss | 0.00206 | -| std | 0.0615 | -| value_loss | 5.14e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9125 | -| time_elapsed | 54301 | -| total_timesteps | 1168000 | -| train/ | | -| approx_kl | 0.0015820148 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 91240 | -| policy_gradient_loss | -0.00343 | -| std | 0.0615 | -| value_loss | 3.65e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9126 | -| time_elapsed | 54304 | -| total_timesteps | 1168128 | -| train/ | | -| approx_kl | 0.0017528352 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | 0.0029 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 91250 | -| policy_gradient_loss | -0.00364 | -| std | 0.0615 | -| value_loss | 1.53e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9127 | -| time_elapsed | 54312 | -| total_timesteps | 1168256 | -| train/ | | -| approx_kl | 0.028398111 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -0.786 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 91260 | -| policy_gradient_loss | -0.013 | -| std | 0.0614 | -| value_loss | 0.00225 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9128 | -| time_elapsed | 54316 | -| total_timesteps | 1168384 | -| train/ | | -| approx_kl | 0.010482492 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -327 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 91270 | -| policy_gradient_loss | -0.00231 | -| std | 0.0614 | -| value_loss | 3.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9129 | -| time_elapsed | 54321 | -| total_timesteps | 1168512 | -| train/ | | -| approx_kl | 0.008313965 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -421 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 91280 | -| policy_gradient_loss | -0.00106 | -| std | 0.0613 | -| value_loss | 2.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9130 | -| time_elapsed | 54324 | -| total_timesteps | 1168640 | -| train/ | | -| approx_kl | 0.051178128 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 1.37 | -| explained_variance | -28.1 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 91290 | -| policy_gradient_loss | -0.000667 | -| std | 0.0612 | -| value_loss | 4.88e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9131 | -| time_elapsed | 54328 | -| total_timesteps | 1168768 | -| train/ | | -| approx_kl | 0.08023213 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -16.1 | -| learning_rate | 0.0003 | -| loss | -0.00669 | -| n_updates | 91300 | -| policy_gradient_loss | -0.00539 | -| std | 0.0611 | -| value_loss | 4.49e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 21 | -| iterations | 9132 | -| time_elapsed | 54332 | -| total_timesteps | 1168896 | -| train/ | | -| approx_kl | 0.013461152 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -2.72 | -| learning_rate | 0.0003 | -| loss | -0.00865 | -| n_updates | 91310 | -| policy_gradient_loss | -0.000217 | -| std | 0.0611 | -| value_loss | 5.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9133 | -| time_elapsed | 54337 | -| total_timesteps | 1169024 | -| train/ | | -| approx_kl | 0.013241105 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 91320 | -| policy_gradient_loss | 0.00139 | -| std | 0.061 | -| value_loss | 8.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9134 | -| time_elapsed | 54345 | -| total_timesteps | 1169152 | -| train/ | | -| approx_kl | 0.014306808 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.00924 | -| n_updates | 91330 | -| policy_gradient_loss | -0.00758 | -| std | 0.0609 | -| value_loss | 0.00069 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9135 | -| time_elapsed | 54347 | -| total_timesteps | 1169280 | -| train/ | | -| approx_kl | 0.03616482 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | 0.191 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 91340 | -| policy_gradient_loss | 0.00076 | -| std | 0.0609 | -| value_loss | 1.34e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9136 | -| time_elapsed | 54350 | -| total_timesteps | 1169408 | -| train/ | | -| approx_kl | 0.19309962 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -126 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 91350 | -| policy_gradient_loss | -0.00256 | -| std | 0.0609 | -| value_loss | 1.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9137 | -| time_elapsed | 54353 | -| total_timesteps | 1169536 | -| train/ | | -| approx_kl | 0.017025374 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -17.6 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 91360 | -| policy_gradient_loss | -0.00379 | -| std | 0.0609 | -| value_loss | 1.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9138 | -| time_elapsed | 54356 | -| total_timesteps | 1169664 | -| train/ | | -| approx_kl | 0.063541465 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -2.21 | -| learning_rate | 0.0003 | -| loss | 0.00433 | -| n_updates | 91370 | -| policy_gradient_loss | 0.0154 | -| std | 0.0609 | -| value_loss | 3.08e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9139 | -| time_elapsed | 54360 | -| total_timesteps | 1169792 | -| train/ | | -| approx_kl | 0.048256997 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -0.651 | -| learning_rate | 0.0003 | -| loss | 0.00322 | -| n_updates | 91380 | -| policy_gradient_loss | 0.00176 | -| std | 0.0609 | -| value_loss | 9.42e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9140 | -| time_elapsed | 54362 | -| total_timesteps | 1169920 | -| train/ | | -| approx_kl | 0.00040107686 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 91390 | -| policy_gradient_loss | -0.000742 | -| std | 0.0609 | -| value_loss | 3.99e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9141 | -| time_elapsed | 54365 | -| total_timesteps | 1170048 | -| train/ | | -| approx_kl | 0.00015842775 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.000197 | -| n_updates | 91400 | -| policy_gradient_loss | 0.000107 | -| std | 0.0608 | -| value_loss | 3.29e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9142 | -| time_elapsed | 54371 | -| total_timesteps | 1170176 | -| train/ | | -| approx_kl | 0.006655373 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 91410 | -| policy_gradient_loss | -0.0156 | -| std | 0.0607 | -| value_loss | 0.0016 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9143 | -| time_elapsed | 54375 | -| total_timesteps | 1170304 | -| train/ | | -| approx_kl | 0.0053568296 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 91420 | -| policy_gradient_loss | -0.00817 | -| std | 0.0606 | -| value_loss | 3.68e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9144 | -| time_elapsed | 54378 | -| total_timesteps | 1170432 | -| train/ | | -| approx_kl | 0.00073625194 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.39 | -| explained_variance | -0.683 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 91430 | -| policy_gradient_loss | 0.000815 | -| std | 0.0606 | -| value_loss | 2.76e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9145 | -| time_elapsed | 54381 | -| total_timesteps | 1170560 | -| train/ | | -| approx_kl | 0.009410644 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 1.39 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 91440 | -| policy_gradient_loss | -0.0013 | -| std | 0.0606 | -| value_loss | 7.99e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9146 | -| time_elapsed | 54385 | -| total_timesteps | 1170688 | -| train/ | | -| approx_kl | 0.0019056457 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 1.39 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.00339 | -| n_updates | 91450 | -| policy_gradient_loss | -0.00248 | -| std | 0.0605 | -| value_loss | 3.91e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9147 | -| time_elapsed | 54389 | -| total_timesteps | 1170816 | -| train/ | | -| approx_kl | 8.092029e-05 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | -0.000118 | -| n_updates | 91460 | -| policy_gradient_loss | 0.000898 | -| std | 0.0606 | -| value_loss | 2.74e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9148 | -| time_elapsed | 54394 | -| total_timesteps | 1170944 | -| train/ | | -| approx_kl | 0.0001319861 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | 0.00357 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 91470 | -| policy_gradient_loss | -0.00161 | -| std | 0.0607 | -| value_loss | 3.48e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9149 | -| time_elapsed | 54398 | -| total_timesteps | 1171072 | -| train/ | | -| approx_kl | 0.0072577125 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 1.38 | -| explained_variance | -0.643 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 91480 | -| policy_gradient_loss | -0.00284 | -| std | 0.0606 | -| value_loss | 6.37e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9150 | -| time_elapsed | 54404 | -| total_timesteps | 1171200 | -| train/ | | -| approx_kl | 0.022821825 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 1.39 | -| explained_variance | -8.85 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 91490 | -| policy_gradient_loss | -0.0137 | -| std | 0.0605 | -| value_loss | 0.0032 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9151 | -| time_elapsed | 54407 | -| total_timesteps | 1171328 | -| train/ | | -| approx_kl | 0.002280532 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.39 | -| explained_variance | -278 | -| learning_rate | 0.0003 | -| loss | -0.00031 | -| n_updates | 91500 | -| policy_gradient_loss | -0.000115 | -| std | 0.0603 | -| value_loss | 6.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9152 | -| time_elapsed | 54410 | -| total_timesteps | 1171456 | -| train/ | | -| approx_kl | 0.011550081 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 1.39 | -| explained_variance | -326 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 91510 | -| policy_gradient_loss | -0.0135 | -| std | 0.0601 | -| value_loss | 2.92e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9153 | -| time_elapsed | 54413 | -| total_timesteps | 1171584 | -| train/ | | -| approx_kl | 0.00066198036 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 1.39 | -| explained_variance | -17 | -| learning_rate | 0.0003 | -| loss | -0.00035 | -| n_updates | 91520 | -| policy_gradient_loss | -0.000119 | -| std | 0.0599 | -| value_loss | 1.94e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9154 | -| time_elapsed | 54416 | -| total_timesteps | 1171712 | -| train/ | | -| approx_kl | 0.017836792 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 1.4 | -| explained_variance | -2.01 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 91530 | -| policy_gradient_loss | -0.00331 | -| std | 0.0598 | -| value_loss | 5.37e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9155 | -| time_elapsed | 54419 | -| total_timesteps | 1171840 | -| train/ | | -| approx_kl | 0.004785419 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.4 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 91540 | -| policy_gradient_loss | -0.00243 | -| std | 0.0597 | -| value_loss | 2.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 21 | -| iterations | 9156 | -| time_elapsed | 54422 | -| total_timesteps | 1171968 | -| train/ | | -| approx_kl | 0.0055621383 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 1.4 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 91550 | -| policy_gradient_loss | 0.000376 | -| std | 0.0597 | -| value_loss | 9.83e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9157 | -| time_elapsed | 54425 | -| total_timesteps | 1172096 | -| train/ | | -| approx_kl | 0.007015401 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 1.4 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 91560 | -| policy_gradient_loss | 0.000928 | -| std | 0.0596 | -| value_loss | 1.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9158 | -| time_elapsed | 54432 | -| total_timesteps | 1172224 | -| train/ | | -| approx_kl | 0.008621238 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 1.4 | -| explained_variance | 0.721 | -| learning_rate | 0.0003 | -| loss | 0.000467 | -| n_updates | 91570 | -| policy_gradient_loss | -0.000817 | -| std | 0.0595 | -| value_loss | 0.00385 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9159 | -| time_elapsed | 54435 | -| total_timesteps | 1172352 | -| train/ | | -| approx_kl | 0.100244 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 1.4 | -| explained_variance | -9.23 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 91580 | -| policy_gradient_loss | -0.0123 | -| std | 0.0593 | -| value_loss | 0.00026 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9160 | -| time_elapsed | 54437 | -| total_timesteps | 1172480 | -| train/ | | -| approx_kl | 0.005576054 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | -2.68e+03 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 91590 | -| policy_gradient_loss | -0.00912 | -| std | 0.0593 | -| value_loss | 6.56e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9161 | -| time_elapsed | 54441 | -| total_timesteps | 1172608 | -| train/ | | -| approx_kl | 0.021022031 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 91600 | -| policy_gradient_loss | -0.00489 | -| std | 0.0592 | -| value_loss | 3.19e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9162 | -| time_elapsed | 54444 | -| total_timesteps | 1172736 | -| train/ | | -| approx_kl | 0.0062037334 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | -4.18 | -| learning_rate | 0.0003 | -| loss | -0.00359 | -| n_updates | 91610 | -| policy_gradient_loss | -0.00157 | -| std | 0.0592 | -| value_loss | 6.89e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9163 | -| time_elapsed | 54448 | -| total_timesteps | 1172864 | -| train/ | | -| approx_kl | 0.0014524958 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 91620 | -| policy_gradient_loss | 0.00152 | -| std | 0.0592 | -| value_loss | 8.34e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 21 | -| iterations | 9164 | -| time_elapsed | 54451 | -| total_timesteps | 1172992 | -| train/ | | -| approx_kl | 0.0071287393 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | -0.000585 | -| n_updates | 91630 | -| policy_gradient_loss | -0.000808 | -| std | 0.059 | -| value_loss | 2.29e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9165 | -| time_elapsed | 54455 | -| total_timesteps | 1173120 | -| train/ | | -| approx_kl | 0.0055653662 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | 0.00411 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 91640 | -| policy_gradient_loss | -0.00225 | -| std | 0.0589 | -| value_loss | 2.75e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9166 | -| time_elapsed | 54464 | -| total_timesteps | 1173248 | -| train/ | | -| approx_kl | 0.028718924 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | 0.52 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 91650 | -| policy_gradient_loss | -0.0147 | -| std | 0.0589 | -| value_loss | 0.000838 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9167 | -| time_elapsed | 54468 | -| total_timesteps | 1173376 | -| train/ | | -| approx_kl | 0.026270345 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | -59.8 | -| learning_rate | 0.0003 | -| loss | -0.00609 | -| n_updates | 91660 | -| policy_gradient_loss | -0.00321 | -| std | 0.0588 | -| value_loss | 1.83e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9168 | -| time_elapsed | 54471 | -| total_timesteps | 1173504 | -| train/ | | -| approx_kl | 0.14196438 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 1.41 | -| explained_variance | -52.4 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 91670 | -| policy_gradient_loss | -0.0017 | -| std | 0.0588 | -| value_loss | 8.99e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9169 | -| time_elapsed | 54475 | -| total_timesteps | 1173632 | -| train/ | | -| approx_kl | 0.036751077 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -10 | -| learning_rate | 0.0003 | -| loss | -0.0097 | -| n_updates | 91680 | -| policy_gradient_loss | -0.00342 | -| std | 0.0588 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9170 | -| time_elapsed | 54479 | -| total_timesteps | 1173760 | -| train/ | | -| approx_kl | 0.0037621362 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -1.36 | -| learning_rate | 0.0003 | -| loss | -0.00499 | -| n_updates | 91690 | -| policy_gradient_loss | -0.0034 | -| std | 0.0588 | -| value_loss | 2.95e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9171 | -| time_elapsed | 54483 | -| total_timesteps | 1173888 | -| train/ | | -| approx_kl | 0.004358479 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 91700 | -| policy_gradient_loss | -0.0106 | -| std | 0.0588 | -| value_loss | 5.57e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9172 | -| time_elapsed | 54486 | -| total_timesteps | 1174016 | -| train/ | | -| approx_kl | 0.0057617896 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.000981 | -| learning_rate | 0.0003 | -| loss | -0.00701 | -| n_updates | 91710 | -| policy_gradient_loss | -0.00189 | -| std | 0.0588 | -| value_loss | 2.12e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9173 | -| time_elapsed | 54494 | -| total_timesteps | 1174144 | -| train/ | | -| approx_kl | 0.052941002 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 91720 | -| policy_gradient_loss | -0.00644 | -| std | 0.0588 | -| value_loss | 0.000884 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9174 | -| time_elapsed | 54499 | -| total_timesteps | 1174272 | -| train/ | | -| approx_kl | 8.8092405e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | 0.0722 | -| learning_rate | 0.0003 | -| loss | -8.37e-05 | -| n_updates | 91730 | -| policy_gradient_loss | -3.11e-05 | -| std | 0.0586 | -| value_loss | 1.93e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9175 | -| time_elapsed | 54501 | -| total_timesteps | 1174400 | -| train/ | | -| approx_kl | 0.21540019 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 91740 | -| policy_gradient_loss | -0.00539 | -| std | 0.0585 | -| value_loss | 2.02e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9176 | -| time_elapsed | 54505 | -| total_timesteps | 1174528 | -| train/ | | -| approx_kl | 0.0002443199 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.987 | -| learning_rate | 0.0003 | -| loss | 0.00066 | -| n_updates | 91750 | -| policy_gradient_loss | 0.00283 | -| std | 0.0585 | -| value_loss | 4.26e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9177 | -| time_elapsed | 54508 | -| total_timesteps | 1174656 | -| train/ | | -| approx_kl | 0.005147931 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.302 | -| learning_rate | 0.0003 | -| loss | -0.00692 | -| n_updates | 91760 | -| policy_gradient_loss | -0.00501 | -| std | 0.0585 | -| value_loss | 2.67e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9178 | -| time_elapsed | 54511 | -| total_timesteps | 1174784 | -| train/ | | -| approx_kl | 0.00037427386 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.099 | -| learning_rate | 0.0003 | -| loss | -0.0008 | -| n_updates | 91770 | -| policy_gradient_loss | 0.00963 | -| std | 0.0584 | -| value_loss | 1.58e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9179 | -| time_elapsed | 54514 | -| total_timesteps | 1174912 | -| train/ | | -| approx_kl | 0.00010472676 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | -0.000555 | -| n_updates | 91780 | -| policy_gradient_loss | 0.00826 | -| std | 0.0584 | -| value_loss | 1.6e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9180 | -| time_elapsed | 54516 | -| total_timesteps | 1175040 | -| train/ | | -| approx_kl | 0.017564591 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.0652 | -| learning_rate | 0.0003 | -| loss | -0.000579 | -| n_updates | 91790 | -| policy_gradient_loss | 0.00319 | -| std | 0.0584 | -| value_loss | 7.18e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9181 | -| time_elapsed | 54524 | -| total_timesteps | 1175168 | -| train/ | | -| approx_kl | 0.05095213 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 91800 | -| policy_gradient_loss | -0.0122 | -| std | 0.0584 | -| value_loss | 0.000467 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9182 | -| time_elapsed | 54526 | -| total_timesteps | 1175296 | -| train/ | | -| approx_kl | 0.0036867345 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.793 | -| learning_rate | 0.0003 | -| loss | -0.00888 | -| n_updates | 91810 | -| policy_gradient_loss | -0.00651 | -| std | 0.0584 | -| value_loss | 1.64e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9183 | -| time_elapsed | 54529 | -| total_timesteps | 1175424 | -| train/ | | -| approx_kl | 0.0021231356 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.396 | -| learning_rate | 0.0003 | -| loss | 0.00128 | -| n_updates | 91820 | -| policy_gradient_loss | 0.00602 | -| std | 0.0584 | -| value_loss | 4.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9184 | -| time_elapsed | 54531 | -| total_timesteps | 1175552 | -| train/ | | -| approx_kl | 0.0014800592 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 91830 | -| policy_gradient_loss | -0.000192 | -| std | 0.0583 | -| value_loss | 4.51e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9185 | -| time_elapsed | 54534 | -| total_timesteps | 1175680 | -| train/ | | -| approx_kl | 3.5664532e-05 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.42 | -| explained_variance | 0.00216 | -| learning_rate | 0.0003 | -| loss | -0.000532 | -| n_updates | 91840 | -| policy_gradient_loss | 0.00458 | -| std | 0.0582 | -| value_loss | 5.67e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9186 | -| time_elapsed | 54537 | -| total_timesteps | 1175808 | -| train/ | | -| approx_kl | 0.0052125477 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 91850 | -| policy_gradient_loss | -0.00183 | -| std | 0.058 | -| value_loss | 8.35e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9187 | -| time_elapsed | 54541 | -| total_timesteps | 1175936 | -| train/ | | -| approx_kl | 0.0032777996 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 91860 | -| policy_gradient_loss | 0.000723 | -| std | 0.058 | -| value_loss | 3.9e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9188 | -| time_elapsed | 54545 | -| total_timesteps | 1176064 | -| train/ | | -| approx_kl | 0.0017066137 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | -0.00949 | -| n_updates | 91870 | -| policy_gradient_loss | -0.00977 | -| std | 0.0579 | -| value_loss | 3.67e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9189 | -| time_elapsed | 54552 | -| total_timesteps | 1176192 | -| train/ | | -| approx_kl | 0.0026919986 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.00914 | -| n_updates | 91880 | -| policy_gradient_loss | -0.00548 | -| std | 0.0579 | -| value_loss | 8.65e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9190 | -| time_elapsed | 54557 | -| total_timesteps | 1176320 | -| train/ | | -| approx_kl | 0.0013696006 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 91890 | -| policy_gradient_loss | -0.019 | -| std | 0.0579 | -| value_loss | 4.44e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9191 | -| time_elapsed | 54561 | -| total_timesteps | 1176448 | -| train/ | | -| approx_kl | 0.000186841 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.00558 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 91900 | -| policy_gradient_loss | 0.000511 | -| std | 0.0579 | -| value_loss | 2.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9192 | -| time_elapsed | 54564 | -| total_timesteps | 1176576 | -| train/ | | -| approx_kl | 0.007336623 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00442 | -| n_updates | 91910 | -| policy_gradient_loss | -0.00293 | -| std | 0.0579 | -| value_loss | 6.81e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9193 | -| time_elapsed | 54566 | -| total_timesteps | 1176704 | -| train/ | | -| approx_kl | 0.0047023334 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.443 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 91920 | -| policy_gradient_loss | -0.000442 | -| std | 0.0578 | -| value_loss | 1.41e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9194 | -| time_elapsed | 54570 | -| total_timesteps | 1176832 | -| train/ | | -| approx_kl | 0.014943564 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | 0.00316 | -| learning_rate | 0.0003 | -| loss | 0.00421 | -| n_updates | 91930 | -| policy_gradient_loss | 0.00553 | -| std | 0.0578 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9195 | -| time_elapsed | 54574 | -| total_timesteps | 1176960 | -| train/ | | -| approx_kl | 0.0033867955 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 91940 | -| policy_gradient_loss | -0.00413 | -| std | 0.0578 | -| value_loss | 2.39e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9196 | -| time_elapsed | 54576 | -| total_timesteps | 1177088 | -| train/ | | -| approx_kl | 0.019092323 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 91950 | -| policy_gradient_loss | 3.88e-05 | -| std | 0.0578 | -| value_loss | 3.38e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9197 | -| time_elapsed | 54584 | -| total_timesteps | 1177216 | -| train/ | | -| approx_kl | 0.001767362 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | 0.777 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 91960 | -| policy_gradient_loss | -0.0149 | -| std | 0.0578 | -| value_loss | 0.00344 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9198 | -| time_elapsed | 54588 | -| total_timesteps | 1177344 | -| train/ | | -| approx_kl | 0.0056198128 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -9.95 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 91970 | -| policy_gradient_loss | 0.000278 | -| std | 0.0579 | -| value_loss | 5.36e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9199 | -| time_elapsed | 54592 | -| total_timesteps | 1177472 | -| train/ | | -| approx_kl | 0.020552076 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -21.4 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 91980 | -| policy_gradient_loss | -0.0166 | -| std | 0.0579 | -| value_loss | 0.000208 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9200 | -| time_elapsed | 54596 | -| total_timesteps | 1177600 | -| train/ | | -| approx_kl | 0.039521173 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 91990 | -| policy_gradient_loss | 0.00732 | -| std | 0.0579 | -| value_loss | 0.0027 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9201 | -| time_elapsed | 54600 | -| total_timesteps | 1177728 | -| train/ | | -| approx_kl | 0.0031475592 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | -0.00919 | -| n_updates | 92000 | -| policy_gradient_loss | -0.00524 | -| std | 0.0579 | -| value_loss | 0.000396 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9202 | -| time_elapsed | 54604 | -| total_timesteps | 1177856 | -| train/ | | -| approx_kl | 0.004227898 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.41 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 92010 | -| policy_gradient_loss | -0.0111 | -| std | 0.0579 | -| value_loss | 7.3e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 21 | -| iterations | 9203 | -| time_elapsed | 54606 | -| total_timesteps | 1177984 | -| train/ | | -| approx_kl | 0.0003069858 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | -0.000461 | -| n_updates | 92020 | -| policy_gradient_loss | 0.00252 | -| std | 0.0579 | -| value_loss | 7.87e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 21 | -| iterations | 9204 | -| time_elapsed | 54610 | -| total_timesteps | 1178112 | -| train/ | | -| approx_kl | 0.0006219712 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 92030 | -| policy_gradient_loss | -0.0063 | -| std | 0.0579 | -| value_loss | 0.00028 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 21 | -| iterations | 9205 | -| time_elapsed | 54618 | -| total_timesteps | 1178240 | -| train/ | | -| approx_kl | 0.056025825 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | 0.433 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 92040 | -| policy_gradient_loss | -0.016 | -| std | 0.0578 | -| value_loss | 0.00118 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 21 | -| iterations | 9206 | -| time_elapsed | 54622 | -| total_timesteps | 1178368 | -| train/ | | -| approx_kl | 0.010073077 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.535 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 92050 | -| policy_gradient_loss | -0.002 | -| std | 0.0578 | -| value_loss | 3.07e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 21 | -| iterations | 9207 | -| time_elapsed | 54626 | -| total_timesteps | 1178496 | -| train/ | | -| approx_kl | 0.0022880472 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 92060 | -| policy_gradient_loss | -0.00331 | -| std | 0.0578 | -| value_loss | 4.21e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 21 | -| iterations | 9208 | -| time_elapsed | 54630 | -| total_timesteps | 1178624 | -| train/ | | -| approx_kl | 0.0010971464 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 92070 | -| policy_gradient_loss | 0.00399 | -| std | 0.0578 | -| value_loss | 4.51e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 21 | -| iterations | 9209 | -| time_elapsed | 54634 | -| total_timesteps | 1178752 | -| train/ | | -| approx_kl | 0.0023531471 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.000458 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 92080 | -| policy_gradient_loss | -0.00351 | -| std | 0.0578 | -| value_loss | 5.17e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 21 | -| iterations | 9210 | -| time_elapsed | 54638 | -| total_timesteps | 1178880 | -| train/ | | -| approx_kl | 0.017252252 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | 0.00272 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 92090 | -| policy_gradient_loss | -0.012 | -| std | 0.0578 | -| value_loss | 8.9e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9211 | -| time_elapsed | 54641 | -| total_timesteps | 1179008 | -| train/ | | -| approx_kl | 0.0021390673 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.00662 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 92100 | -| policy_gradient_loss | 0.000396 | -| std | 0.0578 | -| value_loss | 8.2e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9212 | -| time_elapsed | 54650 | -| total_timesteps | 1179136 | -| train/ | | -| approx_kl | 0.073729426 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 92110 | -| policy_gradient_loss | -0.0149 | -| std | 0.0578 | -| value_loss | 0.00167 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9213 | -| time_elapsed | 54653 | -| total_timesteps | 1179264 | -| train/ | | -| approx_kl | 0.0012369626 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.777 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 92120 | -| policy_gradient_loss | -0.00148 | -| std | 0.0577 | -| value_loss | 5.09e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9214 | -| time_elapsed | 54657 | -| total_timesteps | 1179392 | -| train/ | | -| approx_kl | 0.0016530128 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -5 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 92130 | -| policy_gradient_loss | -0.00276 | -| std | 0.0577 | -| value_loss | 1.42e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9215 | -| time_elapsed | 54659 | -| total_timesteps | 1179520 | -| train/ | | -| approx_kl | 0.0020227619 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 1.43 | -| explained_variance | -0.583 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 92140 | -| policy_gradient_loss | 0.0034 | -| std | 0.0576 | -| value_loss | 8.85e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9216 | -| time_elapsed | 54663 | -| total_timesteps | 1179648 | -| train/ | | -| approx_kl | 0.0069626844 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 92150 | -| policy_gradient_loss | -0.00354 | -| std | 0.0575 | -| value_loss | 8.66e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9217 | -| time_elapsed | 54667 | -| total_timesteps | 1179776 | -| train/ | | -| approx_kl | 0.0028242068 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0736 | -| learning_rate | 0.0003 | -| loss | -0.00895 | -| n_updates | 92160 | -| policy_gradient_loss | -0.00333 | -| std | 0.0574 | -| value_loss | 0.000162 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9218 | -| time_elapsed | 54670 | -| total_timesteps | 1179904 | -| train/ | | -| approx_kl | 0.00019962247 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | -0.000742 | -| n_updates | 92170 | -| policy_gradient_loss | 0.00288 | -| std | 0.0573 | -| value_loss | 3.31e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9219 | -| time_elapsed | 54675 | -| total_timesteps | 1180032 | -| train/ | | -| approx_kl | 0.00936481 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 92180 | -| policy_gradient_loss | -0.00951 | -| std | 0.0573 | -| value_loss | 1.75e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9220 | -| time_elapsed | 54683 | -| total_timesteps | 1180160 | -| train/ | | -| approx_kl | 0.07803475 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 92190 | -| policy_gradient_loss | -0.0183 | -| std | 0.0573 | -| value_loss | 0.000127 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9221 | -| time_elapsed | 54687 | -| total_timesteps | 1180288 | -| train/ | | -| approx_kl | 0.08632079 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -6.73 | -| learning_rate | 0.0003 | -| loss | -0.00696 | -| n_updates | 92200 | -| policy_gradient_loss | -0.00697 | -| std | 0.0572 | -| value_loss | 2.84e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9222 | -| time_elapsed | 54691 | -| total_timesteps | 1180416 | -| train/ | | -| approx_kl | 0.00088339485 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -1.91 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 92210 | -| policy_gradient_loss | -0.00139 | -| std | 0.0572 | -| value_loss | 1.3e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9223 | -| time_elapsed | 54695 | -| total_timesteps | 1180544 | -| train/ | | -| approx_kl | 0.002949013 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 92220 | -| policy_gradient_loss | 0.000233 | -| std | 0.0572 | -| value_loss | 1.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9224 | -| time_elapsed | 54699 | -| total_timesteps | 1180672 | -| train/ | | -| approx_kl | 0.003877107 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 92230 | -| policy_gradient_loss | -0.00334 | -| std | 0.0571 | -| value_loss | 3.8e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9225 | -| time_elapsed | 54704 | -| total_timesteps | 1180800 | -| train/ | | -| approx_kl | 0.00033652643 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 92240 | -| policy_gradient_loss | -0.00192 | -| std | 0.0571 | -| value_loss | 6.88e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9226 | -| time_elapsed | 54707 | -| total_timesteps | 1180928 | -| train/ | | -| approx_kl | 0.0032604132 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 92250 | -| policy_gradient_loss | -0.0118 | -| std | 0.0572 | -| value_loss | 1.74e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9227 | -| time_elapsed | 54711 | -| total_timesteps | 1181056 | -| train/ | | -| approx_kl | 0.0051050773 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 92260 | -| policy_gradient_loss | 0.000125 | -| std | 0.0573 | -| value_loss | 9.02e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9228 | -| time_elapsed | 54717 | -| total_timesteps | 1181184 | -| train/ | | -| approx_kl | 0.022256829 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | 0.655 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 92270 | -| policy_gradient_loss | -0.0167 | -| std | 0.0574 | -| value_loss | 0.000508 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9229 | -| time_elapsed | 54720 | -| total_timesteps | 1181312 | -| train/ | | -| approx_kl | 0.007815496 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -72 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 92280 | -| policy_gradient_loss | -0.00342 | -| std | 0.0574 | -| value_loss | 4.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9230 | -| time_elapsed | 54724 | -| total_timesteps | 1181440 | -| train/ | | -| approx_kl | 0.048087794 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -139 | -| learning_rate | 0.0003 | -| loss | -0.00544 | -| n_updates | 92290 | -| policy_gradient_loss | -0.0022 | -| std | 0.0574 | -| value_loss | 2.2e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9231 | -| time_elapsed | 54728 | -| total_timesteps | 1181568 | -| train/ | | -| approx_kl | 0.0084780045 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -75.6 | -| learning_rate | 0.0003 | -| loss | -0.000658 | -| n_updates | 92300 | -| policy_gradient_loss | 0.000291 | -| std | 0.0573 | -| value_loss | 4.19e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9232 | -| time_elapsed | 54731 | -| total_timesteps | 1181696 | -| train/ | | -| approx_kl | 0.012991712 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -2.95 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 92310 | -| policy_gradient_loss | 0.00328 | -| std | 0.0571 | -| value_loss | 1.8e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9233 | -| time_elapsed | 54734 | -| total_timesteps | 1181824 | -| train/ | | -| approx_kl | 0.00015236763 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00024 | -| n_updates | 92320 | -| policy_gradient_loss | 0.000299 | -| std | 0.0569 | -| value_loss | 1.59e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9234 | -| time_elapsed | 54737 | -| total_timesteps | 1181952 | -| train/ | | -| approx_kl | 0.0026159422 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | -0.00669 | -| n_updates | 92330 | -| policy_gradient_loss | -0.00596 | -| std | 0.0568 | -| value_loss | 9.16e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9235 | -| time_elapsed | 54740 | -| total_timesteps | 1182080 | -| train/ | | -| approx_kl | 0.0033740327 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.0029 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 92340 | -| policy_gradient_loss | -0.00272 | -| std | 0.0567 | -| value_loss | 3.95e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9236 | -| time_elapsed | 54747 | -| total_timesteps | 1182208 | -| train/ | | -| approx_kl | 0.007954769 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.742 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 92350 | -| policy_gradient_loss | -0.016 | -| std | 0.0567 | -| value_loss | 0.00347 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9237 | -| time_elapsed | 54750 | -| total_timesteps | 1182336 | -| train/ | | -| approx_kl | 0.0044663777 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -65.3 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 92360 | -| policy_gradient_loss | -0.013 | -| std | 0.0568 | -| value_loss | 1.95e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9238 | -| time_elapsed | 54753 | -| total_timesteps | 1182464 | -| train/ | | -| approx_kl | 0.18309279 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -22.2 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 92370 | -| policy_gradient_loss | -0.00292 | -| std | 0.0568 | -| value_loss | 1.1e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9239 | -| time_elapsed | 54756 | -| total_timesteps | 1182592 | -| train/ | | -| approx_kl | 0.03730391 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -24.8 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 92380 | -| policy_gradient_loss | -0.00712 | -| std | 0.0568 | -| value_loss | 8.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9240 | -| time_elapsed | 54759 | -| total_timesteps | 1182720 | -| train/ | | -| approx_kl | 0.017161507 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -4.57 | -| learning_rate | 0.0003 | -| loss | -0.0008 | -| n_updates | 92390 | -| policy_gradient_loss | 0.000462 | -| std | 0.0568 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9241 | -| time_elapsed | 54764 | -| total_timesteps | 1182848 | -| train/ | | -| approx_kl | 0.0022612778 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.596 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 92400 | -| policy_gradient_loss | 0.00044 | -| std | 0.0567 | -| value_loss | 6.36e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9242 | -| time_elapsed | 54767 | -| total_timesteps | 1182976 | -| train/ | | -| approx_kl | 0.08073237 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.00579 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 92410 | -| policy_gradient_loss | 6.18e-05 | -| std | 0.0566 | -| value_loss | 1.27e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9243 | -| time_elapsed | 54770 | -| total_timesteps | 1183104 | -| train/ | | -| approx_kl | 0.00018401956 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.000825 | -| n_updates | 92420 | -| policy_gradient_loss | 0.000236 | -| std | 0.0566 | -| value_loss | 8.85e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9244 | -| time_elapsed | 54778 | -| total_timesteps | 1183232 | -| train/ | | -| approx_kl | 0.02471838 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.806 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 92430 | -| policy_gradient_loss | -0.0161 | -| std | 0.0565 | -| value_loss | 0.00371 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9245 | -| time_elapsed | 54780 | -| total_timesteps | 1183360 | -| train/ | | -| approx_kl | 0.0019821269 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -26.3 | -| learning_rate | 0.0003 | -| loss | -0.00954 | -| n_updates | 92440 | -| policy_gradient_loss | -0.0136 | -| std | 0.0565 | -| value_loss | 6.99e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9246 | -| time_elapsed | 54783 | -| total_timesteps | 1183488 | -| train/ | | -| approx_kl | 0.1901154 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -817 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 92450 | -| policy_gradient_loss | -0.00613 | -| std | 0.0565 | -| value_loss | 2.52e-06 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9247 | -| time_elapsed | 54785 | -| total_timesteps | 1183616 | -| train/ | | -| approx_kl | 9.0454705e-06 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -300 | -| learning_rate | 0.0003 | -| loss | 0.000371 | -| n_updates | 92460 | -| policy_gradient_loss | -0.00513 | -| std | 0.0565 | -| value_loss | 2.59e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9248 | -| time_elapsed | 54788 | -| total_timesteps | 1183744 | -| train/ | | -| approx_kl | 0.0034668501 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -76.8 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 92470 | -| policy_gradient_loss | -0.00112 | -| std | 0.0566 | -| value_loss | 3.13e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9249 | -| time_elapsed | 54792 | -| total_timesteps | 1183872 | -| train/ | | -| approx_kl | 0.1067182 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -13.5 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 92480 | -| policy_gradient_loss | -0.00455 | -| std | 0.0567 | -| value_loss | 1.51e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9250 | -| time_elapsed | 54795 | -| total_timesteps | 1184000 | -| train/ | | -| approx_kl | 0.00049918005 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.898 | -| learning_rate | 0.0003 | -| loss | 0.000148 | -| n_updates | 92490 | -| policy_gradient_loss | 0.000538 | -| std | 0.0568 | -| value_loss | 1.6e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9251 | -| time_elapsed | 54798 | -| total_timesteps | 1184128 | -| train/ | | -| approx_kl | 0.00086013833 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.00425 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 92500 | -| policy_gradient_loss | 0.000379 | -| std | 0.0569 | -| value_loss | 4.24e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9252 | -| time_elapsed | 54805 | -| total_timesteps | 1184256 | -| train/ | | -| approx_kl | 0.035423566 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 92510 | -| policy_gradient_loss | -0.0166 | -| std | 0.057 | -| value_loss | 0.00209 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9253 | -| time_elapsed | 54809 | -| total_timesteps | 1184384 | -| train/ | | -| approx_kl | 0.001694432 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -391 | -| learning_rate | 0.0003 | -| loss | -0.000499 | -| n_updates | 92520 | -| policy_gradient_loss | -1.68e-05 | -| std | 0.0568 | -| value_loss | 4.92e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9254 | -| time_elapsed | 54813 | -| total_timesteps | 1184512 | -| train/ | | -| approx_kl | 0.0006265668 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -5.01e+03 | -| learning_rate | 0.0003 | -| loss | -0.000733 | -| n_updates | 92530 | -| policy_gradient_loss | -7.81e-05 | -| std | 0.0566 | -| value_loss | 1.77e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9255 | -| time_elapsed | 54817 | -| total_timesteps | 1184640 | -| train/ | | -| approx_kl | 0.0005247956 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.00791 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 92540 | -| policy_gradient_loss | -0.000359 | -| std | 0.0564 | -| value_loss | 2.19e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9256 | -| time_elapsed | 54821 | -| total_timesteps | 1184768 | -| train/ | | -| approx_kl | 0.029351907 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | -0.00595 | -| n_updates | 92550 | -| policy_gradient_loss | -0.00309 | -| std | 0.0564 | -| value_loss | 1.57e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 21 | -| iterations | 9257 | -| time_elapsed | 54824 | -| total_timesteps | 1184896 | -| train/ | | -| approx_kl | 0.00216498 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.244 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 92560 | -| policy_gradient_loss | -0.00506 | -| std | 0.0564 | -| value_loss | 2.12e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9258 | -| time_elapsed | 54828 | -| total_timesteps | 1185024 | -| train/ | | -| approx_kl | 9.3670096e-05 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | 4.42e-05 | -| n_updates | 92570 | -| policy_gradient_loss | -0.000342 | -| std | 0.0564 | -| value_loss | 1.1e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9259 | -| time_elapsed | 54835 | -| total_timesteps | 1185152 | -| train/ | | -| approx_kl | 0.007897573 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 92580 | -| policy_gradient_loss | -0.00176 | -| std | 0.0564 | -| value_loss | 0.000364 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9260 | -| time_elapsed | 54839 | -| total_timesteps | 1185280 | -| train/ | | -| approx_kl | 0.008438308 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -21.8 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 92590 | -| policy_gradient_loss | -0.00389 | -| std | 0.0564 | -| value_loss | 2.19e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9261 | -| time_elapsed | 54843 | -| total_timesteps | 1185408 | -| train/ | | -| approx_kl | 0.03475669 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -18.6 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 92600 | -| policy_gradient_loss | -0.00733 | -| std | 0.0564 | -| value_loss | 6.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9262 | -| time_elapsed | 54846 | -| total_timesteps | 1185536 | -| train/ | | -| approx_kl | 0.012884274 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | 0.000853 | -| n_updates | 92610 | -| policy_gradient_loss | 0.00233 | -| std | 0.0565 | -| value_loss | 2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9263 | -| time_elapsed | 54850 | -| total_timesteps | 1185664 | -| train/ | | -| approx_kl | 0.021864785 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 92620 | -| policy_gradient_loss | 0.000599 | -| std | 0.0567 | -| value_loss | 9.28e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9264 | -| time_elapsed | 54853 | -| total_timesteps | 1185792 | -| train/ | | -| approx_kl | 0.0004206081 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.0041 | -| n_updates | 92630 | -| policy_gradient_loss | -0.0102 | -| std | 0.0569 | -| value_loss | 1.21e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 21 | -| iterations | 9265 | -| time_elapsed | 54855 | -| total_timesteps | 1185920 | -| train/ | | -| approx_kl | 0.0119169075 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.000879 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 92640 | -| policy_gradient_loss | -0.00344 | -| std | 0.0571 | -| value_loss | 2.33e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9266 | -| time_elapsed | 54858 | -| total_timesteps | 1186048 | -| train/ | | -| approx_kl | 0.0024034753 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | -0.00364 | -| n_updates | 92650 | -| policy_gradient_loss | -0.00127 | -| std | 0.0571 | -| value_loss | 5.56e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9267 | -| time_elapsed | 54864 | -| total_timesteps | 1186176 | -| train/ | | -| approx_kl | 0.057774253 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 92660 | -| policy_gradient_loss | -0.0158 | -| std | 0.0571 | -| value_loss | 0.000412 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9268 | -| time_elapsed | 54868 | -| total_timesteps | 1186304 | -| train/ | | -| approx_kl | 0.10992699 | -| clip_fraction | 0.564 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -2.59e+03 | -| learning_rate | 0.0003 | -| loss | -0.00635 | -| n_updates | 92670 | -| policy_gradient_loss | -0.00349 | -| std | 0.0571 | -| value_loss | 2.62e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9269 | -| time_elapsed | 54871 | -| total_timesteps | 1186432 | -| train/ | | -| approx_kl | 0.03051728 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 1.44 | -| explained_variance | -4.33e+03 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 92680 | -| policy_gradient_loss | -0.00233 | -| std | 0.0571 | -| value_loss | 1.36e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9270 | -| time_elapsed | 54874 | -| total_timesteps | 1186560 | -| train/ | | -| approx_kl | 0.00027657673 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -642 | -| learning_rate | 0.0003 | -| loss | 0.000491 | -| n_updates | 92690 | -| policy_gradient_loss | 0.000215 | -| std | 0.057 | -| value_loss | 1.49e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9271 | -| time_elapsed | 54877 | -| total_timesteps | 1186688 | -| train/ | | -| approx_kl | 0.034586363 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -44 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 92700 | -| policy_gradient_loss | -0.0111 | -| std | 0.057 | -| value_loss | 1.63e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9272 | -| time_elapsed | 54880 | -| total_timesteps | 1186816 | -| train/ | | -| approx_kl | 0.00016445806 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -4.4 | -| learning_rate | 0.0003 | -| loss | 0.000551 | -| n_updates | 92710 | -| policy_gradient_loss | 0.00223 | -| std | 0.0569 | -| value_loss | 2.22e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 21 | -| iterations | 9273 | -| time_elapsed | 54883 | -| total_timesteps | 1186944 | -| train/ | | -| approx_kl | 0.010799002 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.494 | -| learning_rate | 0.0003 | -| loss | -0.00809 | -| n_updates | 92720 | -| policy_gradient_loss | -0.00637 | -| std | 0.0569 | -| value_loss | 2.18e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9274 | -| time_elapsed | 54886 | -| total_timesteps | 1187072 | -| train/ | | -| approx_kl | 0.0039030304 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 92730 | -| policy_gradient_loss | -0.00463 | -| std | 0.0569 | -| value_loss | 2.97e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9275 | -| time_elapsed | 54892 | -| total_timesteps | 1187200 | -| train/ | | -| approx_kl | 0.008128502 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | 7.67e-05 | -| n_updates | 92740 | -| policy_gradient_loss | -0.00088 | -| std | 0.0567 | -| value_loss | 0.00337 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9276 | -| time_elapsed | 54896 | -| total_timesteps | 1187328 | -| train/ | | -| approx_kl | 0.00392109 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -7.34 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 92750 | -| policy_gradient_loss | -0.00117 | -| std | 0.0566 | -| value_loss | 1.39e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9277 | -| time_elapsed | 54899 | -| total_timesteps | 1187456 | -| train/ | | -| approx_kl | 0.0043093176 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 92760 | -| policy_gradient_loss | -0.0134 | -| std | 0.0566 | -| value_loss | 1.54e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9278 | -| time_elapsed | 54902 | -| total_timesteps | 1187584 | -| train/ | | -| approx_kl | 0.032842238 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.229 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 92770 | -| policy_gradient_loss | -0.0129 | -| std | 0.0567 | -| value_loss | 1.12e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9279 | -| time_elapsed | 54906 | -| total_timesteps | 1187712 | -| train/ | | -| approx_kl | 0.0086180605 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 92780 | -| policy_gradient_loss | -0.000578 | -| std | 0.0567 | -| value_loss | 2.8e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9280 | -| time_elapsed | 54910 | -| total_timesteps | 1187840 | -| train/ | | -| approx_kl | 0.0021823193 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | 7.41e-05 | -| n_updates | 92790 | -| policy_gradient_loss | 0.0097 | -| std | 0.0567 | -| value_loss | 1.96e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9281 | -| time_elapsed | 54914 | -| total_timesteps | 1187968 | -| train/ | | -| approx_kl | 0.0018737358 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.000301 | -| learning_rate | 0.0003 | -| loss | 0.0042 | -| n_updates | 92800 | -| policy_gradient_loss | 0.00594 | -| std | 0.0568 | -| value_loss | 2.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9282 | -| time_elapsed | 54918 | -| total_timesteps | 1188096 | -| train/ | | -| approx_kl | 0.0013739006 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.0937 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 92810 | -| policy_gradient_loss | -0.00322 | -| std | 0.0568 | -| value_loss | 4.12e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9283 | -| time_elapsed | 54924 | -| total_timesteps | 1188224 | -| train/ | | -| approx_kl | 0.038885135 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 92820 | -| policy_gradient_loss | -0.0172 | -| std | 0.0568 | -| value_loss | 0.000511 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9284 | -| time_elapsed | 54927 | -| total_timesteps | 1188352 | -| train/ | | -| approx_kl | 0.0152316075 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -36.6 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 92830 | -| policy_gradient_loss | -0.00377 | -| std | 0.0567 | -| value_loss | 1.07e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9285 | -| time_elapsed | 54930 | -| total_timesteps | 1188480 | -| train/ | | -| approx_kl | 0.0017760526 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -17.7 | -| learning_rate | 0.0003 | -| loss | -0.00931 | -| n_updates | 92840 | -| policy_gradient_loss | -0.00778 | -| std | 0.0566 | -| value_loss | 2.06e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9286 | -| time_elapsed | 54933 | -| total_timesteps | 1188608 | -| train/ | | -| approx_kl | 0.016878335 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 92850 | -| policy_gradient_loss | -0.00451 | -| std | 0.0566 | -| value_loss | 8.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9287 | -| time_elapsed | 54936 | -| total_timesteps | 1188736 | -| train/ | | -| approx_kl | 0.002238141 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 92860 | -| policy_gradient_loss | -0.00394 | -| std | 0.0566 | -| value_loss | 4.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9288 | -| time_elapsed | 54939 | -| total_timesteps | 1188864 | -| train/ | | -| approx_kl | 0.008598477 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.00179 | -| learning_rate | 0.0003 | -| loss | -0.0098 | -| n_updates | 92870 | -| policy_gradient_loss | -0.00572 | -| std | 0.0567 | -| value_loss | 2.25e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9289 | -| time_elapsed | 54943 | -| total_timesteps | 1188992 | -| train/ | | -| approx_kl | 0.00020604022 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.00288 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 92880 | -| policy_gradient_loss | -0.00301 | -| std | 0.0567 | -| value_loss | 9.27e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9290 | -| time_elapsed | 54947 | -| total_timesteps | 1189120 | -| train/ | | -| approx_kl | 0.0018506087 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.0029 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 92890 | -| policy_gradient_loss | -0.00194 | -| std | 0.0567 | -| value_loss | 2.08e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9291 | -| time_elapsed | 54956 | -| total_timesteps | 1189248 | -| train/ | | -| approx_kl | 0.0017035035 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.0063 | -| n_updates | 92900 | -| policy_gradient_loss | -0.00783 | -| std | 0.0567 | -| value_loss | 0.000174 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9292 | -| time_elapsed | 54960 | -| total_timesteps | 1189376 | -| train/ | | -| approx_kl | 0.0024537612 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.00854 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 92910 | -| policy_gradient_loss | -0.00131 | -| std | 0.0567 | -| value_loss | 1.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9293 | -| time_elapsed | 54962 | -| total_timesteps | 1189504 | -| train/ | | -| approx_kl | 0.010038534 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 92920 | -| policy_gradient_loss | -0.00653 | -| std | 0.0568 | -| value_loss | 7.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9294 | -| time_elapsed | 54965 | -| total_timesteps | 1189632 | -| train/ | | -| approx_kl | 8.725794e-05 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | 0.000283 | -| n_updates | 92930 | -| policy_gradient_loss | 0.000376 | -| std | 0.0567 | -| value_loss | 1.4e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9295 | -| time_elapsed | 54968 | -| total_timesteps | 1189760 | -| train/ | | -| approx_kl | 0.0010276306 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.00183 | -| learning_rate | 0.0003 | -| loss | 0.00215 | -| n_updates | 92940 | -| policy_gradient_loss | -4.22e-05 | -| std | 0.0566 | -| value_loss | 7.67e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9296 | -| time_elapsed | 54971 | -| total_timesteps | 1189888 | -| train/ | | -| approx_kl | 0.010359471 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.00468 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 92950 | -| policy_gradient_loss | -0.0111 | -| std | 0.0566 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9297 | -| time_elapsed | 54975 | -| total_timesteps | 1190016 | -| train/ | | -| approx_kl | 0.0037786872 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 1.45 | -| explained_variance | -0.00855 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 92960 | -| policy_gradient_loss | -0.00451 | -| std | 0.0565 | -| value_loss | 4.61e-07 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9298 | -| time_elapsed | 54983 | -| total_timesteps | 1190144 | -| train/ | | -| approx_kl | 0.011122 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -8.93 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 92970 | -| policy_gradient_loss | -0.0148 | -| std | 0.0563 | -| value_loss | 0.00358 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9299 | -| time_elapsed | 54986 | -| total_timesteps | 1190272 | -| train/ | | -| approx_kl | 0.0036539803 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -77.5 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 92980 | -| policy_gradient_loss | -0.0119 | -| std | 0.0563 | -| value_loss | 5.75e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9300 | -| time_elapsed | 54990 | -| total_timesteps | 1190400 | -| train/ | | -| approx_kl | 0.006647987 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -48 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 92990 | -| policy_gradient_loss | -0.00517 | -| std | 0.0563 | -| value_loss | 1.41e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9301 | -| time_elapsed | 54993 | -| total_timesteps | 1190528 | -| train/ | | -| approx_kl | 0.0023214598 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 93000 | -| policy_gradient_loss | -0.00747 | -| std | 0.0563 | -| value_loss | 2.85e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9302 | -| time_elapsed | 54997 | -| total_timesteps | 1190656 | -| train/ | | -| approx_kl | 0.0060511413 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | -0.000615 | -| n_updates | 93010 | -| policy_gradient_loss | 0.0024 | -| std | 0.0564 | -| value_loss | 4.44e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9303 | -| time_elapsed | 55000 | -| total_timesteps | 1190784 | -| train/ | | -| approx_kl | 0.011630476 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 93020 | -| policy_gradient_loss | 0.000452 | -| std | 0.0564 | -| value_loss | 1.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 21 | -| iterations | 9304 | -| time_elapsed | 55003 | -| total_timesteps | 1190912 | -| train/ | | -| approx_kl | 0.005131999 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.000626 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 93030 | -| policy_gradient_loss | 4.99e-05 | -| std | 0.0564 | -| value_loss | 1.82e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9305 | -| time_elapsed | 55006 | -| total_timesteps | 1191040 | -| train/ | | -| approx_kl | 2.690684e-05 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.0847 | -| learning_rate | 0.0003 | -| loss | -0.000916 | -| n_updates | 93040 | -| policy_gradient_loss | -0.00455 | -| std | 0.0564 | -| value_loss | 4.65e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9306 | -| time_elapsed | 55014 | -| total_timesteps | 1191168 | -| train/ | | -| approx_kl | 0.011107368 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | 0.694 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 93050 | -| policy_gradient_loss | -0.0114 | -| std | 0.0564 | -| value_loss | 0.00041 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9307 | -| time_elapsed | 55017 | -| total_timesteps | 1191296 | -| train/ | | -| approx_kl | 0.0010365387 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -6.59 | -| learning_rate | 0.0003 | -| loss | 0.00075 | -| n_updates | 93060 | -| policy_gradient_loss | 0.000353 | -| std | 0.0563 | -| value_loss | 6.16e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9308 | -| time_elapsed | 55021 | -| total_timesteps | 1191424 | -| train/ | | -| approx_kl | 0.00843501 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -3.1 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 93070 | -| policy_gradient_loss | -0.0104 | -| std | 0.0563 | -| value_loss | 8.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9309 | -| time_elapsed | 55025 | -| total_timesteps | 1191552 | -| train/ | | -| approx_kl | 0.0013001156 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.907 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 93080 | -| policy_gradient_loss | 0.00222 | -| std | 0.0563 | -| value_loss | 4.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9310 | -| time_elapsed | 55029 | -| total_timesteps | 1191680 | -| train/ | | -| approx_kl | 0.010882547 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 93090 | -| policy_gradient_loss | -0.00845 | -| std | 0.0564 | -| value_loss | 5.25e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9311 | -| time_elapsed | 55033 | -| total_timesteps | 1191808 | -| train/ | | -| approx_kl | 0.0032770368 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -502 | -| learning_rate | 0.0003 | -| loss | -0.000293 | -| n_updates | 93100 | -| policy_gradient_loss | -6.81e-05 | -| std | 0.0562 | -| value_loss | 8.56e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9312 | -| time_elapsed | 55035 | -| total_timesteps | 1191936 | -| train/ | | -| approx_kl | 3.7868507e-05 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.00016 | -| n_updates | 93110 | -| policy_gradient_loss | 0.00231 | -| std | 0.0561 | -| value_loss | 2.71e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9313 | -| time_elapsed | 55037 | -| total_timesteps | 1192064 | -| train/ | | -| approx_kl | 0.0033101635 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.00772 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 93120 | -| policy_gradient_loss | -0.00298 | -| std | 0.0561 | -| value_loss | 1.59e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9314 | -| time_elapsed | 55043 | -| total_timesteps | 1192192 | -| train/ | | -| approx_kl | 0.024006521 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | 0.699 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 93130 | -| policy_gradient_loss | -0.0157 | -| std | 0.0562 | -| value_loss | 0.00437 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9315 | -| time_elapsed | 55046 | -| total_timesteps | 1192320 | -| train/ | | -| approx_kl | 0.00031501148 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -0.616 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 93140 | -| policy_gradient_loss | 6.46e-05 | -| std | 0.056 | -| value_loss | 5.23e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9316 | -| time_elapsed | 55049 | -| total_timesteps | 1192448 | -| train/ | | -| approx_kl | 0.011606832 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 1.46 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 93150 | -| policy_gradient_loss | -0.00744 | -| std | 0.0559 | -| value_loss | 1.3e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9317 | -| time_elapsed | 55053 | -| total_timesteps | 1192576 | -| train/ | | -| approx_kl | 0.0015665204 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 93160 | -| policy_gradient_loss | -0.000242 | -| std | 0.0558 | -| value_loss | 3.82e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9318 | -| time_elapsed | 55056 | -| total_timesteps | 1192704 | -| train/ | | -| approx_kl | 0.0054527894 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 93170 | -| policy_gradient_loss | -0.00388 | -| std | 0.0558 | -| value_loss | 2.7e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9319 | -| time_elapsed | 55059 | -| total_timesteps | 1192832 | -| train/ | | -| approx_kl | 0.00061195577 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.000722 | -| n_updates | 93180 | -| policy_gradient_loss | 0.0021 | -| std | 0.0558 | -| value_loss | 1.54e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9320 | -| time_elapsed | 55064 | -| total_timesteps | 1192960 | -| train/ | | -| approx_kl | 0.0008683349 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 93190 | -| policy_gradient_loss | 0.00118 | -| std | 0.0558 | -| value_loss | 1.52e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9321 | -| time_elapsed | 55067 | -| total_timesteps | 1193088 | -| train/ | | -| approx_kl | 0.0045625158 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 93200 | -| policy_gradient_loss | -0.00223 | -| std | 0.0559 | -| value_loss | 2.33e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9322 | -| time_elapsed | 55074 | -| total_timesteps | 1193216 | -| train/ | | -| approx_kl | 0.005151932 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.971 | -| learning_rate | 0.0003 | -| loss | -0.00891 | -| n_updates | 93210 | -| policy_gradient_loss | -0.00711 | -| std | 0.0559 | -| value_loss | 0.000149 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9323 | -| time_elapsed | 55078 | -| total_timesteps | 1193344 | -| train/ | | -| approx_kl | 0.0102487765 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.818 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 93220 | -| policy_gradient_loss | -0.00306 | -| std | 0.0559 | -| value_loss | 1.83e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9324 | -| time_elapsed | 55080 | -| total_timesteps | 1193472 | -| train/ | | -| approx_kl | 0.00044635963 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.945 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 93230 | -| policy_gradient_loss | -0.00818 | -| std | 0.0559 | -| value_loss | 1.75e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9325 | -| time_elapsed | 55084 | -| total_timesteps | 1193600 | -| train/ | | -| approx_kl | 1.992425e-05 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.452 | -| learning_rate | 0.0003 | -| loss | 0.00108 | -| n_updates | 93240 | -| policy_gradient_loss | -0.00436 | -| std | 0.0559 | -| value_loss | 3.44e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9326 | -| time_elapsed | 55087 | -| total_timesteps | 1193728 | -| train/ | | -| approx_kl | 0.011954901 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 93250 | -| policy_gradient_loss | -0.00365 | -| std | 0.0559 | -| value_loss | 2.45e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9327 | -| time_elapsed | 55090 | -| total_timesteps | 1193856 | -| train/ | | -| approx_kl | 0.00037436327 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | -0.000352 | -| n_updates | 93260 | -| policy_gradient_loss | 0.00152 | -| std | 0.0558 | -| value_loss | 3.39e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9328 | -| time_elapsed | 55093 | -| total_timesteps | 1193984 | -| train/ | | -| approx_kl | 0.0005613719 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.00413 | -| learning_rate | 0.0003 | -| loss | 0.000314 | -| n_updates | 93270 | -| policy_gradient_loss | 0.00449 | -| std | 0.0558 | -| value_loss | 8.61e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9329 | -| time_elapsed | 55095 | -| total_timesteps | 1194112 | -| train/ | | -| approx_kl | 0.0004940396 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.00407 | -| learning_rate | 0.0003 | -| loss | 0.00266 | -| n_updates | 93280 | -| policy_gradient_loss | -0.00123 | -| std | 0.0559 | -| value_loss | 4.33e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9330 | -| time_elapsed | 55104 | -| total_timesteps | 1194240 | -| train/ | | -| approx_kl | 0.0132817235 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.00943 | -| n_updates | 93290 | -| policy_gradient_loss | -0.00682 | -| std | 0.0558 | -| value_loss | 0.000791 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9331 | -| time_elapsed | 55107 | -| total_timesteps | 1194368 | -| train/ | | -| approx_kl | 0.0020281188 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.00402 | -| learning_rate | 0.0003 | -| loss | -0.00645 | -| n_updates | 93300 | -| policy_gradient_loss | 0.00287 | -| std | 0.0558 | -| value_loss | 2.27e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9332 | -| time_elapsed | 55111 | -| total_timesteps | 1194496 | -| train/ | | -| approx_kl | 0.001589891 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.778 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 93310 | -| policy_gradient_loss | -0.00102 | -| std | 0.0558 | -| value_loss | 1.63e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9333 | -| time_elapsed | 55114 | -| total_timesteps | 1194624 | -| train/ | | -| approx_kl | 0.013726974 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 93320 | -| policy_gradient_loss | -0.00277 | -| std | 0.0558 | -| value_loss | 8.58e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9334 | -| time_elapsed | 55117 | -| total_timesteps | 1194752 | -| train/ | | -| approx_kl | 0.00016402779 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 93330 | -| policy_gradient_loss | -0.0126 | -| std | 0.0558 | -| value_loss | 9.74e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9335 | -| time_elapsed | 55119 | -| total_timesteps | 1194880 | -| train/ | | -| approx_kl | 0.023318775 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.238 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 93340 | -| policy_gradient_loss | -0.0082 | -| std | 0.0558 | -| value_loss | 0.000188 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9336 | -| time_elapsed | 55122 | -| total_timesteps | 1195008 | -| train/ | | -| approx_kl | 0.023208957 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.00417 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 93350 | -| policy_gradient_loss | 0.00366 | -| std | 0.0559 | -| value_loss | 2.41e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9337 | -| time_elapsed | 55130 | -| total_timesteps | 1195136 | -| train/ | | -| approx_kl | 0.08158613 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 93360 | -| policy_gradient_loss | -0.0027 | -| std | 0.0558 | -| value_loss | 2.1e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9338 | -| time_elapsed | 55134 | -| total_timesteps | 1195264 | -| train/ | | -| approx_kl | 0.0127880275 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | -0.000745 | -| n_updates | 93370 | -| policy_gradient_loss | -0.0024 | -| std | 0.0557 | -| value_loss | 7.32e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9339 | -| time_elapsed | 55137 | -| total_timesteps | 1195392 | -| train/ | | -| approx_kl | 0.0032051592 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.595 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 93380 | -| policy_gradient_loss | -0.00651 | -| std | 0.0557 | -| value_loss | 8.16e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9340 | -| time_elapsed | 55141 | -| total_timesteps | 1195520 | -| train/ | | -| approx_kl | 0.0019062487 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.00318 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 93390 | -| policy_gradient_loss | 0.000415 | -| std | 0.0556 | -| value_loss | 2.39e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9341 | -| time_elapsed | 55145 | -| total_timesteps | 1195648 | -| train/ | | -| approx_kl | 2.944842e-06 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.00307 | -| learning_rate | 0.0003 | -| loss | -0.000514 | -| n_updates | 93400 | -| policy_gradient_loss | 0.00274 | -| std | 0.0556 | -| value_loss | 1.98e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9342 | -| time_elapsed | 55148 | -| total_timesteps | 1195776 | -| train/ | | -| approx_kl | 0.00020077033 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.00253 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 93410 | -| policy_gradient_loss | 0.000177 | -| std | 0.0555 | -| value_loss | 6.88e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9343 | -| time_elapsed | 55152 | -| total_timesteps | 1195904 | -| train/ | | -| approx_kl | 0.0084283035 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 93420 | -| policy_gradient_loss | -0.00219 | -| std | 0.0555 | -| value_loss | 4.23e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9344 | -| time_elapsed | 55155 | -| total_timesteps | 1196032 | -| train/ | | -| approx_kl | 0.00022132276 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 93430 | -| policy_gradient_loss | 0.00359 | -| std | 0.0555 | -| value_loss | 1.53e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9345 | -| time_elapsed | 55164 | -| total_timesteps | 1196160 | -| train/ | | -| approx_kl | 0.014595492 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | 0.791 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 93440 | -| policy_gradient_loss | -0.0172 | -| std | 0.0554 | -| value_loss | 0.000376 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9346 | -| time_elapsed | 55168 | -| total_timesteps | 1196288 | -| train/ | | -| approx_kl | 0.004284748 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 1.47 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.00923 | -| n_updates | 93450 | -| policy_gradient_loss | -0.00756 | -| std | 0.0554 | -| value_loss | 9.71e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9347 | -| time_elapsed | 55171 | -| total_timesteps | 1196416 | -| train/ | | -| approx_kl | 0.0021361322 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -39.8 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 93460 | -| policy_gradient_loss | -0.00189 | -| std | 0.0553 | -| value_loss | 2.28e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9348 | -| time_elapsed | 55174 | -| total_timesteps | 1196544 | -| train/ | | -| approx_kl | 0.075565174 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -6.57e+03 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 93470 | -| policy_gradient_loss | -0.00268 | -| std | 0.0552 | -| value_loss | 8.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9349 | -| time_elapsed | 55177 | -| total_timesteps | 1196672 | -| train/ | | -| approx_kl | 0.008705644 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -1.8 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 93480 | -| policy_gradient_loss | 0.000588 | -| std | 0.0552 | -| value_loss | 3.35e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9350 | -| time_elapsed | 55179 | -| total_timesteps | 1196800 | -| train/ | | -| approx_kl | 0.00033743912 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -0.889 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 93490 | -| policy_gradient_loss | -0.00232 | -| std | 0.0551 | -| value_loss | 9.48e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 21 | -| iterations | 9351 | -| time_elapsed | 55183 | -| total_timesteps | 1196928 | -| train/ | | -| approx_kl | 0.00040880917 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | -0.000536 | -| n_updates | 93500 | -| policy_gradient_loss | -0.000127 | -| std | 0.055 | -| value_loss | 5.41e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9352 | -| time_elapsed | 55187 | -| total_timesteps | 1197056 | -| train/ | | -| approx_kl | 0.017283699 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 93510 | -| policy_gradient_loss | -0.00534 | -| std | 0.055 | -| value_loss | 1.58e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9353 | -| time_elapsed | 55194 | -| total_timesteps | 1197184 | -| train/ | | -| approx_kl | 0.031337187 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 93520 | -| policy_gradient_loss | -0.00677 | -| std | 0.055 | -| value_loss | 9.01e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9354 | -| time_elapsed | 55197 | -| total_timesteps | 1197312 | -| train/ | | -| approx_kl | 0.0037192763 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -322 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 93530 | -| policy_gradient_loss | -0.00124 | -| std | 0.0549 | -| value_loss | 2.19e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9355 | -| time_elapsed | 55200 | -| total_timesteps | 1197440 | -| train/ | | -| approx_kl | 0.0079130735 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -319 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 93540 | -| policy_gradient_loss | -0.00285 | -| std | 0.0548 | -| value_loss | 1.57e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9356 | -| time_elapsed | 55203 | -| total_timesteps | 1197568 | -| train/ | | -| approx_kl | 0.012068718 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -4.32 | -| learning_rate | 0.0003 | -| loss | -0.000503 | -| n_updates | 93550 | -| policy_gradient_loss | -0.00148 | -| std | 0.0547 | -| value_loss | 1.8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9357 | -| time_elapsed | 55206 | -| total_timesteps | 1197696 | -| train/ | | -| approx_kl | 0.021466509 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -8.37 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 93560 | -| policy_gradient_loss | -0.00301 | -| std | 0.0547 | -| value_loss | 3.6e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9358 | -| time_elapsed | 55209 | -| total_timesteps | 1197824 | -| train/ | | -| approx_kl | 5.060807e-06 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.421 | -| learning_rate | 0.0003 | -| loss | 0.000218 | -| n_updates | 93570 | -| policy_gradient_loss | -0.00189 | -| std | 0.0546 | -| value_loss | 5.85e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9359 | -| time_elapsed | 55212 | -| total_timesteps | 1197952 | -| train/ | | -| approx_kl | 0.012751605 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | -0.0087 | -| n_updates | 93580 | -| policy_gradient_loss | -0.00234 | -| std | 0.0546 | -| value_loss | 1.38e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9360 | -| time_elapsed | 55215 | -| total_timesteps | 1198080 | -| train/ | | -| approx_kl | 0.03156905 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | 0.00438 | -| n_updates | 93590 | -| policy_gradient_loss | 0.00286 | -| std | 0.0546 | -| value_loss | 7.43e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9361 | -| time_elapsed | 55223 | -| total_timesteps | 1198208 | -| train/ | | -| approx_kl | 0.0043412223 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | 0.638 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 93600 | -| policy_gradient_loss | -0.0101 | -| std | 0.0547 | -| value_loss | 0.00451 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9362 | -| time_elapsed | 55227 | -| total_timesteps | 1198336 | -| train/ | | -| approx_kl | 0.00049544685 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0811 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 93610 | -| policy_gradient_loss | 0.00117 | -| std | 0.0547 | -| value_loss | 0.000137 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9363 | -| time_elapsed | 55230 | -| total_timesteps | 1198464 | -| train/ | | -| approx_kl | 0.0095905885 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.00785 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 93620 | -| policy_gradient_loss | -0.00402 | -| std | 0.0547 | -| value_loss | 3.88e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9364 | -| time_elapsed | 55234 | -| total_timesteps | 1198592 | -| train/ | | -| approx_kl | 0.011430986 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 93630 | -| policy_gradient_loss | -0.00364 | -| std | 0.0547 | -| value_loss | 1.28e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9365 | -| time_elapsed | 55238 | -| total_timesteps | 1198720 | -| train/ | | -| approx_kl | 0.00433149 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 93640 | -| policy_gradient_loss | -0.000868 | -| std | 0.0547 | -| value_loss | 1.02e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9366 | -| time_elapsed | 55240 | -| total_timesteps | 1198848 | -| train/ | | -| approx_kl | 0.010398721 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.00788 | -| n_updates | 93650 | -| policy_gradient_loss | 0.0061 | -| std | 0.0548 | -| value_loss | 8.63e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9367 | -| time_elapsed | 55243 | -| total_timesteps | 1198976 | -| train/ | | -| approx_kl | 3.64203e-05 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.000308 | -| n_updates | 93660 | -| policy_gradient_loss | 0.00382 | -| std | 0.0548 | -| value_loss | 0.00146 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9368 | -| time_elapsed | 55247 | -| total_timesteps | 1199104 | -| train/ | | -| approx_kl | 0.0036227573 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -0.00406 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 93670 | -| policy_gradient_loss | -0.000849 | -| std | 0.055 | -| value_loss | 0.000172 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9369 | -| time_elapsed | 55255 | -| total_timesteps | 1199232 | -| train/ | | -| approx_kl | 0.013483344 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | 0.733 | -| learning_rate | 0.0003 | -| loss | -0.00756 | -| n_updates | 93680 | -| policy_gradient_loss | -0.00673 | -| std | 0.055 | -| value_loss | 0.00386 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9370 | -| time_elapsed | 55259 | -| total_timesteps | 1199360 | -| train/ | | -| approx_kl | 0.001448825 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.000252 | -| n_updates | 93690 | -| policy_gradient_loss | -2.79e-06 | -| std | 0.0549 | -| value_loss | 0.00065 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9371 | -| time_elapsed | 55262 | -| total_timesteps | 1199488 | -| train/ | | -| approx_kl | 0.0020253328 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 1.48 | -| explained_variance | -0.0754 | -| learning_rate | 0.0003 | -| loss | 0.0069 | -| n_updates | 93700 | -| policy_gradient_loss | 0.00925 | -| std | 0.0548 | -| value_loss | 0.0058 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9372 | -| time_elapsed | 55265 | -| total_timesteps | 1199616 | -| train/ | | -| approx_kl | 0.003917468 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 93710 | -| policy_gradient_loss | -0.00302 | -| std | 0.0547 | -| value_loss | 0.00118 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9373 | -| time_elapsed | 55267 | -| total_timesteps | 1199744 | -| train/ | | -| approx_kl | 0.037049238 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -33.8 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 93720 | -| policy_gradient_loss | -0.00356 | -| std | 0.0547 | -| value_loss | 6.95e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 21 | -| iterations | 9374 | -| time_elapsed | 55271 | -| total_timesteps | 1199872 | -| train/ | | -| approx_kl | 0.0009721769 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 93730 | -| policy_gradient_loss | 0.00809 | -| std | 0.0547 | -| value_loss | 8.22e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9375 | -| time_elapsed | 55274 | -| total_timesteps | 1200000 | -| train/ | | -| approx_kl | 0.00027275085 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 93740 | -| policy_gradient_loss | -7.16e-05 | -| std | 0.0546 | -| value_loss | 7.28e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9376 | -| time_elapsed | 55277 | -| total_timesteps | 1200128 | -| train/ | | -| approx_kl | 0.027523601 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.00277 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 93750 | -| policy_gradient_loss | -0.00584 | -| std | 0.0545 | -| value_loss | 5.08e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9377 | -| time_elapsed | 55285 | -| total_timesteps | 1200256 | -| train/ | | -| approx_kl | 0.04448916 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 93760 | -| policy_gradient_loss | -0.0137 | -| std | 0.0545 | -| value_loss | 0.00112 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9378 | -| time_elapsed | 55288 | -| total_timesteps | 1200384 | -| train/ | | -| approx_kl | 0.013776401 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | -0.0258 | -| n_updates | 93770 | -| policy_gradient_loss | -0.0158 | -| std | 0.0545 | -| value_loss | 8.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9379 | -| time_elapsed | 55291 | -| total_timesteps | 1200512 | -| train/ | | -| approx_kl | 0.0001945938 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.366 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 93780 | -| policy_gradient_loss | -0.00504 | -| std | 0.0544 | -| value_loss | 5.85e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9380 | -| time_elapsed | 55293 | -| total_timesteps | 1200640 | -| train/ | | -| approx_kl | 0.0071867243 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.00377 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 93790 | -| policy_gradient_loss | -0.00961 | -| std | 0.0544 | -| value_loss | 1.35e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9381 | -| time_elapsed | 55295 | -| total_timesteps | 1200768 | -| train/ | | -| approx_kl | 0.0005791071 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | 0.00231 | -| learning_rate | 0.0003 | -| loss | -0.000601 | -| n_updates | 93800 | -| policy_gradient_loss | 0.0029 | -| std | 0.0544 | -| value_loss | 1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 21 | -| iterations | 9382 | -| time_elapsed | 55298 | -| total_timesteps | 1200896 | -| train/ | | -| approx_kl | 0.014711559 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0072 | -| learning_rate | 0.0003 | -| loss | -0.00566 | -| n_updates | 93810 | -| policy_gradient_loss | -0.00475 | -| std | 0.0543 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9383 | -| time_elapsed | 55300 | -| total_timesteps | 1201024 | -| train/ | | -| approx_kl | 0.0024988144 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.00358 | -| n_updates | 93820 | -| policy_gradient_loss | -0.000727 | -| std | 0.0543 | -| value_loss | 4.19e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9384 | -| time_elapsed | 55309 | -| total_timesteps | 1201152 | -| train/ | | -| approx_kl | 0.0026030974 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 1.49 | -| explained_variance | 0.87 | -| learning_rate | 0.0003 | -| loss | -0.000759 | -| n_updates | 93830 | -| policy_gradient_loss | -0.000642 | -| std | 0.0543 | -| value_loss | 0.00107 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9385 | -| time_elapsed | 55311 | -| total_timesteps | 1201280 | -| train/ | | -| approx_kl | 0.00060740765 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | 0.164 | -| learning_rate | 0.0003 | -| loss | 0.000302 | -| n_updates | 93840 | -| policy_gradient_loss | 0.000317 | -| std | 0.0542 | -| value_loss | 9.85e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9386 | -| time_elapsed | 55314 | -| total_timesteps | 1201408 | -| train/ | | -| approx_kl | 0.00032830797 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -2.81 | -| learning_rate | 0.0003 | -| loss | -0.000677 | -| n_updates | 93850 | -| policy_gradient_loss | -0.000101 | -| std | 0.0541 | -| value_loss | 1.12e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9387 | -| time_elapsed | 55317 | -| total_timesteps | 1201536 | -| train/ | | -| approx_kl | 0.007627294 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.488 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 93860 | -| policy_gradient_loss | -0.00117 | -| std | 0.0542 | -| value_loss | 5.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9388 | -| time_elapsed | 55321 | -| total_timesteps | 1201664 | -| train/ | | -| approx_kl | 0.0029224483 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.468 | -| learning_rate | 0.0003 | -| loss | -0.0057 | -| n_updates | 93870 | -| policy_gradient_loss | -0.00162 | -| std | 0.0542 | -| value_loss | 1.13e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9389 | -| time_elapsed | 55324 | -| total_timesteps | 1201792 | -| train/ | | -| approx_kl | 0.0016266992 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 93880 | -| policy_gradient_loss | -0.000231 | -| std | 0.0542 | -| value_loss | 2.98e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9390 | -| time_elapsed | 55328 | -| total_timesteps | 1201920 | -| train/ | | -| approx_kl | 0.002864197 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.0558 | -| learning_rate | 0.0003 | -| loss | 0.00191 | -| n_updates | 93890 | -| policy_gradient_loss | 0.00596 | -| std | 0.0542 | -| value_loss | 2.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9391 | -| time_elapsed | 55332 | -| total_timesteps | 1202048 | -| train/ | | -| approx_kl | 0.001561346 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 93900 | -| policy_gradient_loss | -0.000759 | -| std | 0.0543 | -| value_loss | 1.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9392 | -| time_elapsed | 55339 | -| total_timesteps | 1202176 | -| train/ | | -| approx_kl | 0.008124446 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 93910 | -| policy_gradient_loss | -0.014 | -| std | 0.0543 | -| value_loss | 0.000955 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9393 | -| time_elapsed | 55342 | -| total_timesteps | 1202304 | -| train/ | | -| approx_kl | 0.0007298584 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -8.88e+03 | -| learning_rate | 0.0003 | -| loss | -0.000446 | -| n_updates | 93920 | -| policy_gradient_loss | -6.29e-05 | -| std | 0.0541 | -| value_loss | 4.64e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9394 | -| time_elapsed | 55346 | -| total_timesteps | 1202432 | -| train/ | | -| approx_kl | 0.0863584 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -6.38e+03 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 93930 | -| policy_gradient_loss | -0.00896 | -| std | 0.0539 | -| value_loss | 4.34e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9395 | -| time_elapsed | 55349 | -| total_timesteps | 1202560 | -| train/ | | -| approx_kl | 0.021267615 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -3.42e+03 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 93940 | -| policy_gradient_loss | -0.00217 | -| std | 0.0538 | -| value_loss | 9.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9396 | -| time_elapsed | 55352 | -| total_timesteps | 1202688 | -| train/ | | -| approx_kl | 0.039439972 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -104 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 93950 | -| policy_gradient_loss | 0.000897 | -| std | 0.0538 | -| value_loss | 1.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9397 | -| time_elapsed | 55354 | -| total_timesteps | 1202816 | -| train/ | | -| approx_kl | 0.003762701 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -4.28 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 93960 | -| policy_gradient_loss | -0.0163 | -| std | 0.0537 | -| value_loss | 3.05e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9398 | -| time_elapsed | 55357 | -| total_timesteps | 1202944 | -| train/ | | -| approx_kl | 0.0010210471 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.33 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 93970 | -| policy_gradient_loss | -0.00717 | -| std | 0.0537 | -| value_loss | 7.22e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9399 | -| time_elapsed | 55360 | -| total_timesteps | 1203072 | -| train/ | | -| approx_kl | 0.0033829869 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 93980 | -| policy_gradient_loss | -0.000537 | -| std | 0.0537 | -| value_loss | 5.48e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9400 | -| time_elapsed | 55367 | -| total_timesteps | 1203200 | -| train/ | | -| approx_kl | 0.03890703 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 93990 | -| policy_gradient_loss | -0.0177 | -| std | 0.0537 | -| value_loss | 0.000461 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9401 | -| time_elapsed | 55371 | -| total_timesteps | 1203328 | -| train/ | | -| approx_kl | 0.0019493 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -7.43 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 94000 | -| policy_gradient_loss | -0.00117 | -| std | 0.0537 | -| value_loss | 6.08e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9402 | -| time_elapsed | 55374 | -| total_timesteps | 1203456 | -| train/ | | -| approx_kl | 0.03830304 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -14.5 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 94010 | -| policy_gradient_loss | -0.00107 | -| std | 0.0538 | -| value_loss | 2.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9403 | -| time_elapsed | 55378 | -| total_timesteps | 1203584 | -| train/ | | -| approx_kl | 0.012021801 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -13.1 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 94020 | -| policy_gradient_loss | -0.00185 | -| std | 0.0539 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9404 | -| time_elapsed | 55380 | -| total_timesteps | 1203712 | -| train/ | | -| approx_kl | 0.009533355 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -2.52 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 94030 | -| policy_gradient_loss | -0.00246 | -| std | 0.0539 | -| value_loss | 3.33e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9405 | -| time_elapsed | 55383 | -| total_timesteps | 1203840 | -| train/ | | -| approx_kl | 7.139519e-06 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.397 | -| learning_rate | 0.0003 | -| loss | 2.95e-05 | -| n_updates | 94040 | -| policy_gradient_loss | -0.00123 | -| std | 0.054 | -| value_loss | 1.82e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9406 | -| time_elapsed | 55385 | -| total_timesteps | 1203968 | -| train/ | | -| approx_kl | 6.4042397e-06 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.00513 | -| learning_rate | 0.0003 | -| loss | -0.000256 | -| n_updates | 94050 | -| policy_gradient_loss | -0.00195 | -| std | 0.054 | -| value_loss | 1.65e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9407 | -| time_elapsed | 55388 | -| total_timesteps | 1204096 | -| train/ | | -| approx_kl | 1.5920028e-05 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.0603 | -| learning_rate | 0.0003 | -| loss | -0.000967 | -| n_updates | 94060 | -| policy_gradient_loss | -0.00898 | -| std | 0.054 | -| value_loss | 2.16e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9408 | -| time_elapsed | 55394 | -| total_timesteps | 1204224 | -| train/ | | -| approx_kl | 0.02087603 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | 0.734 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 94070 | -| policy_gradient_loss | -0.0139 | -| std | 0.054 | -| value_loss | 0.00382 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9409 | -| time_elapsed | 55396 | -| total_timesteps | 1204352 | -| train/ | | -| approx_kl | 0.003759854 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -97.5 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 94080 | -| policy_gradient_loss | -0.0136 | -| std | 0.0539 | -| value_loss | 7.12e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9410 | -| time_elapsed | 55399 | -| total_timesteps | 1204480 | -| train/ | | -| approx_kl | 0.0013424791 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -766 | -| learning_rate | 0.0003 | -| loss | -0.00667 | -| n_updates | 94090 | -| policy_gradient_loss | -0.0114 | -| std | 0.0539 | -| value_loss | 4.07e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9411 | -| time_elapsed | 55403 | -| total_timesteps | 1204608 | -| train/ | | -| approx_kl | 0.020089192 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -142 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 94100 | -| policy_gradient_loss | -0.00133 | -| std | 0.054 | -| value_loss | 5.17e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9412 | -| time_elapsed | 55406 | -| total_timesteps | 1204736 | -| train/ | | -| approx_kl | 0.0051036766 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -12.5 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 94110 | -| policy_gradient_loss | -0.0013 | -| std | 0.054 | -| value_loss | 1.26e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9413 | -| time_elapsed | 55411 | -| total_timesteps | 1204864 | -| train/ | | -| approx_kl | 0.00021262467 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -1.83 | -| learning_rate | 0.0003 | -| loss | 0.000833 | -| n_updates | 94120 | -| policy_gradient_loss | -0.000679 | -| std | 0.0541 | -| value_loss | 3.75e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9414 | -| time_elapsed | 55414 | -| total_timesteps | 1204992 | -| train/ | | -| approx_kl | 0.0039928947 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.00569 | -| n_updates | 94130 | -| policy_gradient_loss | -0.00509 | -| std | 0.054 | -| value_loss | 1.39e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9415 | -| time_elapsed | 55417 | -| total_timesteps | 1205120 | -| train/ | | -| approx_kl | 0.0011345707 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 94140 | -| policy_gradient_loss | 0.00453 | -| std | 0.054 | -| value_loss | 2.52e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9416 | -| time_elapsed | 55427 | -| total_timesteps | 1205248 | -| train/ | | -| approx_kl | 0.007842438 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 94150 | -| policy_gradient_loss | -0.0127 | -| std | 0.054 | -| value_loss | 0.0014 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9417 | -| time_elapsed | 55431 | -| total_timesteps | 1205376 | -| train/ | | -| approx_kl | 0.0045540994 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -280 | -| learning_rate | 0.0003 | -| loss | -0.000462 | -| n_updates | 94160 | -| policy_gradient_loss | -0.000176 | -| std | 0.0538 | -| value_loss | 8.79e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9418 | -| time_elapsed | 55435 | -| total_timesteps | 1205504 | -| train/ | | -| approx_kl | 0.035782095 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -3.25e+03 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 94170 | -| policy_gradient_loss | -0.00135 | -| std | 0.0536 | -| value_loss | 8.04e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9419 | -| time_elapsed | 55438 | -| total_timesteps | 1205632 | -| train/ | | -| approx_kl | 0.00016015861 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -1.4e+03 | -| learning_rate | 0.0003 | -| loss | 0.00193 | -| n_updates | 94180 | -| policy_gradient_loss | -0.00704 | -| std | 0.0536 | -| value_loss | 8.52e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9420 | -| time_elapsed | 55443 | -| total_timesteps | 1205760 | -| train/ | | -| approx_kl | 0.00091102906 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -1.08e+03 | -| learning_rate | 0.0003 | -| loss | -0.00695 | -| n_updates | 94190 | -| policy_gradient_loss | -0.00948 | -| std | 0.0536 | -| value_loss | 1.06e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9421 | -| time_elapsed | 55446 | -| total_timesteps | 1205888 | -| train/ | | -| approx_kl | 0.0018721591 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -91.8 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 94200 | -| policy_gradient_loss | -0.0124 | -| std | 0.0536 | -| value_loss | 1.17e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9422 | -| time_elapsed | 55449 | -| total_timesteps | 1206016 | -| train/ | | -| approx_kl | 0.0020805113 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -6.72 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 94210 | -| policy_gradient_loss | -0.00284 | -| std | 0.0536 | -| value_loss | 2.2e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9423 | -| time_elapsed | 55459 | -| total_timesteps | 1206144 | -| train/ | | -| approx_kl | 0.035138004 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 94220 | -| policy_gradient_loss | -0.0153 | -| std | 0.0536 | -| value_loss | 0.00103 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9424 | -| time_elapsed | 55463 | -| total_timesteps | 1206272 | -| train/ | | -| approx_kl | 0.0031712078 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -0.927 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 94230 | -| policy_gradient_loss | -0.000598 | -| std | 0.0537 | -| value_loss | 5.97e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9425 | -| time_elapsed | 55466 | -| total_timesteps | 1206400 | -| train/ | | -| approx_kl | 0.073915504 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -297 | -| learning_rate | 0.0003 | -| loss | -0.00748 | -| n_updates | 94240 | -| policy_gradient_loss | -0.00555 | -| std | 0.0537 | -| value_loss | 3.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9426 | -| time_elapsed | 55469 | -| total_timesteps | 1206528 | -| train/ | | -| approx_kl | 0.004582747 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -8.53e+03 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 94250 | -| policy_gradient_loss | -0.00846 | -| std | 0.0537 | -| value_loss | 9.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9427 | -| time_elapsed | 55473 | -| total_timesteps | 1206656 | -| train/ | | -| approx_kl | 0.074363105 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -1.04e+03 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 94260 | -| policy_gradient_loss | -0.00413 | -| std | 0.0537 | -| value_loss | 1.69e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9428 | -| time_elapsed | 55476 | -| total_timesteps | 1206784 | -| train/ | | -| approx_kl | 8.1838574e-05 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -5.55 | -| learning_rate | 0.0003 | -| loss | -0.000386 | -| n_updates | 94270 | -| policy_gradient_loss | -0.000469 | -| std | 0.0538 | -| value_loss | 9.15e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 21 | -| iterations | 9429 | -| time_elapsed | 55480 | -| total_timesteps | 1206912 | -| train/ | | -| approx_kl | 0.00069588376 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -179 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 94280 | -| policy_gradient_loss | -0.00959 | -| std | 0.0538 | -| value_loss | 1.34e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9430 | -| time_elapsed | 55484 | -| total_timesteps | 1207040 | -| train/ | | -| approx_kl | 4.752772e-05 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -3.45 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 94290 | -| policy_gradient_loss | -0.00776 | -| std | 0.0538 | -| value_loss | 3.04e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9431 | -| time_elapsed | 55492 | -| total_timesteps | 1207168 | -| train/ | | -| approx_kl | 0.023306815 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 94300 | -| policy_gradient_loss | -0.0154 | -| std | 0.0538 | -| value_loss | 0.000696 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9432 | -| time_elapsed | 55496 | -| total_timesteps | 1207296 | -| train/ | | -| approx_kl | 0.06964184 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -25.3 | -| learning_rate | 0.0003 | -| loss | -0.000947 | -| n_updates | 94310 | -| policy_gradient_loss | -0.0012 | -| std | 0.0538 | -| value_loss | 5.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9433 | -| time_elapsed | 55499 | -| total_timesteps | 1207424 | -| train/ | | -| approx_kl | 0.10354468 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -298 | -| learning_rate | 0.0003 | -| loss | -0.000791 | -| n_updates | 94320 | -| policy_gradient_loss | -0.00232 | -| std | 0.0538 | -| value_loss | 4.94e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9434 | -| time_elapsed | 55503 | -| total_timesteps | 1207552 | -| train/ | | -| approx_kl | 0.18692018 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -74.2 | -| learning_rate | 0.0003 | -| loss | 7.29e-05 | -| n_updates | 94330 | -| policy_gradient_loss | -0.000352 | -| std | 0.0538 | -| value_loss | 5.56e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9435 | -| time_elapsed | 55506 | -| total_timesteps | 1207680 | -| train/ | | -| approx_kl | 0.08146942 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -9.85 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 94340 | -| policy_gradient_loss | -0.00304 | -| std | 0.0538 | -| value_loss | 1.46e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9436 | -| time_elapsed | 55510 | -| total_timesteps | 1207808 | -| train/ | | -| approx_kl | 0.010273529 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 94350 | -| policy_gradient_loss | -0.00868 | -| std | 0.0538 | -| value_loss | 2.68e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9437 | -| time_elapsed | 55513 | -| total_timesteps | 1207936 | -| train/ | | -| approx_kl | 0.0022787298 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.545 | -| learning_rate | 0.0003 | -| loss | 0.00345 | -| n_updates | 94360 | -| policy_gradient_loss | 0.00209 | -| std | 0.0538 | -| value_loss | 1.09e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9438 | -| time_elapsed | 55514 | -| total_timesteps | 1208064 | -| train/ | | -| approx_kl | 0.00017986726 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 1.5 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.000884 | -| n_updates | 94370 | -| policy_gradient_loss | 0.00242 | -| std | 0.0537 | -| value_loss | 6.21e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9439 | -| time_elapsed | 55520 | -| total_timesteps | 1208192 | -| train/ | | -| approx_kl | 0.035156175 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 94380 | -| policy_gradient_loss | -0.0179 | -| std | 0.0537 | -| value_loss | 0.000169 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9440 | -| time_elapsed | 55523 | -| total_timesteps | 1208320 | -| train/ | | -| approx_kl | 0.005662358 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -57.8 | -| learning_rate | 0.0003 | -| loss | -0.00616 | -| n_updates | 94390 | -| policy_gradient_loss | -0.0032 | -| std | 0.0536 | -| value_loss | 4.44e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9441 | -| time_elapsed | 55527 | -| total_timesteps | 1208448 | -| train/ | | -| approx_kl | 0.0025238646 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -149 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 94400 | -| policy_gradient_loss | -0.00416 | -| std | 0.0536 | -| value_loss | 3.19e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9442 | -| time_elapsed | 55531 | -| total_timesteps | 1208576 | -| train/ | | -| approx_kl | 0.020672118 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -15.2 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 94410 | -| policy_gradient_loss | -0.00214 | -| std | 0.0536 | -| value_loss | 3.2e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9443 | -| time_elapsed | 55535 | -| total_timesteps | 1208704 | -| train/ | | -| approx_kl | 0.00010523852 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | 0.000751 | -| n_updates | 94420 | -| policy_gradient_loss | 0.00041 | -| std | 0.0535 | -| value_loss | 2.49e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9444 | -| time_elapsed | 55538 | -| total_timesteps | 1208832 | -| train/ | | -| approx_kl | 0.012907559 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 94430 | -| policy_gradient_loss | 0.000456 | -| std | 0.0535 | -| value_loss | 5.04e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9445 | -| time_elapsed | 55543 | -| total_timesteps | 1208960 | -| train/ | | -| approx_kl | 0.02900792 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | -7.31e-05 | -| n_updates | 94440 | -| policy_gradient_loss | 0.0024 | -| std | 0.0534 | -| value_loss | 2.31e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9446 | -| time_elapsed | 55547 | -| total_timesteps | 1209088 | -| train/ | | -| approx_kl | 0.0043038037 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | -0.00974 | -| n_updates | 94450 | -| policy_gradient_loss | -0.00435 | -| std | 0.0534 | -| value_loss | 8.73e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9447 | -| time_elapsed | 55556 | -| total_timesteps | 1209216 | -| train/ | | -| approx_kl | 0.10162986 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -0.862 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 94460 | -| policy_gradient_loss | -0.014 | -| std | 0.0534 | -| value_loss | 0.00181 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9448 | -| time_elapsed | 55560 | -| total_timesteps | 1209344 | -| train/ | | -| approx_kl | 0.0004210039 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -304 | -| learning_rate | 0.0003 | -| loss | -0.000862 | -| n_updates | 94470 | -| policy_gradient_loss | 0.000946 | -| std | 0.0533 | -| value_loss | 2.57e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9449 | -| time_elapsed | 55564 | -| total_timesteps | 1209472 | -| train/ | | -| approx_kl | 0.014057092 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -261 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 94480 | -| policy_gradient_loss | -0.0137 | -| std | 0.0532 | -| value_loss | 2.3e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9450 | -| time_elapsed | 55567 | -| total_timesteps | 1209600 | -| train/ | | -| approx_kl | 0.00682221 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -1.93e+03 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 94490 | -| policy_gradient_loss | -0.0147 | -| std | 0.0532 | -| value_loss | 4.33e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9451 | -| time_elapsed | 55570 | -| total_timesteps | 1209728 | -| train/ | | -| approx_kl | 0.004422992 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -80.7 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 94500 | -| policy_gradient_loss | -0.00772 | -| std | 0.0532 | -| value_loss | 2.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9452 | -| time_elapsed | 55573 | -| total_timesteps | 1209856 | -| train/ | | -| approx_kl | 0.0023244293 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.51 | -| explained_variance | -2.63 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 94510 | -| policy_gradient_loss | 0.000423 | -| std | 0.0532 | -| value_loss | 1.7e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 21 | -| iterations | 9453 | -| time_elapsed | 55576 | -| total_timesteps | 1209984 | -| train/ | | -| approx_kl | 0.002806189 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.252 | -| learning_rate | 0.0003 | -| loss | 0.00277 | -| n_updates | 94520 | -| policy_gradient_loss | 0.00252 | -| std | 0.0532 | -| value_loss | 4.67e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9454 | -| time_elapsed | 55579 | -| total_timesteps | 1210112 | -| train/ | | -| approx_kl | 0.001396005 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 94530 | -| policy_gradient_loss | 0.000658 | -| std | 0.0532 | -| value_loss | 3.93e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9455 | -| time_elapsed | 55587 | -| total_timesteps | 1210240 | -| train/ | | -| approx_kl | 0.02409621 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | 0.925 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 94540 | -| policy_gradient_loss | -0.00485 | -| std | 0.0531 | -| value_loss | 0.000613 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9456 | -| time_elapsed | 55589 | -| total_timesteps | 1210368 | -| train/ | | -| approx_kl | 0.0018908218 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -19.3 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 94550 | -| policy_gradient_loss | -0.0178 | -| std | 0.053 | -| value_loss | 3.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9457 | -| time_elapsed | 55592 | -| total_timesteps | 1210496 | -| train/ | | -| approx_kl | 0.048954263 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -23.2 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 94560 | -| policy_gradient_loss | -0.00803 | -| std | 0.053 | -| value_loss | 2.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9458 | -| time_elapsed | 55595 | -| total_timesteps | 1210624 | -| train/ | | -| approx_kl | 0.03759084 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -7.23 | -| learning_rate | 0.0003 | -| loss | 0.00654 | -| n_updates | 94570 | -| policy_gradient_loss | 0.00239 | -| std | 0.053 | -| value_loss | 3.62e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9459 | -| time_elapsed | 55598 | -| total_timesteps | 1210752 | -| train/ | | -| approx_kl | 0.0036819498 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.801 | -| learning_rate | 0.0003 | -| loss | -0.00709 | -| n_updates | 94580 | -| policy_gradient_loss | -0.00211 | -| std | 0.053 | -| value_loss | 3.89e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9460 | -| time_elapsed | 55601 | -| total_timesteps | 1210880 | -| train/ | | -| approx_kl | 0.0024271095 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.434 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 94590 | -| policy_gradient_loss | -0.00201 | -| std | 0.0529 | -| value_loss | 7.8e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9461 | -| time_elapsed | 55605 | -| total_timesteps | 1211008 | -| train/ | | -| approx_kl | 0.00041000778 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 94600 | -| policy_gradient_loss | 0.00161 | -| std | 0.0529 | -| value_loss | 2.84e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9462 | -| time_elapsed | 55614 | -| total_timesteps | 1211136 | -| train/ | | -| approx_kl | 0.039699163 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 94610 | -| policy_gradient_loss | -0.0168 | -| std | 0.053 | -| value_loss | 7.8e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9463 | -| time_elapsed | 55618 | -| total_timesteps | 1211264 | -| train/ | | -| approx_kl | 0.0013346672 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 94620 | -| policy_gradient_loss | -0.0116 | -| std | 0.053 | -| value_loss | 8.6e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9464 | -| time_elapsed | 55622 | -| total_timesteps | 1211392 | -| train/ | | -| approx_kl | 0.02043055 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -29 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 94630 | -| policy_gradient_loss | -0.00507 | -| std | 0.053 | -| value_loss | 1.82e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9465 | -| time_elapsed | 55624 | -| total_timesteps | 1211520 | -| train/ | | -| approx_kl | 0.012034637 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -13.3 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 94640 | -| policy_gradient_loss | -0.0112 | -| std | 0.053 | -| value_loss | 4.34e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9466 | -| time_elapsed | 55627 | -| total_timesteps | 1211648 | -| train/ | | -| approx_kl | 0.011057656 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -2.78 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 94650 | -| policy_gradient_loss | -0.00174 | -| std | 0.053 | -| value_loss | 3.93e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9467 | -| time_elapsed | 55632 | -| total_timesteps | 1211776 | -| train/ | | -| approx_kl | 0.0027652686 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.41 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 94660 | -| policy_gradient_loss | -0.00439 | -| std | 0.0529 | -| value_loss | 3.18e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 21 | -| iterations | 9468 | -| time_elapsed | 55636 | -| total_timesteps | 1211904 | -| train/ | | -| approx_kl | 0.00027544703 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.000932 | -| n_updates | 94670 | -| policy_gradient_loss | -0.00222 | -| std | 0.053 | -| value_loss | 1.49e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9469 | -| time_elapsed | 55639 | -| total_timesteps | 1212032 | -| train/ | | -| approx_kl | 0.0038669938 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.0785 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 94680 | -| policy_gradient_loss | 0.0015 | -| std | 0.053 | -| value_loss | 1.04e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9470 | -| time_elapsed | 55647 | -| total_timesteps | 1212160 | -| train/ | | -| approx_kl | 0.012686651 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | 0.807 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 94690 | -| policy_gradient_loss | -0.0103 | -| std | 0.053 | -| value_loss | 0.00292 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9471 | -| time_elapsed | 55651 | -| total_timesteps | 1212288 | -| train/ | | -| approx_kl | 0.0022117961 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -2.36 | -| learning_rate | 0.0003 | -| loss | -7.09e-05 | -| n_updates | 94700 | -| policy_gradient_loss | 9.61e-07 | -| std | 0.0529 | -| value_loss | 5.29e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9472 | -| time_elapsed | 55653 | -| total_timesteps | 1212416 | -| train/ | | -| approx_kl | 0.009130543 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -2.96 | -| learning_rate | 0.0003 | -| loss | -0.00519 | -| n_updates | 94710 | -| policy_gradient_loss | -0.00404 | -| std | 0.0528 | -| value_loss | 3.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9473 | -| time_elapsed | 55657 | -| total_timesteps | 1212544 | -| train/ | | -| approx_kl | 0.010418408 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.52 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | -0.0284 | -| n_updates | 94720 | -| policy_gradient_loss | -0.0214 | -| std | 0.0527 | -| value_loss | 2.08e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9474 | -| time_elapsed | 55660 | -| total_timesteps | 1212672 | -| train/ | | -| approx_kl | 0.00072376244 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 1.53 | -| explained_variance | 0.00617 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 94730 | -| policy_gradient_loss | -0.00672 | -| std | 0.0526 | -| value_loss | 1.99e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9475 | -| time_elapsed | 55664 | -| total_timesteps | 1212800 | -| train/ | | -| approx_kl | 0.012590963 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.53 | -| explained_variance | 0.000133 | -| learning_rate | 0.0003 | -| loss | -0.0371 | -| n_updates | 94740 | -| policy_gradient_loss | -0.0303 | -| std | 0.0526 | -| value_loss | 3.65e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9476 | -| time_elapsed | 55667 | -| total_timesteps | 1212928 | -| train/ | | -| approx_kl | 0.008742083 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 1.53 | -| explained_variance | -0.00552 | -| learning_rate | 0.0003 | -| loss | 0.000565 | -| n_updates | 94750 | -| policy_gradient_loss | -9.77e-05 | -| std | 0.0524 | -| value_loss | 1.94e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9477 | -| time_elapsed | 55672 | -| total_timesteps | 1213056 | -| train/ | | -| approx_kl | 0.007817228 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.53 | -| explained_variance | -0.00465 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 94760 | -| policy_gradient_loss | -0.00647 | -| std | 0.0522 | -| value_loss | 7.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9478 | -| time_elapsed | 55678 | -| total_timesteps | 1213184 | -| train/ | | -| approx_kl | 0.021320043 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 1.53 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 94770 | -| policy_gradient_loss | -0.0151 | -| std | 0.0522 | -| value_loss | 0.000966 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9479 | -| time_elapsed | 55682 | -| total_timesteps | 1213312 | -| train/ | | -| approx_kl | 0.024605695 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 1.53 | -| explained_variance | -11.7 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 94780 | -| policy_gradient_loss | -0.00246 | -| std | 0.0521 | -| value_loss | 3.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9480 | -| time_elapsed | 55686 | -| total_timesteps | 1213440 | -| train/ | | -| approx_kl | 0.01012099 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -13.5 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 94790 | -| policy_gradient_loss | -0.0118 | -| std | 0.0521 | -| value_loss | 4.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9481 | -| time_elapsed | 55688 | -| total_timesteps | 1213568 | -| train/ | | -| approx_kl | 0.009078417 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -1.91 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 94800 | -| policy_gradient_loss | -0.00122 | -| std | 0.0521 | -| value_loss | 2.66e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9482 | -| time_elapsed | 55692 | -| total_timesteps | 1213696 | -| train/ | | -| approx_kl | 0.0062198886 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -3.19 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 94810 | -| policy_gradient_loss | -0.00252 | -| std | 0.0521 | -| value_loss | 2.47e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9483 | -| time_elapsed | 55696 | -| total_timesteps | 1213824 | -| train/ | | -| approx_kl | 0.017402219 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.69 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 94820 | -| policy_gradient_loss | -0.00512 | -| std | 0.0521 | -| value_loss | 7.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9484 | -| time_elapsed | 55699 | -| total_timesteps | 1213952 | -| train/ | | -| approx_kl | 0.009870977 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.00611 | -| n_updates | 94830 | -| policy_gradient_loss | 0.000261 | -| std | 0.0521 | -| value_loss | 3.67e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9485 | -| time_elapsed | 55702 | -| total_timesteps | 1214080 | -| train/ | | -| approx_kl | 0.0042444514 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.00509 | -| n_updates | 94840 | -| policy_gradient_loss | 0.000845 | -| std | 0.052 | -| value_loss | 3.53e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9486 | -| time_elapsed | 55708 | -| total_timesteps | 1214208 | -| train/ | | -| approx_kl | 0.04557962 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 94850 | -| policy_gradient_loss | -0.0157 | -| std | 0.052 | -| value_loss | 0.00102 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9487 | -| time_elapsed | 55711 | -| total_timesteps | 1214336 | -| train/ | | -| approx_kl | 0.055296883 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -1.97e+03 | -| learning_rate | 0.0003 | -| loss | -0.00499 | -| n_updates | 94860 | -| policy_gradient_loss | -0.0032 | -| std | 0.052 | -| value_loss | 2.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9488 | -| time_elapsed | 55714 | -| total_timesteps | 1214464 | -| train/ | | -| approx_kl | 0.006365695 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -1.05e+04 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 94870 | -| policy_gradient_loss | -0.0094 | -| std | 0.052 | -| value_loss | 9.44e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9489 | -| time_elapsed | 55717 | -| total_timesteps | 1214592 | -| train/ | | -| approx_kl | 0.0001757429 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -1.74e+03 | -| learning_rate | 0.0003 | -| loss | 0.00311 | -| n_updates | 94880 | -| policy_gradient_loss | -0.00632 | -| std | 0.052 | -| value_loss | 1.9e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9490 | -| time_elapsed | 55721 | -| total_timesteps | 1214720 | -| train/ | | -| approx_kl | 0.24171972 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -369 | -| learning_rate | 0.0003 | -| loss | -0.000548 | -| n_updates | 94890 | -| policy_gradient_loss | -0.00256 | -| std | 0.052 | -| value_loss | 2.35e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9491 | -| time_elapsed | 55725 | -| total_timesteps | 1214848 | -| train/ | | -| approx_kl | 0.009617675 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -6.81 | -| learning_rate | 0.0003 | -| loss | -0.00914 | -| n_updates | 94900 | -| policy_gradient_loss | -0.00658 | -| std | 0.052 | -| value_loss | 2.27e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9492 | -| time_elapsed | 55727 | -| total_timesteps | 1214976 | -| train/ | | -| approx_kl | 0.011743387 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | 0.00102 | -| n_updates | 94910 | -| policy_gradient_loss | -0.000322 | -| std | 0.052 | -| value_loss | 8.22e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9493 | -| time_elapsed | 55730 | -| total_timesteps | 1215104 | -| train/ | | -| approx_kl | 0.008098378 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.000331 | -| n_updates | 94920 | -| policy_gradient_loss | 0.00162 | -| std | 0.052 | -| value_loss | 5.91e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9494 | -| time_elapsed | 55737 | -| total_timesteps | 1215232 | -| train/ | | -| approx_kl | 0.015817685 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.57 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 94930 | -| policy_gradient_loss | -0.0153 | -| std | 0.0521 | -| value_loss | 0.00228 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9495 | -| time_elapsed | 55740 | -| total_timesteps | 1215360 | -| train/ | | -| approx_kl | 0.0053430395 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -9.18e+03 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 94940 | -| policy_gradient_loss | -0.00183 | -| std | 0.0521 | -| value_loss | 2.08e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9496 | -| time_elapsed | 55743 | -| total_timesteps | 1215488 | -| train/ | | -| approx_kl | 0.00021922914 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -61.4 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 94950 | -| policy_gradient_loss | -0.00788 | -| std | 0.0521 | -| value_loss | 0.000104 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9497 | -| time_elapsed | 55746 | -| total_timesteps | 1215616 | -| train/ | | -| approx_kl | 5.2347314e-05 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 94960 | -| policy_gradient_loss | -0.00557 | -| std | 0.0521 | -| value_loss | 2.62e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9498 | -| time_elapsed | 55749 | -| total_timesteps | 1215744 | -| train/ | | -| approx_kl | 0.00072423834 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 94970 | -| policy_gradient_loss | -0.00252 | -| std | 0.0521 | -| value_loss | 1.22e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9499 | -| time_elapsed | 55751 | -| total_timesteps | 1215872 | -| train/ | | -| approx_kl | 0.006608827 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 94980 | -| policy_gradient_loss | -0.000237 | -| std | 0.052 | -| value_loss | 6.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9500 | -| time_elapsed | 55755 | -| total_timesteps | 1216000 | -| train/ | | -| approx_kl | 0.003891874 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 94990 | -| policy_gradient_loss | -0.000642 | -| std | 0.052 | -| value_loss | 7.98e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9501 | -| time_elapsed | 55758 | -| total_timesteps | 1216128 | -| train/ | | -| approx_kl | 0.0005475916 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.00197 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 95000 | -| policy_gradient_loss | -0.00112 | -| std | 0.052 | -| value_loss | 4.99e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9502 | -| time_elapsed | 55765 | -| total_timesteps | 1216256 | -| train/ | | -| approx_kl | 0.01674409 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 95010 | -| policy_gradient_loss | -0.00533 | -| std | 0.052 | -| value_loss | 0.000592 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9503 | -| time_elapsed | 55770 | -| total_timesteps | 1216384 | -| train/ | | -| approx_kl | 0.0011707926 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.443 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 95020 | -| policy_gradient_loss | 0.00831 | -| std | 0.0519 | -| value_loss | 5.83e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9504 | -| time_elapsed | 55773 | -| total_timesteps | 1216512 | -| train/ | | -| approx_kl | 0.008024614 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -3.99 | -| learning_rate | 0.0003 | -| loss | -0.00477 | -| n_updates | 95030 | -| policy_gradient_loss | -0.00296 | -| std | 0.0519 | -| value_loss | 1.1e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9505 | -| time_elapsed | 55777 | -| total_timesteps | 1216640 | -| train/ | | -| approx_kl | 0.0026061367 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.85 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 95040 | -| policy_gradient_loss | 0.0136 | -| std | 0.0519 | -| value_loss | 1.15e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9506 | -| time_elapsed | 55779 | -| total_timesteps | 1216768 | -| train/ | | -| approx_kl | 0.0005716523 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.533 | -| learning_rate | 0.0003 | -| loss | -0.000155 | -| n_updates | 95050 | -| policy_gradient_loss | 0.00108 | -| std | 0.0518 | -| value_loss | 8.01e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9507 | -| time_elapsed | 55783 | -| total_timesteps | 1216896 | -| train/ | | -| approx_kl | 0.00070590666 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 95060 | -| policy_gradient_loss | -0.00355 | -| std | 0.0517 | -| value_loss | 1.84e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9508 | -| time_elapsed | 55786 | -| total_timesteps | 1217024 | -| train/ | | -| approx_kl | 0.0010429267 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.54 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | 0.000563 | -| n_updates | 95070 | -| policy_gradient_loss | 0.00364 | -| std | 0.0516 | -| value_loss | 2.47e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9509 | -| time_elapsed | 55794 | -| total_timesteps | 1217152 | -| train/ | | -| approx_kl | 0.006165533 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 1.55 | -| explained_variance | 0.024 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 95080 | -| policy_gradient_loss | -0.012 | -| std | 0.0516 | -| value_loss | 0.00112 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9510 | -| time_elapsed | 55797 | -| total_timesteps | 1217280 | -| train/ | | -| approx_kl | 0.0018038554 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 1.55 | -| explained_variance | -46.2 | -| learning_rate | 0.0003 | -| loss | -0.000596 | -| n_updates | 95090 | -| policy_gradient_loss | -0.00035 | -| std | 0.0514 | -| value_loss | 7.89e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9511 | -| time_elapsed | 55802 | -| total_timesteps | 1217408 | -| train/ | | -| approx_kl | 0.004189711 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 1.55 | -| explained_variance | -275 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 95100 | -| policy_gradient_loss | -0.000694 | -| std | 0.0511 | -| value_loss | 4.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9512 | -| time_elapsed | 55806 | -| total_timesteps | 1217536 | -| train/ | | -| approx_kl | 0.002007564 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -46.3 | -| learning_rate | 0.0003 | -| loss | -0.000943 | -| n_updates | 95110 | -| policy_gradient_loss | -0.000604 | -| std | 0.0509 | -| value_loss | 3.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9513 | -| time_elapsed | 55809 | -| total_timesteps | 1217664 | -| train/ | | -| approx_kl | 0.008146532 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 95120 | -| policy_gradient_loss | -0.00209 | -| std | 0.0508 | -| value_loss | 6.57e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9514 | -| time_elapsed | 55813 | -| total_timesteps | 1217792 | -| train/ | | -| approx_kl | 0.002867904 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.312 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 95130 | -| policy_gradient_loss | -0.00265 | -| std | 0.0507 | -| value_loss | 2.06e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 21 | -| iterations | 9515 | -| time_elapsed | 55815 | -| total_timesteps | 1217920 | -| train/ | | -| approx_kl | 0.0121846525 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.083 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 95140 | -| policy_gradient_loss | 0.000398 | -| std | 0.0507 | -| value_loss | 4.92e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9516 | -| time_elapsed | 55819 | -| total_timesteps | 1218048 | -| train/ | | -| approx_kl | 0.00010714913 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 95150 | -| policy_gradient_loss | 0.000837 | -| std | 0.0507 | -| value_loss | 1.13e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9517 | -| time_elapsed | 55826 | -| total_timesteps | 1218176 | -| train/ | | -| approx_kl | 0.0050944686 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 95160 | -| policy_gradient_loss | -0.0142 | -| std | 0.0506 | -| value_loss | 0.00135 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9518 | -| time_elapsed | 55829 | -| total_timesteps | 1218304 | -| train/ | | -| approx_kl | 0.0005414551 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -102 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 95170 | -| policy_gradient_loss | -0.00471 | -| std | 0.0506 | -| value_loss | 2.25e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9519 | -| time_elapsed | 55832 | -| total_timesteps | 1218432 | -| train/ | | -| approx_kl | 0.005962524 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -222 | -| learning_rate | 0.0003 | -| loss | -0.00624 | -| n_updates | 95180 | -| policy_gradient_loss | -0.00554 | -| std | 0.0506 | -| value_loss | 9.49e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9520 | -| time_elapsed | 55836 | -| total_timesteps | 1218560 | -| train/ | | -| approx_kl | 0.0013395092 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -27 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 95190 | -| policy_gradient_loss | -0.000456 | -| std | 0.0505 | -| value_loss | 2.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9521 | -| time_elapsed | 55839 | -| total_timesteps | 1218688 | -| train/ | | -| approx_kl | 0.011806088 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -3.86 | -| learning_rate | 0.0003 | -| loss | 0.000331 | -| n_updates | 95200 | -| policy_gradient_loss | -0.000368 | -| std | 0.0504 | -| value_loss | 5.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9522 | -| time_elapsed | 55841 | -| total_timesteps | 1218816 | -| train/ | | -| approx_kl | 0.006568054 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.303 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 95210 | -| policy_gradient_loss | -0.000795 | -| std | 0.0503 | -| value_loss | 7.58e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9523 | -| time_elapsed | 55845 | -| total_timesteps | 1218944 | -| train/ | | -| approx_kl | 2.6997644e-05 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.000648 | -| n_updates | 95220 | -| policy_gradient_loss | -0.0044 | -| std | 0.0503 | -| value_loss | 4.28e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9524 | -| time_elapsed | 55849 | -| total_timesteps | 1219072 | -| train/ | | -| approx_kl | 0.004088574 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.0901 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 95230 | -| policy_gradient_loss | -0.0239 | -| std | 0.0503 | -| value_loss | 1.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9525 | -| time_elapsed | 55855 | -| total_timesteps | 1219200 | -| train/ | | -| approx_kl | 0.003903178 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 95240 | -| policy_gradient_loss | -0.0143 | -| std | 0.0504 | -| value_loss | 0.000591 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9526 | -| time_elapsed | 55858 | -| total_timesteps | 1219328 | -| train/ | | -| approx_kl | 0.26429462 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -213 | -| learning_rate | 0.0003 | -| loss | 0.00607 | -| n_updates | 95250 | -| policy_gradient_loss | -0.00108 | -| std | 0.0504 | -| value_loss | 6.97e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9527 | -| time_elapsed | 55862 | -| total_timesteps | 1219456 | -| train/ | | -| approx_kl | 0.12389368 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -441 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 95260 | -| policy_gradient_loss | -0.00328 | -| std | 0.0504 | -| value_loss | 2.86e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9528 | -| time_elapsed | 55865 | -| total_timesteps | 1219584 | -| train/ | | -| approx_kl | 2.4532434e-05 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -86.8 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 95270 | -| policy_gradient_loss | -0.00688 | -| std | 0.0504 | -| value_loss | 3.23e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9529 | -| time_elapsed | 55867 | -| total_timesteps | 1219712 | -| train/ | | -| approx_kl | 0.0060283653 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -12.3 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 95280 | -| policy_gradient_loss | -0.00968 | -| std | 0.0504 | -| value_loss | 9.67e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9530 | -| time_elapsed | 55870 | -| total_timesteps | 1219840 | -| train/ | | -| approx_kl | 0.00117512 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 95290 | -| policy_gradient_loss | -0.00476 | -| std | 0.0504 | -| value_loss | 1.94e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 21 | -| iterations | 9531 | -| time_elapsed | 55872 | -| total_timesteps | 1219968 | -| train/ | | -| approx_kl | 0.01607618 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.00502 | -| n_updates | 95300 | -| policy_gradient_loss | 0.000213 | -| std | 0.0505 | -| value_loss | 7.43e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9532 | -| time_elapsed | 55876 | -| total_timesteps | 1220096 | -| train/ | | -| approx_kl | 0.0031560245 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.00786 | -| learning_rate | 0.0003 | -| loss | -0.00798 | -| n_updates | 95310 | -| policy_gradient_loss | -0.00639 | -| std | 0.0505 | -| value_loss | 1.4e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9533 | -| time_elapsed | 55884 | -| total_timesteps | 1220224 | -| train/ | | -| approx_kl | 0.020079376 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 95320 | -| policy_gradient_loss | -0.0144 | -| std | 0.0505 | -| value_loss | 3.59e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9534 | -| time_elapsed | 55887 | -| total_timesteps | 1220352 | -| train/ | | -| approx_kl | 0.00054587563 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | -0.000893 | -| n_updates | 95330 | -| policy_gradient_loss | -0.000144 | -| std | 0.0505 | -| value_loss | 8.8e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9535 | -| time_elapsed | 55890 | -| total_timesteps | 1220480 | -| train/ | | -| approx_kl | 0.0025203344 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -0.00931 | -| n_updates | 95340 | -| policy_gradient_loss | -0.0107 | -| std | 0.0504 | -| value_loss | 3.03e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9536 | -| time_elapsed | 55893 | -| total_timesteps | 1220608 | -| train/ | | -| approx_kl | 0.00043308223 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -27.5 | -| learning_rate | 0.0003 | -| loss | -0.000271 | -| n_updates | 95350 | -| policy_gradient_loss | 0.000974 | -| std | 0.0505 | -| value_loss | 1.28e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9537 | -| time_elapsed | 55897 | -| total_timesteps | 1220736 | -| train/ | | -| approx_kl | 6.212853e-06 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.298 | -| learning_rate | 0.0003 | -| loss | 4.05e-05 | -| n_updates | 95360 | -| policy_gradient_loss | 0.000221 | -| std | 0.0505 | -| value_loss | 4.29e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9538 | -| time_elapsed | 55901 | -| total_timesteps | 1220864 | -| train/ | | -| approx_kl | 0.002648082 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | 0.000541 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 95370 | -| policy_gradient_loss | -0.001 | -| std | 0.0505 | -| value_loss | 1.45e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9539 | -| time_elapsed | 55904 | -| total_timesteps | 1220992 | -| train/ | | -| approx_kl | 0.0061615924 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | 0.00207 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 95380 | -| policy_gradient_loss | 0.00306 | -| std | 0.0506 | -| value_loss | 3.45e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 9540 | -| time_elapsed | 55907 | -| total_timesteps | 1221120 | -| train/ | | -| approx_kl | 0.0015473599 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 95390 | -| policy_gradient_loss | -0.00283 | -| std | 0.0507 | -| value_loss | 1.26e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 9541 | -| time_elapsed | 55916 | -| total_timesteps | 1221248 | -| train/ | | -| approx_kl | 0.12605396 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | 0.668 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 95400 | -| policy_gradient_loss | -0.0137 | -| std | 0.0507 | -| value_loss | 0.00621 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 9542 | -| time_elapsed | 55918 | -| total_timesteps | 1221376 | -| train/ | | -| approx_kl | 0.37582213 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -590 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 95410 | -| policy_gradient_loss | -0.0025 | -| std | 0.0508 | -| value_loss | 1.32e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 9543 | -| time_elapsed | 55922 | -| total_timesteps | 1221504 | -| train/ | | -| approx_kl | 0.0027327542 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -35.5 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 95420 | -| policy_gradient_loss | -0.000551 | -| std | 0.0509 | -| value_loss | 3.38e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 9544 | -| time_elapsed | 55926 | -| total_timesteps | 1221632 | -| train/ | | -| approx_kl | 0.015977418 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -2.67 | -| learning_rate | 0.0003 | -| loss | -0.00888 | -| n_updates | 95430 | -| policy_gradient_loss | -0.000651 | -| std | 0.051 | -| value_loss | 2.07e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 9545 | -| time_elapsed | 55931 | -| total_timesteps | 1221760 | -| train/ | | -| approx_kl | 0.002707194 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.00116 | -| n_updates | 95440 | -| policy_gradient_loss | 0.00743 | -| std | 0.0511 | -| value_loss | 3.91e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 21 | -| iterations | 9546 | -| time_elapsed | 55935 | -| total_timesteps | 1221888 | -| train/ | | -| approx_kl | 0.010599724 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 95450 | -| policy_gradient_loss | -0.0008 | -| std | 0.0511 | -| value_loss | 4.89e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9547 | -| time_elapsed | 55939 | -| total_timesteps | 1222016 | -| train/ | | -| approx_kl | 0.009872245 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -6.58 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 95460 | -| policy_gradient_loss | -0.0102 | -| std | 0.0511 | -| value_loss | 2.69e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9548 | -| time_elapsed | 55947 | -| total_timesteps | 1222144 | -| train/ | | -| approx_kl | 0.07579386 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 95470 | -| policy_gradient_loss | -0.0161 | -| std | 0.0511 | -| value_loss | 9.77e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9549 | -| time_elapsed | 55951 | -| total_timesteps | 1222272 | -| train/ | | -| approx_kl | 0.011144189 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 95480 | -| policy_gradient_loss | -0.00904 | -| std | 0.051 | -| value_loss | 1.79e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9550 | -| time_elapsed | 55953 | -| total_timesteps | 1222400 | -| train/ | | -| approx_kl | 0.0013750205 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0957 | -| learning_rate | 0.0003 | -| loss | 0.00153 | -| n_updates | 95490 | -| policy_gradient_loss | 0.00831 | -| std | 0.051 | -| value_loss | 1.56e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9551 | -| time_elapsed | 55957 | -| total_timesteps | 1222528 | -| train/ | | -| approx_kl | 0.0094767455 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | 0.00317 | -| n_updates | 95500 | -| policy_gradient_loss | 1.04e-05 | -| std | 0.0509 | -| value_loss | 3.61e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9552 | -| time_elapsed | 55959 | -| total_timesteps | 1222656 | -| train/ | | -| approx_kl | 0.00087971706 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.00038 | -| n_updates | 95510 | -| policy_gradient_loss | 1.78e-05 | -| std | 0.0508 | -| value_loss | 4.71e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9553 | -| time_elapsed | 55963 | -| total_timesteps | 1222784 | -| train/ | | -| approx_kl | 0.003803072 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | 0.00458 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 95520 | -| policy_gradient_loss | -0.00269 | -| std | 0.0507 | -| value_loss | 3.44e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9554 | -| time_elapsed | 55967 | -| total_timesteps | 1222912 | -| train/ | | -| approx_kl | 0.0021710242 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 95530 | -| policy_gradient_loss | -0.00043 | -| std | 0.0508 | -| value_loss | 2.04e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9555 | -| time_elapsed | 55970 | -| total_timesteps | 1223040 | -| train/ | | -| approx_kl | 0.00018960703 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0093 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 95540 | -| policy_gradient_loss | -0.00189 | -| std | 0.0509 | -| value_loss | 2.98e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9556 | -| time_elapsed | 55977 | -| total_timesteps | 1223168 | -| train/ | | -| approx_kl | 0.015177623 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | 0.971 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 95550 | -| policy_gradient_loss | -0.0141 | -| std | 0.0509 | -| value_loss | 0.000233 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9557 | -| time_elapsed | 55980 | -| total_timesteps | 1223296 | -| train/ | | -| approx_kl | 0.0010021445 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.433 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 95560 | -| policy_gradient_loss | -0.00219 | -| std | 0.0509 | -| value_loss | 4.73e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9558 | -| time_elapsed | 55984 | -| total_timesteps | 1223424 | -| train/ | | -| approx_kl | 0.009378957 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -1.77 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 95570 | -| policy_gradient_loss | -0.00931 | -| std | 0.0508 | -| value_loss | 3.1e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9559 | -| time_elapsed | 55986 | -| total_timesteps | 1223552 | -| train/ | | -| approx_kl | 0.0008864333 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.389 | -| learning_rate | 0.0003 | -| loss | -0.00338 | -| n_updates | 95580 | -| policy_gradient_loss | -0.0008 | -| std | 0.0508 | -| value_loss | 2.6e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9560 | -| time_elapsed | 55990 | -| total_timesteps | 1223680 | -| train/ | | -| approx_kl | 0.00016590487 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0842 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 95590 | -| policy_gradient_loss | -0.00728 | -| std | 0.0508 | -| value_loss | 7.32e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9561 | -| time_elapsed | 55994 | -| total_timesteps | 1223808 | -| train/ | | -| approx_kl | 0.015620371 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | 0.00468 | -| n_updates | 95600 | -| policy_gradient_loss | 3.68e-05 | -| std | 0.0508 | -| value_loss | 4.15e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 21 | -| iterations | 9562 | -| time_elapsed | 55998 | -| total_timesteps | 1223936 | -| train/ | | -| approx_kl | 0.0027746707 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | -0.00853 | -| n_updates | 95610 | -| policy_gradient_loss | -0.00726 | -| std | 0.0508 | -| value_loss | 5.95e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9563 | -| time_elapsed | 56002 | -| total_timesteps | 1224064 | -| train/ | | -| approx_kl | 0.002240003 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 95620 | -| policy_gradient_loss | 0.00438 | -| std | 0.0508 | -| value_loss | 1.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9564 | -| time_elapsed | 56007 | -| total_timesteps | 1224192 | -| train/ | | -| approx_kl | 0.01112867 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 95630 | -| policy_gradient_loss | -0.0143 | -| std | 0.0508 | -| value_loss | 0.0022 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9565 | -| time_elapsed | 56011 | -| total_timesteps | 1224320 | -| train/ | | -| approx_kl | 0.0001901961 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -147 | -| learning_rate | 0.0003 | -| loss | 0.000632 | -| n_updates | 95640 | -| policy_gradient_loss | -0.000189 | -| std | 0.0508 | -| value_loss | 1.12e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9566 | -| time_elapsed | 56015 | -| total_timesteps | 1224448 | -| train/ | | -| approx_kl | 3.879424e-06 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -165 | -| learning_rate | 0.0003 | -| loss | 0.000296 | -| n_updates | 95650 | -| policy_gradient_loss | -0.00696 | -| std | 0.0508 | -| value_loss | 7.04e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9567 | -| time_elapsed | 56019 | -| total_timesteps | 1224576 | -| train/ | | -| approx_kl | 0.01078736 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -67.1 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 95660 | -| policy_gradient_loss | -0.0117 | -| std | 0.0508 | -| value_loss | 1.12e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9568 | -| time_elapsed | 56022 | -| total_timesteps | 1224704 | -| train/ | | -| approx_kl | 0.0009658877 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.56 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | -0.000972 | -| n_updates | 95670 | -| policy_gradient_loss | -0.000372 | -| std | 0.0504 | -| value_loss | 1.67e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9569 | -| time_elapsed | 56025 | -| total_timesteps | 1224832 | -| train/ | | -| approx_kl | 0.0046479 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 95680 | -| policy_gradient_loss | 0.000291 | -| std | 0.0501 | -| value_loss | 1.89e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9570 | -| time_elapsed | 56027 | -| total_timesteps | 1224960 | -| train/ | | -| approx_kl | 0.019713672 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 95690 | -| policy_gradient_loss | -0.00299 | -| std | 0.05 | -| value_loss | 5.18e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9571 | -| time_elapsed | 56031 | -| total_timesteps | 1225088 | -| train/ | | -| approx_kl | 0.0070115877 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.0478 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 95700 | -| policy_gradient_loss | -0.00143 | -| std | 0.0499 | -| value_loss | 3.14e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9572 | -| time_elapsed | 56038 | -| total_timesteps | 1225216 | -| train/ | | -| approx_kl | 0.026059879 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 95710 | -| policy_gradient_loss | -0.0107 | -| std | 0.0499 | -| value_loss | 0.00222 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9573 | -| time_elapsed | 56041 | -| total_timesteps | 1225344 | -| train/ | | -| approx_kl | 0.0010764846 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | -0.000951 | -| n_updates | 95720 | -| policy_gradient_loss | -0.000268 | -| std | 0.0499 | -| value_loss | 3.18e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9574 | -| time_elapsed | 56045 | -| total_timesteps | 1225472 | -| train/ | | -| approx_kl | 0.0003738557 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -2.04 | -| learning_rate | 0.0003 | -| loss | 3.84e-05 | -| n_updates | 95730 | -| policy_gradient_loss | 8.23e-05 | -| std | 0.0499 | -| value_loss | 3.18e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9575 | -| time_elapsed | 56049 | -| total_timesteps | 1225600 | -| train/ | | -| approx_kl | 0.0006121411 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | -0.00345 | -| n_updates | 95740 | -| policy_gradient_loss | -0.00454 | -| std | 0.05 | -| value_loss | 2.94e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9576 | -| time_elapsed | 56052 | -| total_timesteps | 1225728 | -| train/ | | -| approx_kl | 0.007540947 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.00893 | -| n_updates | 95750 | -| policy_gradient_loss | -7.72e-05 | -| std | 0.05 | -| value_loss | 5.34e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9577 | -| time_elapsed | 56055 | -| total_timesteps | 1225856 | -| train/ | | -| approx_kl | 0.00045104045 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.00465 | -| n_updates | 95760 | -| policy_gradient_loss | -0.00775 | -| std | 0.0499 | -| value_loss | 1.09e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 21 | -| iterations | 9578 | -| time_elapsed | 56058 | -| total_timesteps | 1225984 | -| train/ | | -| approx_kl | 0.005913663 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.000228 | -| n_updates | 95770 | -| policy_gradient_loss | 8.48e-05 | -| std | 0.0501 | -| value_loss | 4.79e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9579 | -| time_elapsed | 56062 | -| total_timesteps | 1226112 | -| train/ | | -| approx_kl | 0.00018484425 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 95780 | -| policy_gradient_loss | -0.00962 | -| std | 0.0501 | -| value_loss | 2.99e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9580 | -| time_elapsed | 56072 | -| total_timesteps | 1226240 | -| train/ | | -| approx_kl | 0.012452174 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 95790 | -| policy_gradient_loss | -0.015 | -| std | 0.0501 | -| value_loss | 0.000506 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9581 | -| time_elapsed | 56075 | -| total_timesteps | 1226368 | -| train/ | | -| approx_kl | 0.012118842 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -6.2e+03 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 95800 | -| policy_gradient_loss | -0.0122 | -| std | 0.0501 | -| value_loss | 2.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9582 | -| time_elapsed | 56079 | -| total_timesteps | 1226496 | -| train/ | | -| approx_kl | 0.049519956 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -48 | -| learning_rate | 0.0003 | -| loss | -0.00944 | -| n_updates | 95810 | -| policy_gradient_loss | -0.00563 | -| std | 0.0501 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9583 | -| time_elapsed | 56083 | -| total_timesteps | 1226624 | -| train/ | | -| approx_kl | 0.012656427 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -78.9 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 95820 | -| policy_gradient_loss | -0.0112 | -| std | 0.0501 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9584 | -| time_elapsed | 56088 | -| total_timesteps | 1226752 | -| train/ | | -| approx_kl | 0.030797437 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | 0.00329 | -| n_updates | 95830 | -| policy_gradient_loss | 0.0016 | -| std | 0.0501 | -| value_loss | 9.33e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 21 | -| iterations | 9585 | -| time_elapsed | 56092 | -| total_timesteps | 1226880 | -| train/ | | -| approx_kl | 0.008121959 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 1.57 | -| explained_variance | -0.821 | -| learning_rate | 0.0003 | -| loss | 0.000191 | -| n_updates | 95840 | -| policy_gradient_loss | -0.000286 | -| std | 0.05 | -| value_loss | 2.37e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9586 | -| time_elapsed | 56095 | -| total_timesteps | 1227008 | -| train/ | | -| approx_kl | 0.0067902515 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.0977 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 95850 | -| policy_gradient_loss | -0.00118 | -| std | 0.05 | -| value_loss | 3.08e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9587 | -| time_elapsed | 56103 | -| total_timesteps | 1227136 | -| train/ | | -| approx_kl | 0.016837612 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | 0.943 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 95860 | -| policy_gradient_loss | -0.0022 | -| std | 0.0499 | -| value_loss | 0.000525 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9588 | -| time_elapsed | 56107 | -| total_timesteps | 1227264 | -| train/ | | -| approx_kl | 0.010453844 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | 0.209 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 95870 | -| policy_gradient_loss | -0.0144 | -| std | 0.0497 | -| value_loss | 3.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9589 | -| time_elapsed | 56111 | -| total_timesteps | 1227392 | -| train/ | | -| approx_kl | 0.036765534 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -283 | -| learning_rate | 0.0003 | -| loss | -0.00948 | -| n_updates | 95880 | -| policy_gradient_loss | -0.00407 | -| std | 0.0497 | -| value_loss | 5.91e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9590 | -| time_elapsed | 56114 | -| total_timesteps | 1227520 | -| train/ | | -| approx_kl | 0.0048948973 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -114 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 95890 | -| policy_gradient_loss | -0.00923 | -| std | 0.0497 | -| value_loss | 7.44e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9591 | -| time_elapsed | 56117 | -| total_timesteps | 1227648 | -| train/ | | -| approx_kl | 0.0042826426 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -29.2 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 95900 | -| policy_gradient_loss | -0.0128 | -| std | 0.0497 | -| value_loss | 8.26e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9592 | -| time_elapsed | 56120 | -| total_timesteps | 1227776 | -| train/ | | -| approx_kl | 0.0071506505 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -3.76 | -| learning_rate | 0.0003 | -| loss | -0.000896 | -| n_updates | 95910 | -| policy_gradient_loss | -0.000563 | -| std | 0.0497 | -| value_loss | 2.45e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9593 | -| time_elapsed | 56124 | -| total_timesteps | 1227904 | -| train/ | | -| approx_kl | 0.0013144398 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 1.58 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.000352 | -| n_updates | 95920 | -| policy_gradient_loss | 0.000711 | -| std | 0.0496 | -| value_loss | 1.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9594 | -| time_elapsed | 56128 | -| total_timesteps | 1228032 | -| train/ | | -| approx_kl | 0.017418262 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.59 | -| explained_variance | -0.0592 | -| learning_rate | 0.0003 | -| loss | 0.00717 | -| n_updates | 95930 | -| policy_gradient_loss | 0.000267 | -| std | 0.0495 | -| value_loss | 7.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9595 | -| time_elapsed | 56136 | -| total_timesteps | 1228160 | -| train/ | | -| approx_kl | 0.010158557 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.59 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 95940 | -| policy_gradient_loss | -0.016 | -| std | 0.0495 | -| value_loss | 0.00243 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9596 | -| time_elapsed | 56140 | -| total_timesteps | 1228288 | -| train/ | | -| approx_kl | 0.011697209 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 1.59 | -| explained_variance | -53.4 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 95950 | -| policy_gradient_loss | -0.0111 | -| std | 0.0495 | -| value_loss | 2.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9597 | -| time_elapsed | 56143 | -| total_timesteps | 1228416 | -| train/ | | -| approx_kl | 0.03959624 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 1.59 | -| explained_variance | -80.8 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 95960 | -| policy_gradient_loss | -0.00686 | -| std | 0.0495 | -| value_loss | 9.46e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9598 | -| time_elapsed | 56146 | -| total_timesteps | 1228544 | -| train/ | | -| approx_kl | 0.042951524 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 1.59 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 95970 | -| policy_gradient_loss | -0.000589 | -| std | 0.0495 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9599 | -| time_elapsed | 56149 | -| total_timesteps | 1228672 | -| train/ | | -| approx_kl | 0.008607486 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 1.59 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | -8.56e-05 | -| n_updates | 95980 | -| policy_gradient_loss | -0.000249 | -| std | 0.0494 | -| value_loss | 3.22e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9600 | -| time_elapsed | 56152 | -| total_timesteps | 1228800 | -| train/ | | -| approx_kl | 7.6130964e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.59 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | -0.000913 | -| n_updates | 95990 | -| policy_gradient_loss | -0.000385 | -| std | 0.049 | -| value_loss | 2.89e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 21 | -| iterations | 9601 | -| time_elapsed | 56154 | -| total_timesteps | 1228928 | -| train/ | | -| approx_kl | 0.0026697638 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 1.6 | -| explained_variance | -0.00323 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 96000 | -| policy_gradient_loss | -0.00272 | -| std | 0.0487 | -| value_loss | 3.14e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9602 | -| time_elapsed | 56157 | -| total_timesteps | 1229056 | -| train/ | | -| approx_kl | 0.00015727803 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | -0.000163 | -| n_updates | 96010 | -| policy_gradient_loss | 0.0203 | -| std | 0.0485 | -| value_loss | 8.55e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9603 | -| time_elapsed | 56164 | -| total_timesteps | 1229184 | -| train/ | | -| approx_kl | 0.021027189 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 96020 | -| policy_gradient_loss | -0.0106 | -| std | 0.0485 | -| value_loss | 0.000271 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9604 | -| time_elapsed | 56168 | -| total_timesteps | 1229312 | -| train/ | | -| approx_kl | 0.029897455 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -65.7 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 96030 | -| policy_gradient_loss | -0.00593 | -| std | 0.0485 | -| value_loss | 1.17e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9605 | -| time_elapsed | 56172 | -| total_timesteps | 1229440 | -| train/ | | -| approx_kl | 0.0016934597 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -107 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 96040 | -| policy_gradient_loss | 0.00315 | -| std | 0.0485 | -| value_loss | 6.06e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9606 | -| time_elapsed | 56175 | -| total_timesteps | 1229568 | -| train/ | | -| approx_kl | 0.006899773 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 96050 | -| policy_gradient_loss | -0.0109 | -| std | 0.0484 | -| value_loss | 1.98e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9607 | -| time_elapsed | 56179 | -| total_timesteps | 1229696 | -| train/ | | -| approx_kl | 2.104789e-07 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -2.57e-05 | -| n_updates | 96060 | -| policy_gradient_loss | 0.01 | -| std | 0.0484 | -| value_loss | 1.29e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9608 | -| time_elapsed | 56183 | -| total_timesteps | 1229824 | -| train/ | | -| approx_kl | 0.0038887765 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 96070 | -| policy_gradient_loss | -0.00714 | -| std | 0.0484 | -| value_loss | 6.56e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 21 | -| iterations | 9609 | -| time_elapsed | 56186 | -| total_timesteps | 1229952 | -| train/ | | -| approx_kl | 0.0028425655 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 96080 | -| policy_gradient_loss | -0.00122 | -| std | 0.0484 | -| value_loss | 1.58e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9610 | -| time_elapsed | 56190 | -| total_timesteps | 1230080 | -| train/ | | -| approx_kl | 3.3610966e-05 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.00289 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 96090 | -| policy_gradient_loss | -0.00886 | -| std | 0.0484 | -| value_loss | 1.52e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9611 | -| time_elapsed | 56197 | -| total_timesteps | 1230208 | -| train/ | | -| approx_kl | 0.026616612 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 96100 | -| policy_gradient_loss | -0.014 | -| std | 0.0484 | -| value_loss | 0.00137 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9612 | -| time_elapsed | 56200 | -| total_timesteps | 1230336 | -| train/ | | -| approx_kl | 0.00024687592 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -433 | -| learning_rate | 0.0003 | -| loss | -0.00431 | -| n_updates | 96110 | -| policy_gradient_loss | -0.011 | -| std | 0.0484 | -| value_loss | 1.26e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9613 | -| time_elapsed | 56203 | -| total_timesteps | 1230464 | -| train/ | | -| approx_kl | 2.8352253e-05 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -1.22e+04 | -| learning_rate | 0.0003 | -| loss | -0.00015 | -| n_updates | 96120 | -| policy_gradient_loss | 0.00018 | -| std | 0.0484 | -| value_loss | 5.11e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9614 | -| time_elapsed | 56207 | -| total_timesteps | 1230592 | -| train/ | | -| approx_kl | 0.00017219502 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | 0.000511 | -| n_updates | 96130 | -| policy_gradient_loss | -0.000964 | -| std | 0.0483 | -| value_loss | 6.63e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9615 | -| time_elapsed | 56210 | -| total_timesteps | 1230720 | -| train/ | | -| approx_kl | 0.01511067 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -16 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 96140 | -| policy_gradient_loss | -0.0094 | -| std | 0.0482 | -| value_loss | 6.29e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9616 | -| time_elapsed | 56213 | -| total_timesteps | 1230848 | -| train/ | | -| approx_kl | 0.018479977 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.474 | -| learning_rate | 0.0003 | -| loss | 0.00217 | -| n_updates | 96150 | -| policy_gradient_loss | -0.00138 | -| std | 0.0482 | -| value_loss | 1.77e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9617 | -| time_elapsed | 56216 | -| total_timesteps | 1230976 | -| train/ | | -| approx_kl | 0.0033330135 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 96160 | -| policy_gradient_loss | -0.00776 | -| std | 0.0482 | -| value_loss | 5.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9618 | -| time_elapsed | 56219 | -| total_timesteps | 1231104 | -| train/ | | -| approx_kl | 0.003045944 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.0012 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 96170 | -| policy_gradient_loss | -0.00304 | -| std | 0.0482 | -| value_loss | 1.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9619 | -| time_elapsed | 56227 | -| total_timesteps | 1231232 | -| train/ | | -| approx_kl | 0.042917848 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 96180 | -| policy_gradient_loss | -0.0148 | -| std | 0.0482 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9620 | -| time_elapsed | 56230 | -| total_timesteps | 1231360 | -| train/ | | -| approx_kl | 0.0010330938 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 96190 | -| policy_gradient_loss | -0.00285 | -| std | 0.0482 | -| value_loss | 2.67e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9621 | -| time_elapsed | 56233 | -| total_timesteps | 1231488 | -| train/ | | -| approx_kl | 0.011959568 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 1.61 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | -0.00455 | -| n_updates | 96200 | -| policy_gradient_loss | -0.00356 | -| std | 0.0481 | -| value_loss | 2.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9622 | -| time_elapsed | 56236 | -| total_timesteps | 1231616 | -| train/ | | -| approx_kl | 0.015562322 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.00146 | -| learning_rate | 0.0003 | -| loss | -0.0076 | -| n_updates | 96210 | -| policy_gradient_loss | -0.0053 | -| std | 0.0481 | -| value_loss | 2.28e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9623 | -| time_elapsed | 56238 | -| total_timesteps | 1231744 | -| train/ | | -| approx_kl | 0.0020429245 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 96220 | -| policy_gradient_loss | 0.00179 | -| std | 0.048 | -| value_loss | 2.52e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 21 | -| iterations | 9624 | -| time_elapsed | 56242 | -| total_timesteps | 1231872 | -| train/ | | -| approx_kl | 1.2116507e-05 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | 0.0031 | -| learning_rate | 0.0003 | -| loss | -0.000295 | -| n_updates | 96230 | -| policy_gradient_loss | -0.000159 | -| std | 0.0481 | -| value_loss | 4.97e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9625 | -| time_elapsed | 56246 | -| total_timesteps | 1232000 | -| train/ | | -| approx_kl | 0.036719047 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.00499 | -| n_updates | 96240 | -| policy_gradient_loss | 0.00528 | -| std | 0.0481 | -| value_loss | 2.15e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9626 | -| time_elapsed | 56249 | -| total_timesteps | 1232128 | -| train/ | | -| approx_kl | 0.0136458315 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | 0.00383 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 96250 | -| policy_gradient_loss | 0.00939 | -| std | 0.048 | -| value_loss | 6.55e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9627 | -| time_elapsed | 56258 | -| total_timesteps | 1232256 | -| train/ | | -| approx_kl | 0.02373397 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | 0.743 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 96260 | -| policy_gradient_loss | -0.0154 | -| std | 0.048 | -| value_loss | 0.00455 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9628 | -| time_elapsed | 56261 | -| total_timesteps | 1232384 | -| train/ | | -| approx_kl | 0.00023651076 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.331 | -| learning_rate | 0.0003 | -| loss | 0.00184 | -| n_updates | 96270 | -| policy_gradient_loss | 0.00232 | -| std | 0.048 | -| value_loss | 2e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9629 | -| time_elapsed | 56264 | -| total_timesteps | 1232512 | -| train/ | | -| approx_kl | 0.00010349136 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -3.48 | -| learning_rate | 0.0003 | -| loss | -0.000521 | -| n_updates | 96280 | -| policy_gradient_loss | 0.000384 | -| std | 0.048 | -| value_loss | 9.19e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9630 | -| time_elapsed | 56267 | -| total_timesteps | 1232640 | -| train/ | | -| approx_kl | 0.0015124655 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.808 | -| learning_rate | 0.0003 | -| loss | -0.00586 | -| n_updates | 96290 | -| policy_gradient_loss | -0.0021 | -| std | 0.048 | -| value_loss | 3.79e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9631 | -| time_elapsed | 56271 | -| total_timesteps | 1232768 | -| train/ | | -| approx_kl | 1.704041e-05 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.000421 | -| n_updates | 96300 | -| policy_gradient_loss | 0.00404 | -| std | 0.048 | -| value_loss | 1.47e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 21 | -| iterations | 9632 | -| time_elapsed | 56275 | -| total_timesteps | 1232896 | -| train/ | | -| approx_kl | 0.014225396 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.0784 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 96310 | -| policy_gradient_loss | -0.012 | -| std | 0.048 | -| value_loss | 9.88e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9633 | -| time_elapsed | 56280 | -| total_timesteps | 1233024 | -| train/ | | -| approx_kl | 0.00075906515 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 96320 | -| policy_gradient_loss | 0.00683 | -| std | 0.048 | -| value_loss | 7e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9634 | -| time_elapsed | 56288 | -| total_timesteps | 1233152 | -| train/ | | -| approx_kl | 0.007070519 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | -0.00414 | -| n_updates | 96330 | -| policy_gradient_loss | -0.00297 | -| std | 0.0479 | -| value_loss | 0.00133 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9635 | -| time_elapsed | 56292 | -| total_timesteps | 1233280 | -| train/ | | -| approx_kl | 0.011106202 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -7.92 | -| learning_rate | 0.0003 | -| loss | -0.000988 | -| n_updates | 96340 | -| policy_gradient_loss | -0.000976 | -| std | 0.0479 | -| value_loss | 5.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9636 | -| time_elapsed | 56294 | -| total_timesteps | 1233408 | -| train/ | | -| approx_kl | 0.008276791 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -16.2 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 96350 | -| policy_gradient_loss | -0.0159 | -| std | 0.0479 | -| value_loss | 3.42e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9637 | -| time_elapsed | 56297 | -| total_timesteps | 1233536 | -| train/ | | -| approx_kl | 0.00068260403 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -2.05 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 96360 | -| policy_gradient_loss | 0.0111 | -| std | 0.0479 | -| value_loss | 1.12e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9638 | -| time_elapsed | 56300 | -| total_timesteps | 1233664 | -| train/ | | -| approx_kl | 0.0054791 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -0.000296 | -| n_updates | 96370 | -| policy_gradient_loss | -9.58e-05 | -| std | 0.0478 | -| value_loss | 8.34e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9639 | -| time_elapsed | 56303 | -| total_timesteps | 1233792 | -| train/ | | -| approx_kl | 0.014634192 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.235 | -| learning_rate | 0.0003 | -| loss | 0.00698 | -| n_updates | 96380 | -| policy_gradient_loss | 0.0016 | -| std | 0.0478 | -| value_loss | 4.4e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 21 | -| iterations | 9640 | -| time_elapsed | 56306 | -| total_timesteps | 1233920 | -| train/ | | -| approx_kl | 0.0030417861 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | 0.00619 | -| learning_rate | 0.0003 | -| loss | -0.0059 | -| n_updates | 96390 | -| policy_gradient_loss | -0.00579 | -| std | 0.0478 | -| value_loss | 1.07e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9641 | -| time_elapsed | 56308 | -| total_timesteps | 1234048 | -| train/ | | -| approx_kl | 0.0037353388 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.00741 | -| n_updates | 96400 | -| policy_gradient_loss | 0.00382 | -| std | 0.0478 | -| value_loss | 6.35e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9642 | -| time_elapsed | 56314 | -| total_timesteps | 1234176 | -| train/ | | -| approx_kl | 0.012266897 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -4.14 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 96410 | -| policy_gradient_loss | -0.0132 | -| std | 0.0478 | -| value_loss | 0.00265 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9643 | -| time_elapsed | 56317 | -| total_timesteps | 1234304 | -| train/ | | -| approx_kl | 0.0019130716 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -62.7 | -| learning_rate | 0.0003 | -| loss | -0.00633 | -| n_updates | 96420 | -| policy_gradient_loss | -0.0108 | -| std | 0.0478 | -| value_loss | 5e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9644 | -| time_elapsed | 56320 | -| total_timesteps | 1234432 | -| train/ | | -| approx_kl | 0.0021488913 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -2.53e+03 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 96430 | -| policy_gradient_loss | -0.000909 | -| std | 0.0478 | -| value_loss | 2.38e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9645 | -| time_elapsed | 56323 | -| total_timesteps | 1234560 | -| train/ | | -| approx_kl | 0.00023926329 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 1.62 | -| explained_variance | -60.3 | -| learning_rate | 0.0003 | -| loss | -0.000166 | -| n_updates | 96440 | -| policy_gradient_loss | 0.000135 | -| std | 0.0476 | -| value_loss | 1.68e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9646 | -| time_elapsed | 56327 | -| total_timesteps | 1234688 | -| train/ | | -| approx_kl | 0.014544828 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.63 | -| explained_variance | -2.64 | -| learning_rate | 0.0003 | -| loss | 0.00235 | -| n_updates | 96450 | -| policy_gradient_loss | 0.000737 | -| std | 0.0476 | -| value_loss | 9.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9647 | -| time_elapsed | 56331 | -| total_timesteps | 1234816 | -| train/ | | -| approx_kl | 0.013974519 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 1.63 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.00163 | -| n_updates | 96460 | -| policy_gradient_loss | -0.000192 | -| std | 0.0474 | -| value_loss | 2.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 21 | -| iterations | 9648 | -| time_elapsed | 56334 | -| total_timesteps | 1234944 | -| train/ | | -| approx_kl | 0.0044488437 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.63 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 96470 | -| policy_gradient_loss | -0.00124 | -| std | 0.0472 | -| value_loss | 7.36e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9649 | -| time_elapsed | 56338 | -| total_timesteps | 1235072 | -| train/ | | -| approx_kl | 0.0002971557 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 1.63 | -| explained_variance | 0.00104 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 96480 | -| policy_gradient_loss | 0.00448 | -| std | 0.0472 | -| value_loss | 1.06e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9650 | -| time_elapsed | 56342 | -| total_timesteps | 1235200 | -| train/ | | -| approx_kl | 0.006620981 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | 0.726 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 96490 | -| policy_gradient_loss | -0.0135 | -| std | 0.0471 | -| value_loss | 0.000447 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9651 | -| time_elapsed | 56346 | -| total_timesteps | 1235328 | -| train/ | | -| approx_kl | 0.023045732 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -10.3 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 96500 | -| policy_gradient_loss | -0.0104 | -| std | 0.0471 | -| value_loss | 6.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9652 | -| time_elapsed | 56349 | -| total_timesteps | 1235456 | -| train/ | | -| approx_kl | 0.001638907 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -75.4 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 96510 | -| policy_gradient_loss | -0.00113 | -| std | 0.047 | -| value_loss | 4.87e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9653 | -| time_elapsed | 56353 | -| total_timesteps | 1235584 | -| train/ | | -| approx_kl | 0.00035665464 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 96520 | -| policy_gradient_loss | 0.00029 | -| std | 0.0469 | -| value_loss | 0.000116 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9654 | -| time_elapsed | 56356 | -| total_timesteps | 1235712 | -| train/ | | -| approx_kl | 4.2606145e-05 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | -0.000321 | -| n_updates | 96530 | -| policy_gradient_loss | 0.00237 | -| std | 0.0468 | -| value_loss | 7.33e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9655 | -| time_elapsed | 56358 | -| total_timesteps | 1235840 | -| train/ | | -| approx_kl | 0.0003691758 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.000285 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 96540 | -| policy_gradient_loss | -0.000165 | -| std | 0.0468 | -| value_loss | 7.71e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9656 | -| time_elapsed | 56361 | -| total_timesteps | 1235968 | -| train/ | | -| approx_kl | 0.00033314805 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.000969 | -| n_updates | 96550 | -| policy_gradient_loss | 0.000145 | -| std | 0.0468 | -| value_loss | 1.32e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9657 | -| time_elapsed | 56365 | -| total_timesteps | 1236096 | -| train/ | | -| approx_kl | 0.0026245993 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 96560 | -| policy_gradient_loss | -3.61e-06 | -| std | 0.0467 | -| value_loss | 8.28e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9658 | -| time_elapsed | 56373 | -| total_timesteps | 1236224 | -| train/ | | -| approx_kl | 0.012542641 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | 0.809 | -| learning_rate | 0.0003 | -| loss | 0.000582 | -| n_updates | 96570 | -| policy_gradient_loss | -0.000105 | -| std | 0.0467 | -| value_loss | 0.000965 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9659 | -| time_elapsed | 56377 | -| total_timesteps | 1236352 | -| train/ | | -| approx_kl | 0.013405524 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 96580 | -| policy_gradient_loss | -0.000816 | -| std | 0.0467 | -| value_loss | 0.000271 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9660 | -| time_elapsed | 56380 | -| total_timesteps | 1236480 | -| train/ | | -| approx_kl | 6.175181e-05 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | 0.0002 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 96590 | -| policy_gradient_loss | -0.000906 | -| std | 0.0467 | -| value_loss | 0.000369 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9661 | -| time_elapsed | 56384 | -| total_timesteps | 1236608 | -| train/ | | -| approx_kl | 0.004357582 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | -0.00671 | -| n_updates | 96600 | -| policy_gradient_loss | -0.00414 | -| std | 0.0467 | -| value_loss | 5.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9662 | -| time_elapsed | 56387 | -| total_timesteps | 1236736 | -| train/ | | -| approx_kl | 0.013225449 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.0074 | -| learning_rate | 0.0003 | -| loss | 0.00606 | -| n_updates | 96610 | -| policy_gradient_loss | 0.00695 | -| std | 0.0467 | -| value_loss | 5.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9663 | -| time_elapsed | 56391 | -| total_timesteps | 1236864 | -| train/ | | -| approx_kl | 0.004562391 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 96620 | -| policy_gradient_loss | 0.00236 | -| std | 0.0467 | -| value_loss | 4.3e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 21 | -| iterations | 9664 | -| time_elapsed | 56394 | -| total_timesteps | 1236992 | -| train/ | | -| approx_kl | 0.0073455223 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 1.64 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 96630 | -| policy_gradient_loss | -0.00686 | -| std | 0.0467 | -| value_loss | 1.42e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 9665 | -| time_elapsed | 56397 | -| total_timesteps | 1237120 | -| train/ | | -| approx_kl | 0.006091059 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 96640 | -| policy_gradient_loss | 0.000706 | -| std | 0.0467 | -| value_loss | 1.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 9666 | -| time_elapsed | 56406 | -| total_timesteps | 1237248 | -| train/ | | -| approx_kl | 0.015235808 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | 0.723 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 96650 | -| policy_gradient_loss | -0.0148 | -| std | 0.0467 | -| value_loss | 0.000417 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 9667 | -| time_elapsed | 56410 | -| total_timesteps | 1237376 | -| train/ | | -| approx_kl | 0.00446876 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | 0.00552 | -| n_updates | 96660 | -| policy_gradient_loss | 0.0034 | -| std | 0.0466 | -| value_loss | 7.12e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 9668 | -| time_elapsed | 56413 | -| total_timesteps | 1237504 | -| train/ | | -| approx_kl | 0.0024341391 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | -0.00858 | -| n_updates | 96670 | -| policy_gradient_loss | -0.00727 | -| std | 0.0466 | -| value_loss | 0.000102 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 9669 | -| time_elapsed | 56416 | -| total_timesteps | 1237632 | -| train/ | | -| approx_kl | 0.0039545805 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 96680 | -| policy_gradient_loss | 0.0039 | -| std | 0.0466 | -| value_loss | 7.48e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 9670 | -| time_elapsed | 56419 | -| total_timesteps | 1237760 | -| train/ | | -| approx_kl | 0.009115736 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 96690 | -| policy_gradient_loss | -0.0155 | -| std | 0.0466 | -| value_loss | 7.83e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 21 | -| iterations | 9671 | -| time_elapsed | 56422 | -| total_timesteps | 1237888 | -| train/ | | -| approx_kl | 2.8352253e-05 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.000189 | -| n_updates | 96700 | -| policy_gradient_loss | 0.00616 | -| std | 0.0466 | -| value_loss | 3.52e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9672 | -| time_elapsed | 56424 | -| total_timesteps | 1238016 | -| train/ | | -| approx_kl | 0.002863333 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 96710 | -| policy_gradient_loss | -0.00615 | -| std | 0.0466 | -| value_loss | 4.44e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9673 | -| time_elapsed | 56433 | -| total_timesteps | 1238144 | -| train/ | | -| approx_kl | 0.022250462 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 96720 | -| policy_gradient_loss | -0.016 | -| std | 0.0465 | -| value_loss | 0.000332 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9674 | -| time_elapsed | 56436 | -| total_timesteps | 1238272 | -| train/ | | -| approx_kl | 0.0047019175 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 96730 | -| policy_gradient_loss | -0.00503 | -| std | 0.0465 | -| value_loss | 0.000124 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9675 | -| time_elapsed | 56440 | -| total_timesteps | 1238400 | -| train/ | | -| approx_kl | 0.007898231 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.258 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 96740 | -| policy_gradient_loss | -0.00449 | -| std | 0.0465 | -| value_loss | 2.77e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9676 | -| time_elapsed | 56443 | -| total_timesteps | 1238528 | -| train/ | | -| approx_kl | 0.0075533125 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 96750 | -| policy_gradient_loss | -0.000342 | -| std | 0.0465 | -| value_loss | 7.88e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9677 | -| time_elapsed | 56446 | -| total_timesteps | 1238656 | -| train/ | | -| approx_kl | 0.0002783467 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | -0.000562 | -| n_updates | 96760 | -| policy_gradient_loss | 0.00133 | -| std | 0.0465 | -| value_loss | 7.74e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9678 | -| time_elapsed | 56449 | -| total_timesteps | 1238784 | -| train/ | | -| approx_kl | 1.2286473e-05 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.00831 | -| learning_rate | 0.0003 | -| loss | -0.000273 | -| n_updates | 96770 | -| policy_gradient_loss | 0.00119 | -| std | 0.0465 | -| value_loss | 9.98e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 21 | -| iterations | 9679 | -| time_elapsed | 56452 | -| total_timesteps | 1238912 | -| train/ | | -| approx_kl | 0.00011160318 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | 0.00225 | -| learning_rate | 0.0003 | -| loss | 0.000834 | -| n_updates | 96780 | -| policy_gradient_loss | 0.00361 | -| std | 0.0464 | -| value_loss | 3.33e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9680 | -| time_elapsed | 56454 | -| total_timesteps | 1239040 | -| train/ | | -| approx_kl | 0.011743986 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 96790 | -| policy_gradient_loss | -0.000411 | -| std | 0.0465 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9681 | -| time_elapsed | 56460 | -| total_timesteps | 1239168 | -| train/ | | -| approx_kl | 0.007681193 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.000121 | -| n_updates | 96800 | -| policy_gradient_loss | -0.00154 | -| std | 0.0464 | -| value_loss | 0.00449 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9682 | -| time_elapsed | 56464 | -| total_timesteps | 1239296 | -| train/ | | -| approx_kl | 0.0016148891 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -3.74 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 96810 | -| policy_gradient_loss | -0.00255 | -| std | 0.0464 | -| value_loss | 2.14e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9683 | -| time_elapsed | 56467 | -| total_timesteps | 1239424 | -| train/ | | -| approx_kl | 0.080492824 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -82.8 | -| learning_rate | 0.0003 | -| loss | -0.00897 | -| n_updates | 96820 | -| policy_gradient_loss | -0.00665 | -| std | 0.0464 | -| value_loss | 1.09e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9684 | -| time_elapsed | 56471 | -| total_timesteps | 1239552 | -| train/ | | -| approx_kl | 0.1959174 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -184 | -| learning_rate | 0.0003 | -| loss | 0.000524 | -| n_updates | 96830 | -| policy_gradient_loss | -0.00328 | -| std | 0.0464 | -| value_loss | 6.03e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9685 | -| time_elapsed | 56474 | -| total_timesteps | 1239680 | -| train/ | | -| approx_kl | 0.0075973975 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 96840 | -| policy_gradient_loss | -0.016 | -| std | 0.0465 | -| value_loss | 2.73e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9686 | -| time_elapsed | 56478 | -| total_timesteps | 1239808 | -| train/ | | -| approx_kl | 0.0010207226 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.068 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 96850 | -| policy_gradient_loss | -0.00542 | -| std | 0.0465 | -| value_loss | 4.31e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 21 | -| iterations | 9687 | -| time_elapsed | 56482 | -| total_timesteps | 1239936 | -| train/ | | -| approx_kl | 0.0050228573 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | 0.00251 | -| learning_rate | 0.0003 | -| loss | -0.000282 | -| n_updates | 96860 | -| policy_gradient_loss | -0.000153 | -| std | 0.0465 | -| value_loss | 6.54e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9688 | -| time_elapsed | 56486 | -| total_timesteps | 1240064 | -| train/ | | -| approx_kl | 0.001046787 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.00764 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 96870 | -| policy_gradient_loss | -0.00982 | -| std | 0.0465 | -| value_loss | 8.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9689 | -| time_elapsed | 56492 | -| total_timesteps | 1240192 | -| train/ | | -| approx_kl | 0.03882136 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | 0.601 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 96880 | -| policy_gradient_loss | -0.0142 | -| std | 0.0465 | -| value_loss | 0.000723 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9690 | -| time_elapsed | 56494 | -| total_timesteps | 1240320 | -| train/ | | -| approx_kl | 0.0045520603 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -2.96 | -| learning_rate | 0.0003 | -| loss | -0.00623 | -| n_updates | 96890 | -| policy_gradient_loss | -0.00332 | -| std | 0.0465 | -| value_loss | 2.79e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9691 | -| time_elapsed | 56497 | -| total_timesteps | 1240448 | -| train/ | | -| approx_kl | 0.0069845663 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -4.54 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 96900 | -| policy_gradient_loss | -0.0127 | -| std | 0.0465 | -| value_loss | 2.49e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9692 | -| time_elapsed | 56500 | -| total_timesteps | 1240576 | -| train/ | | -| approx_kl | 0.006150837 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.808 | -| learning_rate | 0.0003 | -| loss | -0.000225 | -| n_updates | 96910 | -| policy_gradient_loss | -0.000257 | -| std | 0.0464 | -| value_loss | 1.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9693 | -| time_elapsed | 56502 | -| total_timesteps | 1240704 | -| train/ | | -| approx_kl | 0.006951053 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.0888 | -| learning_rate | 0.0003 | -| loss | 0.000655 | -| n_updates | 96920 | -| policy_gradient_loss | 0.00404 | -| std | 0.0463 | -| value_loss | 1.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9694 | -| time_elapsed | 56505 | -| total_timesteps | 1240832 | -| train/ | | -| approx_kl | 0.002444394 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 1.65 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 96930 | -| policy_gradient_loss | -0.00113 | -| std | 0.0463 | -| value_loss | 3.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 21 | -| iterations | 9695 | -| time_elapsed | 56509 | -| total_timesteps | 1240960 | -| train/ | | -| approx_kl | 0.025417225 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -54.8 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 96940 | -| policy_gradient_loss | -0.00247 | -| std | 0.0462 | -| value_loss | 8.64e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9696 | -| time_elapsed | 56512 | -| total_timesteps | 1241088 | -| train/ | | -| approx_kl | 0.00010313047 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -0.0966 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 96950 | -| policy_gradient_loss | -0.00112 | -| std | 0.0462 | -| value_loss | 7.22e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9697 | -| time_elapsed | 56518 | -| total_timesteps | 1241216 | -| train/ | | -| approx_kl | 0.023203325 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 96960 | -| policy_gradient_loss | -0.0161 | -| std | 0.0461 | -| value_loss | 0.00121 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9698 | -| time_elapsed | 56521 | -| total_timesteps | 1241344 | -| train/ | | -| approx_kl | 0.004127624 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -811 | -| learning_rate | 0.0003 | -| loss | -0.00627 | -| n_updates | 96970 | -| policy_gradient_loss | -0.00684 | -| std | 0.0461 | -| value_loss | 3.54e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9699 | -| time_elapsed | 56525 | -| total_timesteps | 1241472 | -| train/ | | -| approx_kl | 0.0028880136 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -1.03e+04 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 96980 | -| policy_gradient_loss | -0.000743 | -| std | 0.046 | -| value_loss | 3.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9700 | -| time_elapsed | 56528 | -| total_timesteps | 1241600 | -| train/ | | -| approx_kl | 0.009557441 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -7.73 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 96990 | -| policy_gradient_loss | -0.00854 | -| std | 0.0459 | -| value_loss | 2.12e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9701 | -| time_elapsed | 56531 | -| total_timesteps | 1241728 | -| train/ | | -| approx_kl | 0.00037218863 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -0.363 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 97000 | -| policy_gradient_loss | -0.00835 | -| std | 0.0459 | -| value_loss | 5.22e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9702 | -| time_elapsed | 56533 | -| total_timesteps | 1241856 | -| train/ | | -| approx_kl | 0.00010682177 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | 0.00169 | -| n_updates | 97010 | -| policy_gradient_loss | -0.00476 | -| std | 0.0459 | -| value_loss | 1.87e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 21 | -| iterations | 9703 | -| time_elapsed | 56536 | -| total_timesteps | 1241984 | -| train/ | | -| approx_kl | 0.01206248 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -0.0092 | -| learning_rate | 0.0003 | -| loss | -0.00638 | -| n_updates | 97020 | -| policy_gradient_loss | -0.0047 | -| std | 0.0458 | -| value_loss | 1.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 9704 | -| time_elapsed | 56540 | -| total_timesteps | 1242112 | -| train/ | | -| approx_kl | 0.000857871 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 97030 | -| policy_gradient_loss | -0.00527 | -| std | 0.0458 | -| value_loss | 1.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 9705 | -| time_elapsed | 56548 | -| total_timesteps | 1242240 | -| train/ | | -| approx_kl | 0.021253217 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 97040 | -| policy_gradient_loss | -0.0159 | -| std | 0.0458 | -| value_loss | 0.00022 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 9706 | -| time_elapsed | 56552 | -| total_timesteps | 1242368 | -| train/ | | -| approx_kl | 8.081412e-05 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.66 | -| explained_variance | -2.29 | -| learning_rate | 0.0003 | -| loss | 0.000654 | -| n_updates | 97050 | -| policy_gradient_loss | -0.000554 | -| std | 0.0458 | -| value_loss | 1.3e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 9707 | -| time_elapsed | 56555 | -| total_timesteps | 1242496 | -| train/ | | -| approx_kl | 3.0168798e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.67 | -| explained_variance | -2.62 | -| learning_rate | 0.0003 | -| loss | -0.000459 | -| n_updates | 97060 | -| policy_gradient_loss | -0.000188 | -| std | 0.0455 | -| value_loss | 7.55e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 9708 | -| time_elapsed | 56559 | -| total_timesteps | 1242624 | -| train/ | | -| approx_kl | 0.014784739 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 1.67 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 97070 | -| policy_gradient_loss | -0.00737 | -| std | 0.0453 | -| value_loss | 2.27e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 9709 | -| time_elapsed | 56563 | -| total_timesteps | 1242752 | -| train/ | | -| approx_kl | 0.0070446227 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 97080 | -| policy_gradient_loss | -0.00155 | -| std | 0.0452 | -| value_loss | 4.64e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 21 | -| iterations | 9710 | -| time_elapsed | 56566 | -| total_timesteps | 1242880 | -| train/ | | -| approx_kl | 0.003950285 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.00303 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 97090 | -| policy_gradient_loss | -0.00715 | -| std | 0.0452 | -| value_loss | 1.9e-08 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9711 | -| time_elapsed | 56570 | -| total_timesteps | 1243008 | -| train/ | | -| approx_kl | 0.000116376206 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.000659 | -| n_updates | 97100 | -| policy_gradient_loss | 0.000661 | -| std | 0.0452 | -| value_loss | 1.87e-08 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9712 | -| time_elapsed | 56579 | -| total_timesteps | 1243136 | -| train/ | | -| approx_kl | 0.11349402 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 97110 | -| policy_gradient_loss | -0.0154 | -| std | 0.0452 | -| value_loss | 3.52e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9713 | -| time_elapsed | 56582 | -| total_timesteps | 1243264 | -| train/ | | -| approx_kl | 0.0076171467 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0499 | -| learning_rate | 0.0003 | -| loss | -0.0279 | -| n_updates | 97120 | -| policy_gradient_loss | -0.0206 | -| std | 0.0452 | -| value_loss | 6.99e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9714 | -| time_elapsed | 56586 | -| total_timesteps | 1243392 | -| train/ | | -| approx_kl | 0.020773023 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 97130 | -| policy_gradient_loss | 0.00526 | -| std | 0.0453 | -| value_loss | 2.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9715 | -| time_elapsed | 56589 | -| total_timesteps | 1243520 | -| train/ | | -| approx_kl | 0.009485571 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.00182 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 97140 | -| policy_gradient_loss | 0.0021 | -| std | 0.0453 | -| value_loss | 1.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9716 | -| time_elapsed | 56592 | -| total_timesteps | 1243648 | -| train/ | | -| approx_kl | 0.006517032 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.00322 | -| n_updates | 97150 | -| policy_gradient_loss | 0.00595 | -| std | 0.0452 | -| value_loss | 3.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9717 | -| time_elapsed | 56595 | -| total_timesteps | 1243776 | -| train/ | | -| approx_kl | 0.0078114695 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | 0.00102 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 97160 | -| policy_gradient_loss | -0.00931 | -| std | 0.0452 | -| value_loss | 8.97e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 21 | -| iterations | 9718 | -| time_elapsed | 56598 | -| total_timesteps | 1243904 | -| train/ | | -| approx_kl | 3.9748847e-06 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -6.62e-05 | -| n_updates | 97170 | -| policy_gradient_loss | 0.00272 | -| std | 0.0452 | -| value_loss | 3.37e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9719 | -| time_elapsed | 56602 | -| total_timesteps | 1244032 | -| train/ | | -| approx_kl | 0.0043759136 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 97180 | -| policy_gradient_loss | -0.00135 | -| std | 0.0451 | -| value_loss | 1.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9720 | -| time_elapsed | 56610 | -| total_timesteps | 1244160 | -| train/ | | -| approx_kl | 0.001438552 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | 0.694 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 97190 | -| policy_gradient_loss | 0.000566 | -| std | 0.0451 | -| value_loss | 0.0047 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9721 | -| time_elapsed | 56614 | -| total_timesteps | 1244288 | -| train/ | | -| approx_kl | 0.0077626845 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | 0.241 | -| learning_rate | 0.0003 | -| loss | -0.00924 | -| n_updates | 97200 | -| policy_gradient_loss | -0.00492 | -| std | 0.0451 | -| value_loss | 1.02e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9722 | -| time_elapsed | 56617 | -| total_timesteps | 1244416 | -| train/ | | -| approx_kl | 0.0022224654 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 97210 | -| policy_gradient_loss | 0.000393 | -| std | 0.045 | -| value_loss | 2.76e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9723 | -| time_elapsed | 56620 | -| total_timesteps | 1244544 | -| train/ | | -| approx_kl | 0.0011161868 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.405 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 97220 | -| policy_gradient_loss | 0.0004 | -| std | 0.045 | -| value_loss | 6.31e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9724 | -| time_elapsed | 56624 | -| total_timesteps | 1244672 | -| train/ | | -| approx_kl | 1.4498364e-05 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.000699 | -| n_updates | 97230 | -| policy_gradient_loss | 0.000796 | -| std | 0.045 | -| value_loss | 2.19e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9725 | -| time_elapsed | 56628 | -| total_timesteps | 1244800 | -| train/ | | -| approx_kl | 0.00019788928 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | -0.000971 | -| n_updates | 97240 | -| policy_gradient_loss | 0.00012 | -| std | 0.0449 | -| value_loss | 1.34e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.834 | -| time/ | | -| fps | 21 | -| iterations | 9726 | -| time_elapsed | 56631 | -| total_timesteps | 1244928 | -| train/ | | -| approx_kl | 0.0114632975 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 97250 | -| policy_gradient_loss | -0.00775 | -| std | 0.0449 | -| value_loss | 1.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9727 | -| time_elapsed | 56636 | -| total_timesteps | 1245056 | -| train/ | | -| approx_kl | 0.015743382 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 97260 | -| policy_gradient_loss | -0.00434 | -| std | 0.0449 | -| value_loss | 8.82e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9728 | -| time_elapsed | 56642 | -| total_timesteps | 1245184 | -| train/ | | -| approx_kl | 0.0382618 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 97270 | -| policy_gradient_loss | -0.00857 | -| std | 0.0449 | -| value_loss | 0.0004 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9729 | -| time_elapsed | 56646 | -| total_timesteps | 1245312 | -| train/ | | -| approx_kl | 0.0015372043 | -| clip_fraction | 0.00625 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 97280 | -| policy_gradient_loss | -0.000903 | -| std | 0.0449 | -| value_loss | 3.66e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9730 | -| time_elapsed | 56649 | -| total_timesteps | 1245440 | -| train/ | | -| approx_kl | 0.005183007 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 97290 | -| policy_gradient_loss | -0.00617 | -| std | 0.0449 | -| value_loss | 4.06e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9731 | -| time_elapsed | 56651 | -| total_timesteps | 1245568 | -| train/ | | -| approx_kl | 6.5667555e-06 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 4.79e-05 | -| n_updates | 97300 | -| policy_gradient_loss | 0.000527 | -| std | 0.0448 | -| value_loss | 1.59e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9732 | -| time_elapsed | 56655 | -| total_timesteps | 1245696 | -| train/ | | -| approx_kl | 0.018251095 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.00571 | -| learning_rate | 0.0003 | -| loss | -7.07e-06 | -| n_updates | 97310 | -| policy_gradient_loss | -0.00174 | -| std | 0.0448 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9733 | -| time_elapsed | 56660 | -| total_timesteps | 1245824 | -| train/ | | -| approx_kl | 0.0022388268 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.00409 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 97320 | -| policy_gradient_loss | -0.000149 | -| std | 0.0447 | -| value_loss | 2.39e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 21 | -| iterations | 9734 | -| time_elapsed | 56663 | -| total_timesteps | 1245952 | -| train/ | | -| approx_kl | 0.0018838518 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.000922 | -| n_updates | 97330 | -| policy_gradient_loss | -0.000341 | -| std | 0.0448 | -| value_loss | 1.93e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9735 | -| time_elapsed | 56667 | -| total_timesteps | 1246080 | -| train/ | | -| approx_kl | 3.0859374e-06 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.000335 | -| learning_rate | 0.0003 | -| loss | -2.75e-05 | -| n_updates | 97340 | -| policy_gradient_loss | 0.00677 | -| std | 0.0448 | -| value_loss | 8.28e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9736 | -| time_elapsed | 56674 | -| total_timesteps | 1246208 | -| train/ | | -| approx_kl | 0.00051211845 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | 0.699 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 97350 | -| policy_gradient_loss | -0.00949 | -| std | 0.0448 | -| value_loss | 0.00504 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9737 | -| time_elapsed | 56679 | -| total_timesteps | 1246336 | -| train/ | | -| approx_kl | 0.004394777 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -3.65 | -| learning_rate | 0.0003 | -| loss | -0.00961 | -| n_updates | 97360 | -| policy_gradient_loss | -0.00741 | -| std | 0.0447 | -| value_loss | 0.000181 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9738 | -| time_elapsed | 56683 | -| total_timesteps | 1246464 | -| train/ | | -| approx_kl | 0.005913575 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -428 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 97370 | -| policy_gradient_loss | -0.00604 | -| std | 0.0447 | -| value_loss | 5.69e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9739 | -| time_elapsed | 56686 | -| total_timesteps | 1246592 | -| train/ | | -| approx_kl | 0.004538966 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -215 | -| learning_rate | 0.0003 | -| loss | -0.00808 | -| n_updates | 97380 | -| policy_gradient_loss | -0.00806 | -| std | 0.0447 | -| value_loss | 1.59e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9740 | -| time_elapsed | 56689 | -| total_timesteps | 1246720 | -| train/ | | -| approx_kl | 0.010922988 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -32 | -| learning_rate | 0.0003 | -| loss | 0.000604 | -| n_updates | 97390 | -| policy_gradient_loss | 7.55e-05 | -| std | 0.0448 | -| value_loss | 3.15e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9741 | -| time_elapsed | 56691 | -| total_timesteps | 1246848 | -| train/ | | -| approx_kl | 0.0012507187 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.425 | -| learning_rate | 0.0003 | -| loss | -0.000546 | -| n_updates | 97400 | -| policy_gradient_loss | -0.000524 | -| std | 0.0448 | -| value_loss | 1.78e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 21 | -| iterations | 9742 | -| time_elapsed | 56695 | -| total_timesteps | 1246976 | -| train/ | | -| approx_kl | 0.0062291254 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | 0.00229 | -| learning_rate | 0.0003 | -| loss | -0.000272 | -| n_updates | 97410 | -| policy_gradient_loss | 0.00223 | -| std | 0.0448 | -| value_loss | 8.84e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 9743 | -| time_elapsed | 56698 | -| total_timesteps | 1247104 | -| train/ | | -| approx_kl | 0.014437029 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.00166 | -| learning_rate | 0.0003 | -| loss | 0.00743 | -| n_updates | 97420 | -| policy_gradient_loss | 0.00145 | -| std | 0.0448 | -| value_loss | 3.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 9744 | -| time_elapsed | 56706 | -| total_timesteps | 1247232 | -| train/ | | -| approx_kl | 0.19796596 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | 0.849 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 97430 | -| policy_gradient_loss | -0.0162 | -| std | 0.0447 | -| value_loss | 0.00275 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 9745 | -| time_elapsed | 56709 | -| total_timesteps | 1247360 | -| train/ | | -| approx_kl | 0.003067019 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 97440 | -| policy_gradient_loss | -0.00498 | -| std | 0.0447 | -| value_loss | 9.87e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 9746 | -| time_elapsed | 56712 | -| total_timesteps | 1247488 | -| train/ | | -| approx_kl | 0.07401426 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -24.8 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 97450 | -| policy_gradient_loss | -0.00947 | -| std | 0.0447 | -| value_loss | 2.54e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 9747 | -| time_elapsed | 56716 | -| total_timesteps | 1247616 | -| train/ | | -| approx_kl | 0.05468869 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -2.62 | -| learning_rate | 0.0003 | -| loss | 0.0033 | -| n_updates | 97460 | -| policy_gradient_loss | 0.000874 | -| std | 0.0447 | -| value_loss | 2.7e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 9748 | -| time_elapsed | 56719 | -| total_timesteps | 1247744 | -| train/ | | -| approx_kl | 0.009250148 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00289 | -| n_updates | 97470 | -| policy_gradient_loss | -0.00189 | -| std | 0.0447 | -| value_loss | 3.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 21 | -| iterations | 9749 | -| time_elapsed | 56723 | -| total_timesteps | 1247872 | -| train/ | | -| approx_kl | 0.004947562 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 97480 | -| policy_gradient_loss | -0.0102 | -| std | 0.0447 | -| value_loss | 2.3e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9750 | -| time_elapsed | 56726 | -| total_timesteps | 1248000 | -| train/ | | -| approx_kl | 0.0037034773 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.00844 | -| n_updates | 97490 | -| policy_gradient_loss | 0.00543 | -| std | 0.0447 | -| value_loss | 9.78e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9751 | -| time_elapsed | 56730 | -| total_timesteps | 1248128 | -| train/ | | -| approx_kl | 0.0024505062 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | 0.00238 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 97500 | -| policy_gradient_loss | -0.00927 | -| std | 0.0447 | -| value_loss | 3.25e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9752 | -| time_elapsed | 56737 | -| total_timesteps | 1248256 | -| train/ | | -| approx_kl | 0.016991306 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 97510 | -| policy_gradient_loss | -0.0125 | -| std | 0.0447 | -| value_loss | 0.000536 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9753 | -| time_elapsed | 56740 | -| total_timesteps | 1248384 | -| train/ | | -| approx_kl | 0.014986702 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -182 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 97520 | -| policy_gradient_loss | -0.011 | -| std | 0.0447 | -| value_loss | 6.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9754 | -| time_elapsed | 56743 | -| total_timesteps | 1248512 | -| train/ | | -| approx_kl | 0.053885344 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -5.74 | -| learning_rate | 0.0003 | -| loss | -0.0028 | -| n_updates | 97530 | -| policy_gradient_loss | 0.00552 | -| std | 0.0447 | -| value_loss | 1.37e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9755 | -| time_elapsed | 56747 | -| total_timesteps | 1248640 | -| train/ | | -| approx_kl | 0.0238842 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -13.3 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 97540 | -| policy_gradient_loss | 0.000929 | -| std | 0.0448 | -| value_loss | 8.71e-09 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9756 | -| time_elapsed | 56751 | -| total_timesteps | 1248768 | -| train/ | | -| approx_kl | 0.0043007242 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.345 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 97550 | -| policy_gradient_loss | -0.00262 | -| std | 0.0448 | -| value_loss | 2.08e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 22 | -| iterations | 9757 | -| time_elapsed | 56754 | -| total_timesteps | 1248896 | -| train/ | | -| approx_kl | 0.005907361 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.00173 | -| n_updates | 97560 | -| policy_gradient_loss | 0.000318 | -| std | 0.0449 | -| value_loss | 9.02e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9758 | -| time_elapsed | 56759 | -| total_timesteps | 1249024 | -| train/ | | -| approx_kl | 0.0025838488 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 97570 | -| policy_gradient_loss | -0.00174 | -| std | 0.0449 | -| value_loss | 2.09e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9759 | -| time_elapsed | 56768 | -| total_timesteps | 1249152 | -| train/ | | -| approx_kl | 0.08109435 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -11.7 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 97580 | -| policy_gradient_loss | -0.0156 | -| std | 0.0449 | -| value_loss | 0.00469 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9760 | -| time_elapsed | 56772 | -| total_timesteps | 1249280 | -| train/ | | -| approx_kl | 0.00026160432 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -24.2 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 97590 | -| policy_gradient_loss | -0.0105 | -| std | 0.0449 | -| value_loss | 8.77e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9761 | -| time_elapsed | 56776 | -| total_timesteps | 1249408 | -| train/ | | -| approx_kl | 0.006228685 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 1.68 | -| explained_variance | -535 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 97600 | -| policy_gradient_loss | -0.00375 | -| std | 0.0449 | -| value_loss | 5.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9762 | -| time_elapsed | 56779 | -| total_timesteps | 1249536 | -| train/ | | -| approx_kl | 0.013469527 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -100 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 97610 | -| policy_gradient_loss | -0.00215 | -| std | 0.0448 | -| value_loss | 1.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9763 | -| time_elapsed | 56783 | -| total_timesteps | 1249664 | -| train/ | | -| approx_kl | 0.006592118 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -51.6 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 97620 | -| policy_gradient_loss | -0.00941 | -| std | 0.0447 | -| value_loss | 1.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9764 | -| time_elapsed | 56786 | -| total_timesteps | 1249792 | -| train/ | | -| approx_kl | 0.0046368404 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | 0.000303 | -| n_updates | 97630 | -| policy_gradient_loss | 0.00202 | -| std | 0.0447 | -| value_loss | 1.14e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9765 | -| time_elapsed | 56790 | -| total_timesteps | 1249920 | -| train/ | | -| approx_kl | 0.0007137903 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 97640 | -| policy_gradient_loss | -0.00202 | -| std | 0.0446 | -| value_loss | 2.04e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9766 | -| time_elapsed | 56793 | -| total_timesteps | 1250048 | -| train/ | | -| approx_kl | 0.00037916936 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 97650 | -| policy_gradient_loss | -0.000395 | -| std | 0.0445 | -| value_loss | 3.51e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9767 | -| time_elapsed | 56801 | -| total_timesteps | 1250176 | -| train/ | | -| approx_kl | 0.0033973642 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | 0.826 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 97660 | -| policy_gradient_loss | 0.000565 | -| std | 0.0444 | -| value_loss | 0.00263 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9768 | -| time_elapsed | 56805 | -| total_timesteps | 1250304 | -| train/ | | -| approx_kl | 0.016613536 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -1.96 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 97670 | -| policy_gradient_loss | 0.00459 | -| std | 0.0445 | -| value_loss | 1.28e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9769 | -| time_elapsed | 56808 | -| total_timesteps | 1250432 | -| train/ | | -| approx_kl | 0.01929184 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -6.69 | -| learning_rate | 0.0003 | -| loss | -0.000869 | -| n_updates | 97680 | -| policy_gradient_loss | 0.000828 | -| std | 0.0446 | -| value_loss | 4.42e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9770 | -| time_elapsed | 56812 | -| total_timesteps | 1250560 | -| train/ | | -| approx_kl | 0.012485171 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | 0.00653 | -| n_updates | 97690 | -| policy_gradient_loss | 0.00633 | -| std | 0.0445 | -| value_loss | 7.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9771 | -| time_elapsed | 56816 | -| total_timesteps | 1250688 | -| train/ | | -| approx_kl | 0.003482602 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -13.6 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 97700 | -| policy_gradient_loss | -0.0123 | -| std | 0.0445 | -| value_loss | 5.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9772 | -| time_elapsed | 56818 | -| total_timesteps | 1250816 | -| train/ | | -| approx_kl | 0.009257073 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 1.69 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | 0.000148 | -| n_updates | 97710 | -| policy_gradient_loss | -0.000794 | -| std | 0.0445 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9773 | -| time_elapsed | 56822 | -| total_timesteps | 1250944 | -| train/ | | -| approx_kl | 0.006771229 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.0867 | -| learning_rate | 0.0003 | -| loss | -0.00459 | -| n_updates | 97720 | -| policy_gradient_loss | -0.00136 | -| std | 0.0444 | -| value_loss | 4.21e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9774 | -| time_elapsed | 56826 | -| total_timesteps | 1251072 | -| train/ | | -| approx_kl | 0.00079899654 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 97730 | -| policy_gradient_loss | -0.000508 | -| std | 0.0444 | -| value_loss | 3.17e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9775 | -| time_elapsed | 56832 | -| total_timesteps | 1251200 | -| train/ | | -| approx_kl | 0.028059835 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | 0.863 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 97740 | -| policy_gradient_loss | -0.00298 | -| std | 0.0444 | -| value_loss | 0.00197 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9776 | -| time_elapsed | 56835 | -| total_timesteps | 1251328 | -| train/ | | -| approx_kl | 4.6310946e-05 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 97750 | -| policy_gradient_loss | -0.00448 | -| std | 0.0444 | -| value_loss | 1.17e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9777 | -| time_elapsed | 56839 | -| total_timesteps | 1251456 | -| train/ | | -| approx_kl | 0.00816397 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.0579 | -| learning_rate | 0.0003 | -| loss | -0.0253 | -| n_updates | 97760 | -| policy_gradient_loss | -0.0178 | -| std | 0.0444 | -| value_loss | 0.000107 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9778 | -| time_elapsed | 56843 | -| total_timesteps | 1251584 | -| train/ | | -| approx_kl | 0.005472877 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.0998 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 97770 | -| policy_gradient_loss | -0.00065 | -| std | 0.0443 | -| value_loss | 2.63e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9779 | -| time_elapsed | 56847 | -| total_timesteps | 1251712 | -| train/ | | -| approx_kl | 0.0057217185 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -9.15 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 97780 | -| policy_gradient_loss | -0.000732 | -| std | 0.0443 | -| value_loss | 0.00118 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9780 | -| time_elapsed | 56850 | -| total_timesteps | 1251840 | -| train/ | | -| approx_kl | 0.010412018 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 97790 | -| policy_gradient_loss | -0.000205 | -| std | 0.0443 | -| value_loss | 0.00351 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 22 | -| iterations | 9781 | -| time_elapsed | 56853 | -| total_timesteps | 1251968 | -| train/ | | -| approx_kl | 0.0052298973 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -7.02e-05 | -| n_updates | 97800 | -| policy_gradient_loss | 0.000337 | -| std | 0.0442 | -| value_loss | 0.000253 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9782 | -| time_elapsed | 56857 | -| total_timesteps | 1252096 | -| train/ | | -| approx_kl | 0.00048478087 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.00577 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 97810 | -| policy_gradient_loss | 0.00126 | -| std | 0.0442 | -| value_loss | 1.7e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9783 | -| time_elapsed | 56865 | -| total_timesteps | 1252224 | -| train/ | | -| approx_kl | 0.013719343 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | 0.804 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 97820 | -| policy_gradient_loss | -0.0121 | -| std | 0.0442 | -| value_loss | 0.000557 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9784 | -| time_elapsed | 56869 | -| total_timesteps | 1252352 | -| train/ | | -| approx_kl | 0.00014788099 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.00662 | -| learning_rate | 0.0003 | -| loss | 0.000122 | -| n_updates | 97830 | -| policy_gradient_loss | 0.00401 | -| std | 0.0442 | -| value_loss | 1.79e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9785 | -| time_elapsed | 56872 | -| total_timesteps | 1252480 | -| train/ | | -| approx_kl | 0.00019230787 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | 0.0029 | -| learning_rate | 0.0003 | -| loss | -0.000294 | -| n_updates | 97840 | -| policy_gradient_loss | 0.00072 | -| std | 0.0443 | -| value_loss | 2.39e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9786 | -| time_elapsed | 56876 | -| total_timesteps | 1252608 | -| train/ | | -| approx_kl | 0.0002250555 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.00419 | -| n_updates | 97850 | -| policy_gradient_loss | -0.00989 | -| std | 0.0443 | -| value_loss | 3.38e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9787 | -| time_elapsed | 56879 | -| total_timesteps | 1252736 | -| train/ | | -| approx_kl | 8.288771e-07 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | 0.00208 | -| learning_rate | 0.0003 | -| loss | 0.000188 | -| n_updates | 97860 | -| policy_gradient_loss | -0.00701 | -| std | 0.0443 | -| value_loss | 3.57e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9788 | -| time_elapsed | 56883 | -| total_timesteps | 1252864 | -| train/ | | -| approx_kl | 1.6852282e-05 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 97870 | -| policy_gradient_loss | -0.0116 | -| std | 0.0443 | -| value_loss | 2.88e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 22 | -| iterations | 9789 | -| time_elapsed | 56887 | -| total_timesteps | 1252992 | -| train/ | | -| approx_kl | 0.0010866057 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 97880 | -| policy_gradient_loss | -0.000222 | -| std | 0.0443 | -| value_loss | 1.5e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 22 | -| iterations | 9790 | -| time_elapsed | 56892 | -| total_timesteps | 1253120 | -| train/ | | -| approx_kl | 0.00841593 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 97890 | -| policy_gradient_loss | -0.00432 | -| std | 0.0443 | -| value_loss | 1.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 22 | -| iterations | 9791 | -| time_elapsed | 56899 | -| total_timesteps | 1253248 | -| train/ | | -| approx_kl | 0.073084645 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 97900 | -| policy_gradient_loss | -0.0131 | -| std | 0.0443 | -| value_loss | 0.000623 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 22 | -| iterations | 9792 | -| time_elapsed | 56902 | -| total_timesteps | 1253376 | -| train/ | | -| approx_kl | 0.0003936314 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 1.7 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 97910 | -| policy_gradient_loss | -0.000859 | -| std | 0.044 | -| value_loss | 5.04e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 22 | -| iterations | 9793 | -| time_elapsed | 56906 | -| total_timesteps | 1253504 | -| train/ | | -| approx_kl | 0.00035347044 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 1.71 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 97920 | -| policy_gradient_loss | -0.000349 | -| std | 0.0438 | -| value_loss | 1.52e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 22 | -| iterations | 9794 | -| time_elapsed | 56909 | -| total_timesteps | 1253632 | -| train/ | | -| approx_kl | 0.0007052105 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 1.71 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | -0.000449 | -| n_updates | 97930 | -| policy_gradient_loss | 0.00109 | -| std | 0.0437 | -| value_loss | 2.32e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 22 | -| iterations | 9795 | -| time_elapsed | 56912 | -| total_timesteps | 1253760 | -| train/ | | -| approx_kl | 0.007903352 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.71 | -| explained_variance | 0.00369 | -| learning_rate | 0.0003 | -| loss | -0.00785 | -| n_updates | 97940 | -| policy_gradient_loss | -0.00424 | -| std | 0.0436 | -| value_loss | 8.76e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 22 | -| iterations | 9796 | -| time_elapsed | 56915 | -| total_timesteps | 1253888 | -| train/ | | -| approx_kl | 0.0040676366 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.71 | -| explained_variance | 0.00412 | -| learning_rate | 0.0003 | -| loss | -0.00667 | -| n_updates | 97950 | -| policy_gradient_loss | -0.00518 | -| std | 0.0436 | -| value_loss | 6.87e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9797 | -| time_elapsed | 56919 | -| total_timesteps | 1254016 | -| train/ | | -| approx_kl | 0.0032242206 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 97960 | -| policy_gradient_loss | -0.000467 | -| std | 0.0433 | -| value_loss | 7.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9798 | -| time_elapsed | 56927 | -| total_timesteps | 1254144 | -| train/ | | -| approx_kl | 0.029088948 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | 0.938 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 97970 | -| policy_gradient_loss | -0.0161 | -| std | 0.0431 | -| value_loss | 0.000201 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9799 | -| time_elapsed | 56931 | -| total_timesteps | 1254272 | -| train/ | | -| approx_kl | 0.0022829976 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -1.53 | -| learning_rate | 0.0003 | -| loss | 0.00469 | -| n_updates | 97980 | -| policy_gradient_loss | -0.000899 | -| std | 0.0431 | -| value_loss | 1.67e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9800 | -| time_elapsed | 56936 | -| total_timesteps | 1254400 | -| train/ | | -| approx_kl | 0.0031526433 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -319 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 97990 | -| policy_gradient_loss | -0.0109 | -| std | 0.043 | -| value_loss | 2.18e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9801 | -| time_elapsed | 56939 | -| total_timesteps | 1254528 | -| train/ | | -| approx_kl | 0.0032038935 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -72.6 | -| learning_rate | 0.0003 | -| loss | -0.00992 | -| n_updates | 98000 | -| policy_gradient_loss | -0.0132 | -| std | 0.043 | -| value_loss | 4.2e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9802 | -| time_elapsed | 56942 | -| total_timesteps | 1254656 | -| train/ | | -| approx_kl | 0.022293393 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -32.6 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 98010 | -| policy_gradient_loss | -0.0141 | -| std | 0.043 | -| value_loss | 2.9e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9803 | -| time_elapsed | 56946 | -| total_timesteps | 1254784 | -| train/ | | -| approx_kl | 1.0551885e-05 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -5.02 | -| learning_rate | 0.0003 | -| loss | 0.000439 | -| n_updates | 98020 | -| policy_gradient_loss | -0.00196 | -| std | 0.043 | -| value_loss | 4.55e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 22 | -| iterations | 9804 | -| time_elapsed | 56948 | -| total_timesteps | 1254912 | -| train/ | | -| approx_kl | 0.0076997727 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.677 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 98030 | -| policy_gradient_loss | -0.00246 | -| std | 0.0431 | -| value_loss | 1.92e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9805 | -| time_elapsed | 56951 | -| total_timesteps | 1255040 | -| train/ | | -| approx_kl | 0.0017796839 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 98040 | -| policy_gradient_loss | 0.0036 | -| std | 0.0431 | -| value_loss | 7.42e-12 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9806 | -| time_elapsed | 56958 | -| total_timesteps | 1255168 | -| train/ | | -| approx_kl | 0.0316108 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 98050 | -| policy_gradient_loss | -0.015 | -| std | 0.0431 | -| value_loss | 0.00205 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9807 | -| time_elapsed | 56963 | -| total_timesteps | 1255296 | -| train/ | | -| approx_kl | 0.0030388841 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 98060 | -| policy_gradient_loss | 3.85e-05 | -| std | 0.0431 | -| value_loss | 3.49e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9808 | -| time_elapsed | 56966 | -| total_timesteps | 1255424 | -| train/ | | -| approx_kl | 0.008215575 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -3.46 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 98070 | -| policy_gradient_loss | -0.00249 | -| std | 0.0431 | -| value_loss | 2.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9809 | -| time_elapsed | 56969 | -| total_timesteps | 1255552 | -| train/ | | -| approx_kl | 0.0009998581 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.947 | -| learning_rate | 0.0003 | -| loss | -0.000731 | -| n_updates | 98080 | -| policy_gradient_loss | 0.00294 | -| std | 0.0431 | -| value_loss | 1.38e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9810 | -| time_elapsed | 56972 | -| total_timesteps | 1255680 | -| train/ | | -| approx_kl | 0.003625888 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.399 | -| learning_rate | 0.0003 | -| loss | -0.00765 | -| n_updates | 98090 | -| policy_gradient_loss | -0.00311 | -| std | 0.043 | -| value_loss | 7.37e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9811 | -| time_elapsed | 56975 | -| total_timesteps | 1255808 | -| train/ | | -| approx_kl | 0.00030991854 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0713 | -| learning_rate | 0.0003 | -| loss | 0.00038 | -| n_updates | 98100 | -| policy_gradient_loss | 0.000947 | -| std | 0.043 | -| value_loss | 5.23e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9812 | -| time_elapsed | 56977 | -| total_timesteps | 1255936 | -| train/ | | -| approx_kl | 0.0018926566 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | 0.00453 | -| n_updates | 98110 | -| policy_gradient_loss | -0.000108 | -| std | 0.0431 | -| value_loss | 1.3e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9813 | -| time_elapsed | 56980 | -| total_timesteps | 1256064 | -| train/ | | -| approx_kl | 0.0011465568 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.000164 | -| learning_rate | 0.0003 | -| loss | 0.000652 | -| n_updates | 98120 | -| policy_gradient_loss | 0.00127 | -| std | 0.0431 | -| value_loss | 3.94e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9814 | -| time_elapsed | 56986 | -| total_timesteps | 1256192 | -| train/ | | -| approx_kl | 0.041123748 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 98130 | -| policy_gradient_loss | -0.0045 | -| std | 0.0431 | -| value_loss | 0.00147 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9815 | -| time_elapsed | 56990 | -| total_timesteps | 1256320 | -| train/ | | -| approx_kl | 0.20434706 | -| clip_fraction | 0.581 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | -0.0075 | -| n_updates | 98140 | -| policy_gradient_loss | -0.00527 | -| std | 0.0431 | -| value_loss | 4.49e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9816 | -| time_elapsed | 56994 | -| total_timesteps | 1256448 | -| train/ | | -| approx_kl | 0.0625564 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -17 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 98150 | -| policy_gradient_loss | -0.00192 | -| std | 0.0431 | -| value_loss | 3.29e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9817 | -| time_elapsed | 56997 | -| total_timesteps | 1256576 | -| train/ | | -| approx_kl | 0.011397477 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -2.9 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 98160 | -| policy_gradient_loss | -0.00671 | -| std | 0.0431 | -| value_loss | 5.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9818 | -| time_elapsed | 57000 | -| total_timesteps | 1256704 | -| train/ | | -| approx_kl | 0.008693287 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.969 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 98170 | -| policy_gradient_loss | -0.00775 | -| std | 0.0431 | -| value_loss | 1.89e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9819 | -| time_elapsed | 57003 | -| total_timesteps | 1256832 | -| train/ | | -| approx_kl | 0.00044803368 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 98180 | -| policy_gradient_loss | -0.000427 | -| std | 0.0431 | -| value_loss | 1.04e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9820 | -| time_elapsed | 57006 | -| total_timesteps | 1256960 | -| train/ | | -| approx_kl | 1.4151912e-05 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0709 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 98190 | -| policy_gradient_loss | -0.00262 | -| std | 0.0431 | -| value_loss | 6.51e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9821 | -| time_elapsed | 57010 | -| total_timesteps | 1257088 | -| train/ | | -| approx_kl | 0.015398292 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.000318 | -| n_updates | 98200 | -| policy_gradient_loss | -0.00417 | -| std | 0.0431 | -| value_loss | 2.62e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9822 | -| time_elapsed | 57016 | -| total_timesteps | 1257216 | -| train/ | | -| approx_kl | 0.041590128 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 98210 | -| policy_gradient_loss | -0.0149 | -| std | 0.0431 | -| value_loss | 0.00121 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9823 | -| time_elapsed | 57020 | -| total_timesteps | 1257344 | -| train/ | | -| approx_kl | 0.01004592 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.55 | -| learning_rate | 0.0003 | -| loss | 0.00339 | -| n_updates | 98220 | -| policy_gradient_loss | 0.00262 | -| std | 0.0431 | -| value_loss | 1.91e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9824 | -| time_elapsed | 57023 | -| total_timesteps | 1257472 | -| train/ | | -| approx_kl | 0.000792271 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 98230 | -| policy_gradient_loss | -0.00152 | -| std | 0.0431 | -| value_loss | 1.74e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9825 | -| time_elapsed | 57026 | -| total_timesteps | 1257600 | -| train/ | | -| approx_kl | 0.0118441135 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.614 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 98240 | -| policy_gradient_loss | -0.000731 | -| std | 0.0432 | -| value_loss | 7.1e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9826 | -| time_elapsed | 57030 | -| total_timesteps | 1257728 | -| train/ | | -| approx_kl | 0.0024314397 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.00997 | -| n_updates | 98250 | -| policy_gradient_loss | -0.00348 | -| std | 0.0432 | -| value_loss | 2.4e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9827 | -| time_elapsed | 57033 | -| total_timesteps | 1257856 | -| train/ | | -| approx_kl | 0.009997062 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.00753 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 98260 | -| policy_gradient_loss | 0.000189 | -| std | 0.0433 | -| value_loss | 1.85e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9828 | -| time_elapsed | 57037 | -| total_timesteps | 1257984 | -| train/ | | -| approx_kl | 0.0044831233 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | 0.00454 | -| learning_rate | 0.0003 | -| loss | 0.00451 | -| n_updates | 98270 | -| policy_gradient_loss | 0.00167 | -| std | 0.0433 | -| value_loss | 6.84e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9829 | -| time_elapsed | 57039 | -| total_timesteps | 1258112 | -| train/ | | -| approx_kl | 0.01119944 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 98280 | -| policy_gradient_loss | -0.000525 | -| std | 0.0433 | -| value_loss | 4.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9830 | -| time_elapsed | 57048 | -| total_timesteps | 1258240 | -| train/ | | -| approx_kl | 0.014528941 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | 0.777 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 98290 | -| policy_gradient_loss | -0.0182 | -| std | 0.0433 | -| value_loss | 0.00477 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9831 | -| time_elapsed | 57052 | -| total_timesteps | 1258368 | -| train/ | | -| approx_kl | 0.00033026747 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | 0.00227 | -| learning_rate | 0.0003 | -| loss | -0.00483 | -| n_updates | 98300 | -| policy_gradient_loss | -0.00786 | -| std | 0.0433 | -| value_loss | 7.52e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9832 | -| time_elapsed | 57057 | -| total_timesteps | 1258496 | -| train/ | | -| approx_kl | 0.00015292689 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.321 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 98310 | -| policy_gradient_loss | 0.00127 | -| std | 0.0433 | -| value_loss | 4.46e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9833 | -| time_elapsed | 57060 | -| total_timesteps | 1258624 | -| train/ | | -| approx_kl | 0.00043459516 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.00262 | -| n_updates | 98320 | -| policy_gradient_loss | -0.000833 | -| std | 0.0433 | -| value_loss | 2.87e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9834 | -| time_elapsed | 57063 | -| total_timesteps | 1258752 | -| train/ | | -| approx_kl | 0.0005140109 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.00263 | -| n_updates | 98330 | -| policy_gradient_loss | -0.000585 | -| std | 0.0433 | -| value_loss | 1.87e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9835 | -| time_elapsed | 57066 | -| total_timesteps | 1258880 | -| train/ | | -| approx_kl | 0.00070427265 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.00183 | -| n_updates | 98340 | -| policy_gradient_loss | 0.00466 | -| std | 0.0433 | -| value_loss | 1.16e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9836 | -| time_elapsed | 57070 | -| total_timesteps | 1259008 | -| train/ | | -| approx_kl | 0.0006952188 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.00077 | -| n_updates | 98350 | -| policy_gradient_loss | 0.00521 | -| std | 0.0434 | -| value_loss | 7.17e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9837 | -| time_elapsed | 57080 | -| total_timesteps | 1259136 | -| train/ | | -| approx_kl | 0.023480795 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -3.37 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 98360 | -| policy_gradient_loss | -0.0142 | -| std | 0.0434 | -| value_loss | 0.00298 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9838 | -| time_elapsed | 57085 | -| total_timesteps | 1259264 | -| train/ | | -| approx_kl | 1.3839919e-05 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -1.58 | -| learning_rate | 0.0003 | -| loss | 2.72e-05 | -| n_updates | 98370 | -| policy_gradient_loss | -0.000159 | -| std | 0.0434 | -| value_loss | 1.13e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9839 | -| time_elapsed | 57088 | -| total_timesteps | 1259392 | -| train/ | | -| approx_kl | 0.0071395272 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -201 | -| learning_rate | 0.0003 | -| loss | -0.000314 | -| n_updates | 98380 | -| policy_gradient_loss | -0.000169 | -| std | 0.0432 | -| value_loss | 1.97e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9840 | -| time_elapsed | 57091 | -| total_timesteps | 1259520 | -| train/ | | -| approx_kl | 0.056289192 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -28.5 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 98390 | -| policy_gradient_loss | -0.0165 | -| std | 0.0431 | -| value_loss | 4.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9841 | -| time_elapsed | 57095 | -| total_timesteps | 1259648 | -| train/ | | -| approx_kl | 0.057129215 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 98400 | -| policy_gradient_loss | 0.00541 | -| std | 0.0431 | -| value_loss | 8.63e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9842 | -| time_elapsed | 57098 | -| total_timesteps | 1259776 | -| train/ | | -| approx_kl | 0.002750732 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.381 | -| learning_rate | 0.0003 | -| loss | 0.00907 | -| n_updates | 98410 | -| policy_gradient_loss | -0.00103 | -| std | 0.0431 | -| value_loss | 1.51e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 22 | -| iterations | 9843 | -| time_elapsed | 57102 | -| total_timesteps | 1259904 | -| train/ | | -| approx_kl | 0.0034359475 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | -0.00578 | -| n_updates | 98420 | -| policy_gradient_loss | 0.000564 | -| std | 0.0431 | -| value_loss | 1.14e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9844 | -| time_elapsed | 57105 | -| total_timesteps | 1260032 | -| train/ | | -| approx_kl | 0.0017615366 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 98430 | -| policy_gradient_loss | -0.00236 | -| std | 0.0432 | -| value_loss | 1.87e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9845 | -| time_elapsed | 57113 | -| total_timesteps | 1260160 | -| train/ | | -| approx_kl | 0.002556434 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | -0.00099 | -| n_updates | 98440 | -| policy_gradient_loss | -0.00176 | -| std | 0.0432 | -| value_loss | 0.000947 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9846 | -| time_elapsed | 57116 | -| total_timesteps | 1260288 | -| train/ | | -| approx_kl | 0.0047841854 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -1.76 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 98450 | -| policy_gradient_loss | -0.0039 | -| std | 0.0431 | -| value_loss | 1.31e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9847 | -| time_elapsed | 57120 | -| total_timesteps | 1260416 | -| train/ | | -| approx_kl | 0.0076634213 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.72 | -| explained_variance | -4.29 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 98460 | -| policy_gradient_loss | -0.00938 | -| std | 0.0431 | -| value_loss | 2.28e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9848 | -| time_elapsed | 57122 | -| total_timesteps | 1260544 | -| train/ | | -| approx_kl | 0.00040259073 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.252 | -| learning_rate | 0.0003 | -| loss | -0.000213 | -| n_updates | 98470 | -| policy_gradient_loss | 0.00107 | -| std | 0.0431 | -| value_loss | 5.35e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9849 | -| time_elapsed | 57124 | -| total_timesteps | 1260672 | -| train/ | | -| approx_kl | 0.014009789 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | -4.65e-05 | -| n_updates | 98480 | -| policy_gradient_loss | -0.00242 | -| std | 0.043 | -| value_loss | 2.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9850 | -| time_elapsed | 57127 | -| total_timesteps | 1260800 | -| train/ | | -| approx_kl | 0.011760969 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.00319 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 98490 | -| policy_gradient_loss | -0.00431 | -| std | 0.043 | -| value_loss | 2.84e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9851 | -| time_elapsed | 57130 | -| total_timesteps | 1260928 | -| train/ | | -| approx_kl | 0.00033986988 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 98500 | -| policy_gradient_loss | -0.00298 | -| std | 0.043 | -| value_loss | 1.58e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9852 | -| time_elapsed | 57134 | -| total_timesteps | 1261056 | -| train/ | | -| approx_kl | 0.0016443003 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 98510 | -| policy_gradient_loss | 0.00686 | -| std | 0.043 | -| value_loss | 7.3e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9853 | -| time_elapsed | 57140 | -| total_timesteps | 1261184 | -| train/ | | -| approx_kl | 0.019472923 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -5.59 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 98520 | -| policy_gradient_loss | -0.0117 | -| std | 0.043 | -| value_loss | 0.00327 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9854 | -| time_elapsed | 57144 | -| total_timesteps | 1261312 | -| train/ | | -| approx_kl | 0.0090589775 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -143 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 98530 | -| policy_gradient_loss | -0.00888 | -| std | 0.043 | -| value_loss | 1.41e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9855 | -| time_elapsed | 57147 | -| total_timesteps | 1261440 | -| train/ | | -| approx_kl | 0.015932653 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 98540 | -| policy_gradient_loss | -0.0118 | -| std | 0.043 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9856 | -| time_elapsed | 57152 | -| total_timesteps | 1261568 | -| train/ | | -| approx_kl | 0.0065705576 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 98550 | -| policy_gradient_loss | -0.004 | -| std | 0.043 | -| value_loss | 3.33e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9857 | -| time_elapsed | 57156 | -| total_timesteps | 1261696 | -| train/ | | -| approx_kl | 0.0062523033 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 98560 | -| policy_gradient_loss | -0.000423 | -| std | 0.0429 | -| value_loss | 5.68e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9858 | -| time_elapsed | 57159 | -| total_timesteps | 1261824 | -| train/ | | -| approx_kl | 0.0052667605 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.00923 | -| learning_rate | 0.0003 | -| loss | -0.00582 | -| n_updates | 98570 | -| policy_gradient_loss | -0.00325 | -| std | 0.0429 | -| value_loss | 1.78e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 9859 | -| time_elapsed | 57162 | -| total_timesteps | 1261952 | -| train/ | | -| approx_kl | 0.0087454915 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | 0.00279 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 98580 | -| policy_gradient_loss | -0.000573 | -| std | 0.0428 | -| value_loss | 6.01e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9860 | -| time_elapsed | 57165 | -| total_timesteps | 1262080 | -| train/ | | -| approx_kl | 7.767696e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.73 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.001 | -| n_updates | 98590 | -| policy_gradient_loss | -0.000415 | -| std | 0.0425 | -| value_loss | 3.73e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9861 | -| time_elapsed | 57172 | -| total_timesteps | 1262208 | -| train/ | | -| approx_kl | 0.01240875 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.74 | -| explained_variance | 0.1 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 98600 | -| policy_gradient_loss | -0.0153 | -| std | 0.0422 | -| value_loss | 0.00129 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9862 | -| time_elapsed | 57176 | -| total_timesteps | 1262336 | -| train/ | | -| approx_kl | 0.0608585 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -1.67e+03 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 98610 | -| policy_gradient_loss | -0.00732 | -| std | 0.0421 | -| value_loss | 2.92e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9863 | -| time_elapsed | 57179 | -| total_timesteps | 1262464 | -| train/ | | -| approx_kl | 0.0077590183 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -283 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 98620 | -| policy_gradient_loss | -0.00207 | -| std | 0.0419 | -| value_loss | 9.35e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9864 | -| time_elapsed | 57183 | -| total_timesteps | 1262592 | -| train/ | | -| approx_kl | 0.0012462912 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.00936 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 98630 | -| policy_gradient_loss | -0.00796 | -| std | 0.0419 | -| value_loss | 1.47e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9865 | -| time_elapsed | 57187 | -| total_timesteps | 1262720 | -| train/ | | -| approx_kl | 0.002749551 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.000116 | -| learning_rate | 0.0003 | -| loss | -0.00069 | -| n_updates | 98640 | -| policy_gradient_loss | 0.000887 | -| std | 0.0419 | -| value_loss | 3.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9866 | -| time_elapsed | 57191 | -| total_timesteps | 1262848 | -| train/ | | -| approx_kl | 0.0021499079 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.00274 | -| learning_rate | 0.0003 | -| loss | 0.00089 | -| n_updates | 98650 | -| policy_gradient_loss | 0.00221 | -| std | 0.0418 | -| value_loss | 3.44e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 22 | -| iterations | 9867 | -| time_elapsed | 57194 | -| total_timesteps | 1262976 | -| train/ | | -| approx_kl | 0.01897325 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | 0.00531 | -| n_updates | 98660 | -| policy_gradient_loss | 0.000586 | -| std | 0.0417 | -| value_loss | 1.23e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9868 | -| time_elapsed | 57198 | -| total_timesteps | 1263104 | -| train/ | | -| approx_kl | 0.0044972324 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | -0.00865 | -| n_updates | 98670 | -| policy_gradient_loss | -0.00607 | -| std | 0.0417 | -| value_loss | 1.71e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9869 | -| time_elapsed | 57206 | -| total_timesteps | 1263232 | -| train/ | | -| approx_kl | 0.0058665904 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 98680 | -| policy_gradient_loss | -0.000688 | -| std | 0.0417 | -| value_loss | 0.000196 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9870 | -| time_elapsed | 57209 | -| total_timesteps | 1263360 | -| train/ | | -| approx_kl | 0.017354615 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.00828 | -| n_updates | 98690 | -| policy_gradient_loss | -0.00611 | -| std | 0.0417 | -| value_loss | 1.38e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9871 | -| time_elapsed | 57213 | -| total_timesteps | 1263488 | -| train/ | | -| approx_kl | 0.00012422027 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.775 | -| learning_rate | 0.0003 | -| loss | 0.000655 | -| n_updates | 98700 | -| policy_gradient_loss | -0.000602 | -| std | 0.0417 | -| value_loss | 6.97e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9872 | -| time_elapsed | 57216 | -| total_timesteps | 1263616 | -| train/ | | -| approx_kl | 0.010421736 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.00364 | -| n_updates | 98710 | -| policy_gradient_loss | 0.00153 | -| std | 0.0417 | -| value_loss | 1.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9873 | -| time_elapsed | 57219 | -| total_timesteps | 1263744 | -| train/ | | -| approx_kl | 0.013889028 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00545 | -| n_updates | 98720 | -| policy_gradient_loss | 0.00114 | -| std | 0.0417 | -| value_loss | 3.06e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 22 | -| iterations | 9874 | -| time_elapsed | 57223 | -| total_timesteps | 1263872 | -| train/ | | -| approx_kl | 0.0074409517 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.00128 | -| n_updates | 98730 | -| policy_gradient_loss | 0.00113 | -| std | 0.0417 | -| value_loss | 3.65e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9875 | -| time_elapsed | 57225 | -| total_timesteps | 1264000 | -| train/ | | -| approx_kl | 5.253125e-05 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.00703 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 98740 | -| policy_gradient_loss | 0.00866 | -| std | 0.0416 | -| value_loss | 1.32e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9876 | -| time_elapsed | 57229 | -| total_timesteps | 1264128 | -| train/ | | -| approx_kl | 0.0028313813 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.00311 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 98750 | -| policy_gradient_loss | -0.00476 | -| std | 0.0416 | -| value_loss | 2.83e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9877 | -| time_elapsed | 57236 | -| total_timesteps | 1264256 | -| train/ | | -| approx_kl | 0.013423337 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.016 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 98760 | -| policy_gradient_loss | -0.0104 | -| std | 0.0416 | -| value_loss | 0.00123 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9878 | -| time_elapsed | 57240 | -| total_timesteps | 1264384 | -| train/ | | -| approx_kl | 0.009453954 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -74.5 | -| learning_rate | 0.0003 | -| loss | -0.000192 | -| n_updates | 98770 | -| policy_gradient_loss | -0.000105 | -| std | 0.0416 | -| value_loss | 9.47e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9879 | -| time_elapsed | 57243 | -| total_timesteps | 1264512 | -| train/ | | -| approx_kl | 0.0037326845 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -2.34e+03 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 98780 | -| policy_gradient_loss | -0.0135 | -| std | 0.0416 | -| value_loss | 6.83e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9880 | -| time_elapsed | 57244 | -| total_timesteps | 1264640 | -| train/ | | -| approx_kl | 0.0023964583 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -322 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 98790 | -| policy_gradient_loss | -0.0107 | -| std | 0.0416 | -| value_loss | 3.32e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9881 | -| time_elapsed | 57247 | -| total_timesteps | 1264768 | -| train/ | | -| approx_kl | 0.013353719 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | 0.000832 | -| n_updates | 98800 | -| policy_gradient_loss | 0.000246 | -| std | 0.0415 | -| value_loss | 3.74e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 22 | -| iterations | 9882 | -| time_elapsed | 57250 | -| total_timesteps | 1264896 | -| train/ | | -| approx_kl | 0.00046282308 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.236 | -| learning_rate | 0.0003 | -| loss | 0.00438 | -| n_updates | 98810 | -| policy_gradient_loss | -0.00436 | -| std | 0.0415 | -| value_loss | 8.28e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9883 | -| time_elapsed | 57255 | -| total_timesteps | 1265024 | -| train/ | | -| approx_kl | 0.000665403 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.00331 | -| n_updates | 98820 | -| policy_gradient_loss | -0.00201 | -| std | 0.0415 | -| value_loss | 3e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9884 | -| time_elapsed | 57262 | -| total_timesteps | 1265152 | -| train/ | | -| approx_kl | 0.004870353 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -3.23 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 98830 | -| policy_gradient_loss | -0.0143 | -| std | 0.0415 | -| value_loss | 0.00198 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9885 | -| time_elapsed | 57266 | -| total_timesteps | 1265280 | -| train/ | | -| approx_kl | 0.0004075016 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 98840 | -| policy_gradient_loss | -0.000398 | -| std | 0.0415 | -| value_loss | 3.79e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9886 | -| time_elapsed | 57269 | -| total_timesteps | 1265408 | -| train/ | | -| approx_kl | 0.001353161 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -217 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 98850 | -| policy_gradient_loss | -0.00815 | -| std | 0.0416 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9887 | -| time_elapsed | 57273 | -| total_timesteps | 1265536 | -| train/ | | -| approx_kl | 9.509735e-06 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -36.1 | -| learning_rate | 0.0003 | -| loss | 0.000144 | -| n_updates | 98860 | -| policy_gradient_loss | -0.00107 | -| std | 0.0415 | -| value_loss | 1.48e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9888 | -| time_elapsed | 57276 | -| total_timesteps | 1265664 | -| train/ | | -| approx_kl | 0.011794478 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -5.58 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 98870 | -| policy_gradient_loss | -0.00481 | -| std | 0.0415 | -| value_loss | 2.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9889 | -| time_elapsed | 57281 | -| total_timesteps | 1265792 | -| train/ | | -| approx_kl | 0.005240234 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.781 | -| learning_rate | 0.0003 | -| loss | -0.00777 | -| n_updates | 98880 | -| policy_gradient_loss | -0.00377 | -| std | 0.0415 | -| value_loss | 8.87e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 22 | -| iterations | 9890 | -| time_elapsed | 57285 | -| total_timesteps | 1265920 | -| train/ | | -| approx_kl | 0.011394156 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | 0.000891 | -| n_updates | 98890 | -| policy_gradient_loss | -0.000578 | -| std | 0.0415 | -| value_loss | 5.78e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9891 | -| time_elapsed | 57289 | -| total_timesteps | 1266048 | -| train/ | | -| approx_kl | 0.0040458944 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.00225 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 98900 | -| policy_gradient_loss | -0.011 | -| std | 0.0415 | -| value_loss | 1.46e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9892 | -| time_elapsed | 57296 | -| total_timesteps | 1266176 | -| train/ | | -| approx_kl | 0.017410744 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.756 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 98910 | -| policy_gradient_loss | -0.0145 | -| std | 0.0415 | -| value_loss | 0.0031 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9893 | -| time_elapsed | 57299 | -| total_timesteps | 1266304 | -| train/ | | -| approx_kl | 0.0009254995 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -0.000973 | -| n_updates | 98920 | -| policy_gradient_loss | 0.000503 | -| std | 0.0416 | -| value_loss | 1.73e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9894 | -| time_elapsed | 57302 | -| total_timesteps | 1266432 | -| train/ | | -| approx_kl | 0.022364927 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -4.76 | -| learning_rate | 0.0003 | -| loss | 0.00216 | -| n_updates | 98930 | -| policy_gradient_loss | 0.0024 | -| std | 0.0416 | -| value_loss | 1.57e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9895 | -| time_elapsed | 57305 | -| total_timesteps | 1266560 | -| train/ | | -| approx_kl | 0.0032101208 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -1.92 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 98940 | -| policy_gradient_loss | 0.00127 | -| std | 0.0416 | -| value_loss | 4.13e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9896 | -| time_elapsed | 57307 | -| total_timesteps | 1266688 | -| train/ | | -| approx_kl | 0.04235741 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | 0.00385 | -| n_updates | 98950 | -| policy_gradient_loss | 0.00461 | -| std | 0.0416 | -| value_loss | 7.88e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9897 | -| time_elapsed | 57309 | -| total_timesteps | 1266816 | -| train/ | | -| approx_kl | 0.016378252 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.589 | -| learning_rate | 0.0003 | -| loss | 4.74e-05 | -| n_updates | 98960 | -| policy_gradient_loss | 0.00421 | -| std | 0.0417 | -| value_loss | 5.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9898 | -| time_elapsed | 57311 | -| total_timesteps | 1266944 | -| train/ | | -| approx_kl | 0.008081364 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -2.22 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 98970 | -| policy_gradient_loss | 0.00229 | -| std | 0.0417 | -| value_loss | 3.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9899 | -| time_elapsed | 57315 | -| total_timesteps | 1267072 | -| train/ | | -| approx_kl | 0.008062307 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | -0.00802 | -| n_updates | 98980 | -| policy_gradient_loss | -0.000138 | -| std | 0.0417 | -| value_loss | 1.33e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9900 | -| time_elapsed | 57320 | -| total_timesteps | 1267200 | -| train/ | | -| approx_kl | 0.010409944 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 98990 | -| policy_gradient_loss | -0.0129 | -| std | 0.0417 | -| value_loss | 0.000952 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9901 | -| time_elapsed | 57324 | -| total_timesteps | 1267328 | -| train/ | | -| approx_kl | 0.00036862725 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -3.61 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 99000 | -| policy_gradient_loss | 0.0052 | -| std | 0.0417 | -| value_loss | 7.88e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9902 | -| time_elapsed | 57327 | -| total_timesteps | 1267456 | -| train/ | | -| approx_kl | 0.007385894 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -382 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 99010 | -| policy_gradient_loss | -0.0127 | -| std | 0.0417 | -| value_loss | 2.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9903 | -| time_elapsed | 57331 | -| total_timesteps | 1267584 | -| train/ | | -| approx_kl | 0.023517706 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -579 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 99020 | -| policy_gradient_loss | -0.000699 | -| std | 0.0417 | -| value_loss | 2.44e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9904 | -| time_elapsed | 57333 | -| total_timesteps | 1267712 | -| train/ | | -| approx_kl | 0.15276428 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -50.8 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 99030 | -| policy_gradient_loss | -0.00595 | -| std | 0.0417 | -| value_loss | 6.07e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9905 | -| time_elapsed | 57337 | -| total_timesteps | 1267840 | -| train/ | | -| approx_kl | 0.0037554335 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -5.54 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 99040 | -| policy_gradient_loss | -0.00176 | -| std | 0.0417 | -| value_loss | 1.29e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9906 | -| time_elapsed | 57340 | -| total_timesteps | 1267968 | -| train/ | | -| approx_kl | 0.00046599144 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 99050 | -| policy_gradient_loss | 0.00417 | -| std | 0.0417 | -| value_loss | 6.91e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9907 | -| time_elapsed | 57342 | -| total_timesteps | 1268096 | -| train/ | | -| approx_kl | 0.00018204795 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.00177 | -| n_updates | 99060 | -| policy_gradient_loss | -4.34e-05 | -| std | 0.0417 | -| value_loss | 3.73e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9908 | -| time_elapsed | 57350 | -| total_timesteps | 1268224 | -| train/ | | -| approx_kl | 0.0039374516 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 99070 | -| policy_gradient_loss | -0.0106 | -| std | 0.0417 | -| value_loss | 0.000261 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9909 | -| time_elapsed | 57353 | -| total_timesteps | 1268352 | -| train/ | | -| approx_kl | 0.0585107 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -47.6 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 99080 | -| policy_gradient_loss | -0.011 | -| std | 0.0417 | -| value_loss | 3.24e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9910 | -| time_elapsed | 57356 | -| total_timesteps | 1268480 | -| train/ | | -| approx_kl | 0.06425868 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -165 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 99090 | -| policy_gradient_loss | -0.00411 | -| std | 0.0417 | -| value_loss | 2.07e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9911 | -| time_elapsed | 57358 | -| total_timesteps | 1268608 | -| train/ | | -| approx_kl | 0.00087339757 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -16 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 99100 | -| policy_gradient_loss | -0.00174 | -| std | 0.0417 | -| value_loss | 3.01e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9912 | -| time_elapsed | 57361 | -| total_timesteps | 1268736 | -| train/ | | -| approx_kl | 0.0071385275 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | -0.0098 | -| n_updates | 99110 | -| policy_gradient_loss | -0.00652 | -| std | 0.0416 | -| value_loss | 1.47e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9913 | -| time_elapsed | 57364 | -| total_timesteps | 1268864 | -| train/ | | -| approx_kl | 0.007959973 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | 0.0011 | -| n_updates | 99120 | -| policy_gradient_loss | 0.00184 | -| std | 0.0417 | -| value_loss | 3.49e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 22 | -| iterations | 9914 | -| time_elapsed | 57367 | -| total_timesteps | 1268992 | -| train/ | | -| approx_kl | 0.025080843 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.000484 | -| learning_rate | 0.0003 | -| loss | -0.00467 | -| n_updates | 99130 | -| policy_gradient_loss | -0.00701 | -| std | 0.0418 | -| value_loss | 2.42e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9915 | -| time_elapsed | 57370 | -| total_timesteps | 1269120 | -| train/ | | -| approx_kl | 0.002352905 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.00899 | -| n_updates | 99140 | -| policy_gradient_loss | -0.00629 | -| std | 0.0418 | -| value_loss | 8.47e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9916 | -| time_elapsed | 57380 | -| total_timesteps | 1269248 | -| train/ | | -| approx_kl | 0.011506977 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 99150 | -| policy_gradient_loss | -0.0165 | -| std | 0.0418 | -| value_loss | 7.91e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9917 | -| time_elapsed | 57384 | -| total_timesteps | 1269376 | -| train/ | | -| approx_kl | 0.0004897439 | -| clip_fraction | 0.0297 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -173 | -| learning_rate | 0.0003 | -| loss | 0.00162 | -| n_updates | 99160 | -| policy_gradient_loss | -0.000543 | -| std | 0.0419 | -| value_loss | 2.97e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9918 | -| time_elapsed | 57388 | -| total_timesteps | 1269504 | -| train/ | | -| approx_kl | 0.046212405 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -138 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 99170 | -| policy_gradient_loss | -0.0103 | -| std | 0.0419 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9919 | -| time_elapsed | 57391 | -| total_timesteps | 1269632 | -| train/ | | -| approx_kl | 0.010059111 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -32.3 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 99180 | -| policy_gradient_loss | -0.00797 | -| std | 0.0419 | -| value_loss | 1.95e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9920 | -| time_elapsed | 57395 | -| total_timesteps | 1269760 | -| train/ | | -| approx_kl | 6.087683e-05 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -4.73 | -| learning_rate | 0.0003 | -| loss | -0.000569 | -| n_updates | 99190 | -| policy_gradient_loss | -0.00217 | -| std | 0.042 | -| value_loss | 3.24e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9921 | -| time_elapsed | 57398 | -| total_timesteps | 1269888 | -| train/ | | -| approx_kl | 0.0035026637 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.349 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 99200 | -| policy_gradient_loss | 6.67e-05 | -| std | 0.042 | -| value_loss | 6.21e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9922 | -| time_elapsed | 57401 | -| total_timesteps | 1270016 | -| train/ | | -| approx_kl | 0.0111666005 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 99210 | -| policy_gradient_loss | -0.0105 | -| std | 0.042 | -| value_loss | 1.91e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9923 | -| time_elapsed | 57411 | -| total_timesteps | 1270144 | -| train/ | | -| approx_kl | 0.020105459 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.196 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 99220 | -| policy_gradient_loss | -0.0119 | -| std | 0.042 | -| value_loss | 0.000945 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9924 | -| time_elapsed | 57414 | -| total_timesteps | 1270272 | -| train/ | | -| approx_kl | 0.0013529011 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.633 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 99230 | -| policy_gradient_loss | -0.00193 | -| std | 0.042 | -| value_loss | 2.07e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9925 | -| time_elapsed | 57416 | -| total_timesteps | 1270400 | -| train/ | | -| approx_kl | 0.09770184 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -41.6 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 99240 | -| policy_gradient_loss | -0.000771 | -| std | 0.0419 | -| value_loss | 1.06e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9926 | -| time_elapsed | 57421 | -| total_timesteps | 1270528 | -| train/ | | -| approx_kl | 0.026194766 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -81.4 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 99250 | -| policy_gradient_loss | -0.0181 | -| std | 0.0419 | -| value_loss | 5.96e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9927 | -| time_elapsed | 57425 | -| total_timesteps | 1270656 | -| train/ | | -| approx_kl | 0.05238893 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | 0.008 | -| n_updates | 99260 | -| policy_gradient_loss | 0.00471 | -| std | 0.0419 | -| value_loss | 3.47e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9928 | -| time_elapsed | 57429 | -| total_timesteps | 1270784 | -| train/ | | -| approx_kl | 0.0020349938 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.753 | -| learning_rate | 0.0003 | -| loss | -0.000396 | -| n_updates | 99270 | -| policy_gradient_loss | 0.00169 | -| std | 0.0419 | -| value_loss | 2.09e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9929 | -| time_elapsed | 57431 | -| total_timesteps | 1270912 | -| train/ | | -| approx_kl | 2.5298446e-05 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.000494 | -| n_updates | 99280 | -| policy_gradient_loss | 9.21e-05 | -| std | 0.042 | -| value_loss | 5.24e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9930 | -| time_elapsed | 57434 | -| total_timesteps | 1271040 | -| train/ | | -| approx_kl | 0.0013015149 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.00063 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 99290 | -| policy_gradient_loss | 0.00151 | -| std | 0.042 | -| value_loss | 6.59e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9931 | -| time_elapsed | 57441 | -| total_timesteps | 1271168 | -| train/ | | -| approx_kl | 0.01822214 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 99300 | -| policy_gradient_loss | -0.0133 | -| std | 0.042 | -| value_loss | 4.89e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9932 | -| time_elapsed | 57445 | -| total_timesteps | 1271296 | -| train/ | | -| approx_kl | 5.612988e-05 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | -0.000593 | -| n_updates | 99310 | -| policy_gradient_loss | 0.00704 | -| std | 0.042 | -| value_loss | 9.38e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9933 | -| time_elapsed | 57449 | -| total_timesteps | 1271424 | -| train/ | | -| approx_kl | 0.005320411 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 99320 | -| policy_gradient_loss | -0.00773 | -| std | 0.042 | -| value_loss | 7.14e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9934 | -| time_elapsed | 57452 | -| total_timesteps | 1271552 | -| train/ | | -| approx_kl | 0.0034348932 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.425 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 99330 | -| policy_gradient_loss | -0.00177 | -| std | 0.042 | -| value_loss | 3.09e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9935 | -| time_elapsed | 57455 | -| total_timesteps | 1271680 | -| train/ | | -| approx_kl | 0.00028321194 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.000353 | -| n_updates | 99340 | -| policy_gradient_loss | 0.00102 | -| std | 0.042 | -| value_loss | 3.25e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9936 | -| time_elapsed | 57458 | -| total_timesteps | 1271808 | -| train/ | | -| approx_kl | 0.018220186 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 99350 | -| policy_gradient_loss | -0.00342 | -| std | 0.042 | -| value_loss | 7.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 22 | -| iterations | 9937 | -| time_elapsed | 57462 | -| total_timesteps | 1271936 | -| train/ | | -| approx_kl | 0.004084047 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.00762 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 99360 | -| policy_gradient_loss | 0.0022 | -| std | 0.042 | -| value_loss | 2.38e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9938 | -| time_elapsed | 57465 | -| total_timesteps | 1272064 | -| train/ | | -| approx_kl | 0.007768851 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.00496 | -| learning_rate | 0.0003 | -| loss | -0.000752 | -| n_updates | 99370 | -| policy_gradient_loss | 0.000188 | -| std | 0.0419 | -| value_loss | 1.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9939 | -| time_elapsed | 57471 | -| total_timesteps | 1272192 | -| train/ | | -| approx_kl | 0.024813497 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.76 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 99380 | -| policy_gradient_loss | -0.0141 | -| std | 0.0419 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9940 | -| time_elapsed | 57475 | -| total_timesteps | 1272320 | -| train/ | | -| approx_kl | 3.128918e-05 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | -0.000109 | -| n_updates | 99390 | -| policy_gradient_loss | 0.000697 | -| std | 0.0419 | -| value_loss | 1.67e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9941 | -| time_elapsed | 57479 | -| total_timesteps | 1272448 | -| train/ | | -| approx_kl | 0.000122522 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -6.24 | -| learning_rate | 0.0003 | -| loss | 0.000215 | -| n_updates | 99400 | -| policy_gradient_loss | 0.00185 | -| std | 0.0418 | -| value_loss | 1.94e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9942 | -| time_elapsed | 57482 | -| total_timesteps | 1272576 | -| train/ | | -| approx_kl | 0.0017355094 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 99410 | -| policy_gradient_loss | -0.0081 | -| std | 0.0418 | -| value_loss | 6.26e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9943 | -| time_elapsed | 57486 | -| total_timesteps | 1272704 | -| train/ | | -| approx_kl | 4.1178428e-06 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | -0.000118 | -| n_updates | 99420 | -| policy_gradient_loss | 0.00142 | -| std | 0.0418 | -| value_loss | 1.71e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9944 | -| time_elapsed | 57490 | -| total_timesteps | 1272832 | -| train/ | | -| approx_kl | 0.0059237215 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 99430 | -| policy_gradient_loss | -0.000485 | -| std | 0.0418 | -| value_loss | 2e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 22 | -| iterations | 9945 | -| time_elapsed | 57493 | -| total_timesteps | 1272960 | -| train/ | | -| approx_kl | 0.0040429374 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.000374 | -| n_updates | 99440 | -| policy_gradient_loss | 0.00123 | -| std | 0.0417 | -| value_loss | 5.37e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9946 | -| time_elapsed | 57496 | -| total_timesteps | 1273088 | -| train/ | | -| approx_kl | 0.0045637833 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.00375 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 99450 | -| policy_gradient_loss | -0.00307 | -| std | 0.0416 | -| value_loss | 3.91e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9947 | -| time_elapsed | 57503 | -| total_timesteps | 1273216 | -| train/ | | -| approx_kl | 4.7068577e-05 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | -0.000691 | -| n_updates | 99460 | -| policy_gradient_loss | -0.000258 | -| std | 0.0416 | -| value_loss | 0.000263 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9948 | -| time_elapsed | 57507 | -| total_timesteps | 1273344 | -| train/ | | -| approx_kl | 0.00029477244 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -188 | -| learning_rate | 0.0003 | -| loss | 0.000543 | -| n_updates | 99470 | -| policy_gradient_loss | -0.00104 | -| std | 0.0415 | -| value_loss | 1.89e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9949 | -| time_elapsed | 57510 | -| total_timesteps | 1273472 | -| train/ | | -| approx_kl | 0.0037965258 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -57 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 99480 | -| policy_gradient_loss | -0.00146 | -| std | 0.0416 | -| value_loss | 6.55e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9950 | -| time_elapsed | 57513 | -| total_timesteps | 1273600 | -| train/ | | -| approx_kl | 8.229166e-05 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -5.25 | -| learning_rate | 0.0003 | -| loss | 0.00297 | -| n_updates | 99490 | -| policy_gradient_loss | -0.00802 | -| std | 0.0416 | -| value_loss | 8.88e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9951 | -| time_elapsed | 57515 | -| total_timesteps | 1273728 | -| train/ | | -| approx_kl | 0.00065347366 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -2.12 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 99500 | -| policy_gradient_loss | -0.00174 | -| std | 0.0416 | -| value_loss | 9.3e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9952 | -| time_elapsed | 57519 | -| total_timesteps | 1273856 | -| train/ | | -| approx_kl | 0.00014882488 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 99510 | -| policy_gradient_loss | -0.00437 | -| std | 0.0416 | -| value_loss | 4.3e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 22 | -| iterations | 9953 | -| time_elapsed | 57523 | -| total_timesteps | 1273984 | -| train/ | | -| approx_kl | 0.016187489 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.000579 | -| n_updates | 99520 | -| policy_gradient_loss | -0.00191 | -| std | 0.0416 | -| value_loss | 1.78e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9954 | -| time_elapsed | 57527 | -| total_timesteps | 1274112 | -| train/ | | -| approx_kl | 0.013047811 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.00733 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 99530 | -| policy_gradient_loss | -0.00147 | -| std | 0.0416 | -| value_loss | 1.9e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9955 | -| time_elapsed | 57536 | -| total_timesteps | 1274240 | -| train/ | | -| approx_kl | 0.06315186 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 99540 | -| policy_gradient_loss | -0.014 | -| std | 0.0416 | -| value_loss | 0.00102 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9956 | -| time_elapsed | 57540 | -| total_timesteps | 1274368 | -| train/ | | -| approx_kl | 0.010710044 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 99550 | -| policy_gradient_loss | -0.00172 | -| std | 0.0416 | -| value_loss | 1.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9957 | -| time_elapsed | 57543 | -| total_timesteps | 1274496 | -| train/ | | -| approx_kl | 0.023312256 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -8.24 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 99560 | -| policy_gradient_loss | -0.00867 | -| std | 0.0417 | -| value_loss | 1.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9958 | -| time_elapsed | 57547 | -| total_timesteps | 1274624 | -| train/ | | -| approx_kl | 0.0026259231 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | -0.00729 | -| n_updates | 99570 | -| policy_gradient_loss | -0.00751 | -| std | 0.0417 | -| value_loss | 2.17e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9959 | -| time_elapsed | 57550 | -| total_timesteps | 1274752 | -| train/ | | -| approx_kl | 0.015576753 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 99580 | -| policy_gradient_loss | -0.00168 | -| std | 0.0416 | -| value_loss | 3.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9960 | -| time_elapsed | 57553 | -| total_timesteps | 1274880 | -| train/ | | -| approx_kl | 0.009400003 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 99590 | -| policy_gradient_loss | -0.00108 | -| std | 0.0416 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9961 | -| time_elapsed | 57556 | -| total_timesteps | 1275008 | -| train/ | | -| approx_kl | 0.001054368 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0523 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 99600 | -| policy_gradient_loss | -0.000807 | -| std | 0.0416 | -| value_loss | 2.9e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9962 | -| time_elapsed | 57566 | -| total_timesteps | 1275136 | -| train/ | | -| approx_kl | 0.0129659455 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.81 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 99610 | -| policy_gradient_loss | -0.0108 | -| std | 0.0416 | -| value_loss | 0.00267 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9963 | -| time_elapsed | 57569 | -| total_timesteps | 1275264 | -| train/ | | -| approx_kl | 0.0019521452 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.0542 | -| learning_rate | 0.0003 | -| loss | 0.00351 | -| n_updates | 99620 | -| policy_gradient_loss | 0.00222 | -| std | 0.0415 | -| value_loss | 2.42e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9964 | -| time_elapsed | 57573 | -| total_timesteps | 1275392 | -| train/ | | -| approx_kl | 0.011813816 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.961 | -| learning_rate | 0.0003 | -| loss | -0.00477 | -| n_updates | 99630 | -| policy_gradient_loss | -0.00302 | -| std | 0.0415 | -| value_loss | 2.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9965 | -| time_elapsed | 57577 | -| total_timesteps | 1275520 | -| train/ | | -| approx_kl | 0.012213965 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.461 | -| learning_rate | 0.0003 | -| loss | 0.00152 | -| n_updates | 99640 | -| policy_gradient_loss | -0.000432 | -| std | 0.0414 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9966 | -| time_elapsed | 57580 | -| total_timesteps | 1275648 | -| train/ | | -| approx_kl | 0.000521726 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 99650 | -| policy_gradient_loss | -0.00172 | -| std | 0.0414 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9967 | -| time_elapsed | 57582 | -| total_timesteps | 1275776 | -| train/ | | -| approx_kl | 0.002959209 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 99660 | -| policy_gradient_loss | -0.00126 | -| std | 0.0413 | -| value_loss | 6.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 22 | -| iterations | 9968 | -| time_elapsed | 57586 | -| total_timesteps | 1275904 | -| train/ | | -| approx_kl | 0.013517387 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 99670 | -| policy_gradient_loss | -0.0019 | -| std | 0.0412 | -| value_loss | 5.69e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9969 | -| time_elapsed | 57588 | -| total_timesteps | 1276032 | -| train/ | | -| approx_kl | 0.00459901 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | -0.00871 | -| n_updates | 99680 | -| policy_gradient_loss | -0.00341 | -| std | 0.0412 | -| value_loss | 2.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9970 | -| time_elapsed | 57596 | -| total_timesteps | 1276160 | -| train/ | | -| approx_kl | 0.054037914 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | 0.903 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 99690 | -| policy_gradient_loss | -0.0144 | -| std | 0.0412 | -| value_loss | 0.000923 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9971 | -| time_elapsed | 57599 | -| total_timesteps | 1276288 | -| train/ | | -| approx_kl | 0.008823802 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -102 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 99700 | -| policy_gradient_loss | -0.00146 | -| std | 0.0412 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9972 | -| time_elapsed | 57603 | -| total_timesteps | 1276416 | -| train/ | | -| approx_kl | 0.013551645 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -97.6 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 99710 | -| policy_gradient_loss | -0.0152 | -| std | 0.0412 | -| value_loss | 1.52e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9973 | -| time_elapsed | 57607 | -| total_timesteps | 1276544 | -| train/ | | -| approx_kl | 0.0039568604 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -32.4 | -| learning_rate | 0.0003 | -| loss | -0.00939 | -| n_updates | 99720 | -| policy_gradient_loss | -0.00616 | -| std | 0.0412 | -| value_loss | 1.04e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9974 | -| time_elapsed | 57611 | -| total_timesteps | 1276672 | -| train/ | | -| approx_kl | 0.003204384 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.898 | -| learning_rate | 0.0003 | -| loss | -0.00941 | -| n_updates | 99730 | -| policy_gradient_loss | -0.00317 | -| std | 0.0412 | -| value_loss | 7.24e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9975 | -| time_elapsed | 57614 | -| total_timesteps | 1276800 | -| train/ | | -| approx_kl | 4.961621e-06 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.9 | -| learning_rate | 0.0003 | -| loss | -0.000161 | -| n_updates | 99740 | -| policy_gradient_loss | 0.00338 | -| std | 0.0412 | -| value_loss | 5.17e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 22 | -| iterations | 9976 | -| time_elapsed | 57618 | -| total_timesteps | 1276928 | -| train/ | | -| approx_kl | 1.3044104e-05 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | -0.000426 | -| n_updates | 99750 | -| policy_gradient_loss | -0.00239 | -| std | 0.0411 | -| value_loss | 3.05e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9977 | -| time_elapsed | 57622 | -| total_timesteps | 1277056 | -| train/ | | -| approx_kl | 0.0016087494 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.909 | -| learning_rate | 0.0003 | -| loss | -0.00939 | -| n_updates | 99760 | -| policy_gradient_loss | -0.0102 | -| std | 0.0411 | -| value_loss | 2.95e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9978 | -| time_elapsed | 57627 | -| total_timesteps | 1277184 | -| train/ | | -| approx_kl | 0.033239488 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 99770 | -| policy_gradient_loss | -0.0019 | -| std | 0.0411 | -| value_loss | 0.000672 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9979 | -| time_elapsed | 57630 | -| total_timesteps | 1277312 | -| train/ | | -| approx_kl | 0.25333777 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -2e+03 | -| learning_rate | 0.0003 | -| loss | 0.00614 | -| n_updates | 99780 | -| policy_gradient_loss | 0.00108 | -| std | 0.0411 | -| value_loss | 6.89e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9980 | -| time_elapsed | 57633 | -| total_timesteps | 1277440 | -| train/ | | -| approx_kl | 0.05058703 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -42.2 | -| learning_rate | 0.0003 | -| loss | 0.000811 | -| n_updates | 99790 | -| policy_gradient_loss | 0.00155 | -| std | 0.0411 | -| value_loss | 2.83e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9981 | -| time_elapsed | 57637 | -| total_timesteps | 1277568 | -| train/ | | -| approx_kl | 0.09097777 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -141 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 99800 | -| policy_gradient_loss | -0.0027 | -| std | 0.0411 | -| value_loss | 1.2e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9982 | -| time_elapsed | 57640 | -| total_timesteps | 1277696 | -| train/ | | -| approx_kl | 0.0143167805 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -20.1 | -| learning_rate | 0.0003 | -| loss | -0.000808 | -| n_updates | 99810 | -| policy_gradient_loss | -0.000993 | -| std | 0.0412 | -| value_loss | 2.04e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9983 | -| time_elapsed | 57643 | -| total_timesteps | 1277824 | -| train/ | | -| approx_kl | 0.0033590235 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -3.18 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 99820 | -| policy_gradient_loss | -5.91e-05 | -| std | 0.0412 | -| value_loss | 8.48e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 22 | -| iterations | 9984 | -| time_elapsed | 57645 | -| total_timesteps | 1277952 | -| train/ | | -| approx_kl | 0.009211316 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | -0.000887 | -| n_updates | 99830 | -| policy_gradient_loss | -0.000846 | -| std | 0.0413 | -| value_loss | 3.75e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9985 | -| time_elapsed | 57647 | -| total_timesteps | 1278080 | -| train/ | | -| approx_kl | 0.0037326855 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0874 | -| learning_rate | 0.0003 | -| loss | -0.000761 | -| n_updates | 99840 | -| policy_gradient_loss | -0.000523 | -| std | 0.0415 | -| value_loss | 3.91e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9986 | -| time_elapsed | 57652 | -| total_timesteps | 1278208 | -| train/ | | -| approx_kl | 0.048811067 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 99850 | -| policy_gradient_loss | -0.00203 | -| std | 0.0415 | -| value_loss | 0.000946 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9987 | -| time_elapsed | 57656 | -| total_timesteps | 1278336 | -| train/ | | -| approx_kl | 0.10552612 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -288 | -| learning_rate | 0.0003 | -| loss | -0.00839 | -| n_updates | 99860 | -| policy_gradient_loss | -0.00475 | -| std | 0.0414 | -| value_loss | 2.1e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9988 | -| time_elapsed | 57660 | -| total_timesteps | 1278464 | -| train/ | | -| approx_kl | 0.3164082 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -9.14e+03 | -| learning_rate | 0.0003 | -| loss | 0.00276 | -| n_updates | 99870 | -| policy_gradient_loss | -0.00275 | -| std | 0.0414 | -| value_loss | 7.61e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9989 | -| time_elapsed | 57664 | -| total_timesteps | 1278592 | -| train/ | | -| approx_kl | 0.17107627 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -216 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 99880 | -| policy_gradient_loss | -0.00335 | -| std | 0.0414 | -| value_loss | 6.99e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9990 | -| time_elapsed | 57668 | -| total_timesteps | 1278720 | -| train/ | | -| approx_kl | 0.09870897 | -| clip_fraction | 0.565 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -57.8 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 99890 | -| policy_gradient_loss | -0.000419 | -| std | 0.0414 | -| value_loss | 7.59e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9991 | -| time_elapsed | 57671 | -| total_timesteps | 1278848 | -| train/ | | -| approx_kl | 0.034218047 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -12.1 | -| learning_rate | 0.0003 | -| loss | 0.00165 | -| n_updates | 99900 | -| policy_gradient_loss | 0.000936 | -| std | 0.0415 | -| value_loss | 9.41e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 22 | -| iterations | 9992 | -| time_elapsed | 57674 | -| total_timesteps | 1278976 | -| train/ | | -| approx_kl | 0.015247092 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | 0.00301 | -| n_updates | 99910 | -| policy_gradient_loss | -0.000133 | -| std | 0.0415 | -| value_loss | 7.79e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9993 | -| time_elapsed | 57677 | -| total_timesteps | 1279104 | -| train/ | | -| approx_kl | 2.507586e-06 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 1.51e-05 | -| n_updates | 99920 | -| policy_gradient_loss | 0.00655 | -| std | 0.0415 | -| value_loss | 2.94e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9994 | -| time_elapsed | 57684 | -| total_timesteps | 1279232 | -| train/ | | -| approx_kl | 0.110677555 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.933 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 99930 | -| policy_gradient_loss | -0.0177 | -| std | 0.0416 | -| value_loss | 0.000882 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9995 | -| time_elapsed | 57687 | -| total_timesteps | 1279360 | -| train/ | | -| approx_kl | 0.00063042063 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -104 | -| learning_rate | 0.0003 | -| loss | 0.0044 | -| n_updates | 99940 | -| policy_gradient_loss | -0.00388 | -| std | 0.0416 | -| value_loss | 4.35e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9996 | -| time_elapsed | 57691 | -| total_timesteps | 1279488 | -| train/ | | -| approx_kl | 5.6308694e-05 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -219 | -| learning_rate | 0.0003 | -| loss | -0.00017 | -| n_updates | 99950 | -| policy_gradient_loss | -0.00022 | -| std | 0.0417 | -| value_loss | 1.19e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9997 | -| time_elapsed | 57694 | -| total_timesteps | 1279616 | -| train/ | | -| approx_kl | 0.05688951 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -17.7 | -| learning_rate | 0.0003 | -| loss | -0.00726 | -| n_updates | 99960 | -| policy_gradient_loss | -0.00212 | -| std | 0.0418 | -| value_loss | 2.85e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9998 | -| time_elapsed | 57697 | -| total_timesteps | 1279744 | -| train/ | | -| approx_kl | 0.029462317 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -155 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 99970 | -| policy_gradient_loss | -0.00198 | -| std | 0.0418 | -| value_loss | 5.31e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 22 | -| iterations | 9999 | -| time_elapsed | 57700 | -| total_timesteps | 1279872 | -| train/ | | -| approx_kl | 0.0008500037 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.861 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 99980 | -| policy_gradient_loss | 0.00578 | -| std | 0.0419 | -| value_loss | 4.89e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10000 | -| time_elapsed | 57703 | -| total_timesteps | 1280000 | -| train/ | | -| approx_kl | 0.004658863 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0806 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 99990 | -| policy_gradient_loss | -0.0015 | -| std | 0.0417 | -| value_loss | 1.46e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10001 | -| time_elapsed | 57706 | -| total_timesteps | 1280128 | -| train/ | | -| approx_kl | 0.00980259 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.00196 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 100000 | -| policy_gradient_loss | 0.00597 | -| std | 0.0416 | -| value_loss | 8.68e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10002 | -| time_elapsed | 57715 | -| total_timesteps | 1280256 | -| train/ | | -| approx_kl | 0.026626877 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -2.49 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 100010 | -| policy_gradient_loss | -0.0107 | -| std | 0.0415 | -| value_loss | 0.00361 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10003 | -| time_elapsed | 57718 | -| total_timesteps | 1280384 | -| train/ | | -| approx_kl | 0.027435612 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -202 | -| learning_rate | 0.0003 | -| loss | -0.00772 | -| n_updates | 100020 | -| policy_gradient_loss | -0.00333 | -| std | 0.0415 | -| value_loss | 1.29e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10004 | -| time_elapsed | 57722 | -| total_timesteps | 1280512 | -| train/ | | -| approx_kl | 0.015579131 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -256 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 100030 | -| policy_gradient_loss | -0.00533 | -| std | 0.0415 | -| value_loss | 9.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10005 | -| time_elapsed | 57726 | -| total_timesteps | 1280640 | -| train/ | | -| approx_kl | 0.026435971 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -27.4 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 100040 | -| policy_gradient_loss | -0.00677 | -| std | 0.0416 | -| value_loss | 2.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10006 | -| time_elapsed | 57729 | -| total_timesteps | 1280768 | -| train/ | | -| approx_kl | 0.0050454335 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.849 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 100050 | -| policy_gradient_loss | -0.0159 | -| std | 0.0416 | -| value_loss | 4.92e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 22 | -| iterations | 10007 | -| time_elapsed | 57731 | -| total_timesteps | 1280896 | -| train/ | | -| approx_kl | 0.015435971 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.577 | -| learning_rate | 0.0003 | -| loss | -0.000757 | -| n_updates | 100060 | -| policy_gradient_loss | -0.00116 | -| std | 0.0416 | -| value_loss | 3.28e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10008 | -| time_elapsed | 57735 | -| total_timesteps | 1281024 | -| train/ | | -| approx_kl | 0.0046548815 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.0775 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 100070 | -| policy_gradient_loss | 8.73e-05 | -| std | 0.0416 | -| value_loss | 4.71e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10009 | -| time_elapsed | 57741 | -| total_timesteps | 1281152 | -| train/ | | -| approx_kl | 0.0029021762 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | 0.867 | -| learning_rate | 0.0003 | -| loss | -0.000343 | -| n_updates | 100080 | -| policy_gradient_loss | 0.000601 | -| std | 0.0416 | -| value_loss | 0.00228 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10010 | -| time_elapsed | 57745 | -| total_timesteps | 1281280 | -| train/ | | -| approx_kl | 0.009530335 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -60.4 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 100090 | -| policy_gradient_loss | -0.00888 | -| std | 0.0415 | -| value_loss | 2.56e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10011 | -| time_elapsed | 57749 | -| total_timesteps | 1281408 | -| train/ | | -| approx_kl | 0.0040015806 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -72.6 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 100100 | -| policy_gradient_loss | -0.001 | -| std | 0.0416 | -| value_loss | 1.53e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10012 | -| time_elapsed | 57753 | -| total_timesteps | 1281536 | -| train/ | | -| approx_kl | 0.0020206734 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | -0.000873 | -| n_updates | 100110 | -| policy_gradient_loss | -0.000486 | -| std | 0.0417 | -| value_loss | 4.75e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10013 | -| time_elapsed | 57756 | -| total_timesteps | 1281664 | -| train/ | | -| approx_kl | 5.174428e-06 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | -0.000305 | -| n_updates | 100120 | -| policy_gradient_loss | 0.0051 | -| std | 0.0418 | -| value_loss | 2.92e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10014 | -| time_elapsed | 57758 | -| total_timesteps | 1281792 | -| train/ | | -| approx_kl | 0.013873152 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -0.00052 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 100130 | -| policy_gradient_loss | -0.0104 | -| std | 0.0418 | -| value_loss | 6.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 22 | -| iterations | 10015 | -| time_elapsed | 57762 | -| total_timesteps | 1281920 | -| train/ | | -| approx_kl | 0.015856225 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.0968 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 100140 | -| policy_gradient_loss | -0.00287 | -| std | 0.0419 | -| value_loss | 2.41e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10016 | -| time_elapsed | 57766 | -| total_timesteps | 1282048 | -| train/ | | -| approx_kl | 0.0055328137 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 100150 | -| policy_gradient_loss | -0.00916 | -| std | 0.0419 | -| value_loss | 3.41e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10017 | -| time_elapsed | 57773 | -| total_timesteps | 1282176 | -| train/ | | -| approx_kl | 0.015142065 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 100160 | -| policy_gradient_loss | -0.019 | -| std | 0.0419 | -| value_loss | 0.000306 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10018 | -| time_elapsed | 57776 | -| total_timesteps | 1282304 | -| train/ | | -| approx_kl | 0.0009391047 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -32.9 | -| learning_rate | 0.0003 | -| loss | -0.000932 | -| n_updates | 100170 | -| policy_gradient_loss | -0.000949 | -| std | 0.042 | -| value_loss | 4.27e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10019 | -| time_elapsed | 57778 | -| total_timesteps | 1282432 | -| train/ | | -| approx_kl | 0.013375724 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -24.8 | -| learning_rate | 0.0003 | -| loss | -0.00288 | -| n_updates | 100180 | -| policy_gradient_loss | -0.00202 | -| std | 0.042 | -| value_loss | 1.51e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10020 | -| time_elapsed | 57782 | -| total_timesteps | 1282560 | -| train/ | | -| approx_kl | 0.0029112282 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 100190 | -| policy_gradient_loss | 0.00142 | -| std | 0.0421 | -| value_loss | 6.17e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10021 | -| time_elapsed | 57785 | -| total_timesteps | 1282688 | -| train/ | | -| approx_kl | 0.0024933806 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 100200 | -| policy_gradient_loss | -0.0076 | -| std | 0.0421 | -| value_loss | 3.29e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10022 | -| time_elapsed | 57789 | -| total_timesteps | 1282816 | -| train/ | | -| approx_kl | 0.006118368 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.00538 | -| learning_rate | 0.0003 | -| loss | 0.00967 | -| n_updates | 100210 | -| policy_gradient_loss | 0.0102 | -| std | 0.0421 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10023 | -| time_elapsed | 57792 | -| total_timesteps | 1282944 | -| train/ | | -| approx_kl | 0.011501211 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 100220 | -| policy_gradient_loss | -0.0042 | -| std | 0.0421 | -| value_loss | 4.02e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10024 | -| time_elapsed | 57796 | -| total_timesteps | 1283072 | -| train/ | | -| approx_kl | 0.0012584347 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 100230 | -| policy_gradient_loss | -0.00394 | -| std | 0.0421 | -| value_loss | 7.35e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10025 | -| time_elapsed | 57802 | -| total_timesteps | 1283200 | -| train/ | | -| approx_kl | 0.06822224 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 100240 | -| policy_gradient_loss | -0.0152 | -| std | 0.042 | -| value_loss | 0.00033 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10026 | -| time_elapsed | 57805 | -| total_timesteps | 1283328 | -| train/ | | -| approx_kl | 0.27065095 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -476 | -| learning_rate | 0.0003 | -| loss | 0.00754 | -| n_updates | 100250 | -| policy_gradient_loss | 0.00105 | -| std | 0.0421 | -| value_loss | 4.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10027 | -| time_elapsed | 57809 | -| total_timesteps | 1283456 | -| train/ | | -| approx_kl | 0.016108455 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -224 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 100260 | -| policy_gradient_loss | -0.0129 | -| std | 0.0421 | -| value_loss | 1.23e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10028 | -| time_elapsed | 57813 | -| total_timesteps | 1283584 | -| train/ | | -| approx_kl | 0.0007917206 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.000339 | -| n_updates | 100270 | -| policy_gradient_loss | 0.00106 | -| std | 0.0421 | -| value_loss | 7.32e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10029 | -| time_elapsed | 57815 | -| total_timesteps | 1283712 | -| train/ | | -| approx_kl | 3.416883e-05 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.442 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 100280 | -| policy_gradient_loss | -0.00452 | -| std | 0.0421 | -| value_loss | 2.72e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10030 | -| time_elapsed | 57818 | -| total_timesteps | 1283840 | -| train/ | | -| approx_kl | 0.015159983 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | -0.000433 | -| n_updates | 100290 | -| policy_gradient_loss | -0.00193 | -| std | 0.0421 | -| value_loss | 1.44e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10031 | -| time_elapsed | 57820 | -| total_timesteps | 1283968 | -| train/ | | -| approx_kl | 0.0036799922 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | 0.00482 | -| n_updates | 100300 | -| policy_gradient_loss | 0.00291 | -| std | 0.0421 | -| value_loss | 3.38e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10032 | -| time_elapsed | 57824 | -| total_timesteps | 1284096 | -| train/ | | -| approx_kl | 0.0008574361 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.00392 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 100310 | -| policy_gradient_loss | -0.00321 | -| std | 0.0421 | -| value_loss | 1.15e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10033 | -| time_elapsed | 57830 | -| total_timesteps | 1284224 | -| train/ | | -| approx_kl | 0.0044884123 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 100320 | -| policy_gradient_loss | -0.0101 | -| std | 0.0421 | -| value_loss | 0.000295 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10034 | -| time_elapsed | 57834 | -| total_timesteps | 1284352 | -| train/ | | -| approx_kl | 0.014321268 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -8.86 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 100330 | -| policy_gradient_loss | -0.0112 | -| std | 0.042 | -| value_loss | 3.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10035 | -| time_elapsed | 57837 | -| total_timesteps | 1284480 | -| train/ | | -| approx_kl | 0.0021531521 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -205 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 100340 | -| policy_gradient_loss | -0.00705 | -| std | 0.042 | -| value_loss | 9.27e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10036 | -| time_elapsed | 57841 | -| total_timesteps | 1284608 | -| train/ | | -| approx_kl | 0.00044285832 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -90.1 | -| learning_rate | 0.0003 | -| loss | -0.00362 | -| n_updates | 100350 | -| policy_gradient_loss | -0.0102 | -| std | 0.042 | -| value_loss | 3.36e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10037 | -| time_elapsed | 57845 | -| total_timesteps | 1284736 | -| train/ | | -| approx_kl | 0.009034667 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 100360 | -| policy_gradient_loss | -0.0023 | -| std | 0.042 | -| value_loss | 1.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10038 | -| time_elapsed | 57849 | -| total_timesteps | 1284864 | -| train/ | | -| approx_kl | 0.0016010185 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | -0.000147 | -| n_updates | 100370 | -| policy_gradient_loss | 0.00287 | -| std | 0.0419 | -| value_loss | 2.28e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 22 | -| iterations | 10039 | -| time_elapsed | 57852 | -| total_timesteps | 1284992 | -| train/ | | -| approx_kl | 0.017611435 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.00351 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 100380 | -| policy_gradient_loss | -0.0031 | -| std | 0.0419 | -| value_loss | 1.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10040 | -| time_elapsed | 57855 | -| total_timesteps | 1285120 | -| train/ | | -| approx_kl | 0.001211741 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | -0.91 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 100390 | -| policy_gradient_loss | -0.000377 | -| std | 0.0419 | -| value_loss | 3.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10041 | -| time_elapsed | 57865 | -| total_timesteps | 1285248 | -| train/ | | -| approx_kl | 0.023307001 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 1.75 | -| explained_variance | 0.248 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 100400 | -| policy_gradient_loss | -0.0137 | -| std | 0.0419 | -| value_loss | 0.00193 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10042 | -| time_elapsed | 57868 | -| total_timesteps | 1285376 | -| train/ | | -| approx_kl | 0.00013655936 | -| clip_fraction | 0.000781 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -63.3 | -| learning_rate | 0.0003 | -| loss | -0.000386 | -| n_updates | 100410 | -| policy_gradient_loss | -0.000168 | -| std | 0.0417 | -| value_loss | 2.31e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10043 | -| time_elapsed | 57871 | -| total_timesteps | 1285504 | -| train/ | | -| approx_kl | 0.019974604 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.76 | -| explained_variance | -62.8 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 100420 | -| policy_gradient_loss | -0.00132 | -| std | 0.0415 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10044 | -| time_elapsed | 57874 | -| total_timesteps | 1285632 | -| train/ | | -| approx_kl | 0.000709136 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 100430 | -| policy_gradient_loss | 0.00583 | -| std | 0.0414 | -| value_loss | 4.1e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10045 | -| time_elapsed | 57877 | -| total_timesteps | 1285760 | -| train/ | | -| approx_kl | 0.00033910666 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.00632 | -| learning_rate | 0.0003 | -| loss | -1.38e-05 | -| n_updates | 100440 | -| policy_gradient_loss | 1.27e-05 | -| std | 0.0413 | -| value_loss | 3.03e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10046 | -| time_elapsed | 57879 | -| total_timesteps | 1285888 | -| train/ | | -| approx_kl | 0.016692003 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | 0.00566 | -| learning_rate | 0.0003 | -| loss | -0.00916 | -| n_updates | 100450 | -| policy_gradient_loss | -0.00721 | -| std | 0.0413 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10047 | -| time_elapsed | 57882 | -| total_timesteps | 1286016 | -| train/ | | -| approx_kl | 0.014864897 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -43 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 100460 | -| policy_gradient_loss | -0.00321 | -| std | 0.0413 | -| value_loss | 4.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10048 | -| time_elapsed | 57891 | -| total_timesteps | 1286144 | -| train/ | | -| approx_kl | 0.004099089 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 100470 | -| policy_gradient_loss | -0.0132 | -| std | 0.0412 | -| value_loss | 0.000417 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10049 | -| time_elapsed | 57893 | -| total_timesteps | 1286272 | -| train/ | | -| approx_kl | 3.8007274e-06 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -1.43 | -| learning_rate | 0.0003 | -| loss | -5.31e-05 | -| n_updates | 100480 | -| policy_gradient_loss | 0.0003 | -| std | 0.0412 | -| value_loss | 2.1e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10050 | -| time_elapsed | 57895 | -| total_timesteps | 1286400 | -| train/ | | -| approx_kl | 0.10256588 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -71.2 | -| learning_rate | 0.0003 | -| loss | -0.00749 | -| n_updates | 100490 | -| policy_gradient_loss | -0.00381 | -| std | 0.0412 | -| value_loss | 7.55e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10051 | -| time_elapsed | 57898 | -| total_timesteps | 1286528 | -| train/ | | -| approx_kl | 0.002124899 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -18.8 | -| learning_rate | 0.0003 | -| loss | 0.00926 | -| n_updates | 100500 | -| policy_gradient_loss | -0.00717 | -| std | 0.0412 | -| value_loss | 1.05e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10052 | -| time_elapsed | 57901 | -| total_timesteps | 1286656 | -| train/ | | -| approx_kl | 0.0037421682 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -3.96 | -| learning_rate | 0.0003 | -| loss | 0.00242 | -| n_updates | 100510 | -| policy_gradient_loss | 0.00046 | -| std | 0.0412 | -| value_loss | 2.04e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10053 | -| time_elapsed | 57906 | -| total_timesteps | 1286784 | -| train/ | | -| approx_kl | 0.0005796654 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.461 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 100520 | -| policy_gradient_loss | -0.0021 | -| std | 0.0412 | -| value_loss | 2.18e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 22 | -| iterations | 10054 | -| time_elapsed | 57910 | -| total_timesteps | 1286912 | -| train/ | | -| approx_kl | 0.014529351 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 100530 | -| policy_gradient_loss | -0.00472 | -| std | 0.0412 | -| value_loss | 3.21e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10055 | -| time_elapsed | 57914 | -| total_timesteps | 1287040 | -| train/ | | -| approx_kl | 0.00078226486 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | -0.000412 | -| n_updates | 100540 | -| policy_gradient_loss | -0.000163 | -| std | 0.0412 | -| value_loss | 3.15e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10056 | -| time_elapsed | 57920 | -| total_timesteps | 1287168 | -| train/ | | -| approx_kl | 0.025101777 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 100550 | -| policy_gradient_loss | -0.0175 | -| std | 0.0412 | -| value_loss | 1.46e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10057 | -| time_elapsed | 57924 | -| total_timesteps | 1287296 | -| train/ | | -| approx_kl | 0.005794181 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -892 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 100560 | -| policy_gradient_loss | -0.00996 | -| std | 0.0412 | -| value_loss | 7.88e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10058 | -| time_elapsed | 57928 | -| total_timesteps | 1287424 | -| train/ | | -| approx_kl | 0.0020463509 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -987 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 100570 | -| policy_gradient_loss | -0.0077 | -| std | 0.0412 | -| value_loss | 5.37e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10059 | -| time_elapsed | 57931 | -| total_timesteps | 1287552 | -| train/ | | -| approx_kl | 0.025202472 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -25.8 | -| learning_rate | 0.0003 | -| loss | -0.00706 | -| n_updates | 100580 | -| policy_gradient_loss | -0.00596 | -| std | 0.0412 | -| value_loss | 9.4e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10060 | -| time_elapsed | 57934 | -| total_timesteps | 1287680 | -| train/ | | -| approx_kl | 0.0075999573 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -1.67 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 100590 | -| policy_gradient_loss | -0.00544 | -| std | 0.0411 | -| value_loss | 1.11e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10061 | -| time_elapsed | 57937 | -| total_timesteps | 1287808 | -| train/ | | -| approx_kl | 0.0015355395 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 100600 | -| policy_gradient_loss | -0.0189 | -| std | 0.041 | -| value_loss | 6.46e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10062 | -| time_elapsed | 57940 | -| total_timesteps | 1287936 | -| train/ | | -| approx_kl | 0.00051577436 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 100610 | -| policy_gradient_loss | -0.00184 | -| std | 0.041 | -| value_loss | 3.06e-10 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10063 | -| time_elapsed | 57943 | -| total_timesteps | 1288064 | -| train/ | | -| approx_kl | 0.00018133037 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 100620 | -| policy_gradient_loss | -0.000914 | -| std | 0.041 | -| value_loss | 3.59e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10064 | -| time_elapsed | 57947 | -| total_timesteps | 1288192 | -| train/ | | -| approx_kl | 0.025127709 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | 0.861 | -| learning_rate | 0.0003 | -| loss | -0.00886 | -| n_updates | 100630 | -| policy_gradient_loss | -0.00718 | -| std | 0.0409 | -| value_loss | 0.00259 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10065 | -| time_elapsed | 57949 | -| total_timesteps | 1288320 | -| train/ | | -| approx_kl | 0.0057525435 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -85.3 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 100640 | -| policy_gradient_loss | -0.00886 | -| std | 0.0409 | -| value_loss | 1.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10066 | -| time_elapsed | 57951 | -| total_timesteps | 1288448 | -| train/ | | -| approx_kl | 0.031388175 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -91.9 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 100650 | -| policy_gradient_loss | -0.00518 | -| std | 0.0409 | -| value_loss | 7.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10067 | -| time_elapsed | 57953 | -| total_timesteps | 1288576 | -| train/ | | -| approx_kl | 0.09554474 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -57.6 | -| learning_rate | 0.0003 | -| loss | -0.00908 | -| n_updates | 100660 | -| policy_gradient_loss | -0.00583 | -| std | 0.0408 | -| value_loss | 6.15e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10068 | -| time_elapsed | 57955 | -| total_timesteps | 1288704 | -| train/ | | -| approx_kl | 0.00050420454 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -6.54 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 100670 | -| policy_gradient_loss | -0.0054 | -| std | 0.0408 | -| value_loss | 1.76e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10069 | -| time_elapsed | 57957 | -| total_timesteps | 1288832 | -| train/ | | -| approx_kl | 3.059907e-05 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | -0.000226 | -| n_updates | 100680 | -| policy_gradient_loss | -9.81e-05 | -| std | 0.0409 | -| value_loss | 3.67e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 22 | -| iterations | 10070 | -| time_elapsed | 57959 | -| total_timesteps | 1288960 | -| train/ | | -| approx_kl | 0.000409937 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 100690 | -| policy_gradient_loss | 0.00317 | -| std | 0.041 | -| value_loss | 1.64e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10071 | -| time_elapsed | 57961 | -| total_timesteps | 1289088 | -| train/ | | -| approx_kl | 0.0018600053 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.77 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.00475 | -| n_updates | 100700 | -| policy_gradient_loss | 0.00146 | -| std | 0.041 | -| value_loss | 4.25e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10072 | -| time_elapsed | 57968 | -| total_timesteps | 1289216 | -| train/ | | -| approx_kl | 0.14283666 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 100710 | -| policy_gradient_loss | -0.0122 | -| std | 0.041 | -| value_loss | 6.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10073 | -| time_elapsed | 57972 | -| total_timesteps | 1289344 | -| train/ | | -| approx_kl | 0.004997073 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.63 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 100720 | -| policy_gradient_loss | -0.0018 | -| std | 0.041 | -| value_loss | 2.43e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10074 | -| time_elapsed | 57974 | -| total_timesteps | 1289472 | -| train/ | | -| approx_kl | 0.0036091753 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.812 | -| learning_rate | 0.0003 | -| loss | -0.007 | -| n_updates | 100730 | -| policy_gradient_loss | -0.00234 | -| std | 0.0409 | -| value_loss | 3.54e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10075 | -| time_elapsed | 57978 | -| total_timesteps | 1289600 | -| train/ | | -| approx_kl | 0.005498642 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 100740 | -| policy_gradient_loss | -0.000727 | -| std | 0.0409 | -| value_loss | 5.08e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10076 | -| time_elapsed | 57981 | -| total_timesteps | 1289728 | -| train/ | | -| approx_kl | 0.004832476 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | 0.0077 | -| n_updates | 100750 | -| policy_gradient_loss | 0.00293 | -| std | 0.0409 | -| value_loss | 6.22e-11 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10077 | -| time_elapsed | 57983 | -| total_timesteps | 1289856 | -| train/ | | -| approx_kl | 0.00070818886 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 100760 | -| policy_gradient_loss | -0.0067 | -| std | 0.0409 | -| value_loss | 2.71e-11 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10078 | -| time_elapsed | 57986 | -| total_timesteps | 1289984 | -| train/ | | -| approx_kl | 0.0017373986 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 100770 | -| policy_gradient_loss | -0.0019 | -| std | 0.0409 | -| value_loss | 1.57e-11 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10079 | -| time_elapsed | 57990 | -| total_timesteps | 1290112 | -| train/ | | -| approx_kl | 0.00018470548 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 7.72e-05 | -| n_updates | 100780 | -| policy_gradient_loss | 0.00117 | -| std | 0.0409 | -| value_loss | 2.78e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10080 | -| time_elapsed | 57998 | -| total_timesteps | 1290240 | -| train/ | | -| approx_kl | 0.008627145 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 100790 | -| policy_gradient_loss | -0.0154 | -| std | 0.0409 | -| value_loss | 6.58e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10081 | -| time_elapsed | 58001 | -| total_timesteps | 1290368 | -| train/ | | -| approx_kl | 8.6962245e-05 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -280 | -| learning_rate | 0.0003 | -| loss | 1.36e-05 | -| n_updates | 100800 | -| policy_gradient_loss | 0.00265 | -| std | 0.0409 | -| value_loss | 1.42e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10082 | -| time_elapsed | 58005 | -| total_timesteps | 1290496 | -| train/ | | -| approx_kl | 0.00023314543 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -439 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 100810 | -| policy_gradient_loss | -0.00614 | -| std | 0.0408 | -| value_loss | 8.24e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10083 | -| time_elapsed | 58008 | -| total_timesteps | 1290624 | -| train/ | | -| approx_kl | 0.019679653 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -24 | -| learning_rate | 0.0003 | -| loss | -0.00377 | -| n_updates | 100820 | -| policy_gradient_loss | -0.00331 | -| std | 0.0408 | -| value_loss | 7.69e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10084 | -| time_elapsed | 58011 | -| total_timesteps | 1290752 | -| train/ | | -| approx_kl | 6.0437713e-05 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 1.78 | -| explained_variance | -29.3 | -| learning_rate | 0.0003 | -| loss | -0.000537 | -| n_updates | 100830 | -| policy_gradient_loss | 0.00179 | -| std | 0.0406 | -| value_loss | 1.26e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 22 | -| iterations | 10085 | -| time_elapsed | 58014 | -| total_timesteps | 1290880 | -| train/ | | -| approx_kl | 0.00028298376 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -0.702 | -| learning_rate | 0.0003 | -| loss | 0.00345 | -| n_updates | 100840 | -| policy_gradient_loss | -0.00224 | -| std | 0.0406 | -| value_loss | 1.01e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10086 | -| time_elapsed | 58016 | -| total_timesteps | 1291008 | -| train/ | | -| approx_kl | 0.0005572657 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.000227 | -| n_updates | 100850 | -| policy_gradient_loss | -8.85e-05 | -| std | 0.0404 | -| value_loss | 2e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10087 | -| time_elapsed | 58022 | -| total_timesteps | 1291136 | -| train/ | | -| approx_kl | 0.023847118 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | 0.951 | -| learning_rate | 0.0003 | -| loss | -0.00374 | -| n_updates | 100860 | -| policy_gradient_loss | -0.00308 | -| std | 0.0402 | -| value_loss | 0.000619 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10088 | -| time_elapsed | 58025 | -| total_timesteps | 1291264 | -| train/ | | -| approx_kl | 0.00023134518 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | 0.283 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 100870 | -| policy_gradient_loss | -0.0153 | -| std | 0.0401 | -| value_loss | 1.12e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10089 | -| time_elapsed | 58028 | -| total_timesteps | 1291392 | -| train/ | | -| approx_kl | 0.0046265353 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -1.58e+04 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 100880 | -| policy_gradient_loss | -0.0112 | -| std | 0.04 | -| value_loss | 5.53e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10090 | -| time_elapsed | 58031 | -| total_timesteps | 1291520 | -| train/ | | -| approx_kl | 0.10765526 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -165 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 100890 | -| policy_gradient_loss | 3.42e-05 | -| std | 0.04 | -| value_loss | 1.19e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10091 | -| time_elapsed | 58035 | -| total_timesteps | 1291648 | -| train/ | | -| approx_kl | 0.07524778 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -51.4 | -| learning_rate | 0.0003 | -| loss | -0.00346 | -| n_updates | 100900 | -| policy_gradient_loss | -0.00087 | -| std | 0.04 | -| value_loss | 7.16e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10092 | -| time_elapsed | 58038 | -| total_timesteps | 1291776 | -| train/ | | -| approx_kl | 8.284114e-05 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -18.2 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 100910 | -| policy_gradient_loss | -0.00773 | -| std | 0.04 | -| value_loss | 2.6e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10093 | -| time_elapsed | 58042 | -| total_timesteps | 1291904 | -| train/ | | -| approx_kl | 0.02070878 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.847 | -| learning_rate | 0.0003 | -| loss | 0.000532 | -| n_updates | 100920 | -| policy_gradient_loss | -0.000734 | -| std | 0.0401 | -| value_loss | 8.2e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10094 | -| time_elapsed | 58044 | -| total_timesteps | 1292032 | -| train/ | | -| approx_kl | 0.0017094822 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.0023 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 100930 | -| policy_gradient_loss | -0.00496 | -| std | 0.0401 | -| value_loss | 1.63e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10095 | -| time_elapsed | 58052 | -| total_timesteps | 1292160 | -| train/ | | -| approx_kl | 0.0092511885 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 100940 | -| policy_gradient_loss | -0.0144 | -| std | 0.0401 | -| value_loss | 0.000711 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10096 | -| time_elapsed | 58056 | -| total_timesteps | 1292288 | -| train/ | | -| approx_kl | 0.0026331851 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -86.9 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 100950 | -| policy_gradient_loss | -0.015 | -| std | 0.0402 | -| value_loss | 1.63e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10097 | -| time_elapsed | 58059 | -| total_timesteps | 1292416 | -| train/ | | -| approx_kl | 0.0007368331 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -946 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 100960 | -| policy_gradient_loss | -0.0018 | -| std | 0.0401 | -| value_loss | 1.14e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10098 | -| time_elapsed | 58063 | -| total_timesteps | 1292544 | -| train/ | | -| approx_kl | 0.03127025 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -88.3 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 100970 | -| policy_gradient_loss | -0.00767 | -| std | 0.0401 | -| value_loss | 1.23e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10099 | -| time_elapsed | 58066 | -| total_timesteps | 1292672 | -| train/ | | -| approx_kl | 0.0054729036 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -15.3 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 100980 | -| policy_gradient_loss | -0.00173 | -| std | 0.0401 | -| value_loss | 1.24e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10100 | -| time_elapsed | 58069 | -| total_timesteps | 1292800 | -| train/ | | -| approx_kl | 0.005935139 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 100990 | -| policy_gradient_loss | -0.00274 | -| std | 0.04 | -| value_loss | 8.56e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 22 | -| iterations | 10101 | -| time_elapsed | 58072 | -| total_timesteps | 1292928 | -| train/ | | -| approx_kl | 0.001726679 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.489 | -| learning_rate | 0.0003 | -| loss | 0.000212 | -| n_updates | 101000 | -| policy_gradient_loss | 0.000575 | -| std | 0.04 | -| value_loss | 3.57e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10102 | -| time_elapsed | 58076 | -| total_timesteps | 1293056 | -| train/ | | -| approx_kl | 0.0017799293 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 101010 | -| policy_gradient_loss | 0.00209 | -| std | 0.0401 | -| value_loss | 7.97e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10103 | -| time_elapsed | 58081 | -| total_timesteps | 1293184 | -| train/ | | -| approx_kl | 0.021609904 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 101020 | -| policy_gradient_loss | -0.0133 | -| std | 0.0401 | -| value_loss | 0.000667 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10104 | -| time_elapsed | 58083 | -| total_timesteps | 1293312 | -| train/ | | -| approx_kl | 0.03773503 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -244 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 101030 | -| policy_gradient_loss | -0.000634 | -| std | 0.0401 | -| value_loss | 4.15e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10105 | -| time_elapsed | 58086 | -| total_timesteps | 1293440 | -| train/ | | -| approx_kl | 9.74494e-05 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -36 | -| learning_rate | 0.0003 | -| loss | -0.00023 | -| n_updates | 101040 | -| policy_gradient_loss | 0.000262 | -| std | 0.0402 | -| value_loss | 0.000163 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10106 | -| time_elapsed | 58088 | -| total_timesteps | 1293568 | -| train/ | | -| approx_kl | 0.0010655769 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.496 | -| learning_rate | 0.0003 | -| loss | -0.000466 | -| n_updates | 101050 | -| policy_gradient_loss | 0.00487 | -| std | 0.0402 | -| value_loss | 0.000741 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10107 | -| time_elapsed | 58091 | -| total_timesteps | 1293696 | -| train/ | | -| approx_kl | 0.010479951 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 101060 | -| policy_gradient_loss | -0.00153 | -| std | 0.0402 | -| value_loss | 2.42e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10108 | -| time_elapsed | 58094 | -| total_timesteps | 1293824 | -| train/ | | -| approx_kl | 0.016541362 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | 0.00448 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 101070 | -| policy_gradient_loss | -0.00822 | -| std | 0.0402 | -| value_loss | 1.68e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 22 | -| iterations | 10109 | -| time_elapsed | 58098 | -| total_timesteps | 1293952 | -| train/ | | -| approx_kl | 0.0010113181 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 101080 | -| policy_gradient_loss | -0.00664 | -| std | 0.0402 | -| value_loss | 6.51e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10110 | -| time_elapsed | 58102 | -| total_timesteps | 1294080 | -| train/ | | -| approx_kl | 7.773563e-05 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.000318 | -| n_updates | 101090 | -| policy_gradient_loss | -0.000389 | -| std | 0.0402 | -| value_loss | 5.8e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10111 | -| time_elapsed | 58110 | -| total_timesteps | 1294208 | -| train/ | | -| approx_kl | 0.016137201 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 101100 | -| policy_gradient_loss | -0.0133 | -| std | 0.0402 | -| value_loss | 0.000377 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10112 | -| time_elapsed | 58113 | -| total_timesteps | 1294336 | -| train/ | | -| approx_kl | 6.4544845e-05 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | 0.000282 | -| n_updates | 101110 | -| policy_gradient_loss | 0.00608 | -| std | 0.0402 | -| value_loss | 6.96e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10113 | -| time_elapsed | 58117 | -| total_timesteps | 1294464 | -| train/ | | -| approx_kl | 0.0071685533 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -3.98 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 101120 | -| policy_gradient_loss | -0.00315 | -| std | 0.0402 | -| value_loss | 2.31e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10114 | -| time_elapsed | 58122 | -| total_timesteps | 1294592 | -| train/ | | -| approx_kl | 0.0073356573 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.00444 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 101130 | -| policy_gradient_loss | -0.000672 | -| std | 0.0401 | -| value_loss | 3.58e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10115 | -| time_elapsed | 58125 | -| total_timesteps | 1294720 | -| train/ | | -| approx_kl | 0.011931579 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.412 | -| learning_rate | 0.0003 | -| loss | 0.00165 | -| n_updates | 101140 | -| policy_gradient_loss | 0.000248 | -| std | 0.0402 | -| value_loss | 2.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10116 | -| time_elapsed | 58129 | -| total_timesteps | 1294848 | -| train/ | | -| approx_kl | 0.004534351 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.00127 | -| n_updates | 101150 | -| policy_gradient_loss | 0.00188 | -| std | 0.0402 | -| value_loss | 5.02e-06 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10117 | -| time_elapsed | 58131 | -| total_timesteps | 1294976 | -| train/ | | -| approx_kl | 0.000102848746 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.336 | -| learning_rate | 0.0003 | -| loss | -0.000898 | -| n_updates | 101160 | -| policy_gradient_loss | -0.000256 | -| std | 0.0401 | -| value_loss | 3.68e-07 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10118 | -| time_elapsed | 58134 | -| total_timesteps | 1295104 | -| train/ | | -| approx_kl | 0.030826794 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.0162 | -| n_updates | 101170 | -| policy_gradient_loss | 0.00304 | -| std | 0.0402 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10119 | -| time_elapsed | 58142 | -| total_timesteps | 1295232 | -| train/ | | -| approx_kl | 0.052271076 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 101180 | -| policy_gradient_loss | -0.0146 | -| std | 0.0403 | -| value_loss | 0.000263 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10120 | -| time_elapsed | 58145 | -| total_timesteps | 1295360 | -| train/ | | -| approx_kl | 0.0014206674 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -26.3 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 101190 | -| policy_gradient_loss | -0.01 | -| std | 0.0403 | -| value_loss | 4.4e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10121 | -| time_elapsed | 58148 | -| total_timesteps | 1295488 | -| train/ | | -| approx_kl | 0.0051102918 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -84.6 | -| learning_rate | 0.0003 | -| loss | -0.00773 | -| n_updates | 101200 | -| policy_gradient_loss | -0.00673 | -| std | 0.0404 | -| value_loss | 2.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10122 | -| time_elapsed | 58151 | -| total_timesteps | 1295616 | -| train/ | | -| approx_kl | 0.014749839 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -19.7 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 101210 | -| policy_gradient_loss | -0.0092 | -| std | 0.0404 | -| value_loss | 3.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10123 | -| time_elapsed | 58154 | -| total_timesteps | 1295744 | -| train/ | | -| approx_kl | 0.061604887 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -4.26 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 101220 | -| policy_gradient_loss | -0.00409 | -| std | 0.0403 | -| value_loss | 9.04e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10124 | -| time_elapsed | 58158 | -| total_timesteps | 1295872 | -| train/ | | -| approx_kl | 0.06996262 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -0.000843 | -| n_updates | 101230 | -| policy_gradient_loss | 0.000501 | -| std | 0.0404 | -| value_loss | 2.5e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10125 | -| time_elapsed | 58161 | -| total_timesteps | 1296000 | -| train/ | | -| approx_kl | 0.008475806 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 1.79 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 101240 | -| policy_gradient_loss | 0.000451 | -| std | 0.0403 | -| value_loss | 2.32e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10126 | -| time_elapsed | 58163 | -| total_timesteps | 1296128 | -| train/ | | -| approx_kl | 0.00038803834 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | 0.00208 | -| learning_rate | 0.0003 | -| loss | -0.000333 | -| n_updates | 101250 | -| policy_gradient_loss | 0.000665 | -| std | 0.0401 | -| value_loss | 3.23e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10127 | -| time_elapsed | 58171 | -| total_timesteps | 1296256 | -| train/ | | -| approx_kl | 0.004325999 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.00857 | -| n_updates | 101260 | -| policy_gradient_loss | -0.00694 | -| std | 0.04 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10128 | -| time_elapsed | 58176 | -| total_timesteps | 1296384 | -| train/ | | -| approx_kl | 0.012703653 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -2.05 | -| learning_rate | 0.0003 | -| loss | 0.000316 | -| n_updates | 101270 | -| policy_gradient_loss | -0.000813 | -| std | 0.0399 | -| value_loss | 3.74e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10129 | -| time_elapsed | 58180 | -| total_timesteps | 1296512 | -| train/ | | -| approx_kl | 5.2056275e-06 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | 0.000162 | -| n_updates | 101280 | -| policy_gradient_loss | 0.00453 | -| std | 0.0399 | -| value_loss | 3.11e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10130 | -| time_elapsed | 58183 | -| total_timesteps | 1296640 | -| train/ | | -| approx_kl | 2.7627684e-05 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.000498 | -| n_updates | 101290 | -| policy_gradient_loss | -0.000809 | -| std | 0.0399 | -| value_loss | 2.36e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10131 | -| time_elapsed | 58187 | -| total_timesteps | 1296768 | -| train/ | | -| approx_kl | 0.0030788989 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | 0.00108 | -| n_updates | 101300 | -| policy_gradient_loss | 0.0016 | -| std | 0.0399 | -| value_loss | 7.61e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10132 | -| time_elapsed | 58189 | -| total_timesteps | 1296896 | -| train/ | | -| approx_kl | 0.006983259 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 101310 | -| policy_gradient_loss | 0.00314 | -| std | 0.0399 | -| value_loss | 1.11e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10133 | -| time_elapsed | 58192 | -| total_timesteps | 1297024 | -| train/ | | -| approx_kl | 0.0014292006 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.315 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 101320 | -| policy_gradient_loss | 0.00123 | -| std | 0.0399 | -| value_loss | 1.21e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10134 | -| time_elapsed | 58198 | -| total_timesteps | 1297152 | -| train/ | | -| approx_kl | 0.09599692 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.758 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 101330 | -| policy_gradient_loss | -0.0121 | -| std | 0.0399 | -| value_loss | 0.00272 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10135 | -| time_elapsed | 58202 | -| total_timesteps | 1297280 | -| train/ | | -| approx_kl | 0.0020239581 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -2.5 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 101340 | -| policy_gradient_loss | -0.00159 | -| std | 0.0399 | -| value_loss | 0.000195 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10136 | -| time_elapsed | 58205 | -| total_timesteps | 1297408 | -| train/ | | -| approx_kl | 0.013327349 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 1.8 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.00312 | -| n_updates | 101350 | -| policy_gradient_loss | -0.000197 | -| std | 0.0398 | -| value_loss | 0.000849 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10137 | -| time_elapsed | 58209 | -| total_timesteps | 1297536 | -| train/ | | -| approx_kl | 0.0029590214 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 1.81 | -| explained_variance | -0.0988 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 101360 | -| policy_gradient_loss | -0.000247 | -| std | 0.0396 | -| value_loss | 0.000163 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10138 | -| time_elapsed | 58212 | -| total_timesteps | 1297664 | -| train/ | | -| approx_kl | 0.024071552 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 1.81 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.0066 | -| n_updates | 101370 | -| policy_gradient_loss | -0.00697 | -| std | 0.0395 | -| value_loss | 0.000253 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10139 | -| time_elapsed | 58214 | -| total_timesteps | 1297792 | -| train/ | | -| approx_kl | 0.001510019 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | 1.82 | -| explained_variance | -34.8 | -| learning_rate | 0.0003 | -| loss | -0.000932 | -| n_updates | 101380 | -| policy_gradient_loss | -0.000395 | -| std | 0.0392 | -| value_loss | 6.2e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10140 | -| time_elapsed | 58218 | -| total_timesteps | 1297920 | -| train/ | | -| approx_kl | 0.0037801121 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.82 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | -0.00947 | -| n_updates | 101390 | -| policy_gradient_loss | -0.00548 | -| std | 0.0391 | -| value_loss | 5.23e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10141 | -| time_elapsed | 58221 | -| total_timesteps | 1298048 | -| train/ | | -| approx_kl | 0.016114792 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.82 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | 0.00185 | -| n_updates | 101400 | -| policy_gradient_loss | -0.00136 | -| std | 0.039 | -| value_loss | 4.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10142 | -| time_elapsed | 58228 | -| total_timesteps | 1298176 | -| train/ | | -| approx_kl | 0.013927495 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 101410 | -| policy_gradient_loss | -0.0139 | -| std | 0.039 | -| value_loss | 0.000104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10143 | -| time_elapsed | 58231 | -| total_timesteps | 1298304 | -| train/ | | -| approx_kl | 0.000969497 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -2.24 | -| learning_rate | 0.0003 | -| loss | 0.000894 | -| n_updates | 101420 | -| policy_gradient_loss | 0.00191 | -| std | 0.039 | -| value_loss | 6.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10144 | -| time_elapsed | 58234 | -| total_timesteps | 1298432 | -| train/ | | -| approx_kl | 0.0002214848 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -2.38 | -| learning_rate | 0.0003 | -| loss | -0.000416 | -| n_updates | 101430 | -| policy_gradient_loss | 0.000591 | -| std | 0.039 | -| value_loss | 8.6e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10145 | -| time_elapsed | 58237 | -| total_timesteps | 1298560 | -| train/ | | -| approx_kl | 0.008171428 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.09 | -| learning_rate | 0.0003 | -| loss | 0.00996 | -| n_updates | 101440 | -| policy_gradient_loss | 0.0082 | -| std | 0.039 | -| value_loss | 7.1e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10146 | -| time_elapsed | 58239 | -| total_timesteps | 1298688 | -| train/ | | -| approx_kl | 0.0046577794 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.00293 | -| n_updates | 101450 | -| policy_gradient_loss | 0.00617 | -| std | 0.039 | -| value_loss | 5.86e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10147 | -| time_elapsed | 58243 | -| total_timesteps | 1298816 | -| train/ | | -| approx_kl | 0.0017178068 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0691 | -| learning_rate | 0.0003 | -| loss | 0.00499 | -| n_updates | 101460 | -| policy_gradient_loss | 0.00111 | -| std | 0.039 | -| value_loss | 5.59e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10148 | -| time_elapsed | 58245 | -| total_timesteps | 1298944 | -| train/ | | -| approx_kl | 0.0059956377 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 101470 | -| policy_gradient_loss | -0.00113 | -| std | 0.039 | -| value_loss | 1.87e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10149 | -| time_elapsed | 58249 | -| total_timesteps | 1299072 | -| train/ | | -| approx_kl | 0.0061898483 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.000204 | -| n_updates | 101480 | -| policy_gradient_loss | 0.00013 | -| std | 0.0388 | -| value_loss | 2.08e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10150 | -| time_elapsed | 58255 | -| total_timesteps | 1299200 | -| train/ | | -| approx_kl | 0.04690655 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 101490 | -| policy_gradient_loss | -0.0131 | -| std | 0.0388 | -| value_loss | 0.00247 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10151 | -| time_elapsed | 58259 | -| total_timesteps | 1299328 | -| train/ | | -| approx_kl | 0.01648213 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -223 | -| learning_rate | 0.0003 | -| loss | -0.0074 | -| n_updates | 101500 | -| policy_gradient_loss | -0.00564 | -| std | 0.0387 | -| value_loss | 3.49e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10152 | -| time_elapsed | 58263 | -| total_timesteps | 1299456 | -| train/ | | -| approx_kl | 0.00032963278 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -83.5 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 101510 | -| policy_gradient_loss | -0.00681 | -| std | 0.0387 | -| value_loss | 9.29e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10153 | -| time_elapsed | 58266 | -| total_timesteps | 1299584 | -| train/ | | -| approx_kl | 0.00025329972 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -7.8 | -| learning_rate | 0.0003 | -| loss | 0.000974 | -| n_updates | 101520 | -| policy_gradient_loss | -0.000159 | -| std | 0.0387 | -| value_loss | 1.06e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10154 | -| time_elapsed | 58270 | -| total_timesteps | 1299712 | -| train/ | | -| approx_kl | 9.7780954e-05 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.000737 | -| n_updates | 101530 | -| policy_gradient_loss | -0.00112 | -| std | 0.0387 | -| value_loss | 3.21e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10155 | -| time_elapsed | 58273 | -| total_timesteps | 1299840 | -| train/ | | -| approx_kl | 0.004385224 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 101540 | -| policy_gradient_loss | -0.00455 | -| std | 0.0386 | -| value_loss | 2.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10156 | -| time_elapsed | 58278 | -| total_timesteps | 1299968 | -| train/ | | -| approx_kl | 0.009025819 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.00192 | -| learning_rate | 0.0003 | -| loss | 0.0002 | -| n_updates | 101550 | -| policy_gradient_loss | 0.000467 | -| std | 0.0387 | -| value_loss | 5.55e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10157 | -| time_elapsed | 58282 | -| total_timesteps | 1300096 | -| train/ | | -| approx_kl | 4.9695373e-06 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | 0.000858 | -| learning_rate | 0.0003 | -| loss | -0.00019 | -| n_updates | 101560 | -| policy_gradient_loss | 0.000891 | -| std | 0.0387 | -| value_loss | 4.88e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10158 | -| time_elapsed | 58291 | -| total_timesteps | 1300224 | -| train/ | | -| approx_kl | 0.016793542 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 101570 | -| policy_gradient_loss | -0.0121 | -| std | 0.0387 | -| value_loss | 0.000945 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10159 | -| time_elapsed | 58294 | -| total_timesteps | 1300352 | -| train/ | | -| approx_kl | 0.017950485 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | -6.44e-05 | -| n_updates | 101580 | -| policy_gradient_loss | 0.00442 | -| std | 0.0387 | -| value_loss | 5.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10160 | -| time_elapsed | 58298 | -| total_timesteps | 1300480 | -| train/ | | -| approx_kl | 0.014341613 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -1.94 | -| learning_rate | 0.0003 | -| loss | -0.00813 | -| n_updates | 101590 | -| policy_gradient_loss | 0.000651 | -| std | 0.0387 | -| value_loss | 1.72e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10161 | -| time_elapsed | 58302 | -| total_timesteps | 1300608 | -| train/ | | -| approx_kl | 0.0088651655 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | -0.000442 | -| n_updates | 101600 | -| policy_gradient_loss | 0.00438 | -| std | 0.0388 | -| value_loss | 1.73e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10162 | -| time_elapsed | 58306 | -| total_timesteps | 1300736 | -| train/ | | -| approx_kl | 0.009335998 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.268 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 101610 | -| policy_gradient_loss | 0.00188 | -| std | 0.0388 | -| value_loss | 2.97e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10163 | -| time_elapsed | 58310 | -| total_timesteps | 1300864 | -| train/ | | -| approx_kl | 6.010756e-05 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0604 | -| learning_rate | 0.0003 | -| loss | -0.000863 | -| n_updates | 101620 | -| policy_gradient_loss | 0.000876 | -| std | 0.0388 | -| value_loss | 1.84e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10164 | -| time_elapsed | 58313 | -| total_timesteps | 1300992 | -| train/ | | -| approx_kl | 0.00050022453 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 101630 | -| policy_gradient_loss | -0.000342 | -| std | 0.0388 | -| value_loss | 1.16e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10165 | -| time_elapsed | 58317 | -| total_timesteps | 1301120 | -| train/ | | -| approx_kl | 0.0021875305 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 101640 | -| policy_gradient_loss | -0.00227 | -| std | 0.0388 | -| value_loss | 8.1e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10166 | -| time_elapsed | 58324 | -| total_timesteps | 1301248 | -| train/ | | -| approx_kl | 0.04516148 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | 0.85 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 101650 | -| policy_gradient_loss | -0.0124 | -| std | 0.0388 | -| value_loss | 0.00236 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10167 | -| time_elapsed | 58327 | -| total_timesteps | 1301376 | -| train/ | | -| approx_kl | 0.003628688 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -15.9 | -| learning_rate | 0.0003 | -| loss | -0.00682 | -| n_updates | 101660 | -| policy_gradient_loss | -0.00598 | -| std | 0.0388 | -| value_loss | 2.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10168 | -| time_elapsed | 58330 | -| total_timesteps | 1301504 | -| train/ | | -| approx_kl | 0.04276205 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -416 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 101670 | -| policy_gradient_loss | -0.00514 | -| std | 0.0388 | -| value_loss | 7.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10169 | -| time_elapsed | 58333 | -| total_timesteps | 1301632 | -| train/ | | -| approx_kl | 0.017906561 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -54.4 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 101680 | -| policy_gradient_loss | -0.00415 | -| std | 0.0388 | -| value_loss | 2.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10170 | -| time_elapsed | 58336 | -| total_timesteps | 1301760 | -| train/ | | -| approx_kl | 0.32931066 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -55.2 | -| learning_rate | 0.0003 | -| loss | 0.00596 | -| n_updates | 101690 | -| policy_gradient_loss | -0.000412 | -| std | 0.0388 | -| value_loss | 6.9e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10171 | -| time_elapsed | 58339 | -| total_timesteps | 1301888 | -| train/ | | -| approx_kl | 0.013154875 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -2.99 | -| learning_rate | 0.0003 | -| loss | -0.00994 | -| n_updates | 101700 | -| policy_gradient_loss | -0.00737 | -| std | 0.0388 | -| value_loss | 3.4e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10172 | -| time_elapsed | 58342 | -| total_timesteps | 1302016 | -| train/ | | -| approx_kl | 0.014980279 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | -1.5e-05 | -| n_updates | 101710 | -| policy_gradient_loss | -0.000978 | -| std | 0.0389 | -| value_loss | 2.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10173 | -| time_elapsed | 58350 | -| total_timesteps | 1302144 | -| train/ | | -| approx_kl | 0.014065225 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 101720 | -| policy_gradient_loss | -0.0172 | -| std | 0.0389 | -| value_loss | 0.000124 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10174 | -| time_elapsed | 58353 | -| total_timesteps | 1302272 | -| train/ | | -| approx_kl | 0.00018198742 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -23.2 | -| learning_rate | 0.0003 | -| loss | -0.00063 | -| n_updates | 101730 | -| policy_gradient_loss | -0.00106 | -| std | 0.0388 | -| value_loss | 1.38e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10175 | -| time_elapsed | 58355 | -| total_timesteps | 1302400 | -| train/ | | -| approx_kl | 0.011521382 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -27.2 | -| learning_rate | 0.0003 | -| loss | -0.00594 | -| n_updates | 101740 | -| policy_gradient_loss | -0.00438 | -| std | 0.0387 | -| value_loss | 7.39e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10176 | -| time_elapsed | 58357 | -| total_timesteps | 1302528 | -| train/ | | -| approx_kl | 2.9951334e-06 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -0.000176 | -| n_updates | 101750 | -| policy_gradient_loss | -0.0051 | -| std | 0.0387 | -| value_loss | 5.45e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10177 | -| time_elapsed | 58360 | -| total_timesteps | 1302656 | -| train/ | | -| approx_kl | 0.004091938 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -1.13 | -| learning_rate | 0.0003 | -| loss | -0.00646 | -| n_updates | 101760 | -| policy_gradient_loss | 0.011 | -| std | 0.0386 | -| value_loss | 9.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10178 | -| time_elapsed | 58363 | -| total_timesteps | 1302784 | -| train/ | | -| approx_kl | 0.008649163 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.00678 | -| learning_rate | 0.0003 | -| loss | 0.00229 | -| n_updates | 101770 | -| policy_gradient_loss | 0.000389 | -| std | 0.0387 | -| value_loss | 5.89e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10179 | -| time_elapsed | 58365 | -| total_timesteps | 1302912 | -| train/ | | -| approx_kl | 0.0049746116 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.00403 | -| n_updates | 101780 | -| policy_gradient_loss | 0.00498 | -| std | 0.0386 | -| value_loss | 6.41e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10180 | -| time_elapsed | 58368 | -| total_timesteps | 1303040 | -| train/ | | -| approx_kl | 0.025393339 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -0.00395 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 101790 | -| policy_gradient_loss | -0.0182 | -| std | 0.0386 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10181 | -| time_elapsed | 58375 | -| total_timesteps | 1303168 | -| train/ | | -| approx_kl | 0.003377303 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 101800 | -| policy_gradient_loss | -0.0146 | -| std | 0.0386 | -| value_loss | 0.000185 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10182 | -| time_elapsed | 58377 | -| total_timesteps | 1303296 | -| train/ | | -| approx_kl | 0.008693969 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.00338 | -| n_updates | 101810 | -| policy_gradient_loss | -0.000593 | -| std | 0.0386 | -| value_loss | 7.95e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10183 | -| time_elapsed | 58379 | -| total_timesteps | 1303424 | -| train/ | | -| approx_kl | 0.002650355 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -30.4 | -| learning_rate | 0.0003 | -| loss | -0.00919 | -| n_updates | 101820 | -| policy_gradient_loss | -0.00998 | -| std | 0.0386 | -| value_loss | 1.05e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10184 | -| time_elapsed | 58383 | -| total_timesteps | 1303552 | -| train/ | | -| approx_kl | 0.00016512442 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -44.8 | -| learning_rate | 0.0003 | -| loss | 0.00248 | -| n_updates | 101830 | -| policy_gradient_loss | -0.0047 | -| std | 0.0387 | -| value_loss | 1.59e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10185 | -| time_elapsed | 58386 | -| total_timesteps | 1303680 | -| train/ | | -| approx_kl | 0.0010696328 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 1.83 | -| explained_variance | -8.08 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 101840 | -| policy_gradient_loss | 0.00431 | -| std | 0.0386 | -| value_loss | 1.17e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10186 | -| time_elapsed | 58390 | -| total_timesteps | 1303808 | -| train/ | | -| approx_kl | 0.0001224773 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 1.84 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 101850 | -| policy_gradient_loss | 0.00159 | -| std | 0.0386 | -| value_loss | 4.15e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10187 | -| time_elapsed | 58393 | -| total_timesteps | 1303936 | -| train/ | | -| approx_kl | 6.4075924e-05 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 1.84 | -| explained_variance | -0.00841 | -| learning_rate | 0.0003 | -| loss | -0.000531 | -| n_updates | 101860 | -| policy_gradient_loss | 0.00129 | -| std | 0.0386 | -| value_loss | 4.2e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10188 | -| time_elapsed | 58396 | -| total_timesteps | 1304064 | -| train/ | | -| approx_kl | 0.0016456963 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 1.84 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 101870 | -| policy_gradient_loss | -0.00445 | -| std | 0.0386 | -| value_loss | 2.27e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10189 | -| time_elapsed | 58401 | -| total_timesteps | 1304192 | -| train/ | | -| approx_kl | 0.02224678 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 1.84 | -| explained_variance | 0.519 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 101880 | -| policy_gradient_loss | -0.0162 | -| std | 0.0386 | -| value_loss | 0.00101 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10190 | -| time_elapsed | 58404 | -| total_timesteps | 1304320 | -| train/ | | -| approx_kl | 0.008677977 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 1.84 | -| explained_variance | -769 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 101890 | -| policy_gradient_loss | -0.00623 | -| std | 0.0385 | -| value_loss | 1e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10191 | -| time_elapsed | 58407 | -| total_timesteps | 1304448 | -| train/ | | -| approx_kl | 4.064059e-05 | -| clip_fraction | 0.00156 | -| clip_range | 0.2 | -| entropy_loss | 1.84 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | -0.000338 | -| n_updates | 101900 | -| policy_gradient_loss | -0.000146 | -| std | 0.0384 | -| value_loss | 3.72e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10192 | -| time_elapsed | 58411 | -| total_timesteps | 1304576 | -| train/ | | -| approx_kl | 0.0006474261 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.84 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.000139 | -| n_updates | 101910 | -| policy_gradient_loss | -7.21e-05 | -| std | 0.0381 | -| value_loss | 7.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10193 | -| time_elapsed | 58414 | -| total_timesteps | 1304704 | -| train/ | | -| approx_kl | 0.018064454 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 1.85 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 101920 | -| policy_gradient_loss | -0.00321 | -| std | 0.038 | -| value_loss | 4.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10194 | -| time_elapsed | 58417 | -| total_timesteps | 1304832 | -| train/ | | -| approx_kl | 0.004725391 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 1.85 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 101930 | -| policy_gradient_loss | 0.00241 | -| std | 0.038 | -| value_loss | 2.23e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10195 | -| time_elapsed | 58420 | -| total_timesteps | 1304960 | -| train/ | | -| approx_kl | 0.0068245577 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 1.85 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 101940 | -| policy_gradient_loss | 0.00281 | -| std | 0.0379 | -| value_loss | 9.53e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10196 | -| time_elapsed | 58423 | -| total_timesteps | 1305088 | -| train/ | | -| approx_kl | 0.0065895882 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 1.85 | -| explained_variance | 0.00184 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 101950 | -| policy_gradient_loss | 0.00148 | -| std | 0.0379 | -| value_loss | 1.32e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10197 | -| time_elapsed | 58429 | -| total_timesteps | 1305216 | -| train/ | | -| approx_kl | 0.0975605 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 1.85 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 101960 | -| policy_gradient_loss | -0.011 | -| std | 0.0379 | -| value_loss | 8.68e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10198 | -| time_elapsed | 58433 | -| total_timesteps | 1305344 | -| train/ | | -| approx_kl | 0.0015142509 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.85 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 101970 | -| policy_gradient_loss | -0.00395 | -| std | 0.0379 | -| value_loss | 1.78e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10199 | -| time_elapsed | 58437 | -| total_timesteps | 1305472 | -| train/ | | -| approx_kl | 0.0005269316 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 1.85 | -| explained_variance | -2.45 | -| learning_rate | 0.0003 | -| loss | 0.00262 | -| n_updates | 101980 | -| policy_gradient_loss | 0.00224 | -| std | 0.0378 | -| value_loss | 1.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10200 | -| time_elapsed | 58441 | -| total_timesteps | 1305600 | -| train/ | | -| approx_kl | 0.008207836 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.681 | -| learning_rate | 0.0003 | -| loss | -0.0309 | -| n_updates | 101990 | -| policy_gradient_loss | -0.0257 | -| std | 0.0378 | -| value_loss | 5.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10201 | -| time_elapsed | 58444 | -| total_timesteps | 1305728 | -| train/ | | -| approx_kl | 0.011772472 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 102000 | -| policy_gradient_loss | -0.00477 | -| std | 0.0378 | -| value_loss | 2.59e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10202 | -| time_elapsed | 58448 | -| total_timesteps | 1305856 | -| train/ | | -| approx_kl | 0.0041210447 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 102010 | -| policy_gradient_loss | 0.000649 | -| std | 0.0378 | -| value_loss | 1.76e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10203 | -| time_elapsed | 58451 | -| total_timesteps | 1305984 | -| train/ | | -| approx_kl | 0.02045648 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 102020 | -| policy_gradient_loss | -0.000988 | -| std | 0.0377 | -| value_loss | 4.15e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10204 | -| time_elapsed | 58454 | -| total_timesteps | 1306112 | -| train/ | | -| approx_kl | 0.007632547 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -2.02 | -| learning_rate | 0.0003 | -| loss | 0.00316 | -| n_updates | 102030 | -| policy_gradient_loss | 0.00306 | -| std | 0.0377 | -| value_loss | 7.26e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10205 | -| time_elapsed | 58463 | -| total_timesteps | 1306240 | -| train/ | | -| approx_kl | 0.005803394 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 102040 | -| policy_gradient_loss | -0.015 | -| std | 0.0377 | -| value_loss | 0.00039 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10206 | -| time_elapsed | 58467 | -| total_timesteps | 1306368 | -| train/ | | -| approx_kl | 0.15167996 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -413 | -| learning_rate | 0.0003 | -| loss | 0.00323 | -| n_updates | 102050 | -| policy_gradient_loss | 0.000976 | -| std | 0.0378 | -| value_loss | 8.59e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10207 | -| time_elapsed | 58471 | -| total_timesteps | 1306496 | -| train/ | | -| approx_kl | 0.17742392 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -60.2 | -| learning_rate | 0.0003 | -| loss | -0.001 | -| n_updates | 102060 | -| policy_gradient_loss | -0.00292 | -| std | 0.0378 | -| value_loss | 2.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10208 | -| time_elapsed | 58474 | -| total_timesteps | 1306624 | -| train/ | | -| approx_kl | 0.021618098 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 102070 | -| policy_gradient_loss | -0.00853 | -| std | 0.0378 | -| value_loss | 5.91e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10209 | -| time_elapsed | 58477 | -| total_timesteps | 1306752 | -| train/ | | -| approx_kl | 0.0055155423 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -3.05 | -| learning_rate | 0.0003 | -| loss | -0.00946 | -| n_updates | 102080 | -| policy_gradient_loss | -0.00898 | -| std | 0.0378 | -| value_loss | 1.75e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10210 | -| time_elapsed | 58481 | -| total_timesteps | 1306880 | -| train/ | | -| approx_kl | 0.00018708687 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | -0.000319 | -| n_updates | 102090 | -| policy_gradient_loss | 0.00239 | -| std | 0.0378 | -| value_loss | 9.68e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10211 | -| time_elapsed | 58485 | -| total_timesteps | 1307008 | -| train/ | | -| approx_kl | 0.00045407377 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00203 | -| n_updates | 102100 | -| policy_gradient_loss | -0.000422 | -| std | 0.0378 | -| value_loss | 3.41e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10212 | -| time_elapsed | 58493 | -| total_timesteps | 1307136 | -| train/ | | -| approx_kl | 0.037526924 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 102110 | -| policy_gradient_loss | -0.0153 | -| std | 0.0378 | -| value_loss | 2.28e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10213 | -| time_elapsed | 58496 | -| total_timesteps | 1307264 | -| train/ | | -| approx_kl | 0.0018577459 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.512 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 102120 | -| policy_gradient_loss | -0.0134 | -| std | 0.0378 | -| value_loss | 1.35e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10214 | -| time_elapsed | 58498 | -| total_timesteps | 1307392 | -| train/ | | -| approx_kl | 0.0005775234 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -7.47e+03 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 102130 | -| policy_gradient_loss | -0.0105 | -| std | 0.0378 | -| value_loss | 1.92e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10215 | -| time_elapsed | 58500 | -| total_timesteps | 1307520 | -| train/ | | -| approx_kl | 0.009377596 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -20.6 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 102140 | -| policy_gradient_loss | -0.000935 | -| std | 0.0378 | -| value_loss | 5.59e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10216 | -| time_elapsed | 58504 | -| total_timesteps | 1307648 | -| train/ | | -| approx_kl | 0.0010375679 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 102150 | -| policy_gradient_loss | 0.000326 | -| std | 0.0377 | -| value_loss | 2.88e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10217 | -| time_elapsed | 58507 | -| total_timesteps | 1307776 | -| train/ | | -| approx_kl | 0.0007477328 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.00755 | -| learning_rate | 0.0003 | -| loss | 0.000685 | -| n_updates | 102160 | -| policy_gradient_loss | 0.00127 | -| std | 0.0377 | -| value_loss | 3e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10218 | -| time_elapsed | 58510 | -| total_timesteps | 1307904 | -| train/ | | -| approx_kl | 0.015833236 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | 0.00183 | -| learning_rate | 0.0003 | -| loss | 0.000178 | -| n_updates | 102170 | -| policy_gradient_loss | -0.00262 | -| std | 0.0377 | -| value_loss | 3.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10219 | -| time_elapsed | 58513 | -| total_timesteps | 1308032 | -| train/ | | -| approx_kl | 0.014277666 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | 0.0074 | -| n_updates | 102180 | -| policy_gradient_loss | 0.00105 | -| std | 0.0376 | -| value_loss | 9.84e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10220 | -| time_elapsed | 58520 | -| total_timesteps | 1308160 | -| train/ | | -| approx_kl | 0.0036245175 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.00689 | -| n_updates | 102190 | -| policy_gradient_loss | -0.00479 | -| std | 0.0376 | -| value_loss | 7.04e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10221 | -| time_elapsed | 58524 | -| total_timesteps | 1308288 | -| train/ | | -| approx_kl | 0.0077239694 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | -0.00058 | -| n_updates | 102200 | -| policy_gradient_loss | 0.00384 | -| std | 0.0376 | -| value_loss | 6.9e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10222 | -| time_elapsed | 58527 | -| total_timesteps | 1308416 | -| train/ | | -| approx_kl | 0.00029610563 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.72 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 102210 | -| policy_gradient_loss | -0.00249 | -| std | 0.0375 | -| value_loss | 1.82e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10223 | -| time_elapsed | 58531 | -| total_timesteps | 1308544 | -| train/ | | -| approx_kl | 0.0009928448 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 102220 | -| policy_gradient_loss | 0.000186 | -| std | 0.0375 | -| value_loss | 2.73e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10224 | -| time_elapsed | 58534 | -| total_timesteps | 1308672 | -| train/ | | -| approx_kl | 2.71108e-06 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 5.23e-05 | -| n_updates | 102230 | -| policy_gradient_loss | 0.0038 | -| std | 0.0375 | -| value_loss | 7.41e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10225 | -| time_elapsed | 58538 | -| total_timesteps | 1308800 | -| train/ | | -| approx_kl | 0.00015796814 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.86 | -| explained_variance | -0.00967 | -| learning_rate | 0.0003 | -| loss | -0.000778 | -| n_updates | 102240 | -| policy_gradient_loss | 0.00148 | -| std | 0.0375 | -| value_loss | 3.31e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10226 | -| time_elapsed | 58541 | -| total_timesteps | 1308928 | -| train/ | | -| approx_kl | 0.004639367 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | -0.00963 | -| n_updates | 102250 | -| policy_gradient_loss | -0.00436 | -| std | 0.0374 | -| value_loss | 3.57e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10227 | -| time_elapsed | 58543 | -| total_timesteps | 1309056 | -| train/ | | -| approx_kl | 5.5210665e-05 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | 0.000855 | -| learning_rate | 0.0003 | -| loss | -0.000446 | -| n_updates | 102260 | -| policy_gradient_loss | 0.00635 | -| std | 0.0374 | -| value_loss | 1.82e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10228 | -| time_elapsed | 58549 | -| total_timesteps | 1309184 | -| train/ | | -| approx_kl | 0.08080038 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -9.91 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 102270 | -| policy_gradient_loss | -0.0121 | -| std | 0.0374 | -| value_loss | 0.00364 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10229 | -| time_elapsed | 58552 | -| total_timesteps | 1309312 | -| train/ | | -| approx_kl | 0.004025898 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -729 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 102280 | -| policy_gradient_loss | -0.00567 | -| std | 0.0374 | -| value_loss | 8.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10230 | -| time_elapsed | 58555 | -| total_timesteps | 1309440 | -| train/ | | -| approx_kl | 0.021745283 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -3.88e+03 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 102290 | -| policy_gradient_loss | -0.00179 | -| std | 0.0374 | -| value_loss | 4.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10231 | -| time_elapsed | 58558 | -| total_timesteps | 1309568 | -| train/ | | -| approx_kl | 0.0012335479 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -18 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 102300 | -| policy_gradient_loss | -0.00811 | -| std | 0.0374 | -| value_loss | 2.33e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10232 | -| time_elapsed | 58561 | -| total_timesteps | 1309696 | -| train/ | | -| approx_kl | 0.014414702 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -3 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 102310 | -| policy_gradient_loss | -0.0044 | -| std | 0.0373 | -| value_loss | 3.92e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10233 | -| time_elapsed | 58565 | -| total_timesteps | 1309824 | -| train/ | | -| approx_kl | 0.00644764 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -0.491 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 102320 | -| policy_gradient_loss | -0.00972 | -| std | 0.0373 | -| value_loss | 2.87e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10234 | -| time_elapsed | 58568 | -| total_timesteps | 1309952 | -| train/ | | -| approx_kl | 0.0029518385 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 102330 | -| policy_gradient_loss | -0.00369 | -| std | 0.0372 | -| value_loss | 1.2e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10235 | -| time_elapsed | 58571 | -| total_timesteps | 1310080 | -| train/ | | -| approx_kl | 0.008475713 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 1.87 | -| explained_variance | -0.0722 | -| learning_rate | 0.0003 | -| loss | 0.00291 | -| n_updates | 102340 | -| policy_gradient_loss | 0.00083 | -| std | 0.0371 | -| value_loss | 1.79e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10236 | -| time_elapsed | 58577 | -| total_timesteps | 1310208 | -| train/ | | -| approx_kl | 0.037790123 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | 0.922 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 102350 | -| policy_gradient_loss | -0.013 | -| std | 0.037 | -| value_loss | 0.000825 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10237 | -| time_elapsed | 58581 | -| total_timesteps | 1310336 | -| train/ | | -| approx_kl | 1.5399419e-06 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -9.17 | -| learning_rate | 0.0003 | -| loss | 6.68e-05 | -| n_updates | 102360 | -| policy_gradient_loss | -0.00165 | -| std | 0.037 | -| value_loss | 2.21e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10238 | -| time_elapsed | 58585 | -| total_timesteps | 1310464 | -| train/ | | -| approx_kl | 0.0038676928 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -10.7 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 102370 | -| policy_gradient_loss | -0.00709 | -| std | 0.037 | -| value_loss | 2.65e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10239 | -| time_elapsed | 58588 | -| total_timesteps | 1310592 | -| train/ | | -| approx_kl | 0.008641107 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 102380 | -| policy_gradient_loss | -0.00953 | -| std | 0.037 | -| value_loss | 5.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10240 | -| time_elapsed | 58591 | -| total_timesteps | 1310720 | -| train/ | | -| approx_kl | 0.013471194 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -0.599 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 102390 | -| policy_gradient_loss | -0.00168 | -| std | 0.037 | -| value_loss | 2.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10241 | -| time_elapsed | 58594 | -| total_timesteps | 1310848 | -| train/ | | -| approx_kl | 0.017808588 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.00751 | -| n_updates | 102400 | -| policy_gradient_loss | 0.00121 | -| std | 0.037 | -| value_loss | 6.41e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 22 | -| iterations | 10242 | -| time_elapsed | 58597 | -| total_timesteps | 1310976 | -| train/ | | -| approx_kl | 0.0048887744 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -0.074 | -| learning_rate | 0.0003 | -| loss | 0.00438 | -| n_updates | 102410 | -| policy_gradient_loss | 0.004 | -| std | 0.037 | -| value_loss | 3.11e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10243 | -| time_elapsed | 58600 | -| total_timesteps | 1311104 | -| train/ | | -| approx_kl | 0.0143797975 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 102420 | -| policy_gradient_loss | -0.00972 | -| std | 0.037 | -| value_loss | 2.51e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10244 | -| time_elapsed | 58608 | -| total_timesteps | 1311232 | -| train/ | | -| approx_kl | 0.022026397 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 102430 | -| policy_gradient_loss | -0.015 | -| std | 0.037 | -| value_loss | 0.00236 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10245 | -| time_elapsed | 58612 | -| total_timesteps | 1311360 | -| train/ | | -| approx_kl | 0.00022023125 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -430 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 102440 | -| policy_gradient_loss | -0.0119 | -| std | 0.037 | -| value_loss | 7.36e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10246 | -| time_elapsed | 58615 | -| total_timesteps | 1311488 | -| train/ | | -| approx_kl | 0.00751991 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -457 | -| learning_rate | 0.0003 | -| loss | -0.00578 | -| n_updates | 102450 | -| policy_gradient_loss | -0.00458 | -| std | 0.037 | -| value_loss | 4.25e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10247 | -| time_elapsed | 58618 | -| total_timesteps | 1311616 | -| train/ | | -| approx_kl | 0.005097472 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -82.5 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 102460 | -| policy_gradient_loss | -0.0164 | -| std | 0.037 | -| value_loss | 6.26e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10248 | -| time_elapsed | 58620 | -| total_timesteps | 1311744 | -| train/ | | -| approx_kl | 2.1830201e-05 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -75.1 | -| learning_rate | 0.0003 | -| loss | -0.000621 | -| n_updates | 102470 | -| policy_gradient_loss | -0.0099 | -| std | 0.037 | -| value_loss | 7.48e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10249 | -| time_elapsed | 58623 | -| total_timesteps | 1311872 | -| train/ | | -| approx_kl | 9.652693e-06 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.000168 | -| n_updates | 102480 | -| policy_gradient_loss | -0.000171 | -| std | 0.037 | -| value_loss | 4.22e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10250 | -| time_elapsed | 58625 | -| total_timesteps | 1312000 | -| train/ | | -| approx_kl | 0.0050000334 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | -0.567 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 102490 | -| policy_gradient_loss | -0.00831 | -| std | 0.037 | -| value_loss | 1.03e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10251 | -| time_elapsed | 58627 | -| total_timesteps | 1312128 | -| train/ | | -| approx_kl | 0.0023216498 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | 0.00294 | -| learning_rate | 0.0003 | -| loss | -0.000161 | -| n_updates | 102500 | -| policy_gradient_loss | 0.000226 | -| std | 0.0369 | -| value_loss | 2.38e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10252 | -| time_elapsed | 58632 | -| total_timesteps | 1312256 | -| train/ | | -| approx_kl | 0.007430541 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 1.88 | -| explained_variance | 0.914 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 102510 | -| policy_gradient_loss | -0.00127 | -| std | 0.0368 | -| value_loss | 0.000824 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10253 | -| time_elapsed | 58635 | -| total_timesteps | 1312384 | -| train/ | | -| approx_kl | 0.0005703564 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -29.5 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 102520 | -| policy_gradient_loss | -0.00851 | -| std | 0.0367 | -| value_loss | 1.69e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10254 | -| time_elapsed | 58639 | -| total_timesteps | 1312512 | -| train/ | | -| approx_kl | 0.023833433 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -114 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 102530 | -| policy_gradient_loss | -0.00434 | -| std | 0.0366 | -| value_loss | 9.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10255 | -| time_elapsed | 58642 | -| total_timesteps | 1312640 | -| train/ | | -| approx_kl | 0.008344898 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -18.5 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 102540 | -| policy_gradient_loss | -0.00748 | -| std | 0.0366 | -| value_loss | 4.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10256 | -| time_elapsed | 58645 | -| total_timesteps | 1312768 | -| train/ | | -| approx_kl | 0.009680752 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -3.49 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 102550 | -| policy_gradient_loss | -0.00798 | -| std | 0.0366 | -| value_loss | 6.98e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10257 | -| time_elapsed | 58647 | -| total_timesteps | 1312896 | -| train/ | | -| approx_kl | 0.00026849378 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -0.448 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 102560 | -| policy_gradient_loss | 0.003 | -| std | 0.0366 | -| value_loss | 6.77e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10258 | -| time_elapsed | 58649 | -| total_timesteps | 1313024 | -| train/ | | -| approx_kl | 0.0018909154 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -0.0991 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 102570 | -| policy_gradient_loss | -0.0108 | -| std | 0.0366 | -| value_loss | 2.93e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10259 | -| time_elapsed | 58659 | -| total_timesteps | 1313152 | -| train/ | | -| approx_kl | 0.021376317 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -0.0733 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 102580 | -| policy_gradient_loss | -0.0149 | -| std | 0.0366 | -| value_loss | 0.00153 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10260 | -| time_elapsed | 58662 | -| total_timesteps | 1313280 | -| train/ | | -| approx_kl | 0.00093223713 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -2.35e+03 | -| learning_rate | 0.0003 | -| loss | -0.00585 | -| n_updates | 102590 | -| policy_gradient_loss | -0.0101 | -| std | 0.0366 | -| value_loss | 7.86e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10261 | -| time_elapsed | 58665 | -| total_timesteps | 1313408 | -| train/ | | -| approx_kl | 0.00049669016 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -1.61e+03 | -| learning_rate | 0.0003 | -| loss | 0.000596 | -| n_updates | 102600 | -| policy_gradient_loss | 0.000195 | -| std | 0.0366 | -| value_loss | 3.49e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10262 | -| time_elapsed | 58666 | -| total_timesteps | 1313536 | -| train/ | | -| approx_kl | 0.003147211 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -161 | -| learning_rate | 0.0003 | -| loss | -0.00419 | -| n_updates | 102610 | -| policy_gradient_loss | -0.00348 | -| std | 0.0365 | -| value_loss | 3.24e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10263 | -| time_elapsed | 58669 | -| total_timesteps | 1313664 | -| train/ | | -| approx_kl | 0.00025787577 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.89 | -| explained_variance | -15.3 | -| learning_rate | 0.0003 | -| loss | -0.000315 | -| n_updates | 102620 | -| policy_gradient_loss | -0.000118 | -| std | 0.0363 | -| value_loss | 4.6e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10264 | -| time_elapsed | 58672 | -| total_timesteps | 1313792 | -| train/ | | -| approx_kl | 0.0024803104 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 1.9 | -| explained_variance | -0.707 | -| learning_rate | 0.0003 | -| loss | -0.00043 | -| n_updates | 102630 | -| policy_gradient_loss | 2.19e-05 | -| std | 0.0361 | -| value_loss | 1.68e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10265 | -| time_elapsed | 58675 | -| total_timesteps | 1313920 | -| train/ | | -| approx_kl | 0.0004628473 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 1.9 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.00389 | -| n_updates | 102640 | -| policy_gradient_loss | 0.00858 | -| std | 0.0361 | -| value_loss | 1.08e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10266 | -| time_elapsed | 58680 | -| total_timesteps | 1314048 | -| train/ | | -| approx_kl | 0.003492346 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 1.9 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.00873 | -| n_updates | 102650 | -| policy_gradient_loss | 0.000239 | -| std | 0.036 | -| value_loss | 1.83e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10267 | -| time_elapsed | 58686 | -| total_timesteps | 1314176 | -| train/ | | -| approx_kl | 0.016583055 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | 0.782 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 102660 | -| policy_gradient_loss | -0.00923 | -| std | 0.0359 | -| value_loss | 0.0039 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10268 | -| time_elapsed | 58690 | -| total_timesteps | 1314304 | -| train/ | | -| approx_kl | 0.40162337 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -23 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 102670 | -| policy_gradient_loss | 0.00139 | -| std | 0.0359 | -| value_loss | 2.54e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10269 | -| time_elapsed | 58693 | -| total_timesteps | 1314432 | -| train/ | | -| approx_kl | 0.002937355 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -2.03 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 102680 | -| policy_gradient_loss | -0.00114 | -| std | 0.0359 | -| value_loss | 2.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10270 | -| time_elapsed | 58696 | -| total_timesteps | 1314560 | -| train/ | | -| approx_kl | 0.003156546 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 102690 | -| policy_gradient_loss | -0.00121 | -| std | 0.0359 | -| value_loss | 9.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10271 | -| time_elapsed | 58699 | -| total_timesteps | 1314688 | -| train/ | | -| approx_kl | 0.0039061378 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -3.83 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 102700 | -| policy_gradient_loss | -0.00148 | -| std | 0.0359 | -| value_loss | 3.7e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10272 | -| time_elapsed | 58703 | -| total_timesteps | 1314816 | -| train/ | | -| approx_kl | 2.6152935e-05 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.000811 | -| n_updates | 102710 | -| policy_gradient_loss | 0.00264 | -| std | 0.0359 | -| value_loss | 9.96e-08 | -------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10273 | -| time_elapsed | 58708 | -| total_timesteps | 1314944 | -| train/ | | -| approx_kl | 1.02003105e-05 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | -0.00067 | -| n_updates | 102720 | -| policy_gradient_loss | -0.00321 | -| std | 0.0359 | -| value_loss | 3.82e-08 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10274 | -| time_elapsed | 58712 | -| total_timesteps | 1315072 | -| train/ | | -| approx_kl | 0.021515373 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 102730 | -| policy_gradient_loss | -0.00789 | -| std | 0.0359 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10275 | -| time_elapsed | 58719 | -| total_timesteps | 1315200 | -| train/ | | -| approx_kl | 0.0043922383 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | 0.847 | -| learning_rate | 0.0003 | -| loss | 8.32e-05 | -| n_updates | 102740 | -| policy_gradient_loss | -0.00132 | -| std | 0.0358 | -| value_loss | 0.00251 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10276 | -| time_elapsed | 58723 | -| total_timesteps | 1315328 | -| train/ | | -| approx_kl | 0.004879407 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 102750 | -| policy_gradient_loss | -0.00736 | -| std | 0.0357 | -| value_loss | 7.52e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10277 | -| time_elapsed | 58727 | -| total_timesteps | 1315456 | -| train/ | | -| approx_kl | 0.0017597461 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -40.5 | -| learning_rate | 0.0003 | -| loss | -0.000294 | -| n_updates | 102760 | -| policy_gradient_loss | -2.79e-05 | -| std | 0.0358 | -| value_loss | 3.06e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10278 | -| time_elapsed | 58730 | -| total_timesteps | 1315584 | -| train/ | | -| approx_kl | 0.02721393 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -2.92 | -| learning_rate | 0.0003 | -| loss | 0.00289 | -| n_updates | 102770 | -| policy_gradient_loss | 0.00397 | -| std | 0.0359 | -| value_loss | 5.68e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10279 | -| time_elapsed | 58733 | -| total_timesteps | 1315712 | -| train/ | | -| approx_kl | 0.035735413 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 102780 | -| policy_gradient_loss | 0.015 | -| std | 0.036 | -| value_loss | 8.85e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10280 | -| time_elapsed | 58736 | -| total_timesteps | 1315840 | -| train/ | | -| approx_kl | 0.022970976 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.0934 | -| learning_rate | 0.0003 | -| loss | 0.0043 | -| n_updates | 102790 | -| policy_gradient_loss | -0.00154 | -| std | 0.036 | -| value_loss | 0.000352 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10281 | -| time_elapsed | 58739 | -| total_timesteps | 1315968 | -| train/ | | -| approx_kl | 0.016635058 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.342 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 102800 | -| policy_gradient_loss | -0.00244 | -| std | 0.036 | -| value_loss | 6.94e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10282 | -| time_elapsed | 58743 | -| total_timesteps | 1316096 | -| train/ | | -| approx_kl | 0.0013315161 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 1.9 | -| explained_variance | -0.00651 | -| learning_rate | 0.0003 | -| loss | 0.00394 | -| n_updates | 102810 | -| policy_gradient_loss | 0.00198 | -| std | 0.036 | -| value_loss | 6.8e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10283 | -| time_elapsed | 58750 | -| total_timesteps | 1316224 | -| train/ | | -| approx_kl | 0.005644582 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 1.9 | -| explained_variance | -14.2 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 102820 | -| policy_gradient_loss | -0.0134 | -| std | 0.036 | -| value_loss | 0.00543 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10284 | -| time_elapsed | 58755 | -| total_timesteps | 1316352 | -| train/ | | -| approx_kl | 0.0010190345 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.39 | -| learning_rate | 0.0003 | -| loss | -0.000916 | -| n_updates | 102830 | -| policy_gradient_loss | 0.00201 | -| std | 0.036 | -| value_loss | 2.65e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10285 | -| time_elapsed | 58758 | -| total_timesteps | 1316480 | -| train/ | | -| approx_kl | 0.000937846 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.955 | -| learning_rate | 0.0003 | -| loss | 0.00152 | -| n_updates | 102840 | -| policy_gradient_loss | 0.00118 | -| std | 0.0359 | -| value_loss | 6.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10286 | -| time_elapsed | 58761 | -| total_timesteps | 1316608 | -| train/ | | -| approx_kl | 0.007208988 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.0897 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 102850 | -| policy_gradient_loss | -0.0104 | -| std | 0.0359 | -| value_loss | 3.63e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10287 | -| time_elapsed | 58764 | -| total_timesteps | 1316736 | -| train/ | | -| approx_kl | 3.9217994e-05 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | 0.000538 | -| learning_rate | 0.0003 | -| loss | -0.000317 | -| n_updates | 102860 | -| policy_gradient_loss | 0.00109 | -| std | 0.0359 | -| value_loss | 1.25e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10288 | -| time_elapsed | 58768 | -| total_timesteps | 1316864 | -| train/ | | -| approx_kl | 0.0003561685 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.00337 | -| learning_rate | 0.0003 | -| loss | 0.00064 | -| n_updates | 102870 | -| policy_gradient_loss | 0.000533 | -| std | 0.0358 | -| value_loss | 9.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10289 | -| time_elapsed | 58770 | -| total_timesteps | 1316992 | -| train/ | | -| approx_kl | 0.003196829 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 102880 | -| policy_gradient_loss | 0.005 | -| std | 0.0358 | -| value_loss | 2.96e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10290 | -| time_elapsed | 58773 | -| total_timesteps | 1317120 | -| train/ | | -| approx_kl | 8.079689e-06 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.00424 | -| learning_rate | 0.0003 | -| loss | -0.000168 | -| n_updates | 102890 | -| policy_gradient_loss | 0.0093 | -| std | 0.0358 | -| value_loss | 6.83e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10291 | -| time_elapsed | 58784 | -| total_timesteps | 1317248 | -| train/ | | -| approx_kl | 0.047476877 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 102900 | -| policy_gradient_loss | -0.0155 | -| std | 0.0358 | -| value_loss | 0.000105 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10292 | -| time_elapsed | 58788 | -| total_timesteps | 1317376 | -| train/ | | -| approx_kl | 0.0014885864 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -5.98 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 102910 | -| policy_gradient_loss | 0.000355 | -| std | 0.0357 | -| value_loss | 5.26e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10293 | -| time_elapsed | 58791 | -| total_timesteps | 1317504 | -| train/ | | -| approx_kl | 6.805174e-05 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -9.16 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 102920 | -| policy_gradient_loss | -0.00901 | -| std | 0.0357 | -| value_loss | 3.27e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10294 | -| time_elapsed | 58793 | -| total_timesteps | 1317632 | -| train/ | | -| approx_kl | 0.006365393 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.628 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 102930 | -| policy_gradient_loss | -0.00189 | -| std | 0.0357 | -| value_loss | 6.01e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10295 | -| time_elapsed | 58797 | -| total_timesteps | 1317760 | -| train/ | | -| approx_kl | 0.0028581633 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 102940 | -| policy_gradient_loss | -0.00153 | -| std | 0.0357 | -| value_loss | 1.76e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10296 | -| time_elapsed | 58800 | -| total_timesteps | 1317888 | -| train/ | | -| approx_kl | 0.00028897077 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.00201 | -| learning_rate | 0.0003 | -| loss | 0.000956 | -| n_updates | 102950 | -| policy_gradient_loss | -0.00013 | -| std | 0.0357 | -| value_loss | 1.07e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10297 | -| time_elapsed | 58803 | -| total_timesteps | 1318016 | -| train/ | | -| approx_kl | 0.0004503997 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 1.91 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.000786 | -| n_updates | 102960 | -| policy_gradient_loss | -0.000314 | -| std | 0.0356 | -| value_loss | 2.23e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10298 | -| time_elapsed | 58813 | -| total_timesteps | 1318144 | -| train/ | | -| approx_kl | 0.11861417 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.92 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 102970 | -| policy_gradient_loss | -0.0124 | -| std | 0.0354 | -| value_loss | 0.000538 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10299 | -| time_elapsed | 58816 | -| total_timesteps | 1318272 | -| train/ | | -| approx_kl | 0.00020643882 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 1.92 | -| explained_variance | -18.5 | -| learning_rate | 0.0003 | -| loss | 0.00363 | -| n_updates | 102980 | -| policy_gradient_loss | -0.00718 | -| std | 0.0353 | -| value_loss | 1.27e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10300 | -| time_elapsed | 58820 | -| total_timesteps | 1318400 | -| train/ | | -| approx_kl | 0.002997702 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.92 | -| explained_variance | -15.3 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 102990 | -| policy_gradient_loss | 0.000172 | -| std | 0.0353 | -| value_loss | 2.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10301 | -| time_elapsed | 58824 | -| total_timesteps | 1318528 | -| train/ | | -| approx_kl | 0.019583024 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | 0.000828 | -| n_updates | 103000 | -| policy_gradient_loss | -0.00147 | -| std | 0.0352 | -| value_loss | 1.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10302 | -| time_elapsed | 58826 | -| total_timesteps | 1318656 | -| train/ | | -| approx_kl | 0.009248024 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | 0.00501 | -| n_updates | 103010 | -| policy_gradient_loss | 0.0051 | -| std | 0.0352 | -| value_loss | 1.2e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10303 | -| time_elapsed | 58828 | -| total_timesteps | 1318784 | -| train/ | | -| approx_kl | 0.0014981311 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.00104 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 103020 | -| policy_gradient_loss | -0.00454 | -| std | 0.0352 | -| value_loss | 2.26e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 22 | -| iterations | 10304 | -| time_elapsed | 58832 | -| total_timesteps | 1318912 | -| train/ | | -| approx_kl | 0.0028341496 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.00324 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 103030 | -| policy_gradient_loss | -0.0014 | -| std | 0.0352 | -| value_loss | 6.16e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10305 | -| time_elapsed | 58835 | -| total_timesteps | 1319040 | -| train/ | | -| approx_kl | 0.0027751266 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.000451 | -| n_updates | 103040 | -| policy_gradient_loss | 0.000759 | -| std | 0.0352 | -| value_loss | 2.48e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10306 | -| time_elapsed | 58843 | -| total_timesteps | 1319168 | -| train/ | | -| approx_kl | 0.046286244 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 103050 | -| policy_gradient_loss | -0.013 | -| std | 0.0351 | -| value_loss | 0.000193 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10307 | -| time_elapsed | 58848 | -| total_timesteps | 1319296 | -| train/ | | -| approx_kl | 3.7113205e-07 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -9.16e-06 | -| n_updates | 103060 | -| policy_gradient_loss | 0.00316 | -| std | 0.0351 | -| value_loss | 1.99e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10308 | -| time_elapsed | 58852 | -| total_timesteps | 1319424 | -| train/ | | -| approx_kl | 0.009435289 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.632 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 103070 | -| policy_gradient_loss | 0.0024 | -| std | 0.0351 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10309 | -| time_elapsed | 58856 | -| total_timesteps | 1319552 | -| train/ | | -| approx_kl | 0.028031701 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.062 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 103080 | -| policy_gradient_loss | -0.00999 | -| std | 0.0351 | -| value_loss | 1.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10310 | -| time_elapsed | 58859 | -| total_timesteps | 1319680 | -| train/ | | -| approx_kl | 0.018980198 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.00214 | -| learning_rate | 0.0003 | -| loss | 0.00552 | -| n_updates | 103090 | -| policy_gradient_loss | -0.000698 | -| std | 0.0351 | -| value_loss | 8.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10311 | -| time_elapsed | 58864 | -| total_timesteps | 1319808 | -| train/ | | -| approx_kl | 0.010950735 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.000552 | -| n_updates | 103100 | -| policy_gradient_loss | -0.00137 | -| std | 0.0352 | -| value_loss | 2.75e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10312 | -| time_elapsed | 58868 | -| total_timesteps | 1319936 | -| train/ | | -| approx_kl | 0.012740456 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.0037 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 103110 | -| policy_gradient_loss | 0.00594 | -| std | 0.0352 | -| value_loss | 6.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10313 | -| time_elapsed | 58872 | -| total_timesteps | 1320064 | -| train/ | | -| approx_kl | 0.002278286 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 103120 | -| policy_gradient_loss | -0.0031 | -| std | 0.0352 | -| value_loss | 3.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10314 | -| time_elapsed | 58878 | -| total_timesteps | 1320192 | -| train/ | | -| approx_kl | 0.059731655 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 103130 | -| policy_gradient_loss | -0.0143 | -| std | 0.0352 | -| value_loss | 0.00215 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10315 | -| time_elapsed | 58883 | -| total_timesteps | 1320320 | -| train/ | | -| approx_kl | 0.035307344 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -20.1 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 103140 | -| policy_gradient_loss | -0.00999 | -| std | 0.0352 | -| value_loss | 0.000137 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10316 | -| time_elapsed | 58886 | -| total_timesteps | 1320448 | -| train/ | | -| approx_kl | 0.011436868 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -64.2 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 103150 | -| policy_gradient_loss | -0.0021 | -| std | 0.0352 | -| value_loss | 2.13e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10317 | -| time_elapsed | 58890 | -| total_timesteps | 1320576 | -| train/ | | -| approx_kl | 0.0077257156 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -71.4 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 103160 | -| policy_gradient_loss | -0.0091 | -| std | 0.0352 | -| value_loss | 2.75e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10318 | -| time_elapsed | 58895 | -| total_timesteps | 1320704 | -| train/ | | -| approx_kl | 0.00017993106 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 103170 | -| policy_gradient_loss | -0.00976 | -| std | 0.0352 | -| value_loss | 2.69e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10319 | -| time_elapsed | 58899 | -| total_timesteps | 1320832 | -| train/ | | -| approx_kl | 0.0042514126 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.00581 | -| learning_rate | 0.0003 | -| loss | -0.000864 | -| n_updates | 103180 | -| policy_gradient_loss | -0.000499 | -| std | 0.0352 | -| value_loss | 1.91e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10320 | -| time_elapsed | 58903 | -| total_timesteps | 1320960 | -| train/ | | -| approx_kl | 0.011256864 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.00449 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 103190 | -| policy_gradient_loss | 0.00237 | -| std | 0.0351 | -| value_loss | 1.33e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10321 | -| time_elapsed | 58908 | -| total_timesteps | 1321088 | -| train/ | | -| approx_kl | 0.00087570585 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.00408 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 103200 | -| policy_gradient_loss | 0.00308 | -| std | 0.0351 | -| value_loss | 3.14e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10322 | -| time_elapsed | 58914 | -| total_timesteps | 1321216 | -| train/ | | -| approx_kl | 0.018188251 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 103210 | -| policy_gradient_loss | -0.0155 | -| std | 0.035 | -| value_loss | 2.9e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10323 | -| time_elapsed | 58916 | -| total_timesteps | 1321344 | -| train/ | | -| approx_kl | 0.0033181706 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.0802 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 103220 | -| policy_gradient_loss | -0.0049 | -| std | 0.035 | -| value_loss | 9.62e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10324 | -| time_elapsed | 58918 | -| total_timesteps | 1321472 | -| train/ | | -| approx_kl | 0.0049656536 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | 0.00353 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 103230 | -| policy_gradient_loss | -0.0137 | -| std | 0.035 | -| value_loss | 2.06e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10325 | -| time_elapsed | 58922 | -| total_timesteps | 1321600 | -| train/ | | -| approx_kl | 0.0120778065 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 1.93 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 103240 | -| policy_gradient_loss | -0.000761 | -| std | 0.035 | -| value_loss | 7.47e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10326 | -| time_elapsed | 58924 | -| total_timesteps | 1321728 | -| train/ | | -| approx_kl | 0.006676124 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.00288 | -| learning_rate | 0.0003 | -| loss | -0.000978 | -| n_updates | 103250 | -| policy_gradient_loss | -0.000562 | -| std | 0.0349 | -| value_loss | 7.3e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10327 | -| time_elapsed | 58927 | -| total_timesteps | 1321856 | -| train/ | | -| approx_kl | 0.01844935 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.00922 | -| learning_rate | 0.0003 | -| loss | -0.0277 | -| n_updates | 103260 | -| policy_gradient_loss | -0.022 | -| std | 0.0349 | -| value_loss | 1.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10328 | -| time_elapsed | 58930 | -| total_timesteps | 1321984 | -| train/ | | -| approx_kl | 0.019924853 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.00472 | -| n_updates | 103270 | -| policy_gradient_loss | -0.000529 | -| std | 0.0349 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10329 | -| time_elapsed | 58933 | -| total_timesteps | 1322112 | -| train/ | | -| approx_kl | 0.004947676 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 103280 | -| policy_gradient_loss | -0.00445 | -| std | 0.0348 | -| value_loss | 1.19e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10330 | -| time_elapsed | 58942 | -| total_timesteps | 1322240 | -| train/ | | -| approx_kl | 0.13642786 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 103290 | -| policy_gradient_loss | -0.0135 | -| std | 0.0348 | -| value_loss | 8.88e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10331 | -| time_elapsed | 58946 | -| total_timesteps | 1322368 | -| train/ | | -| approx_kl | 0.0051136105 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | -0.0249 | -| n_updates | 103300 | -| policy_gradient_loss | -0.0147 | -| std | 0.0348 | -| value_loss | 2.54e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10332 | -| time_elapsed | 58949 | -| total_timesteps | 1322496 | -| train/ | | -| approx_kl | 0.0009698821 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.365 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 103310 | -| policy_gradient_loss | 0.00272 | -| std | 0.0348 | -| value_loss | 1.92e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10333 | -| time_elapsed | 58954 | -| total_timesteps | 1322624 | -| train/ | | -| approx_kl | 0.0003030477 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 103320 | -| policy_gradient_loss | -0.00898 | -| std | 0.0348 | -| value_loss | 7.82e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10334 | -| time_elapsed | 58957 | -| total_timesteps | 1322752 | -| train/ | | -| approx_kl | 0.0012788256 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.558 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 103330 | -| policy_gradient_loss | -0.00815 | -| std | 0.0348 | -| value_loss | 7.39e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10335 | -| time_elapsed | 58961 | -| total_timesteps | 1322880 | -| train/ | | -| approx_kl | 0.00057858694 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.295 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 103340 | -| policy_gradient_loss | -0.00732 | -| std | 0.0348 | -| value_loss | 1.64e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10336 | -| time_elapsed | 58964 | -| total_timesteps | 1323008 | -| train/ | | -| approx_kl | 0.017318849 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | -0.00728 | -| n_updates | 103350 | -| policy_gradient_loss | -0.00744 | -| std | 0.0348 | -| value_loss | 7.1e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10337 | -| time_elapsed | 58973 | -| total_timesteps | 1323136 | -| train/ | | -| approx_kl | 0.23189533 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | 0.832 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 103360 | -| policy_gradient_loss | -0.0128 | -| std | 0.0349 | -| value_loss | 0.00069 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10338 | -| time_elapsed | 58977 | -| total_timesteps | 1323264 | -| train/ | | -| approx_kl | 0.02212562 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.598 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 103370 | -| policy_gradient_loss | -0.00824 | -| std | 0.0349 | -| value_loss | 1.12e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10339 | -| time_elapsed | 58981 | -| total_timesteps | 1323392 | -| train/ | | -| approx_kl | 0.01350143 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -4.8 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 103380 | -| policy_gradient_loss | -0.00399 | -| std | 0.0349 | -| value_loss | 1.82e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10340 | -| time_elapsed | 58984 | -| total_timesteps | 1323520 | -| train/ | | -| approx_kl | 0.0203659 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.508 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 103390 | -| policy_gradient_loss | -0.00445 | -| std | 0.0349 | -| value_loss | 5.94e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10341 | -| time_elapsed | 58987 | -| total_timesteps | 1323648 | -| train/ | | -| approx_kl | 0.00083259493 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | -0.00078 | -| n_updates | 103400 | -| policy_gradient_loss | -0.000428 | -| std | 0.0349 | -| value_loss | 3.83e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10342 | -| time_elapsed | 58989 | -| total_timesteps | 1323776 | -| train/ | | -| approx_kl | 0.0066450057 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | 0.00242 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 103410 | -| policy_gradient_loss | 0.000405 | -| std | 0.0349 | -| value_loss | 5.73e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10343 | -| time_elapsed | 58992 | -| total_timesteps | 1323904 | -| train/ | | -| approx_kl | 0.00716591 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.0067 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 103420 | -| policy_gradient_loss | -0.000876 | -| std | 0.0349 | -| value_loss | 7.11e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10344 | -| time_elapsed | 58995 | -| total_timesteps | 1324032 | -| train/ | | -| approx_kl | 0.0010172576 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 103430 | -| policy_gradient_loss | -0.00142 | -| std | 0.0349 | -| value_loss | 2.92e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10345 | -| time_elapsed | 59003 | -| total_timesteps | 1324160 | -| train/ | | -| approx_kl | 0.05597055 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | 0.411 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 103440 | -| policy_gradient_loss | -0.0152 | -| std | 0.0348 | -| value_loss | 0.00134 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10346 | -| time_elapsed | 59005 | -| total_timesteps | 1324288 | -| train/ | | -| approx_kl | 0.0020265607 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -496 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 103450 | -| policy_gradient_loss | 0.000168 | -| std | 0.0348 | -| value_loss | 3.46e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10347 | -| time_elapsed | 59008 | -| total_timesteps | 1324416 | -| train/ | | -| approx_kl | 0.001466082 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -3.91e+03 | -| learning_rate | 0.0003 | -| loss | 0.00107 | -| n_updates | 103460 | -| policy_gradient_loss | 1.82e-06 | -| std | 0.0348 | -| value_loss | 6.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10348 | -| time_elapsed | 59011 | -| total_timesteps | 1324544 | -| train/ | | -| approx_kl | 0.010985742 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -8.92e+03 | -| learning_rate | 0.0003 | -| loss | -0.00905 | -| n_updates | 103470 | -| policy_gradient_loss | -0.00839 | -| std | 0.0347 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10349 | -| time_elapsed | 59015 | -| total_timesteps | 1324672 | -| train/ | | -| approx_kl | 0.0071010226 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.769 | -| learning_rate | 0.0003 | -| loss | 0.00132 | -| n_updates | 103480 | -| policy_gradient_loss | 0.00139 | -| std | 0.0347 | -| value_loss | 3.18e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10350 | -| time_elapsed | 59018 | -| total_timesteps | 1324800 | -| train/ | | -| approx_kl | 3.434345e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.94 | -| explained_variance | -0.0792 | -| learning_rate | 0.0003 | -| loss | -0.000426 | -| n_updates | 103490 | -| policy_gradient_loss | -0.000163 | -| std | 0.0346 | -| value_loss | 1.5e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 22 | -| iterations | 10351 | -| time_elapsed | 59020 | -| total_timesteps | 1324928 | -| train/ | | -| approx_kl | 0.0014002854 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 103500 | -| policy_gradient_loss | 0.00611 | -| std | 0.0344 | -| value_loss | 1.86e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10352 | -| time_elapsed | 59023 | -| total_timesteps | 1325056 | -| train/ | | -| approx_kl | 7.561082e-05 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -0.009 | -| learning_rate | 0.0003 | -| loss | 0.00116 | -| n_updates | 103510 | -| policy_gradient_loss | 0.00208 | -| std | 0.0343 | -| value_loss | 1.19e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10353 | -| time_elapsed | 59029 | -| total_timesteps | 1325184 | -| train/ | | -| approx_kl | 0.015624631 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 103520 | -| policy_gradient_loss | -0.0118 | -| std | 0.0343 | -| value_loss | 1.28e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10354 | -| time_elapsed | 59033 | -| total_timesteps | 1325312 | -| train/ | | -| approx_kl | 0.0009822571 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -16 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 103530 | -| policy_gradient_loss | -0.00597 | -| std | 0.0343 | -| value_loss | 6.44e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10355 | -| time_elapsed | 59036 | -| total_timesteps | 1325440 | -| train/ | | -| approx_kl | 0.04211829 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -5.85 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 103540 | -| policy_gradient_loss | -0.00926 | -| std | 0.0343 | -| value_loss | 1.75e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10356 | -| time_elapsed | 59040 | -| total_timesteps | 1325568 | -| train/ | | -| approx_kl | 0.0041268156 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -0.742 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 103550 | -| policy_gradient_loss | 0.00126 | -| std | 0.0343 | -| value_loss | 2.27e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10357 | -| time_elapsed | 59044 | -| total_timesteps | 1325696 | -| train/ | | -| approx_kl | 0.00010909652 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 103560 | -| policy_gradient_loss | 0.0033 | -| std | 0.0343 | -| value_loss | 8.09e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10358 | -| time_elapsed | 59048 | -| total_timesteps | 1325824 | -| train/ | | -| approx_kl | 0.006490632 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | 9.42e-05 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 103570 | -| policy_gradient_loss | -0.0129 | -| std | 0.0343 | -| value_loss | 1.09e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10359 | -| time_elapsed | 59051 | -| total_timesteps | 1325952 | -| train/ | | -| approx_kl | 0.0006152871 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -0.00317 | -| learning_rate | 0.0003 | -| loss | 0.000737 | -| n_updates | 103580 | -| policy_gradient_loss | 0.000883 | -| std | 0.0343 | -| value_loss | 1.71e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10360 | -| time_elapsed | 59053 | -| total_timesteps | 1326080 | -| train/ | | -| approx_kl | 8.3843246e-05 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 103590 | -| policy_gradient_loss | -0.00262 | -| std | 0.0343 | -| value_loss | 3.19e-11 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10361 | -| time_elapsed | 59059 | -| total_timesteps | 1326208 | -| train/ | | -| approx_kl | 0.08781189 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 103600 | -| policy_gradient_loss | -0.0144 | -| std | 0.0343 | -| value_loss | 3.34e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10362 | -| time_elapsed | 59062 | -| total_timesteps | 1326336 | -| train/ | | -| approx_kl | 0.0075328033 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -1.75e+03 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 103610 | -| policy_gradient_loss | -0.0123 | -| std | 0.0343 | -| value_loss | 4.75e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10363 | -| time_elapsed | 59065 | -| total_timesteps | 1326464 | -| train/ | | -| approx_kl | 0.0031175734 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 1.95 | -| explained_variance | -77.4 | -| learning_rate | 0.0003 | -| loss | -0.000805 | -| n_updates | 103620 | -| policy_gradient_loss | -0.000319 | -| std | 0.0342 | -| value_loss | 1.33e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10364 | -| time_elapsed | 59069 | -| total_timesteps | 1326592 | -| train/ | | -| approx_kl | 0.011090968 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 1.96 | -| explained_variance | -22.5 | -| learning_rate | 0.0003 | -| loss | 0.000289 | -| n_updates | 103630 | -| policy_gradient_loss | -2.54e-05 | -| std | 0.034 | -| value_loss | 3.95e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10365 | -| time_elapsed | 59072 | -| total_timesteps | 1326720 | -| train/ | | -| approx_kl | 0.0027061044 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.96 | -| explained_variance | -0.0035 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 103640 | -| policy_gradient_loss | 0.00272 | -| std | 0.0339 | -| value_loss | 2.74e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10366 | -| time_elapsed | 59076 | -| total_timesteps | 1326848 | -| train/ | | -| approx_kl | 0.0037079956 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 1.96 | -| explained_variance | -521 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 103650 | -| policy_gradient_loss | -0.0084 | -| std | 0.0339 | -| value_loss | 7.8e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10367 | -| time_elapsed | 59080 | -| total_timesteps | 1326976 | -| train/ | | -| approx_kl | 0.002151649 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 1.96 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 103660 | -| policy_gradient_loss | -0.000659 | -| std | 0.0339 | -| value_loss | 3.54e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10368 | -| time_elapsed | 59084 | -| total_timesteps | 1327104 | -| train/ | | -| approx_kl | 0.01298108 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 1.96 | -| explained_variance | -2.54 | -| learning_rate | 0.0003 | -| loss | 2.04e-05 | -| n_updates | 103670 | -| policy_gradient_loss | -0.000383 | -| std | 0.0339 | -| value_loss | 9.65e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10369 | -| time_elapsed | 59091 | -| total_timesteps | 1327232 | -| train/ | | -| approx_kl | 0.10011917 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 103680 | -| policy_gradient_loss | -0.0142 | -| std | 0.0339 | -| value_loss | 0.000452 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10370 | -| time_elapsed | 59094 | -| total_timesteps | 1327360 | -| train/ | | -| approx_kl | 0.0007682168 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -3.67 | -| learning_rate | 0.0003 | -| loss | -0.000116 | -| n_updates | 103690 | -| policy_gradient_loss | 0.000152 | -| std | 0.0338 | -| value_loss | 2.16e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10371 | -| time_elapsed | 59097 | -| total_timesteps | 1327488 | -| train/ | | -| approx_kl | 0.00019991584 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.00373 | -| n_updates | 103700 | -| policy_gradient_loss | -0.00308 | -| std | 0.0338 | -| value_loss | 0.00216 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10372 | -| time_elapsed | 59099 | -| total_timesteps | 1327616 | -| train/ | | -| approx_kl | 0.0012299484 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | 0.000896 | -| n_updates | 103710 | -| policy_gradient_loss | 0.00208 | -| std | 0.0337 | -| value_loss | 9.41e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10373 | -| time_elapsed | 59102 | -| total_timesteps | 1327744 | -| train/ | | -| approx_kl | 0.001089632 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | 0.00257 | -| learning_rate | 0.0003 | -| loss | 0.00246 | -| n_updates | 103720 | -| policy_gradient_loss | 0.00571 | -| std | 0.0337 | -| value_loss | 0.000158 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 22 | -| iterations | 10374 | -| time_elapsed | 59105 | -| total_timesteps | 1327872 | -| train/ | | -| approx_kl | 0.00052802684 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.00159 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 103730 | -| policy_gradient_loss | -0.00474 | -| std | 0.0337 | -| value_loss | 2.82e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10375 | -| time_elapsed | 59108 | -| total_timesteps | 1328000 | -| train/ | | -| approx_kl | 0.017429868 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.00469 | -| n_updates | 103740 | -| policy_gradient_loss | -0.000136 | -| std | 0.0337 | -| value_loss | 1.21e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10376 | -| time_elapsed | 59112 | -| total_timesteps | 1328128 | -| train/ | | -| approx_kl | 0.0046535837 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | 0.00233 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 103750 | -| policy_gradient_loss | -0.00614 | -| std | 0.0337 | -| value_loss | 5.05e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10377 | -| time_elapsed | 59120 | -| total_timesteps | 1328256 | -| train/ | | -| approx_kl | 0.002996441 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | 0.864 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 103760 | -| policy_gradient_loss | -0.00405 | -| std | 0.0336 | -| value_loss | 0.00186 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10378 | -| time_elapsed | 59123 | -| total_timesteps | 1328384 | -| train/ | | -| approx_kl | 0.01519833 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 103770 | -| policy_gradient_loss | -0.0137 | -| std | 0.0336 | -| value_loss | 0.000668 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10379 | -| time_elapsed | 59127 | -| total_timesteps | 1328512 | -| train/ | | -| approx_kl | 1.2792181e-05 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.359 | -| learning_rate | 0.0003 | -| loss | 0.000381 | -| n_updates | 103780 | -| policy_gradient_loss | -0.000902 | -| std | 0.0336 | -| value_loss | 0.00179 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10380 | -| time_elapsed | 59130 | -| total_timesteps | 1328640 | -| train/ | | -| approx_kl | 0.007890064 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -0.399 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 103790 | -| policy_gradient_loss | -0.00195 | -| std | 0.0336 | -| value_loss | 0.000169 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10381 | -| time_elapsed | 59134 | -| total_timesteps | 1328768 | -| train/ | | -| approx_kl | 0.019132078 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | 0.00244 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 103800 | -| policy_gradient_loss | -0.0173 | -| std | 0.0335 | -| value_loss | 0.000956 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10382 | -| time_elapsed | 59137 | -| total_timesteps | 1328896 | -| train/ | | -| approx_kl | 0.0047120578 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -0.533 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 103810 | -| policy_gradient_loss | -0.0025 | -| std | 0.0335 | -| value_loss | 4.22e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10383 | -| time_elapsed | 59140 | -| total_timesteps | 1329024 | -| train/ | | -| approx_kl | 0.015759535 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.000449 | -| n_updates | 103820 | -| policy_gradient_loss | -0.000955 | -| std | 0.0336 | -| value_loss | 4.94e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10384 | -| time_elapsed | 59147 | -| total_timesteps | 1329152 | -| train/ | | -| approx_kl | 0.0048851534 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | 0.933 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 103830 | -| policy_gradient_loss | 0.00322 | -| std | 0.0335 | -| value_loss | 0.000768 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10385 | -| time_elapsed | 59151 | -| total_timesteps | 1329280 | -| train/ | | -| approx_kl | 0.0021368428 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -3.06 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 103840 | -| policy_gradient_loss | 0.000547 | -| std | 0.0335 | -| value_loss | 5.5e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10386 | -| time_elapsed | 59154 | -| total_timesteps | 1329408 | -| train/ | | -| approx_kl | 0.0028865235 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -6.36 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 103850 | -| policy_gradient_loss | -0.00889 | -| std | 0.0335 | -| value_loss | 2.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10387 | -| time_elapsed | 59158 | -| total_timesteps | 1329536 | -| train/ | | -| approx_kl | 0.002376805 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -1.21 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 103860 | -| policy_gradient_loss | -9.17e-05 | -| std | 0.0335 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10388 | -| time_elapsed | 59161 | -| total_timesteps | 1329664 | -| train/ | | -| approx_kl | 0.0020529372 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -0.665 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 103870 | -| policy_gradient_loss | -0.00838 | -| std | 0.0335 | -| value_loss | 1.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10389 | -| time_elapsed | 59166 | -| total_timesteps | 1329792 | -| train/ | | -| approx_kl | 0.0035011065 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 103880 | -| policy_gradient_loss | -0.000564 | -| std | 0.0336 | -| value_loss | 2.86e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10390 | -| time_elapsed | 59170 | -| total_timesteps | 1329920 | -| train/ | | -| approx_kl | 0.0014588656 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | 0.0051 | -| n_updates | 103890 | -| policy_gradient_loss | -0.000119 | -| std | 0.0337 | -| value_loss | 6.91e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10391 | -| time_elapsed | 59173 | -| total_timesteps | 1330048 | -| train/ | | -| approx_kl | 0.009391764 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.00194 | -| learning_rate | 0.0003 | -| loss | 0.00254 | -| n_updates | 103900 | -| policy_gradient_loss | -0.00125 | -| std | 0.0337 | -| value_loss | 5.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10392 | -| time_elapsed | 59178 | -| total_timesteps | 1330176 | -| train/ | | -| approx_kl | 0.052298207 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | 0.0654 | -| learning_rate | 0.0003 | -| loss | -0.0219 | -| n_updates | 103910 | -| policy_gradient_loss | -0.0187 | -| std | 0.0337 | -| value_loss | 0.00162 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10393 | -| time_elapsed | 59181 | -| total_timesteps | 1330304 | -| train/ | | -| approx_kl | 9.92096e-05 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -18.9 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 103920 | -| policy_gradient_loss | -0.00526 | -| std | 0.0337 | -| value_loss | 1.91e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10394 | -| time_elapsed | 59184 | -| total_timesteps | 1330432 | -| train/ | | -| approx_kl | 0.0042390674 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -37.6 | -| learning_rate | 0.0003 | -| loss | 0.00892 | -| n_updates | 103930 | -| policy_gradient_loss | -0.00611 | -| std | 0.0337 | -| value_loss | 1.23e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10395 | -| time_elapsed | 59186 | -| total_timesteps | 1330560 | -| train/ | | -| approx_kl | 0.0044546244 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -5.02 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 103940 | -| policy_gradient_loss | 0.00125 | -| std | 0.0337 | -| value_loss | 2.63e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10396 | -| time_elapsed | 59189 | -| total_timesteps | 1330688 | -| train/ | | -| approx_kl | 0.00047106948 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.675 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 103950 | -| policy_gradient_loss | -0.00168 | -| std | 0.0337 | -| value_loss | 3.18e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10397 | -| time_elapsed | 59192 | -| total_timesteps | 1330816 | -| train/ | | -| approx_kl | 0.00072336104 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | 0.000821 | -| n_updates | 103960 | -| policy_gradient_loss | 0.00119 | -| std | 0.0337 | -| value_loss | 1.3e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10398 | -| time_elapsed | 59194 | -| total_timesteps | 1330944 | -| train/ | | -| approx_kl | 0.0022607874 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -0.00398 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 103970 | -| policy_gradient_loss | 0.000511 | -| std | 0.0337 | -| value_loss | 2.8e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10399 | -| time_elapsed | 59198 | -| total_timesteps | 1331072 | -| train/ | | -| approx_kl | 8.4433705e-06 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | 0.00269 | -| learning_rate | 0.0003 | -| loss | -0.000189 | -| n_updates | 103980 | -| policy_gradient_loss | 0.00458 | -| std | 0.0337 | -| value_loss | 7.83e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10400 | -| time_elapsed | 59203 | -| total_timesteps | 1331200 | -| train/ | | -| approx_kl | 0.053805552 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 103990 | -| policy_gradient_loss | -0.0147 | -| std | 0.0337 | -| value_loss | 0.00353 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10401 | -| time_elapsed | 59207 | -| total_timesteps | 1331328 | -| train/ | | -| approx_kl | 1.1324883e-06 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -210 | -| learning_rate | 0.0003 | -| loss | -9.68e-05 | -| n_updates | 104000 | -| policy_gradient_loss | 5.62e-05 | -| std | 0.0337 | -| value_loss | 1.4e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10402 | -| time_elapsed | 59210 | -| total_timesteps | 1331456 | -| train/ | | -| approx_kl | 0.012791725 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -1.21e+03 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 104010 | -| policy_gradient_loss | -0.00331 | -| std | 0.0336 | -| value_loss | 8.43e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10403 | -| time_elapsed | 59214 | -| total_timesteps | 1331584 | -| train/ | | -| approx_kl | 0.0009361161 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 1.97 | -| explained_variance | -1.81e+03 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 104020 | -| policy_gradient_loss | 0.00226 | -| std | 0.0336 | -| value_loss | 9.11e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10404 | -| time_elapsed | 59217 | -| total_timesteps | 1331712 | -| train/ | | -| approx_kl | 0.0024711364 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -4.99e+03 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 104030 | -| policy_gradient_loss | -0.00278 | -| std | 0.0336 | -| value_loss | 1.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10405 | -| time_elapsed | 59220 | -| total_timesteps | 1331840 | -| train/ | | -| approx_kl | 0.009158669 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -109 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 104040 | -| policy_gradient_loss | -0.00405 | -| std | 0.0335 | -| value_loss | 1.23e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 22 | -| iterations | 10406 | -| time_elapsed | 59223 | -| total_timesteps | 1331968 | -| train/ | | -| approx_kl | 0.00015098974 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -12.5 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 104050 | -| policy_gradient_loss | 0.000581 | -| std | 0.0335 | -| value_loss | 1.47e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10407 | -| time_elapsed | 59226 | -| total_timesteps | 1332096 | -| train/ | | -| approx_kl | 0.000576789 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -0.488 | -| learning_rate | 0.0003 | -| loss | 0.00364 | -| n_updates | 104060 | -| policy_gradient_loss | -0.00147 | -| std | 0.0335 | -| value_loss | 7.77e-11 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10408 | -| time_elapsed | 59235 | -| total_timesteps | 1332224 | -| train/ | | -| approx_kl | 0.0833963 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 104070 | -| policy_gradient_loss | -0.0159 | -| std | 0.0335 | -| value_loss | 0.00161 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10409 | -| time_elapsed | 59238 | -| total_timesteps | 1332352 | -| train/ | | -| approx_kl | 0.0004992075 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -640 | -| learning_rate | 0.0003 | -| loss | 0.000108 | -| n_updates | 104080 | -| policy_gradient_loss | 0.00118 | -| std | 0.0335 | -| value_loss | 3.62e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10410 | -| time_elapsed | 59242 | -| total_timesteps | 1332480 | -| train/ | | -| approx_kl | 0.000919085 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -977 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 104090 | -| policy_gradient_loss | -0.00271 | -| std | 0.0335 | -| value_loss | 1.02e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10411 | -| time_elapsed | 59246 | -| total_timesteps | 1332608 | -| train/ | | -| approx_kl | 3.5254285e-05 | -| clip_fraction | 0.00391 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -1.03e+03 | -| learning_rate | 0.0003 | -| loss | -0.000284 | -| n_updates | 104100 | -| policy_gradient_loss | -0.000119 | -| std | 0.0333 | -| value_loss | 1.21e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10412 | -| time_elapsed | 59250 | -| total_timesteps | 1332736 | -| train/ | | -| approx_kl | 0.007550221 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.98 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 104110 | -| policy_gradient_loss | -0.00647 | -| std | 0.0332 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10413 | -| time_elapsed | 59254 | -| total_timesteps | 1332864 | -| train/ | | -| approx_kl | 0.016158713 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 104120 | -| policy_gradient_loss | -0.00356 | -| std | 0.0332 | -| value_loss | 7.99e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10414 | -| time_elapsed | 59258 | -| total_timesteps | 1332992 | -| train/ | | -| approx_kl | 0.0013907123 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | 0.00636 | -| n_updates | 104130 | -| policy_gradient_loss | -0.00345 | -| std | 0.0331 | -| value_loss | 6.47e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10415 | -| time_elapsed | 59262 | -| total_timesteps | 1333120 | -| train/ | | -| approx_kl | 0.0010305964 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -7.46 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 104140 | -| policy_gradient_loss | -0.00163 | -| std | 0.0331 | -| value_loss | 4.24e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10416 | -| time_elapsed | 59271 | -| total_timesteps | 1333248 | -| train/ | | -| approx_kl | 0.17929229 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | 0.00367 | -| n_updates | 104150 | -| policy_gradient_loss | -0.00474 | -| std | 0.0332 | -| value_loss | 0.000735 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10417 | -| time_elapsed | 59274 | -| total_timesteps | 1333376 | -| train/ | | -| approx_kl | 0.006575265 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.00721 | -| learning_rate | 0.0003 | -| loss | 0.000209 | -| n_updates | 104160 | -| policy_gradient_loss | 0.000134 | -| std | 0.0331 | -| value_loss | 9.68e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10418 | -| time_elapsed | 59276 | -| total_timesteps | 1333504 | -| train/ | | -| approx_kl | 0.0053772614 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.553 | -| learning_rate | 0.0003 | -| loss | 0.00427 | -| n_updates | 104170 | -| policy_gradient_loss | 0.00295 | -| std | 0.0331 | -| value_loss | 5.87e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10419 | -| time_elapsed | 59280 | -| total_timesteps | 1333632 | -| train/ | | -| approx_kl | 0.0020811078 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -6 | -| learning_rate | 0.0003 | -| loss | 0.00642 | -| n_updates | 104180 | -| policy_gradient_loss | -0.000525 | -| std | 0.0331 | -| value_loss | 2.61e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10420 | -| time_elapsed | 59284 | -| total_timesteps | 1333760 | -| train/ | | -| approx_kl | 0.00054787146 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 104190 | -| policy_gradient_loss | -0.00017 | -| std | 0.0331 | -| value_loss | 1.21e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10421 | -| time_elapsed | 59288 | -| total_timesteps | 1333888 | -| train/ | | -| approx_kl | 0.005249046 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0958 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 104200 | -| policy_gradient_loss | -0.000566 | -| std | 0.0331 | -| value_loss | 1.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10422 | -| time_elapsed | 59293 | -| total_timesteps | 1334016 | -| train/ | | -| approx_kl | 0.022480905 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.00277 | -| n_updates | 104210 | -| policy_gradient_loss | -0.00139 | -| std | 0.0331 | -| value_loss | 1.19e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10423 | -| time_elapsed | 59302 | -| total_timesteps | 1334144 | -| train/ | | -| approx_kl | 0.036724478 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 104220 | -| policy_gradient_loss | -0.0103 | -| std | 0.033 | -| value_loss | 0.000564 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10424 | -| time_elapsed | 59304 | -| total_timesteps | 1334272 | -| train/ | | -| approx_kl | 0.009036944 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | 0.044 | -| learning_rate | 0.0003 | -| loss | 0.000696 | -| n_updates | 104230 | -| policy_gradient_loss | -0.000199 | -| std | 0.033 | -| value_loss | 9.64e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10425 | -| time_elapsed | 59307 | -| total_timesteps | 1334400 | -| train/ | | -| approx_kl | 0.006658214 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | 0.00427 | -| n_updates | 104240 | -| policy_gradient_loss | 0.0108 | -| std | 0.033 | -| value_loss | 1.47e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10426 | -| time_elapsed | 59309 | -| total_timesteps | 1334528 | -| train/ | | -| approx_kl | 0.0024038805 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | 0.00467 | -| n_updates | 104250 | -| policy_gradient_loss | 0.00523 | -| std | 0.033 | -| value_loss | 7.57e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10427 | -| time_elapsed | 59312 | -| total_timesteps | 1334656 | -| train/ | | -| approx_kl | 0.009699538 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 104260 | -| policy_gradient_loss | -0.00102 | -| std | 0.033 | -| value_loss | 4.91e-07 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10428 | -| time_elapsed | 59315 | -| total_timesteps | 1334784 | -| train/ | | -| approx_kl | 0.000119773205 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -0.000574 | -| n_updates | 104270 | -| policy_gradient_loss | 0.00638 | -| std | 0.033 | -| value_loss | 1.91e-07 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 22 | -| iterations | 10429 | -| time_elapsed | 59318 | -| total_timesteps | 1334912 | -| train/ | | -| approx_kl | 0.015000088 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 104280 | -| policy_gradient_loss | 0.000654 | -| std | 0.033 | -| value_loss | 9.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10430 | -| time_elapsed | 59321 | -| total_timesteps | 1335040 | -| train/ | | -| approx_kl | 0.015118506 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 104290 | -| policy_gradient_loss | 0.00104 | -| std | 0.033 | -| value_loss | 1.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10431 | -| time_elapsed | 59328 | -| total_timesteps | 1335168 | -| train/ | | -| approx_kl | 0.08262845 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 104300 | -| policy_gradient_loss | -0.00852 | -| std | 0.033 | -| value_loss | 0.000313 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10432 | -| time_elapsed | 59332 | -| total_timesteps | 1335296 | -| train/ | | -| approx_kl | 0.012279053 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | 0.147 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 104310 | -| policy_gradient_loss | -0.0047 | -| std | 0.033 | -| value_loss | 4.3e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10433 | -| time_elapsed | 59335 | -| total_timesteps | 1335424 | -| train/ | | -| approx_kl | 0.0007672012 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -3.34 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 104320 | -| policy_gradient_loss | -0.00394 | -| std | 0.033 | -| value_loss | 1.01e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10434 | -| time_elapsed | 59340 | -| total_timesteps | 1335552 | -| train/ | | -| approx_kl | 0.003950533 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0973 | -| learning_rate | 0.0003 | -| loss | -0.000851 | -| n_updates | 104330 | -| policy_gradient_loss | 0.000512 | -| std | 0.033 | -| value_loss | 1.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10435 | -| time_elapsed | 59343 | -| total_timesteps | 1335680 | -| train/ | | -| approx_kl | 0.003685804 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.00551 | -| n_updates | 104340 | -| policy_gradient_loss | 0.00481 | -| std | 0.033 | -| value_loss | 2.28e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10436 | -| time_elapsed | 59347 | -| total_timesteps | 1335808 | -| train/ | | -| approx_kl | 0.00065468857 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0016 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 104350 | -| policy_gradient_loss | -0.00732 | -| std | 0.033 | -| value_loss | 2.58e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10437 | -| time_elapsed | 59350 | -| total_timesteps | 1335936 | -| train/ | | -| approx_kl | 0.003227158 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 104360 | -| policy_gradient_loss | -0.0049 | -| std | 0.033 | -| value_loss | 1.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10438 | -| time_elapsed | 59353 | -| total_timesteps | 1336064 | -| train/ | | -| approx_kl | 0.013156219 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | -0.0257 | -| n_updates | 104370 | -| policy_gradient_loss | -0.0189 | -| std | 0.033 | -| value_loss | 8.08e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10439 | -| time_elapsed | 59358 | -| total_timesteps | 1336192 | -| train/ | | -| approx_kl | 0.0110830935 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 104380 | -| policy_gradient_loss | -0.00872 | -| std | 0.0331 | -| value_loss | 0.00139 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10440 | -| time_elapsed | 59362 | -| total_timesteps | 1336320 | -| train/ | | -| approx_kl | 0.005511598 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00995 | -| n_updates | 104390 | -| policy_gradient_loss | -0.00727 | -| std | 0.0331 | -| value_loss | 3.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10441 | -| time_elapsed | 59366 | -| total_timesteps | 1336448 | -| train/ | | -| approx_kl | 0.017827112 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -3.74 | -| learning_rate | 0.0003 | -| loss | 0.000912 | -| n_updates | 104400 | -| policy_gradient_loss | -0.000168 | -| std | 0.0331 | -| value_loss | 1.18e-07 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10442 | -| time_elapsed | 59370 | -| total_timesteps | 1336576 | -| train/ | | -| approx_kl | 0.000114765484 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.986 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 104410 | -| policy_gradient_loss | 4.29e-05 | -| std | 0.0331 | -| value_loss | 4.74e-08 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10443 | -| time_elapsed | 59375 | -| total_timesteps | 1336704 | -| train/ | | -| approx_kl | 0.013563146 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 104420 | -| policy_gradient_loss | 0.00143 | -| std | 0.0331 | -| value_loss | 6.04e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10444 | -| time_elapsed | 59378 | -| total_timesteps | 1336832 | -| train/ | | -| approx_kl | 0.0002703988 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 104430 | -| policy_gradient_loss | 0.000775 | -| std | 0.0331 | -| value_loss | 3.25e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10445 | -| time_elapsed | 59382 | -| total_timesteps | 1336960 | -| train/ | | -| approx_kl | 0.0038607563 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.00116 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 104440 | -| policy_gradient_loss | -0.00447 | -| std | 0.0331 | -| value_loss | 2.04e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10446 | -| time_elapsed | 59385 | -| total_timesteps | 1337088 | -| train/ | | -| approx_kl | 0.008134117 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.00792 | -| learning_rate | 0.0003 | -| loss | 0.00798 | -| n_updates | 104450 | -| policy_gradient_loss | 0.0071 | -| std | 0.0331 | -| value_loss | 1.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10447 | -| time_elapsed | 59390 | -| total_timesteps | 1337216 | -| train/ | | -| approx_kl | 0.085359335 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 104460 | -| policy_gradient_loss | -0.00805 | -| std | 0.0331 | -| value_loss | 0.000385 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10448 | -| time_elapsed | 59394 | -| total_timesteps | 1337344 | -| train/ | | -| approx_kl | 0.0037960154 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 104470 | -| policy_gradient_loss | -0.00867 | -| std | 0.0331 | -| value_loss | 4.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10449 | -| time_elapsed | 59398 | -| total_timesteps | 1337472 | -| train/ | | -| approx_kl | 0.014399856 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.00592 | -| learning_rate | 0.0003 | -| loss | -1.39e-06 | -| n_updates | 104480 | -| policy_gradient_loss | -0.00118 | -| std | 0.0331 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10450 | -| time_elapsed | 59402 | -| total_timesteps | 1337600 | -| train/ | | -| approx_kl | 0.004562274 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | -0.00972 | -| n_updates | 104490 | -| policy_gradient_loss | -0.00645 | -| std | 0.0331 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10451 | -| time_elapsed | 59404 | -| total_timesteps | 1337728 | -| train/ | | -| approx_kl | 0.0043579643 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.00705 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 104500 | -| policy_gradient_loss | -0.000145 | -| std | 0.033 | -| value_loss | 1.21e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10452 | -| time_elapsed | 59407 | -| total_timesteps | 1337856 | -| train/ | | -| approx_kl | 0.00027275644 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 1.99 | -| explained_variance | -0.000867 | -| learning_rate | 0.0003 | -| loss | -0.000443 | -| n_updates | 104510 | -| policy_gradient_loss | -0.000199 | -| std | 0.0328 | -| value_loss | 1.77e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10453 | -| time_elapsed | 59410 | -| total_timesteps | 1337984 | -| train/ | | -| approx_kl | 0.004217078 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 104520 | -| policy_gradient_loss | 0.00611 | -| std | 0.0326 | -| value_loss | 1.95e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10454 | -| time_elapsed | 59413 | -| total_timesteps | 1338112 | -| train/ | | -| approx_kl | 0.0078451075 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | 0.000761 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 104530 | -| policy_gradient_loss | -0.000754 | -| std | 0.0326 | -| value_loss | 9.38e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10455 | -| time_elapsed | 59422 | -| total_timesteps | 1338240 | -| train/ | | -| approx_kl | 0.07747742 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 104540 | -| policy_gradient_loss | -0.0121 | -| std | 0.0327 | -| value_loss | 0.00194 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10456 | -| time_elapsed | 59425 | -| total_timesteps | 1338368 | -| train/ | | -| approx_kl | 0.00015588198 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0799 | -| learning_rate | 0.0003 | -| loss | -0.000791 | -| n_updates | 104550 | -| policy_gradient_loss | -0.000142 | -| std | 0.0327 | -| value_loss | 0.000992 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10457 | -| time_elapsed | 59429 | -| total_timesteps | 1338496 | -| train/ | | -| approx_kl | 0.012993827 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 104560 | -| policy_gradient_loss | 0.0107 | -| std | 0.0327 | -| value_loss | 1.59e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10458 | -| time_elapsed | 59432 | -| total_timesteps | 1338624 | -| train/ | | -| approx_kl | 0.0062504197 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | 0.00452 | -| n_updates | 104570 | -| policy_gradient_loss | 0.00147 | -| std | 0.0327 | -| value_loss | 8.58e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10459 | -| time_elapsed | 59435 | -| total_timesteps | 1338752 | -| train/ | | -| approx_kl | 0.00038371515 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.000804 | -| n_updates | 104580 | -| policy_gradient_loss | -4.91e-05 | -| std | 0.0327 | -| value_loss | 5.53e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10460 | -| time_elapsed | 59439 | -| total_timesteps | 1338880 | -| train/ | | -| approx_kl | 0.0019374033 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.000361 | -| n_updates | 104590 | -| policy_gradient_loss | 0.000226 | -| std | 0.0326 | -| value_loss | 1.17e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10461 | -| time_elapsed | 59442 | -| total_timesteps | 1339008 | -| train/ | | -| approx_kl | 0.009036951 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.0007 | -| n_updates | 104600 | -| policy_gradient_loss | -0.000525 | -| std | 0.0326 | -| value_loss | 1.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10462 | -| time_elapsed | 59452 | -| total_timesteps | 1339136 | -| train/ | | -| approx_kl | 0.041487563 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | 0.869 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 104610 | -| policy_gradient_loss | -0.00664 | -| std | 0.0326 | -| value_loss | 0.000825 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10463 | -| time_elapsed | 59455 | -| total_timesteps | 1339264 | -| train/ | | -| approx_kl | 0.00012305658 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | 0.0246 | -| learning_rate | 0.0003 | -| loss | -0.000117 | -| n_updates | 104620 | -| policy_gradient_loss | 0.00559 | -| std | 0.0326 | -| value_loss | 0.00024 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10464 | -| time_elapsed | 59458 | -| total_timesteps | 1339392 | -| train/ | | -| approx_kl | 0.009859769 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 104630 | -| policy_gradient_loss | 0.00227 | -| std | 0.0326 | -| value_loss | 0.000102 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10465 | -| time_elapsed | 59461 | -| total_timesteps | 1339520 | -| train/ | | -| approx_kl | 0.0007392098 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -16.5 | -| learning_rate | 0.0003 | -| loss | 0.00357 | -| n_updates | 104640 | -| policy_gradient_loss | -0.00441 | -| std | 0.0327 | -| value_loss | 2.39e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10466 | -| time_elapsed | 59465 | -| total_timesteps | 1339648 | -| train/ | | -| approx_kl | 0.0128829 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.00312 | -| n_updates | 104650 | -| policy_gradient_loss | 0.00156 | -| std | 0.0326 | -| value_loss | 7.62e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10467 | -| time_elapsed | 59469 | -| total_timesteps | 1339776 | -| train/ | | -| approx_kl | 0.019549018 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.00472 | -| learning_rate | 0.0003 | -| loss | 0.00324 | -| n_updates | 104660 | -| policy_gradient_loss | -0.000658 | -| std | 0.0326 | -| value_loss | 2.05e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10468 | -| time_elapsed | 59472 | -| total_timesteps | 1339904 | -| train/ | | -| approx_kl | 0.0056834193 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.00648 | -| learning_rate | 0.0003 | -| loss | 0.00555 | -| n_updates | 104670 | -| policy_gradient_loss | 0.0101 | -| std | 0.0326 | -| value_loss | 6.47e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10469 | -| time_elapsed | 59476 | -| total_timesteps | 1340032 | -| train/ | | -| approx_kl | 0.0012787711 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -2.45 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 104680 | -| policy_gradient_loss | -0.00323 | -| std | 0.0326 | -| value_loss | 6.43e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10470 | -| time_elapsed | 59484 | -| total_timesteps | 1340160 | -| train/ | | -| approx_kl | 0.0030464567 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | 0.664 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 104690 | -| policy_gradient_loss | -0.00825 | -| std | 0.0326 | -| value_loss | 0.00572 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10471 | -| time_elapsed | 59487 | -| total_timesteps | 1340288 | -| train/ | | -| approx_kl | 0.0007075616 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 104700 | -| policy_gradient_loss | 0.00194 | -| std | 0.0326 | -| value_loss | 8.51e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10472 | -| time_elapsed | 59490 | -| total_timesteps | 1340416 | -| train/ | | -| approx_kl | 0.02138061 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.00163 | -| n_updates | 104710 | -| policy_gradient_loss | -0.0025 | -| std | 0.0326 | -| value_loss | 5.16e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10473 | -| time_elapsed | 59493 | -| total_timesteps | 1340544 | -| train/ | | -| approx_kl | 0.0073896046 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0777 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 104720 | -| policy_gradient_loss | 0.00493 | -| std | 0.0326 | -| value_loss | 3.42e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10474 | -| time_elapsed | 59497 | -| total_timesteps | 1340672 | -| train/ | | -| approx_kl | 0.0016571074 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 104730 | -| policy_gradient_loss | -0.0129 | -| std | 0.0326 | -| value_loss | 2.66e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10475 | -| time_elapsed | 59500 | -| total_timesteps | 1340800 | -| train/ | | -| approx_kl | 0.0050102198 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | -0.00712 | -| n_updates | 104740 | -| policy_gradient_loss | -0.00352 | -| std | 0.0326 | -| value_loss | 1.69e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 22 | -| iterations | 10476 | -| time_elapsed | 59505 | -| total_timesteps | 1340928 | -| train/ | | -| approx_kl | 0.0034818794 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 104750 | -| policy_gradient_loss | 0.00607 | -| std | 0.0327 | -| value_loss | 1.12e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10477 | -| time_elapsed | 59508 | -| total_timesteps | 1341056 | -| train/ | | -| approx_kl | 0.020817835 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.00494 | -| n_updates | 104760 | -| policy_gradient_loss | -0.000887 | -| std | 0.0325 | -| value_loss | 7.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10478 | -| time_elapsed | 59514 | -| total_timesteps | 1341184 | -| train/ | | -| approx_kl | 0.0118849175 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | 0.606 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 104770 | -| policy_gradient_loss | -0.0177 | -| std | 0.0325 | -| value_loss | 0.00907 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10479 | -| time_elapsed | 59518 | -| total_timesteps | 1341312 | -| train/ | | -| approx_kl | 0.0012310343 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.00586 | -| learning_rate | 0.0003 | -| loss | -0.00199 | -| n_updates | 104780 | -| policy_gradient_loss | 0.00591 | -| std | 0.0325 | -| value_loss | 3.67e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10480 | -| time_elapsed | 59522 | -| total_timesteps | 1341440 | -| train/ | | -| approx_kl | 0.022858173 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0725 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 104790 | -| policy_gradient_loss | -0.00813 | -| std | 0.0325 | -| value_loss | 7.44e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10481 | -| time_elapsed | 59524 | -| total_timesteps | 1341568 | -| train/ | | -| approx_kl | 0.0013684309 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0851 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 104800 | -| policy_gradient_loss | -0.000812 | -| std | 0.0325 | -| value_loss | 4.29e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10482 | -| time_elapsed | 59526 | -| total_timesteps | 1341696 | -| train/ | | -| approx_kl | 0.013101965 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.000301 | -| n_updates | 104810 | -| policy_gradient_loss | -0.000412 | -| std | 0.0325 | -| value_loss | 2.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10483 | -| time_elapsed | 59529 | -| total_timesteps | 1341824 | -| train/ | | -| approx_kl | 0.0043267817 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 104820 | -| policy_gradient_loss | -0.0128 | -| std | 0.0325 | -| value_loss | 6.44e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10484 | -| time_elapsed | 59531 | -| total_timesteps | 1341952 | -| train/ | | -| approx_kl | 0.0032660621 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | 0.000596 | -| learning_rate | 0.0003 | -| loss | -0.00924 | -| n_updates | 104830 | -| policy_gradient_loss | 0.000529 | -| std | 0.0325 | -| value_loss | 7.39e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10485 | -| time_elapsed | 59534 | -| total_timesteps | 1342080 | -| train/ | | -| approx_kl | 0.019861452 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.312 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 104840 | -| policy_gradient_loss | -0.00446 | -| std | 0.0325 | -| value_loss | 6.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10486 | -| time_elapsed | 59541 | -| total_timesteps | 1342208 | -| train/ | | -| approx_kl | 0.0077490816 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | 0.632 | -| learning_rate | 0.0003 | -| loss | 0.00847 | -| n_updates | 104850 | -| policy_gradient_loss | -0.000177 | -| std | 0.0325 | -| value_loss | 0.00476 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10487 | -| time_elapsed | 59544 | -| total_timesteps | 1342336 | -| train/ | | -| approx_kl | 0.019015595 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0658 | -| learning_rate | 0.0003 | -| loss | 0.00601 | -| n_updates | 104860 | -| policy_gradient_loss | 0.000862 | -| std | 0.0325 | -| value_loss | 7.14e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10488 | -| time_elapsed | 59548 | -| total_timesteps | 1342464 | -| train/ | | -| approx_kl | 0.00043088198 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 104870 | -| policy_gradient_loss | -0.00559 | -| std | 0.0325 | -| value_loss | 2.5e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10489 | -| time_elapsed | 59551 | -| total_timesteps | 1342592 | -| train/ | | -| approx_kl | 0.0034067784 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0766 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 104880 | -| policy_gradient_loss | -0.00106 | -| std | 0.0325 | -| value_loss | 2.49e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10490 | -| time_elapsed | 59555 | -| total_timesteps | 1342720 | -| train/ | | -| approx_kl | 0.0011671609 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | 0.00277 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 104890 | -| policy_gradient_loss | -0.000559 | -| std | 0.0325 | -| value_loss | 9.24e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10491 | -| time_elapsed | 59558 | -| total_timesteps | 1342848 | -| train/ | | -| approx_kl | 0.07541197 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | 0.00502 | -| learning_rate | 0.0003 | -| loss | 0.0541 | -| n_updates | 104900 | -| policy_gradient_loss | 0.0201 | -| std | 0.0326 | -| value_loss | 4.39e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 22 | -| iterations | 10492 | -| time_elapsed | 59560 | -| total_timesteps | 1342976 | -| train/ | | -| approx_kl | 0.018674213 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.00704 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 104910 | -| policy_gradient_loss | -0.0129 | -| std | 0.0327 | -| value_loss | 5.62e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 22 | -| iterations | 10493 | -| time_elapsed | 59563 | -| total_timesteps | 1343104 | -| train/ | | -| approx_kl | 0.0052623875 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.447 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 104920 | -| policy_gradient_loss | 0.000738 | -| std | 0.0326 | -| value_loss | 2.83e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 22 | -| iterations | 10494 | -| time_elapsed | 59570 | -| total_timesteps | 1343232 | -| train/ | | -| approx_kl | 0.07394461 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | 0.697 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 104930 | -| policy_gradient_loss | -0.0131 | -| std | 0.0326 | -| value_loss | 0.000615 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 22 | -| iterations | 10495 | -| time_elapsed | 59575 | -| total_timesteps | 1343360 | -| train/ | | -| approx_kl | 0.0027467897 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -286 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 104940 | -| policy_gradient_loss | -0.00834 | -| std | 0.0326 | -| value_loss | 9.66e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 22 | -| iterations | 10496 | -| time_elapsed | 59579 | -| total_timesteps | 1343488 | -| train/ | | -| approx_kl | 0.0037545497 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 2 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 104950 | -| policy_gradient_loss | -0.00047 | -| std | 0.0325 | -| value_loss | 4e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 22 | -| iterations | 10497 | -| time_elapsed | 59582 | -| total_timesteps | 1343616 | -| train/ | | -| approx_kl | 0.0011946955 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.45 | -| learning_rate | 0.0003 | -| loss | -0.00434 | -| n_updates | 104960 | -| policy_gradient_loss | -0.00108 | -| std | 0.0324 | -| value_loss | 0.000177 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 22 | -| iterations | 10498 | -| time_elapsed | 59586 | -| total_timesteps | 1343744 | -| train/ | | -| approx_kl | 0.00091809407 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.00134 | -| n_updates | 104970 | -| policy_gradient_loss | 0.000647 | -| std | 0.0323 | -| value_loss | 8.13e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 22 | -| iterations | 10499 | -| time_elapsed | 59590 | -| total_timesteps | 1343872 | -| train/ | | -| approx_kl | 0.0030087568 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0791 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 104980 | -| policy_gradient_loss | 0.00324 | -| std | 0.0323 | -| value_loss | 3.76e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10500 | -| time_elapsed | 59593 | -| total_timesteps | 1344000 | -| train/ | | -| approx_kl | 0.0012347908 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.000283 | -| n_updates | 104990 | -| policy_gradient_loss | 0.0048 | -| std | 0.0323 | -| value_loss | 7.51e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10501 | -| time_elapsed | 59596 | -| total_timesteps | 1344128 | -| train/ | | -| approx_kl | 0.0037483992 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | -0.00293 | -| learning_rate | 0.0003 | -| loss | 0.00675 | -| n_updates | 105000 | -| policy_gradient_loss | 0.0042 | -| std | 0.0323 | -| value_loss | 2.3e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10502 | -| time_elapsed | 59603 | -| total_timesteps | 1344256 | -| train/ | | -| approx_kl | 0.0027923295 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | 0.753 | -| learning_rate | 0.0003 | -| loss | -0.00975 | -| n_updates | 105010 | -| policy_gradient_loss | -0.00604 | -| std | 0.0323 | -| value_loss | 0.00332 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10503 | -| time_elapsed | 59607 | -| total_timesteps | 1344384 | -| train/ | | -| approx_kl | 1.4982186e-05 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | -0.000618 | -| n_updates | 105020 | -| policy_gradient_loss | -0.00114 | -| std | 0.0322 | -| value_loss | 3.1e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10504 | -| time_elapsed | 59610 | -| total_timesteps | 1344512 | -| train/ | | -| approx_kl | 0.0002765134 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.964 | -| learning_rate | 0.0003 | -| loss | 0.00195 | -| n_updates | 105030 | -| policy_gradient_loss | -0.000708 | -| std | 0.0322 | -| value_loss | 2.06e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10505 | -| time_elapsed | 59614 | -| total_timesteps | 1344640 | -| train/ | | -| approx_kl | 0.0044349274 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | 0.00143 | -| n_updates | 105040 | -| policy_gradient_loss | 0.0067 | -| std | 0.0322 | -| value_loss | 2.37e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10506 | -| time_elapsed | 59618 | -| total_timesteps | 1344768 | -| train/ | | -| approx_kl | 0.0060041468 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 105050 | -| policy_gradient_loss | 4.06e-05 | -| std | 0.0322 | -| value_loss | 9.88e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 22 | -| iterations | 10507 | -| time_elapsed | 59622 | -| total_timesteps | 1344896 | -| train/ | | -| approx_kl | 0.0014955322 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0969 | -| learning_rate | 0.0003 | -| loss | -0.00617 | -| n_updates | 105060 | -| policy_gradient_loss | -0.00254 | -| std | 0.0322 | -| value_loss | 2.95e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10508 | -| time_elapsed | 59625 | -| total_timesteps | 1345024 | -| train/ | | -| approx_kl | 0.015950052 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.00422 | -| n_updates | 105070 | -| policy_gradient_loss | -0.000206 | -| std | 0.0323 | -| value_loss | 1.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10509 | -| time_elapsed | 59632 | -| total_timesteps | 1345152 | -| train/ | | -| approx_kl | 0.075288706 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.01 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 105080 | -| policy_gradient_loss | -0.016 | -| std | 0.0323 | -| value_loss | 0.000291 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10510 | -| time_elapsed | 59635 | -| total_timesteps | 1345280 | -| train/ | | -| approx_kl | 0.0054697716 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.435 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 105090 | -| policy_gradient_loss | -0.00457 | -| std | 0.0323 | -| value_loss | 1.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10511 | -| time_elapsed | 59638 | -| total_timesteps | 1345408 | -| train/ | | -| approx_kl | 0.005735785 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 105100 | -| policy_gradient_loss | -0.0011 | -| std | 0.0322 | -| value_loss | 9.43e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10512 | -| time_elapsed | 59641 | -| total_timesteps | 1345536 | -| train/ | | -| approx_kl | 0.0061179735 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 105110 | -| policy_gradient_loss | -0.000478 | -| std | 0.0322 | -| value_loss | 3.7e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10513 | -| time_elapsed | 59644 | -| total_timesteps | 1345664 | -| train/ | | -| approx_kl | 0.015476674 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.00768 | -| learning_rate | 0.0003 | -| loss | 0.00889 | -| n_updates | 105120 | -| policy_gradient_loss | 0.00166 | -| std | 0.0322 | -| value_loss | 1.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10514 | -| time_elapsed | 59647 | -| total_timesteps | 1345792 | -| train/ | | -| approx_kl | 0.0060111796 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | 0.00304 | -| learning_rate | 0.0003 | -| loss | -2.57e-05 | -| n_updates | 105130 | -| policy_gradient_loss | 0.00684 | -| std | 0.0322 | -| value_loss | 6.37e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 22 | -| iterations | 10515 | -| time_elapsed | 59649 | -| total_timesteps | 1345920 | -| train/ | | -| approx_kl | 0.004882086 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | 0.0034 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 105140 | -| policy_gradient_loss | -0.0134 | -| std | 0.0322 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10516 | -| time_elapsed | 59652 | -| total_timesteps | 1346048 | -| train/ | | -| approx_kl | 0.004018802 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.00859 | -| learning_rate | 0.0003 | -| loss | -0.00655 | -| n_updates | 105150 | -| policy_gradient_loss | -0.00609 | -| std | 0.0322 | -| value_loss | 4.12e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10517 | -| time_elapsed | 59659 | -| total_timesteps | 1346176 | -| train/ | | -| approx_kl | 1.4378689e-05 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | 0.823 | -| learning_rate | 0.0003 | -| loss | 0.000376 | -| n_updates | 105160 | -| policy_gradient_loss | -0.000676 | -| std | 0.0322 | -| value_loss | 0.00219 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10518 | -| time_elapsed | 59663 | -| total_timesteps | 1346304 | -| train/ | | -| approx_kl | 0.0004979926 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 105170 | -| policy_gradient_loss | 0.00174 | -| std | 0.0322 | -| value_loss | 4.47e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10519 | -| time_elapsed | 59667 | -| total_timesteps | 1346432 | -| train/ | | -| approx_kl | 0.006301803 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.000336 | -| n_updates | 105180 | -| policy_gradient_loss | 0.00104 | -| std | 0.0321 | -| value_loss | 1.96e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10520 | -| time_elapsed | 59670 | -| total_timesteps | 1346560 | -| train/ | | -| approx_kl | 0.0010593785 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | 0.00823 | -| n_updates | 105190 | -| policy_gradient_loss | -0.00575 | -| std | 0.0321 | -| value_loss | 1.87e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10521 | -| time_elapsed | 59674 | -| total_timesteps | 1346688 | -| train/ | | -| approx_kl | 0.00020129094 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.000852 | -| n_updates | 105200 | -| policy_gradient_loss | -2.25e-05 | -| std | 0.0321 | -| value_loss | 9.22e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10522 | -| time_elapsed | 59676 | -| total_timesteps | 1346816 | -| train/ | | -| approx_kl | 0.002723372 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 105210 | -| policy_gradient_loss | -0.00291 | -| std | 0.0321 | -| value_loss | 6.34e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 22 | -| iterations | 10523 | -| time_elapsed | 59679 | -| total_timesteps | 1346944 | -| train/ | | -| approx_kl | 7.489696e-06 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.000198 | -| n_updates | 105220 | -| policy_gradient_loss | 0.00819 | -| std | 0.0321 | -| value_loss | 4.51e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10524 | -| time_elapsed | 59682 | -| total_timesteps | 1347072 | -| train/ | | -| approx_kl | 0.00053745694 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | 0.000869 | -| n_updates | 105230 | -| policy_gradient_loss | 0.00692 | -| std | 0.0321 | -| value_loss | 3.15e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10525 | -| time_elapsed | 59687 | -| total_timesteps | 1347200 | -| train/ | | -| approx_kl | 0.020513965 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | 0.834 | -| learning_rate | 0.0003 | -| loss | -0.0076 | -| n_updates | 105240 | -| policy_gradient_loss | -0.00757 | -| std | 0.0321 | -| value_loss | 0.00192 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10526 | -| time_elapsed | 59690 | -| total_timesteps | 1347328 | -| train/ | | -| approx_kl | 0.017440543 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.00994 | -| learning_rate | 0.0003 | -| loss | 0.00428 | -| n_updates | 105250 | -| policy_gradient_loss | -0.00125 | -| std | 0.0321 | -| value_loss | 2.75e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10527 | -| time_elapsed | 59693 | -| total_timesteps | 1347456 | -| train/ | | -| approx_kl | 0.014504559 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 105260 | -| policy_gradient_loss | -0.00285 | -| std | 0.0321 | -| value_loss | 1.52e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10528 | -| time_elapsed | 59697 | -| total_timesteps | 1347584 | -| train/ | | -| approx_kl | 0.0014883028 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.364 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 105270 | -| policy_gradient_loss | -0.00281 | -| std | 0.032 | -| value_loss | 3.78e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10529 | -| time_elapsed | 59699 | -| total_timesteps | 1347712 | -| train/ | | -| approx_kl | 0.00027101813 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | 0.00283 | -| learning_rate | 0.0003 | -| loss | 0.000589 | -| n_updates | 105280 | -| policy_gradient_loss | 0.000106 | -| std | 0.032 | -| value_loss | 1.79e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10530 | -| time_elapsed | 59703 | -| total_timesteps | 1347840 | -| train/ | | -| approx_kl | 0.003458817 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.00494 | -| n_updates | 105290 | -| policy_gradient_loss | 0.00112 | -| std | 0.032 | -| value_loss | 4.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10531 | -| time_elapsed | 59706 | -| total_timesteps | 1347968 | -| train/ | | -| approx_kl | 0.010960041 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 105300 | -| policy_gradient_loss | -0.00689 | -| std | 0.032 | -| value_loss | 4.63e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10532 | -| time_elapsed | 59709 | -| total_timesteps | 1348096 | -| train/ | | -| approx_kl | 0.0049643936 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 105310 | -| policy_gradient_loss | -0.00406 | -| std | 0.032 | -| value_loss | 1.91e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10533 | -| time_elapsed | 59717 | -| total_timesteps | 1348224 | -| train/ | | -| approx_kl | 0.013229163 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 105320 | -| policy_gradient_loss | -0.0103 | -| std | 0.032 | -| value_loss | 6.17e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10534 | -| time_elapsed | 59721 | -| total_timesteps | 1348352 | -| train/ | | -| approx_kl | 0.043179847 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 105330 | -| policy_gradient_loss | -0.0102 | -| std | 0.032 | -| value_loss | 2.04e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10535 | -| time_elapsed | 59724 | -| total_timesteps | 1348480 | -| train/ | | -| approx_kl | 0.00016365666 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | 0.000537 | -| n_updates | 105340 | -| policy_gradient_loss | -0.00117 | -| std | 0.032 | -| value_loss | 3.38e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10536 | -| time_elapsed | 59728 | -| total_timesteps | 1348608 | -| train/ | | -| approx_kl | 0.013255432 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.00781 | -| n_updates | 105350 | -| policy_gradient_loss | 0.0062 | -| std | 0.032 | -| value_loss | 1.02e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10537 | -| time_elapsed | 59731 | -| total_timesteps | 1348736 | -| train/ | | -| approx_kl | 1.1922792e-05 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.302 | -| learning_rate | 0.0003 | -| loss | 0.000307 | -| n_updates | 105360 | -| policy_gradient_loss | -0.00322 | -| std | 0.032 | -| value_loss | 5.65e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10538 | -| time_elapsed | 59735 | -| total_timesteps | 1348864 | -| train/ | | -| approx_kl | 0.004280857 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 105370 | -| policy_gradient_loss | -0.00934 | -| std | 0.032 | -| value_loss | 3.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 22 | -| iterations | 10539 | -| time_elapsed | 59737 | -| total_timesteps | 1348992 | -| train/ | | -| approx_kl | 0.016361495 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | -0.00374 | -| n_updates | 105380 | -| policy_gradient_loss | -0.00406 | -| std | 0.032 | -| value_loss | 1.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10540 | -| time_elapsed | 59741 | -| total_timesteps | 1349120 | -| train/ | | -| approx_kl | 0.015438493 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 105390 | -| policy_gradient_loss | 0.01 | -| std | 0.0319 | -| value_loss | 8.78e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10541 | -| time_elapsed | 59750 | -| total_timesteps | 1349248 | -| train/ | | -| approx_kl | 0.04403088 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -2.97 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 105400 | -| policy_gradient_loss | -0.0148 | -| std | 0.0319 | -| value_loss | 0.00208 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10542 | -| time_elapsed | 59754 | -| total_timesteps | 1349376 | -| train/ | | -| approx_kl | 0.00031421985 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -1.39 | -| learning_rate | 0.0003 | -| loss | -0.000646 | -| n_updates | 105410 | -| policy_gradient_loss | 0.00627 | -| std | 0.0319 | -| value_loss | 2.83e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10543 | -| time_elapsed | 59757 | -| total_timesteps | 1349504 | -| train/ | | -| approx_kl | 0.0045981794 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 2.02 | -| explained_variance | -0.343 | -| learning_rate | 0.0003 | -| loss | 0.00434 | -| n_updates | 105420 | -| policy_gradient_loss | 0.00239 | -| std | 0.0319 | -| value_loss | 1.19e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10544 | -| time_elapsed | 59759 | -| total_timesteps | 1349632 | -| train/ | | -| approx_kl | 0.008998446 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.00101 | -| learning_rate | 0.0003 | -| loss | -0.00989 | -| n_updates | 105430 | -| policy_gradient_loss | -0.00677 | -| std | 0.0319 | -| value_loss | 4.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10545 | -| time_elapsed | 59761 | -| total_timesteps | 1349760 | -| train/ | | -| approx_kl | 0.009077333 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.00493 | -| learning_rate | 0.0003 | -| loss | -0.000491 | -| n_updates | 105440 | -| policy_gradient_loss | -0.000223 | -| std | 0.0319 | -| value_loss | 1.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10546 | -| time_elapsed | 59764 | -| total_timesteps | 1349888 | -| train/ | | -| approx_kl | 0.025335968 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.001 | -| learning_rate | 0.0003 | -| loss | 0.00651 | -| n_updates | 105450 | -| policy_gradient_loss | 0.000105 | -| std | 0.0319 | -| value_loss | 2.41e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10547 | -| time_elapsed | 59767 | -| total_timesteps | 1350016 | -| train/ | | -| approx_kl | 5.0202012e-05 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.00457 | -| learning_rate | 0.0003 | -| loss | 6.61e-05 | -| n_updates | 105460 | -| policy_gradient_loss | 0.00107 | -| std | 0.0319 | -| value_loss | 1.08e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10548 | -| time_elapsed | 59776 | -| total_timesteps | 1350144 | -| train/ | | -| approx_kl | 0.003938586 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | 0.0584 | -| n_updates | 105470 | -| policy_gradient_loss | 0.0207 | -| std | 0.0319 | -| value_loss | 0.000484 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10549 | -| time_elapsed | 59779 | -| total_timesteps | 1350272 | -| train/ | | -| approx_kl | 0.0253306 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.146 | -| learning_rate | 0.0003 | -| loss | -0.00931 | -| n_updates | 105480 | -| policy_gradient_loss | 0.00328 | -| std | 0.0318 | -| value_loss | 9e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10550 | -| time_elapsed | 59782 | -| total_timesteps | 1350400 | -| train/ | | -| approx_kl | 0.014911624 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | 0.00909 | -| n_updates | 105490 | -| policy_gradient_loss | 0.0125 | -| std | 0.0319 | -| value_loss | 1.5e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10551 | -| time_elapsed | 59785 | -| total_timesteps | 1350528 | -| train/ | | -| approx_kl | 0.0014589382 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.00257 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 105500 | -| policy_gradient_loss | -0.000282 | -| std | 0.0319 | -| value_loss | 6.07e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10552 | -| time_elapsed | 59788 | -| total_timesteps | 1350656 | -| train/ | | -| approx_kl | 0.007900154 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.000447 | -| n_updates | 105510 | -| policy_gradient_loss | 0.00335 | -| std | 0.0319 | -| value_loss | 3.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10553 | -| time_elapsed | 59792 | -| total_timesteps | 1350784 | -| train/ | | -| approx_kl | 0.03205525 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 105520 | -| policy_gradient_loss | -0.00791 | -| std | 0.0319 | -| value_loss | 9.19e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 22 | -| iterations | 10554 | -| time_elapsed | 59795 | -| total_timesteps | 1350912 | -| train/ | | -| approx_kl | 0.012114679 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.00437 | -| learning_rate | 0.0003 | -| loss | 0.00839 | -| n_updates | 105530 | -| policy_gradient_loss | 0.00916 | -| std | 0.0319 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10555 | -| time_elapsed | 59798 | -| total_timesteps | 1351040 | -| train/ | | -| approx_kl | 0.0028677736 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.0827 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 105540 | -| policy_gradient_loss | -0.00268 | -| std | 0.0319 | -| value_loss | 3.53e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10556 | -| time_elapsed | 59804 | -| total_timesteps | 1351168 | -| train/ | | -| approx_kl | 0.005486481 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.851 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 105550 | -| policy_gradient_loss | -0.0166 | -| std | 0.0319 | -| value_loss | 0.00155 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10557 | -| time_elapsed | 59807 | -| total_timesteps | 1351296 | -| train/ | | -| approx_kl | 0.0006017783 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 105560 | -| policy_gradient_loss | -0.00264 | -| std | 0.0319 | -| value_loss | 1.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10558 | -| time_elapsed | 59811 | -| total_timesteps | 1351424 | -| train/ | | -| approx_kl | 0.0020878413 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.378 | -| learning_rate | 0.0003 | -| loss | 0.000414 | -| n_updates | 105570 | -| policy_gradient_loss | 0.00548 | -| std | 0.0319 | -| value_loss | 4.08e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10559 | -| time_elapsed | 59815 | -| total_timesteps | 1351552 | -| train/ | | -| approx_kl | 0.0008987924 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 105580 | -| policy_gradient_loss | 0.000482 | -| std | 0.0318 | -| value_loss | 9.32e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10560 | -| time_elapsed | 59817 | -| total_timesteps | 1351680 | -| train/ | | -| approx_kl | 0.019975185 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.000753 | -| learning_rate | 0.0003 | -| loss | 0.00468 | -| n_updates | 105590 | -| policy_gradient_loss | 0.000326 | -| std | 0.0318 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10561 | -| time_elapsed | 59819 | -| total_timesteps | 1351808 | -| train/ | | -| approx_kl | 0.008461686 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.00964 | -| n_updates | 105600 | -| policy_gradient_loss | 0.00552 | -| std | 0.0317 | -| value_loss | 6.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10562 | -| time_elapsed | 59822 | -| total_timesteps | 1351936 | -| train/ | | -| approx_kl | 0.012389688 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 105610 | -| policy_gradient_loss | -0.0106 | -| std | 0.0317 | -| value_loss | 1.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10563 | -| time_elapsed | 59826 | -| total_timesteps | 1352064 | -| train/ | | -| approx_kl | 0.005534729 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 105620 | -| policy_gradient_loss | -0.017 | -| std | 0.0317 | -| value_loss | 4.11e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10564 | -| time_elapsed | 59832 | -| total_timesteps | 1352192 | -| train/ | | -| approx_kl | 0.0048847473 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 105630 | -| policy_gradient_loss | -0.0144 | -| std | 0.0317 | -| value_loss | 0.000263 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10565 | -| time_elapsed | 59836 | -| total_timesteps | 1352320 | -| train/ | | -| approx_kl | 0.00213522 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -0.335 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 105640 | -| policy_gradient_loss | 0.00776 | -| std | 0.0316 | -| value_loss | 4.73e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10566 | -| time_elapsed | 59838 | -| total_timesteps | 1352448 | -| train/ | | -| approx_kl | 0.027422877 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -4.76 | -| learning_rate | 0.0003 | -| loss | -0.00979 | -| n_updates | 105650 | -| policy_gradient_loss | -0.00738 | -| std | 0.0316 | -| value_loss | 2.74e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10567 | -| time_elapsed | 59843 | -| total_timesteps | 1352576 | -| train/ | | -| approx_kl | 0.0013081809 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -77.8 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 105660 | -| policy_gradient_loss | -0.00126 | -| std | 0.0316 | -| value_loss | 8.32e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10568 | -| time_elapsed | 59847 | -| total_timesteps | 1352704 | -| train/ | | -| approx_kl | 4.6703964e-05 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.03 | -| explained_variance | -548 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 105670 | -| policy_gradient_loss | -0.00677 | -| std | 0.0316 | -| value_loss | 1.45e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10569 | -| time_elapsed | 59851 | -| total_timesteps | 1352832 | -| train/ | | -| approx_kl | 0.002011998 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -2.67 | -| learning_rate | 0.0003 | -| loss | -0.00567 | -| n_updates | 105680 | -| policy_gradient_loss | -0.0017 | -| std | 0.0316 | -| value_loss | 7.33e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 22 | -| iterations | 10570 | -| time_elapsed | 59853 | -| total_timesteps | 1352960 | -| train/ | | -| approx_kl | 4.079938e-05 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 105690 | -| policy_gradient_loss | -0.00108 | -| std | 0.0316 | -| value_loss | 2.5e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10571 | -| time_elapsed | 59857 | -| total_timesteps | 1353088 | -| train/ | | -| approx_kl | 0.00060165906 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.00339 | -| n_updates | 105700 | -| policy_gradient_loss | -0.000558 | -| std | 0.0316 | -| value_loss | 3.93e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10572 | -| time_elapsed | 59862 | -| total_timesteps | 1353216 | -| train/ | | -| approx_kl | 0.013391033 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | 0.786 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 105710 | -| policy_gradient_loss | -0.0129 | -| std | 0.0316 | -| value_loss | 0.00327 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10573 | -| time_elapsed | 59865 | -| total_timesteps | 1353344 | -| train/ | | -| approx_kl | 0.009614809 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -77.8 | -| learning_rate | 0.0003 | -| loss | -0.00487 | -| n_updates | 105720 | -| policy_gradient_loss | -0.00494 | -| std | 0.0315 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10574 | -| time_elapsed | 59867 | -| total_timesteps | 1353472 | -| train/ | | -| approx_kl | 0.015434835 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -42.2 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 105730 | -| policy_gradient_loss | -0.00982 | -| std | 0.0315 | -| value_loss | 8e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10575 | -| time_elapsed | 59870 | -| total_timesteps | 1353600 | -| train/ | | -| approx_kl | 0.0029178932 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -3.74 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 105740 | -| policy_gradient_loss | 0.00718 | -| std | 0.0316 | -| value_loss | 4.53e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10576 | -| time_elapsed | 59873 | -| total_timesteps | 1353728 | -| train/ | | -| approx_kl | 0.00017650146 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.000379 | -| n_updates | 105750 | -| policy_gradient_loss | -1.75e-05 | -| std | 0.0315 | -| value_loss | 1.49e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10577 | -| time_elapsed | 59875 | -| total_timesteps | 1353856 | -| train/ | | -| approx_kl | 0.02307633 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.783 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 105760 | -| policy_gradient_loss | -0.0176 | -| std | 0.0315 | -| value_loss | 2.49e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10578 | -| time_elapsed | 59877 | -| total_timesteps | 1353984 | -| train/ | | -| approx_kl | 0.0014763745 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | 0.002 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 105770 | -| policy_gradient_loss | -0.00233 | -| std | 0.0315 | -| value_loss | 3.81e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10579 | -| time_elapsed | 59880 | -| total_timesteps | 1354112 | -| train/ | | -| approx_kl | 0.00013041822 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 105780 | -| policy_gradient_loss | -0.00242 | -| std | 0.0315 | -| value_loss | 1.1e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10580 | -| time_elapsed | 59888 | -| total_timesteps | 1354240 | -| train/ | | -| approx_kl | 0.042786412 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 105790 | -| policy_gradient_loss | -0.0147 | -| std | 0.0315 | -| value_loss | 0.00243 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10581 | -| time_elapsed | 59892 | -| total_timesteps | 1354368 | -| train/ | | -| approx_kl | 0.0131235905 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.000813 | -| n_updates | 105800 | -| policy_gradient_loss | 0.000197 | -| std | 0.0315 | -| value_loss | 4.45e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10582 | -| time_elapsed | 59894 | -| total_timesteps | 1354496 | -| train/ | | -| approx_kl | 0.027234469 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 105810 | -| policy_gradient_loss | -0.00234 | -| std | 0.0315 | -| value_loss | 6.29e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10583 | -| time_elapsed | 59898 | -| total_timesteps | 1354624 | -| train/ | | -| approx_kl | 0.00025494443 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 105820 | -| policy_gradient_loss | -0.000208 | -| std | 0.0315 | -| value_loss | 6.71e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10584 | -| time_elapsed | 59901 | -| total_timesteps | 1354752 | -| train/ | | -| approx_kl | 0.0013152389 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 105830 | -| policy_gradient_loss | -0.000917 | -| std | 0.0314 | -| value_loss | 9.05e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10585 | -| time_elapsed | 59904 | -| total_timesteps | 1354880 | -| train/ | | -| approx_kl | 4.2145606e-05 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 105840 | -| policy_gradient_loss | 0.00229 | -| std | 0.0314 | -| value_loss | 2.12e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10586 | -| time_elapsed | 59907 | -| total_timesteps | 1355008 | -| train/ | | -| approx_kl | 0.00227866 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 105850 | -| policy_gradient_loss | -0.00191 | -| std | 0.0314 | -| value_loss | 1.05e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10587 | -| time_elapsed | 59916 | -| total_timesteps | 1355136 | -| train/ | | -| approx_kl | 0.00037376117 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | 0.00191 | -| n_updates | 105860 | -| policy_gradient_loss | 0.000334 | -| std | 0.0314 | -| value_loss | 0.00307 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10588 | -| time_elapsed | 59918 | -| total_timesteps | 1355264 | -| train/ | | -| approx_kl | 0.021912247 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | 0.254 | -| learning_rate | 0.0003 | -| loss | 0.00037 | -| n_updates | 105870 | -| policy_gradient_loss | 0.000616 | -| std | 0.0314 | -| value_loss | 6.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10589 | -| time_elapsed | 59922 | -| total_timesteps | 1355392 | -| train/ | | -| approx_kl | 0.0042876787 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.969 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 105880 | -| policy_gradient_loss | -0.00466 | -| std | 0.0314 | -| value_loss | 4.06e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10590 | -| time_elapsed | 59926 | -| total_timesteps | 1355520 | -| train/ | | -| approx_kl | 0.0006950209 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.436 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 105890 | -| policy_gradient_loss | 0.00018 | -| std | 0.0314 | -| value_loss | 2.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10591 | -| time_elapsed | 59931 | -| total_timesteps | 1355648 | -| train/ | | -| approx_kl | 0.0024439176 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.362 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 105900 | -| policy_gradient_loss | -0.00304 | -| std | 0.0314 | -| value_loss | 4.01e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10592 | -| time_elapsed | 59933 | -| total_timesteps | 1355776 | -| train/ | | -| approx_kl | 0.00027055293 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.000619 | -| n_updates | 105910 | -| policy_gradient_loss | 0.00225 | -| std | 0.0314 | -| value_loss | 3.1e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 22 | -| iterations | 10593 | -| time_elapsed | 59936 | -| total_timesteps | 1355904 | -| train/ | | -| approx_kl | 0.0017015818 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 105920 | -| policy_gradient_loss | -0.00469 | -| std | 0.0313 | -| value_loss | 5.94e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10594 | -| time_elapsed | 59939 | -| total_timesteps | 1356032 | -| train/ | | -| approx_kl | 7.758755e-05 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.00554 | -| learning_rate | 0.0003 | -| loss | 0.00213 | -| n_updates | 105930 | -| policy_gradient_loss | -0.00493 | -| std | 0.0313 | -| value_loss | 1.22e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10595 | -| time_elapsed | 59948 | -| total_timesteps | 1356160 | -| train/ | | -| approx_kl | 0.01915685 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | 0.741 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 105940 | -| policy_gradient_loss | -0.0135 | -| std | 0.0314 | -| value_loss | 0.000748 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10596 | -| time_elapsed | 59952 | -| total_timesteps | 1356288 | -| train/ | | -| approx_kl | 0.006864763 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -5.8 | -| learning_rate | 0.0003 | -| loss | 0.0073 | -| n_updates | 105950 | -| policy_gradient_loss | 0.00124 | -| std | 0.0314 | -| value_loss | 2.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10597 | -| time_elapsed | 59956 | -| total_timesteps | 1356416 | -| train/ | | -| approx_kl | 0.009310496 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -19.6 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 105960 | -| policy_gradient_loss | -0.000691 | -| std | 0.0313 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10598 | -| time_elapsed | 59960 | -| total_timesteps | 1356544 | -| train/ | | -| approx_kl | 0.027271515 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -2.32 | -| learning_rate | 0.0003 | -| loss | 0.00577 | -| n_updates | 105970 | -| policy_gradient_loss | -0.000616 | -| std | 0.0312 | -| value_loss | 1.27e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10599 | -| time_elapsed | 59963 | -| total_timesteps | 1356672 | -| train/ | | -| approx_kl | 0.00037060212 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 105980 | -| policy_gradient_loss | 0.00406 | -| std | 0.0312 | -| value_loss | 4.63e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10600 | -| time_elapsed | 59966 | -| total_timesteps | 1356800 | -| train/ | | -| approx_kl | 0.00772905 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 105990 | -| policy_gradient_loss | -0.00942 | -| std | 0.0312 | -| value_loss | 8.89e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 22 | -| iterations | 10601 | -| time_elapsed | 59968 | -| total_timesteps | 1356928 | -| train/ | | -| approx_kl | 0.012374755 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.000534 | -| learning_rate | 0.0003 | -| loss | 0.000654 | -| n_updates | 106000 | -| policy_gradient_loss | 0.00133 | -| std | 0.0312 | -| value_loss | 1.27e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10602 | -| time_elapsed | 59971 | -| total_timesteps | 1357056 | -| train/ | | -| approx_kl | 0.0024231747 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 106010 | -| policy_gradient_loss | -0.00489 | -| std | 0.0312 | -| value_loss | 5.05e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10603 | -| time_elapsed | 59977 | -| total_timesteps | 1357184 | -| train/ | | -| approx_kl | 0.0028887377 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -13.4 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 106020 | -| policy_gradient_loss | -0.0158 | -| std | 0.0312 | -| value_loss | 0.00368 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10604 | -| time_elapsed | 59980 | -| total_timesteps | 1357312 | -| train/ | | -| approx_kl | 0.0001847432 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -85.9 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 106030 | -| policy_gradient_loss | -0.00953 | -| std | 0.0312 | -| value_loss | 5e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10605 | -| time_elapsed | 59983 | -| total_timesteps | 1357440 | -| train/ | | -| approx_kl | 0.023306586 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -225 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 106040 | -| policy_gradient_loss | -0.0091 | -| std | 0.0312 | -| value_loss | 1.83e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10606 | -| time_elapsed | 59986 | -| total_timesteps | 1357568 | -| train/ | | -| approx_kl | 0.0017562234 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | -0.00314 | -| n_updates | 106050 | -| policy_gradient_loss | -0.00109 | -| std | 0.0312 | -| value_loss | 4.84e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10607 | -| time_elapsed | 59990 | -| total_timesteps | 1357696 | -| train/ | | -| approx_kl | 9.2538074e-05 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | 0.000432 | -| n_updates | 106060 | -| policy_gradient_loss | 0.000415 | -| std | 0.0312 | -| value_loss | 1.16e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10608 | -| time_elapsed | 59994 | -| total_timesteps | 1357824 | -| train/ | | -| approx_kl | 7.172581e-05 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.000434 | -| n_updates | 106070 | -| policy_gradient_loss | 0.00115 | -| std | 0.0312 | -| value_loss | 7.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 22 | -| iterations | 10609 | -| time_elapsed | 59998 | -| total_timesteps | 1357952 | -| train/ | | -| approx_kl | 0.008256816 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 106080 | -| policy_gradient_loss | 0.0011 | -| std | 0.0312 | -| value_loss | 1.95e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10610 | -| time_elapsed | 60001 | -| total_timesteps | 1358080 | -| train/ | | -| approx_kl | 0.013248234 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.00286 | -| n_updates | 106090 | -| policy_gradient_loss | 0.000445 | -| std | 0.0312 | -| value_loss | 1.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10611 | -| time_elapsed | 60008 | -| total_timesteps | 1358208 | -| train/ | | -| approx_kl | 0.029684618 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.908 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 106100 | -| policy_gradient_loss | -0.0169 | -| std | 0.0312 | -| value_loss | 0.000266 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10612 | -| time_elapsed | 60012 | -| total_timesteps | 1358336 | -| train/ | | -| approx_kl | 0.0024530543 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -3.24 | -| learning_rate | 0.0003 | -| loss | 0.00845 | -| n_updates | 106110 | -| policy_gradient_loss | -0.00497 | -| std | 0.0311 | -| value_loss | 6.82e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10613 | -| time_elapsed | 60015 | -| total_timesteps | 1358464 | -| train/ | | -| approx_kl | 0.019507414 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | 0.00474 | -| n_updates | 106120 | -| policy_gradient_loss | 0.00104 | -| std | 0.0311 | -| value_loss | 6.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10614 | -| time_elapsed | 60018 | -| total_timesteps | 1358592 | -| train/ | | -| approx_kl | 0.03161578 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.0139 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 106130 | -| policy_gradient_loss | 0.000979 | -| std | 0.0311 | -| value_loss | 1.16e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10615 | -| time_elapsed | 60022 | -| total_timesteps | 1358720 | -| train/ | | -| approx_kl | 0.0020940867 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.000576 | -| n_updates | 106140 | -| policy_gradient_loss | 0.00276 | -| std | 0.0311 | -| value_loss | 5.78e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10616 | -| time_elapsed | 60025 | -| total_timesteps | 1358848 | -| train/ | | -| approx_kl | 0.0111571625 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.000144 | -| learning_rate | 0.0003 | -| loss | -0.00728 | -| n_updates | 106150 | -| policy_gradient_loss | -0.00355 | -| std | 0.0311 | -| value_loss | 1.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 22 | -| iterations | 10617 | -| time_elapsed | 60028 | -| total_timesteps | 1358976 | -| train/ | | -| approx_kl | 0.007226784 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.00646 | -| n_updates | 106160 | -| policy_gradient_loss | 0.00382 | -| std | 0.0311 | -| value_loss | 2.06e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10618 | -| time_elapsed | 60032 | -| total_timesteps | 1359104 | -| train/ | | -| approx_kl | 0.0003754287 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.749 | -| learning_rate | 0.0003 | -| loss | -0.000826 | -| n_updates | 106170 | -| policy_gradient_loss | 0.00091 | -| std | 0.0313 | -| value_loss | 7.41e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10619 | -| time_elapsed | 60040 | -| total_timesteps | 1359232 | -| train/ | | -| approx_kl | 0.019138642 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 106180 | -| policy_gradient_loss | -0.0144 | -| std | 0.0313 | -| value_loss | 0.000819 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10620 | -| time_elapsed | 60043 | -| total_timesteps | 1359360 | -| train/ | | -| approx_kl | 0.016520746 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.0709 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 106190 | -| policy_gradient_loss | 0.00555 | -| std | 0.0313 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10621 | -| time_elapsed | 60046 | -| total_timesteps | 1359488 | -| train/ | | -| approx_kl | 0.0027472982 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 2.04 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.000416 | -| n_updates | 106200 | -| policy_gradient_loss | 5.82e-05 | -| std | 0.0312 | -| value_loss | 1.14e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10622 | -| time_elapsed | 60050 | -| total_timesteps | 1359616 | -| train/ | | -| approx_kl | 0.003163834 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 106210 | -| policy_gradient_loss | 0.0028 | -| std | 0.0311 | -| value_loss | 2.46e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10623 | -| time_elapsed | 60053 | -| total_timesteps | 1359744 | -| train/ | | -| approx_kl | 0.0031128237 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.00031 | -| n_updates | 106220 | -| policy_gradient_loss | 0.000959 | -| std | 0.0311 | -| value_loss | 4.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10624 | -| time_elapsed | 60056 | -| total_timesteps | 1359872 | -| train/ | | -| approx_kl | 0.012120642 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.00457 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 106230 | -| policy_gradient_loss | -0.0055 | -| std | 0.0311 | -| value_loss | 5.44e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10625 | -| time_elapsed | 60059 | -| total_timesteps | 1360000 | -| train/ | | -| approx_kl | 0.0013445485 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.00617 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 106240 | -| policy_gradient_loss | -0.00482 | -| std | 0.0311 | -| value_loss | 4.82e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10626 | -| time_elapsed | 60063 | -| total_timesteps | 1360128 | -| train/ | | -| approx_kl | 0.0012498037 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.00363 | -| learning_rate | 0.0003 | -| loss | 0.00487 | -| n_updates | 106250 | -| policy_gradient_loss | -0.00145 | -| std | 0.0311 | -| value_loss | 1.95e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10627 | -| time_elapsed | 60071 | -| total_timesteps | 1360256 | -| train/ | | -| approx_kl | 0.064613245 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 106260 | -| policy_gradient_loss | -0.0111 | -| std | 0.0311 | -| value_loss | 0.000323 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10628 | -| time_elapsed | 60074 | -| total_timesteps | 1360384 | -| train/ | | -| approx_kl | 0.004912903 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 106270 | -| policy_gradient_loss | 0.000689 | -| std | 0.0311 | -| value_loss | 5.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10629 | -| time_elapsed | 60078 | -| total_timesteps | 1360512 | -| train/ | | -| approx_kl | 0.013992868 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.00362 | -| learning_rate | 0.0003 | -| loss | 0.00457 | -| n_updates | 106280 | -| policy_gradient_loss | 0.00123 | -| std | 0.0311 | -| value_loss | 5.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10630 | -| time_elapsed | 60080 | -| total_timesteps | 1360640 | -| train/ | | -| approx_kl | 0.02654566 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.00135 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 106290 | -| policy_gradient_loss | 0.00123 | -| std | 0.0311 | -| value_loss | 4.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10631 | -| time_elapsed | 60083 | -| total_timesteps | 1360768 | -| train/ | | -| approx_kl | 0.0025435588 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.000275 | -| learning_rate | 0.0003 | -| loss | 0.00177 | -| n_updates | 106300 | -| policy_gradient_loss | 0.00293 | -| std | 0.0311 | -| value_loss | 5.54e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 22 | -| iterations | 10632 | -| time_elapsed | 60087 | -| total_timesteps | 1360896 | -| train/ | | -| approx_kl | 0.0037387079 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.00644 | -| n_updates | 106310 | -| policy_gradient_loss | 0.00337 | -| std | 0.0311 | -| value_loss | 2.27e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10633 | -| time_elapsed | 60090 | -| total_timesteps | 1361024 | -| train/ | | -| approx_kl | 0.008302184 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | -0.00573 | -| n_updates | 106320 | -| policy_gradient_loss | -0.00345 | -| std | 0.0311 | -| value_loss | 1.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10634 | -| time_elapsed | 60099 | -| total_timesteps | 1361152 | -| train/ | | -| approx_kl | 0.012307171 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.768 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 106330 | -| policy_gradient_loss | -0.0123 | -| std | 0.0311 | -| value_loss | 0.00319 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10635 | -| time_elapsed | 60103 | -| total_timesteps | 1361280 | -| train/ | | -| approx_kl | 0.02604401 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 106340 | -| policy_gradient_loss | -0.00512 | -| std | 0.031 | -| value_loss | 2.53e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10636 | -| time_elapsed | 60106 | -| total_timesteps | 1361408 | -| train/ | | -| approx_kl | 0.0134020485 | -| clip_fraction | 0.551 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -35.6 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 106350 | -| policy_gradient_loss | -0.00837 | -| std | 0.031 | -| value_loss | 3.76e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10637 | -| time_elapsed | 60108 | -| total_timesteps | 1361536 | -| train/ | | -| approx_kl | 0.0029643797 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -25.3 | -| learning_rate | 0.0003 | -| loss | -0.00762 | -| n_updates | 106360 | -| policy_gradient_loss | -0.0062 | -| std | 0.031 | -| value_loss | 7.02e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10638 | -| time_elapsed | 60111 | -| total_timesteps | 1361664 | -| train/ | | -| approx_kl | 0.0023781406 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -10.7 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 106370 | -| policy_gradient_loss | 0.00133 | -| std | 0.031 | -| value_loss | 1.13e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10639 | -| time_elapsed | 60114 | -| total_timesteps | 1361792 | -| train/ | | -| approx_kl | 0.0040326207 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | -0.000388 | -| n_updates | 106380 | -| policy_gradient_loss | 0.000301 | -| std | 0.0311 | -| value_loss | 5.75e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 22 | -| iterations | 10640 | -| time_elapsed | 60116 | -| total_timesteps | 1361920 | -| train/ | | -| approx_kl | 0.027076328 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.00249 | -| n_updates | 106390 | -| policy_gradient_loss | 0.00049 | -| std | 0.0312 | -| value_loss | 7.83e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10641 | -| time_elapsed | 60119 | -| total_timesteps | 1362048 | -| train/ | | -| approx_kl | 0.0037777363 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | 0.00233 | -| n_updates | 106400 | -| policy_gradient_loss | 0.00735 | -| std | 0.0312 | -| value_loss | 2.18e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10642 | -| time_elapsed | 60123 | -| total_timesteps | 1362176 | -| train/ | | -| approx_kl | 0.032098304 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | 0.818 | -| learning_rate | 0.0003 | -| loss | -0.0253 | -| n_updates | 106410 | -| policy_gradient_loss | -0.0215 | -| std | 0.0312 | -| value_loss | 0.000781 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10643 | -| time_elapsed | 60126 | -| total_timesteps | 1362304 | -| train/ | | -| approx_kl | 0.0046496717 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 106420 | -| policy_gradient_loss | 0.00231 | -| std | 0.0312 | -| value_loss | 7.62e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10644 | -| time_elapsed | 60129 | -| total_timesteps | 1362432 | -| train/ | | -| approx_kl | 0.00057615805 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 106430 | -| policy_gradient_loss | -0.00317 | -| std | 0.0311 | -| value_loss | 1.13e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10645 | -| time_elapsed | 60133 | -| total_timesteps | 1362560 | -| train/ | | -| approx_kl | 0.001319644 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 106440 | -| policy_gradient_loss | 0.000543 | -| std | 0.0311 | -| value_loss | 4.98e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10646 | -| time_elapsed | 60136 | -| total_timesteps | 1362688 | -| train/ | | -| approx_kl | 1.5676953e-05 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | 0.000371 | -| n_updates | 106450 | -| policy_gradient_loss | 0.00213 | -| std | 0.0311 | -| value_loss | 2.13e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10647 | -| time_elapsed | 60139 | -| total_timesteps | 1362816 | -| train/ | | -| approx_kl | 0.00026060548 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | -0.000327 | -| n_updates | 106460 | -| policy_gradient_loss | 0.0061 | -| std | 0.0311 | -| value_loss | 1.95e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 22 | -| iterations | 10648 | -| time_elapsed | 60141 | -| total_timesteps | 1362944 | -| train/ | | -| approx_kl | 0.009609923 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.05 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 106470 | -| policy_gradient_loss | -3.73e-05 | -| std | 0.0309 | -| value_loss | 8.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10649 | -| time_elapsed | 60144 | -| total_timesteps | 1363072 | -| train/ | | -| approx_kl | 0.017248977 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.06 | -| explained_variance | 0.00716 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 106480 | -| policy_gradient_loss | -0.0143 | -| std | 0.0307 | -| value_loss | 1.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10650 | -| time_elapsed | 60148 | -| total_timesteps | 1363200 | -| train/ | | -| approx_kl | 0.014229579 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.06 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 106490 | -| policy_gradient_loss | -0.0148 | -| std | 0.0307 | -| value_loss | 0.000568 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10651 | -| time_elapsed | 60152 | -| total_timesteps | 1363328 | -| train/ | | -| approx_kl | 5.9226528e-05 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.06 | -| explained_variance | -0.957 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 106500 | -| policy_gradient_loss | -0.00948 | -| std | 0.0307 | -| value_loss | 4.08e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10652 | -| time_elapsed | 60155 | -| total_timesteps | 1363456 | -| train/ | | -| approx_kl | 0.00046000117 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | 0.00622 | -| n_updates | 106510 | -| policy_gradient_loss | -0.00901 | -| std | 0.0307 | -| value_loss | 7.9e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10653 | -| time_elapsed | 60158 | -| total_timesteps | 1363584 | -| train/ | | -| approx_kl | 0.00018346217 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 106520 | -| policy_gradient_loss | 0.00246 | -| std | 0.0307 | -| value_loss | 4.97e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10654 | -| time_elapsed | 60161 | -| total_timesteps | 1363712 | -| train/ | | -| approx_kl | 0.02438369 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.00414 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 106530 | -| policy_gradient_loss | -0.0133 | -| std | 0.0307 | -| value_loss | 1.9e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10655 | -| time_elapsed | 60164 | -| total_timesteps | 1363840 | -| train/ | | -| approx_kl | 0.0062023564 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00728 | -| n_updates | 106540 | -| policy_gradient_loss | 0.00853 | -| std | 0.0307 | -| value_loss | 6.73e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 22 | -| iterations | 10656 | -| time_elapsed | 60166 | -| total_timesteps | 1363968 | -| train/ | | -| approx_kl | 0.01946344 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | 0.00518 | -| n_updates | 106550 | -| policy_gradient_loss | 0.000631 | -| std | 0.0307 | -| value_loss | 1.87e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10657 | -| time_elapsed | 60169 | -| total_timesteps | 1364096 | -| train/ | | -| approx_kl | 0.008092303 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.0071 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 106560 | -| policy_gradient_loss | 0.00269 | -| std | 0.0306 | -| value_loss | 6.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10658 | -| time_elapsed | 60177 | -| total_timesteps | 1364224 | -| train/ | | -| approx_kl | 0.003038195 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.692 | -| learning_rate | 0.0003 | -| loss | -0.0091 | -| n_updates | 106570 | -| policy_gradient_loss | -0.00943 | -| std | 0.0306 | -| value_loss | 0.00629 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10659 | -| time_elapsed | 60181 | -| total_timesteps | 1364352 | -| train/ | | -| approx_kl | 0.0011500539 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0099 | -| learning_rate | 0.0003 | -| loss | -0.00695 | -| n_updates | 106580 | -| policy_gradient_loss | -0.00986 | -| std | 0.0306 | -| value_loss | 0.00072 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10660 | -| time_elapsed | 60185 | -| total_timesteps | 1364480 | -| train/ | | -| approx_kl | 9.97656e-05 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -5.71 | -| learning_rate | 0.0003 | -| loss | 0.00027 | -| n_updates | 106590 | -| policy_gradient_loss | 0.0032 | -| std | 0.0306 | -| value_loss | 5.12e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10661 | -| time_elapsed | 60188 | -| total_timesteps | 1364608 | -| train/ | | -| approx_kl | 8.268654e-05 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 106600 | -| policy_gradient_loss | -0.00703 | -| std | 0.0306 | -| value_loss | 7.58e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10662 | -| time_elapsed | 60190 | -| total_timesteps | 1364736 | -| train/ | | -| approx_kl | 0.007488687 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0082 | -| learning_rate | 0.0003 | -| loss | -0.00882 | -| n_updates | 106610 | -| policy_gradient_loss | -0.00449 | -| std | 0.0306 | -| value_loss | 1.54e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10663 | -| time_elapsed | 60194 | -| total_timesteps | 1364864 | -| train/ | | -| approx_kl | 0.004855106 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | -0.00467 | -| n_updates | 106620 | -| policy_gradient_loss | -0.00112 | -| std | 0.0306 | -| value_loss | 1.85e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 22 | -| iterations | 10664 | -| time_elapsed | 60197 | -| total_timesteps | 1364992 | -| train/ | | -| approx_kl | 2.7961098e-05 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.000137 | -| n_updates | 106630 | -| policy_gradient_loss | -0.000106 | -| std | 0.0306 | -| value_loss | 7.66e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10665 | -| time_elapsed | 60200 | -| total_timesteps | 1365120 | -| train/ | | -| approx_kl | 0.018041171 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.00235 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 106640 | -| policy_gradient_loss | -0.0169 | -| std | 0.0306 | -| value_loss | 1.8e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10666 | -| time_elapsed | 60210 | -| total_timesteps | 1365248 | -| train/ | | -| approx_kl | 0.0014641136 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.812 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 106650 | -| policy_gradient_loss | -0.0151 | -| std | 0.0306 | -| value_loss | 0.0036 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10667 | -| time_elapsed | 60214 | -| total_timesteps | 1365376 | -| train/ | | -| approx_kl | 0.0010351106 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -3.91 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 106660 | -| policy_gradient_loss | 0.00115 | -| std | 0.0306 | -| value_loss | 4.77e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10668 | -| time_elapsed | 60219 | -| total_timesteps | 1365504 | -| train/ | | -| approx_kl | 0.0032008342 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | 0.000815 | -| n_updates | 106670 | -| policy_gradient_loss | 0.00335 | -| std | 0.0306 | -| value_loss | 1.53e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10669 | -| time_elapsed | 60222 | -| total_timesteps | 1365632 | -| train/ | | -| approx_kl | 0.0224844 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -2.78 | -| learning_rate | 0.0003 | -| loss | 0.00575 | -| n_updates | 106680 | -| policy_gradient_loss | 0.00363 | -| std | 0.0305 | -| value_loss | 3.15e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10670 | -| time_elapsed | 60226 | -| total_timesteps | 1365760 | -| train/ | | -| approx_kl | 0.001550843 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.488 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 106690 | -| policy_gradient_loss | 0.00194 | -| std | 0.0305 | -| value_loss | 4.2e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 22 | -| iterations | 10671 | -| time_elapsed | 60230 | -| total_timesteps | 1365888 | -| train/ | | -| approx_kl | 0.0038312203 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 106700 | -| policy_gradient_loss | -0.0129 | -| std | 0.0305 | -| value_loss | 2.81e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10672 | -| time_elapsed | 60233 | -| total_timesteps | 1366016 | -| train/ | | -| approx_kl | 0.00045699207 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 106710 | -| policy_gradient_loss | -0.00453 | -| std | 0.0305 | -| value_loss | 3.8e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10673 | -| time_elapsed | 60242 | -| total_timesteps | 1366144 | -| train/ | | -| approx_kl | 0.054651476 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 106720 | -| policy_gradient_loss | -0.0168 | -| std | 0.0305 | -| value_loss | 0.000799 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10674 | -| time_elapsed | 60245 | -| total_timesteps | 1366272 | -| train/ | | -| approx_kl | 0.018597659 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.186 | -| learning_rate | 0.0003 | -| loss | -5.99e-05 | -| n_updates | 106730 | -| policy_gradient_loss | -0.00255 | -| std | 0.0305 | -| value_loss | 1.18e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10675 | -| time_elapsed | 60248 | -| total_timesteps | 1366400 | -| train/ | | -| approx_kl | 0.019460462 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -105 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 106740 | -| policy_gradient_loss | -0.000618 | -| std | 0.0305 | -| value_loss | 4.58e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10676 | -| time_elapsed | 60251 | -| total_timesteps | 1366528 | -| train/ | | -| approx_kl | 0.0023346818 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -16.7 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 106750 | -| policy_gradient_loss | -0.00046 | -| std | 0.0305 | -| value_loss | 6.28e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10677 | -| time_elapsed | 60256 | -| total_timesteps | 1366656 | -| train/ | | -| approx_kl | 1.0980293e-06 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -3.34 | -| learning_rate | 0.0003 | -| loss | -9.21e-05 | -| n_updates | 106760 | -| policy_gradient_loss | -0.00153 | -| std | 0.0305 | -| value_loss | 2.03e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10678 | -| time_elapsed | 60259 | -| total_timesteps | 1366784 | -| train/ | | -| approx_kl | 0.0024779956 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0956 | -| learning_rate | 0.0003 | -| loss | 0.00204 | -| n_updates | 106770 | -| policy_gradient_loss | 0.00695 | -| std | 0.0305 | -| value_loss | 8.62e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10679 | -| time_elapsed | 60261 | -| total_timesteps | 1366912 | -| train/ | | -| approx_kl | 0.0011083246 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 106780 | -| policy_gradient_loss | 0.00769 | -| std | 0.0305 | -| value_loss | 9.45e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10680 | -| time_elapsed | 60265 | -| total_timesteps | 1367040 | -| train/ | | -| approx_kl | 0.0032584798 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -7.56e-05 | -| n_updates | 106790 | -| policy_gradient_loss | 9.04e-05 | -| std | 0.0304 | -| value_loss | 3.27e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10681 | -| time_elapsed | 60271 | -| total_timesteps | 1367168 | -| train/ | | -| approx_kl | 0.12037909 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 2.07 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 106800 | -| policy_gradient_loss | -0.0115 | -| std | 0.0304 | -| value_loss | 0.000199 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10682 | -| time_elapsed | 60275 | -| total_timesteps | 1367296 | -| train/ | | -| approx_kl | 0.014932621 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.00673 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 106810 | -| policy_gradient_loss | 0.000118 | -| std | 0.0303 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10683 | -| time_elapsed | 60278 | -| total_timesteps | 1367424 | -| train/ | | -| approx_kl | 0.008736539 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 106820 | -| policy_gradient_loss | -0.00071 | -| std | 0.0303 | -| value_loss | 9.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10684 | -| time_elapsed | 60281 | -| total_timesteps | 1367552 | -| train/ | | -| approx_kl | 0.013672188 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 106830 | -| policy_gradient_loss | -0.0054 | -| std | 0.0302 | -| value_loss | 1.23e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10685 | -| time_elapsed | 60284 | -| total_timesteps | 1367680 | -| train/ | | -| approx_kl | 0.00035474822 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 106840 | -| policy_gradient_loss | 0.00632 | -| std | 0.0302 | -| value_loss | 1.29e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10686 | -| time_elapsed | 60288 | -| total_timesteps | 1367808 | -| train/ | | -| approx_kl | 0.011465933 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0978 | -| learning_rate | 0.0003 | -| loss | 0.0049 | -| n_updates | 106850 | -| policy_gradient_loss | 0.00204 | -| std | 0.0302 | -| value_loss | 1.19e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 22 | -| iterations | 10687 | -| time_elapsed | 60292 | -| total_timesteps | 1367936 | -| train/ | | -| approx_kl | 0.0015832023 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.000885 | -| n_updates | 106860 | -| policy_gradient_loss | 0.00292 | -| std | 0.0302 | -| value_loss | 1.72e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10688 | -| time_elapsed | 60296 | -| total_timesteps | 1368064 | -| train/ | | -| approx_kl | 0.007816667 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | -0.00546 | -| n_updates | 106870 | -| policy_gradient_loss | -0.00255 | -| std | 0.0303 | -| value_loss | 5.45e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10689 | -| time_elapsed | 60301 | -| total_timesteps | 1368192 | -| train/ | | -| approx_kl | 0.011513822 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.0072 | -| n_updates | 106880 | -| policy_gradient_loss | -0.00877 | -| std | 0.0303 | -| value_loss | 0.00247 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10690 | -| time_elapsed | 60305 | -| total_timesteps | 1368320 | -| train/ | | -| approx_kl | 0.00062021334 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.543 | -| learning_rate | 0.0003 | -| loss | 0.00338 | -| n_updates | 106890 | -| policy_gradient_loss | 0.00404 | -| std | 0.0303 | -| value_loss | 1.05e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10691 | -| time_elapsed | 60309 | -| total_timesteps | 1368448 | -| train/ | | -| approx_kl | 0.00017838739 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.727 | -| learning_rate | 0.0003 | -| loss | -0.00361 | -| n_updates | 106900 | -| policy_gradient_loss | -0.0103 | -| std | 0.0303 | -| value_loss | 3.73e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10692 | -| time_elapsed | 60312 | -| total_timesteps | 1368576 | -| train/ | | -| approx_kl | 0.007965708 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 106910 | -| policy_gradient_loss | 0.000213 | -| std | 0.0303 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10693 | -| time_elapsed | 60315 | -| total_timesteps | 1368704 | -| train/ | | -| approx_kl | 7.782597e-05 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0949 | -| learning_rate | 0.0003 | -| loss | -0.000595 | -| n_updates | 106920 | -| policy_gradient_loss | 0.00382 | -| std | 0.0302 | -| value_loss | 1.59e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10694 | -| time_elapsed | 60318 | -| total_timesteps | 1368832 | -| train/ | | -| approx_kl | 0.0051960973 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0775 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 106930 | -| policy_gradient_loss | 9.39e-05 | -| std | 0.0302 | -| value_loss | 2.25e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 22 | -| iterations | 10695 | -| time_elapsed | 60321 | -| total_timesteps | 1368960 | -| train/ | | -| approx_kl | 0.016252926 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | 0.00723 | -| learning_rate | 0.0003 | -| loss | 0.00823 | -| n_updates | 106940 | -| policy_gradient_loss | 0.0045 | -| std | 0.0302 | -| value_loss | 1.44e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10696 | -| time_elapsed | 60324 | -| total_timesteps | 1369088 | -| train/ | | -| approx_kl | 0.0028987397 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | -0.000517 | -| n_updates | 106950 | -| policy_gradient_loss | 0.000411 | -| std | 0.0301 | -| value_loss | 1.7e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10697 | -| time_elapsed | 60332 | -| total_timesteps | 1369216 | -| train/ | | -| approx_kl | 0.016091743 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | 0.717 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 106960 | -| policy_gradient_loss | -0.0147 | -| std | 0.0301 | -| value_loss | 0.00124 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10698 | -| time_elapsed | 60335 | -| total_timesteps | 1369344 | -| train/ | | -| approx_kl | 0.0006587398 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.406 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 106970 | -| policy_gradient_loss | 0.00272 | -| std | 0.0301 | -| value_loss | 5.28e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10699 | -| time_elapsed | 60339 | -| total_timesteps | 1369472 | -| train/ | | -| approx_kl | 0.0064488184 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.516 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 106980 | -| policy_gradient_loss | 0.00182 | -| std | 0.0301 | -| value_loss | 7.65e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10700 | -| time_elapsed | 60341 | -| total_timesteps | 1369600 | -| train/ | | -| approx_kl | 0.0035024341 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | 0.00359 | -| n_updates | 106990 | -| policy_gradient_loss | 0.012 | -| std | 0.0301 | -| value_loss | 9.39e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10701 | -| time_elapsed | 60345 | -| total_timesteps | 1369728 | -| train/ | | -| approx_kl | 0.00080759404 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | 0.00203 | -| learning_rate | 0.0003 | -| loss | -0.0059 | -| n_updates | 107000 | -| policy_gradient_loss | -0.00543 | -| std | 0.0301 | -| value_loss | 3.47e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10702 | -| time_elapsed | 60348 | -| total_timesteps | 1369856 | -| train/ | | -| approx_kl | 0.0047099716 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.08 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 107010 | -| policy_gradient_loss | 0.00013 | -| std | 0.0301 | -| value_loss | 1.98e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 22 | -| iterations | 10703 | -| time_elapsed | 60351 | -| total_timesteps | 1369984 | -| train/ | | -| approx_kl | 0.0019068648 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.00196 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 107020 | -| policy_gradient_loss | 0.00573 | -| std | 0.03 | -| value_loss | 2.66e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 22 | -| iterations | 10704 | -| time_elapsed | 60354 | -| total_timesteps | 1370112 | -| train/ | | -| approx_kl | 0.0030404772 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | -0.00555 | -| n_updates | 107030 | -| policy_gradient_loss | -0.0036 | -| std | 0.03 | -| value_loss | 5.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 22 | -| iterations | 10705 | -| time_elapsed | 60363 | -| total_timesteps | 1370240 | -| train/ | | -| approx_kl | 0.005641807 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.0075 | -| n_updates | 107040 | -| policy_gradient_loss | -0.00805 | -| std | 0.03 | -| value_loss | 0.00268 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 22 | -| iterations | 10706 | -| time_elapsed | 60367 | -| total_timesteps | 1370368 | -| train/ | | -| approx_kl | 0.0025691926 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 107050 | -| policy_gradient_loss | -0.000109 | -| std | 0.03 | -| value_loss | 0.000235 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 22 | -| iterations | 10707 | -| time_elapsed | 60370 | -| total_timesteps | 1370496 | -| train/ | | -| approx_kl | 0.0017281328 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.865 | -| learning_rate | 0.0003 | -| loss | 0.00405 | -| n_updates | 107060 | -| policy_gradient_loss | 0.000469 | -| std | 0.0299 | -| value_loss | 0.00249 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 22 | -| iterations | 10708 | -| time_elapsed | 60373 | -| total_timesteps | 1370624 | -| train/ | | -| approx_kl | 0.00078811636 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 107070 | -| policy_gradient_loss | -0.000753 | -| std | 0.0299 | -| value_loss | 1.98e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 22 | -| iterations | 10709 | -| time_elapsed | 60376 | -| total_timesteps | 1370752 | -| train/ | | -| approx_kl | 0.010455776 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.0445 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 107080 | -| policy_gradient_loss | -0.00128 | -| std | 0.0299 | -| value_loss | 9.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 22 | -| iterations | 10710 | -| time_elapsed | 60378 | -| total_timesteps | 1370880 | -| train/ | | -| approx_kl | 0.004496355 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 107090 | -| policy_gradient_loss | -0.00228 | -| std | 0.0299 | -| value_loss | 1.03e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10711 | -| time_elapsed | 60382 | -| total_timesteps | 1371008 | -| train/ | | -| approx_kl | 0.00019704085 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | -0.000636 | -| n_updates | 107100 | -| policy_gradient_loss | -0.000477 | -| std | 0.0298 | -| value_loss | 0.000116 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10712 | -| time_elapsed | 60392 | -| total_timesteps | 1371136 | -| train/ | | -| approx_kl | 0.0053846375 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.0288 | -| n_updates | 107110 | -| policy_gradient_loss | -0.0184 | -| std | 0.0298 | -| value_loss | 0.0027 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10713 | -| time_elapsed | 60396 | -| total_timesteps | 1371264 | -| train/ | | -| approx_kl | 0.0003267927 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | 0.0656 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 107120 | -| policy_gradient_loss | -0.000639 | -| std | 0.0298 | -| value_loss | 0.00129 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10714 | -| time_elapsed | 60400 | -| total_timesteps | 1371392 | -| train/ | | -| approx_kl | 8.611241e-05 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.721 | -| learning_rate | 0.0003 | -| loss | 0.000897 | -| n_updates | 107130 | -| policy_gradient_loss | 0.00476 | -| std | 0.0298 | -| value_loss | 3.57e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10715 | -| time_elapsed | 60404 | -| total_timesteps | 1371520 | -| train/ | | -| approx_kl | 0.00026541622 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.00289 | -| n_updates | 107140 | -| policy_gradient_loss | -0.00582 | -| std | 0.0298 | -| value_loss | 5.2e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10716 | -| time_elapsed | 60407 | -| total_timesteps | 1371648 | -| train/ | | -| approx_kl | 0.005568067 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | -0.00975 | -| n_updates | 107150 | -| policy_gradient_loss | -0.0031 | -| std | 0.0298 | -| value_loss | 1.93e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10717 | -| time_elapsed | 60411 | -| total_timesteps | 1371776 | -| train/ | | -| approx_kl | 0.0022495412 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.00263 | -| n_updates | 107160 | -| policy_gradient_loss | 0.0014 | -| std | 0.0298 | -| value_loss | 7.77e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10718 | -| time_elapsed | 60413 | -| total_timesteps | 1371904 | -| train/ | | -| approx_kl | 0.0031697112 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 107170 | -| policy_gradient_loss | 0.002 | -| std | 0.0298 | -| value_loss | 8e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10719 | -| time_elapsed | 60416 | -| total_timesteps | 1372032 | -| train/ | | -| approx_kl | 1.8943101e-06 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | -0.000115 | -| n_updates | 107180 | -| policy_gradient_loss | 0.00466 | -| std | 0.0298 | -| value_loss | 2.11e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10720 | -| time_elapsed | 60422 | -| total_timesteps | 1372160 | -| train/ | | -| approx_kl | 0.012390135 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 107190 | -| policy_gradient_loss | -0.00716 | -| std | 0.0298 | -| value_loss | 0.000656 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10721 | -| time_elapsed | 60426 | -| total_timesteps | 1372288 | -| train/ | | -| approx_kl | 0.0002553966 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 2.09 | -| explained_variance | -0.902 | -| learning_rate | 0.0003 | -| loss | 2.39e-05 | -| n_updates | 107200 | -| policy_gradient_loss | 0.000481 | -| std | 0.0298 | -| value_loss | 3.77e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10722 | -| time_elapsed | 60429 | -| total_timesteps | 1372416 | -| train/ | | -| approx_kl | 0.0018020426 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -2.24 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 107210 | -| policy_gradient_loss | 0.000715 | -| std | 0.0297 | -| value_loss | 3.67e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10723 | -| time_elapsed | 60433 | -| total_timesteps | 1372544 | -| train/ | | -| approx_kl | 0.014603297 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.00439 | -| n_updates | 107220 | -| policy_gradient_loss | -0.00215 | -| std | 0.0297 | -| value_loss | 9.42e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10724 | -| time_elapsed | 60436 | -| total_timesteps | 1372672 | -| train/ | | -| approx_kl | 0.00027099764 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | 0.00363 | -| learning_rate | 0.0003 | -| loss | 0.00115 | -| n_updates | 107230 | -| policy_gradient_loss | 0.00773 | -| std | 0.0297 | -| value_loss | 1.46e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10725 | -| time_elapsed | 60439 | -| total_timesteps | 1372800 | -| train/ | | -| approx_kl | 0.0001209937 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -3.41 | -| learning_rate | 0.0003 | -| loss | -0.000594 | -| n_updates | 107240 | -| policy_gradient_loss | 0.00347 | -| std | 0.0297 | -| value_loss | 2.08e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10726 | -| time_elapsed | 60442 | -| total_timesteps | 1372928 | -| train/ | | -| approx_kl | 0.0047185356 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.00504 | -| n_updates | 107250 | -| policy_gradient_loss | 0.00291 | -| std | 0.0297 | -| value_loss | 1.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10727 | -| time_elapsed | 60445 | -| total_timesteps | 1373056 | -| train/ | | -| approx_kl | 0.0005022548 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 107260 | -| policy_gradient_loss | -0.00272 | -| std | 0.0297 | -| value_loss | 1.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10728 | -| time_elapsed | 60451 | -| total_timesteps | 1373184 | -| train/ | | -| approx_kl | 0.009246144 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.42 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 107270 | -| policy_gradient_loss | -0.0112 | -| std | 0.0297 | -| value_loss | 0.00266 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10729 | -| time_elapsed | 60455 | -| total_timesteps | 1373312 | -| train/ | | -| approx_kl | 0.0020384523 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 107280 | -| policy_gradient_loss | -0.00563 | -| std | 0.0297 | -| value_loss | 1.71e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10730 | -| time_elapsed | 60458 | -| total_timesteps | 1373440 | -| train/ | | -| approx_kl | 0.013106339 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -13.6 | -| learning_rate | 0.0003 | -| loss | 0.00859 | -| n_updates | 107290 | -| policy_gradient_loss | 0.00291 | -| std | 0.0297 | -| value_loss | 1.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10731 | -| time_elapsed | 60462 | -| total_timesteps | 1373568 | -| train/ | | -| approx_kl | 0.00833081 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | 0.00193 | -| n_updates | 107300 | -| policy_gradient_loss | 0.00155 | -| std | 0.0297 | -| value_loss | 2.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10732 | -| time_elapsed | 60464 | -| total_timesteps | 1373696 | -| train/ | | -| approx_kl | 0.009422941 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | -0.00979 | -| n_updates | 107310 | -| policy_gradient_loss | -0.00406 | -| std | 0.0297 | -| value_loss | 5.42e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10733 | -| time_elapsed | 60467 | -| total_timesteps | 1373824 | -| train/ | | -| approx_kl | 0.0115395095 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.00356 | -| learning_rate | 0.0003 | -| loss | -0.000655 | -| n_updates | 107320 | -| policy_gradient_loss | 0.00625 | -| std | 0.0297 | -| value_loss | 3.6e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 22 | -| iterations | 10734 | -| time_elapsed | 60470 | -| total_timesteps | 1373952 | -| train/ | | -| approx_kl | 0.028204275 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | 0.00649 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 107330 | -| policy_gradient_loss | -0.00298 | -| std | 0.0296 | -| value_loss | 3.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10735 | -| time_elapsed | 60474 | -| total_timesteps | 1374080 | -| train/ | | -| approx_kl | 0.014713727 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 107340 | -| policy_gradient_loss | 0.00726 | -| std | 0.0296 | -| value_loss | 7.84e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10736 | -| time_elapsed | 60480 | -| total_timesteps | 1374208 | -| train/ | | -| approx_kl | 0.00076624565 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 107350 | -| policy_gradient_loss | -0.00805 | -| std | 0.0295 | -| value_loss | 0.000437 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10737 | -| time_elapsed | 60483 | -| total_timesteps | 1374336 | -| train/ | | -| approx_kl | 0.029682973 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -254 | -| learning_rate | 0.0003 | -| loss | -0.00974 | -| n_updates | 107360 | -| policy_gradient_loss | -0.00763 | -| std | 0.0295 | -| value_loss | 2.03e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10738 | -| time_elapsed | 60487 | -| total_timesteps | 1374464 | -| train/ | | -| approx_kl | 0.0021212515 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -16.3 | -| learning_rate | 0.0003 | -| loss | -0.00673 | -| n_updates | 107370 | -| policy_gradient_loss | -0.0101 | -| std | 0.0295 | -| value_loss | 8.17e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10739 | -| time_elapsed | 60490 | -| total_timesteps | 1374592 | -| train/ | | -| approx_kl | 0.025351858 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -4.26 | -| learning_rate | 0.0003 | -| loss | 0.00712 | -| n_updates | 107380 | -| policy_gradient_loss | 0.00245 | -| std | 0.0295 | -| value_loss | 1.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10740 | -| time_elapsed | 60493 | -| total_timesteps | 1374720 | -| train/ | | -| approx_kl | 0.020289473 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -1.54 | -| learning_rate | 0.0003 | -| loss | -0.000436 | -| n_updates | 107390 | -| policy_gradient_loss | -0.00234 | -| std | 0.0295 | -| value_loss | 6e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10741 | -| time_elapsed | 60496 | -| total_timesteps | 1374848 | -| train/ | | -| approx_kl | 0.00082746195 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 2.1 | -| explained_variance | -0.572 | -| learning_rate | 0.0003 | -| loss | -0.000547 | -| n_updates | 107400 | -| policy_gradient_loss | -0.000383 | -| std | 0.0294 | -| value_loss | 1.24e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10742 | -| time_elapsed | 60500 | -| total_timesteps | 1374976 | -| train/ | | -| approx_kl | 0.0046374034 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.11 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 107410 | -| policy_gradient_loss | 0.00127 | -| std | 0.0294 | -| value_loss | 1.82e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 22 | -| iterations | 10743 | -| time_elapsed | 60502 | -| total_timesteps | 1375104 | -| train/ | | -| approx_kl | 0.0017050914 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.11 | -| explained_variance | -0.077 | -| learning_rate | 0.0003 | -| loss | 0.00506 | -| n_updates | 107420 | -| policy_gradient_loss | 0.00685 | -| std | 0.0293 | -| value_loss | 1.25e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 22 | -| iterations | 10744 | -| time_elapsed | 60510 | -| total_timesteps | 1375232 | -| train/ | | -| approx_kl | 0.0021018656 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.11 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 107430 | -| policy_gradient_loss | -0.0159 | -| std | 0.0293 | -| value_loss | 0.000116 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 22 | -| iterations | 10745 | -| time_elapsed | 60512 | -| total_timesteps | 1375360 | -| train/ | | -| approx_kl | 0.008334739 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.11 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 107440 | -| policy_gradient_loss | -0.00341 | -| std | 0.0293 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 22 | -| iterations | 10746 | -| time_elapsed | 60516 | -| total_timesteps | 1375488 | -| train/ | | -| approx_kl | 0.012761787 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.11 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 107450 | -| policy_gradient_loss | 0.00207 | -| std | 0.0293 | -| value_loss | 1.22e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 22 | -| iterations | 10747 | -| time_elapsed | 60521 | -| total_timesteps | 1375616 | -| train/ | | -| approx_kl | 3.1744596e-05 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.11 | -| explained_variance | -0.0837 | -| learning_rate | 0.0003 | -| loss | -0.000102 | -| n_updates | 107460 | -| policy_gradient_loss | 0.0078 | -| std | 0.0292 | -| value_loss | 1.84e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 22 | -| iterations | 10748 | -| time_elapsed | 60525 | -| total_timesteps | 1375744 | -| train/ | | -| approx_kl | 0.015770305 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 2.11 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.00457 | -| n_updates | 107470 | -| policy_gradient_loss | 0.000534 | -| std | 0.0291 | -| value_loss | 2.83e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 22 | -| iterations | 10749 | -| time_elapsed | 60528 | -| total_timesteps | 1375872 | -| train/ | | -| approx_kl | 0.00016133208 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.12 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.00112 | -| n_updates | 107480 | -| policy_gradient_loss | -0.000644 | -| std | 0.0291 | -| value_loss | 3.01e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10750 | -| time_elapsed | 60532 | -| total_timesteps | 1376000 | -| train/ | | -| approx_kl | 0.0013452861 | -| clip_fraction | 0.0148 | -| clip_range | 0.2 | -| entropy_loss | 2.12 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | -0.000883 | -| n_updates | 107490 | -| policy_gradient_loss | 2.71e-05 | -| std | 0.029 | -| value_loss | 1.62e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10751 | -| time_elapsed | 60536 | -| total_timesteps | 1376128 | -| train/ | | -| approx_kl | 0.020874165 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.12 | -| explained_variance | 0.00528 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 107500 | -| policy_gradient_loss | -0.00819 | -| std | 0.0289 | -| value_loss | 2.82e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10752 | -| time_elapsed | 60542 | -| total_timesteps | 1376256 | -| train/ | | -| approx_kl | 0.0031012022 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 107510 | -| policy_gradient_loss | -0.0135 | -| std | 0.0288 | -| value_loss | 0.00101 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10753 | -| time_elapsed | 60546 | -| total_timesteps | 1376384 | -| train/ | | -| approx_kl | 0.004344036 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | 0.0042 | -| n_updates | 107520 | -| policy_gradient_loss | -0.000346 | -| std | 0.0288 | -| value_loss | 2.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10754 | -| time_elapsed | 60549 | -| total_timesteps | 1376512 | -| train/ | | -| approx_kl | 0.014811426 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.791 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 107530 | -| policy_gradient_loss | -0.00409 | -| std | 0.0288 | -| value_loss | 1.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10755 | -| time_elapsed | 60552 | -| total_timesteps | 1376640 | -| train/ | | -| approx_kl | 0.012586964 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 107540 | -| policy_gradient_loss | 0.00556 | -| std | 0.0288 | -| value_loss | 1.93e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10756 | -| time_elapsed | 60555 | -| total_timesteps | 1376768 | -| train/ | | -| approx_kl | 0.0077307387 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 107550 | -| policy_gradient_loss | 0.00366 | -| std | 0.0287 | -| value_loss | 4.64e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10757 | -| time_elapsed | 60557 | -| total_timesteps | 1376896 | -| train/ | | -| approx_kl | 0.006342903 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 107560 | -| policy_gradient_loss | -0.0145 | -| std | 0.0287 | -| value_loss | 3.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10758 | -| time_elapsed | 60561 | -| total_timesteps | 1377024 | -| train/ | | -| approx_kl | 0.0002419618 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.427 | -| learning_rate | 0.0003 | -| loss | -0.00314 | -| n_updates | 107570 | -| policy_gradient_loss | -0.00484 | -| std | 0.0287 | -| value_loss | 1.55e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10759 | -| time_elapsed | 60570 | -| total_timesteps | 1377152 | -| train/ | | -| approx_kl | 0.005312661 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 107580 | -| policy_gradient_loss | -0.00243 | -| std | 0.0287 | -| value_loss | 0.00281 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10760 | -| time_elapsed | 60573 | -| total_timesteps | 1377280 | -| train/ | | -| approx_kl | 0.016738959 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 107590 | -| policy_gradient_loss | -0.00657 | -| std | 0.0287 | -| value_loss | 2.53e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10761 | -| time_elapsed | 60576 | -| total_timesteps | 1377408 | -| train/ | | -| approx_kl | 0.022008684 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.549 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 107600 | -| policy_gradient_loss | 0.00807 | -| std | 0.0287 | -| value_loss | 7.98e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10762 | -| time_elapsed | 60580 | -| total_timesteps | 1377536 | -| train/ | | -| approx_kl | 8.643139e-06 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.000224 | -| n_updates | 107610 | -| policy_gradient_loss | -0.00198 | -| std | 0.0287 | -| value_loss | 9.9e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10763 | -| time_elapsed | 60583 | -| total_timesteps | 1377664 | -| train/ | | -| approx_kl | 0.001892637 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 107620 | -| policy_gradient_loss | -0.00713 | -| std | 0.0287 | -| value_loss | 1.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10764 | -| time_elapsed | 60587 | -| total_timesteps | 1377792 | -| train/ | | -| approx_kl | 0.010099052 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 107630 | -| policy_gradient_loss | -0.0032 | -| std | 0.0287 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10765 | -| time_elapsed | 60591 | -| total_timesteps | 1377920 | -| train/ | | -| approx_kl | 0.030898387 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 107640 | -| policy_gradient_loss | 0.000317 | -| std | 0.0287 | -| value_loss | 2.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10766 | -| time_elapsed | 60594 | -| total_timesteps | 1378048 | -| train/ | | -| approx_kl | 0.0024414044 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | 0.000543 | -| n_updates | 107650 | -| policy_gradient_loss | 0.00583 | -| std | 0.0287 | -| value_loss | 2.28e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10767 | -| time_elapsed | 60598 | -| total_timesteps | 1378176 | -| train/ | | -| approx_kl | 0.001650257 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.0057 | -| n_updates | 107660 | -| policy_gradient_loss | -0.00526 | -| std | 0.0288 | -| value_loss | 0.0022 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10768 | -| time_elapsed | 60602 | -| total_timesteps | 1378304 | -| train/ | | -| approx_kl | 0.0046858396 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 107670 | -| policy_gradient_loss | -0.00634 | -| std | 0.0288 | -| value_loss | 4.65e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10769 | -| time_elapsed | 60605 | -| total_timesteps | 1378432 | -| train/ | | -| approx_kl | 0.010180627 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -18.9 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 107680 | -| policy_gradient_loss | -0.00291 | -| std | 0.0288 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10770 | -| time_elapsed | 60609 | -| total_timesteps | 1378560 | -| train/ | | -| approx_kl | 0.008412961 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 107690 | -| policy_gradient_loss | 0.00155 | -| std | 0.0288 | -| value_loss | 1.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10771 | -| time_elapsed | 60612 | -| total_timesteps | 1378688 | -| train/ | | -| approx_kl | 0.007911839 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 107700 | -| policy_gradient_loss | -0.0192 | -| std | 0.0288 | -| value_loss | 3.84e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10772 | -| time_elapsed | 60615 | -| total_timesteps | 1378816 | -| train/ | | -| approx_kl | 0.0002951366 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.976 | -| learning_rate | 0.0003 | -| loss | -0.00379 | -| n_updates | 107710 | -| policy_gradient_loss | -0.00344 | -| std | 0.0288 | -| value_loss | 1e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10773 | -| time_elapsed | 60619 | -| total_timesteps | 1378944 | -| train/ | | -| approx_kl | 0.0001599635 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | 0.00385 | -| n_updates | 107720 | -| policy_gradient_loss | -0.00234 | -| std | 0.0288 | -| value_loss | 1.04e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10774 | -| time_elapsed | 60623 | -| total_timesteps | 1379072 | -| train/ | | -| approx_kl | 0.00035140896 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | 0.00745 | -| learning_rate | 0.0003 | -| loss | -0.00492 | -| n_updates | 107730 | -| policy_gradient_loss | -0.00646 | -| std | 0.0288 | -| value_loss | 8.79e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10775 | -| time_elapsed | 60630 | -| total_timesteps | 1379200 | -| train/ | | -| approx_kl | 0.020962484 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 107740 | -| policy_gradient_loss | 0.00298 | -| std | 0.0288 | -| value_loss | 0.00075 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10776 | -| time_elapsed | 60633 | -| total_timesteps | 1379328 | -| train/ | | -| approx_kl | 0.008731284 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.857 | -| learning_rate | 0.0003 | -| loss | -0.000861 | -| n_updates | 107750 | -| policy_gradient_loss | 0.000814 | -| std | 0.0288 | -| value_loss | 0.00017 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10777 | -| time_elapsed | 60636 | -| total_timesteps | 1379456 | -| train/ | | -| approx_kl | 0.0019098455 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -548 | -| learning_rate | 0.0003 | -| loss | -0.000363 | -| n_updates | 107760 | -| policy_gradient_loss | -0.00014 | -| std | 0.0287 | -| value_loss | 7.76e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10778 | -| time_elapsed | 60640 | -| total_timesteps | 1379584 | -| train/ | | -| approx_kl | 0.044052623 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -185 | -| learning_rate | 0.0003 | -| loss | 2.61e-06 | -| n_updates | 107770 | -| policy_gradient_loss | -0.00199 | -| std | 0.0287 | -| value_loss | 7.83e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10779 | -| time_elapsed | 60642 | -| total_timesteps | 1379712 | -| train/ | | -| approx_kl | 0.008610584 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -3.96 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 107780 | -| policy_gradient_loss | -0.0118 | -| std | 0.0287 | -| value_loss | 6.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10780 | -| time_elapsed | 60645 | -| total_timesteps | 1379840 | -| train/ | | -| approx_kl | 0.003605945 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 107790 | -| policy_gradient_loss | 0.00225 | -| std | 0.0287 | -| value_loss | 6.76e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 22 | -| iterations | 10781 | -| time_elapsed | 60648 | -| total_timesteps | 1379968 | -| train/ | | -| approx_kl | 0.02140102 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 2.13 | -| explained_variance | 0.0034 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 107800 | -| policy_gradient_loss | 0.00254 | -| std | 0.0286 | -| value_loss | 2.07e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10782 | -| time_elapsed | 60650 | -| total_timesteps | 1380096 | -| train/ | | -| approx_kl | 0.0006127567 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | 0.00693 | -| learning_rate | 0.0003 | -| loss | 0.00258 | -| n_updates | 107810 | -| policy_gradient_loss | 0.00876 | -| std | 0.0285 | -| value_loss | 2.87e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10783 | -| time_elapsed | 60656 | -| total_timesteps | 1380224 | -| train/ | | -| approx_kl | 0.003508152 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 107820 | -| policy_gradient_loss | -0.0106 | -| std | 0.0285 | -| value_loss | 0.000379 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10784 | -| time_elapsed | 60659 | -| total_timesteps | 1380352 | -| train/ | | -| approx_kl | 5.569542e-05 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | -0.000382 | -| n_updates | 107830 | -| policy_gradient_loss | 0.00304 | -| std | 0.0285 | -| value_loss | 2.32e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10785 | -| time_elapsed | 60662 | -| total_timesteps | 1380480 | -| train/ | | -| approx_kl | 0.0027385163 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 107840 | -| policy_gradient_loss | -0.00529 | -| std | 0.0285 | -| value_loss | 1.65e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10786 | -| time_elapsed | 60666 | -| total_timesteps | 1380608 | -| train/ | | -| approx_kl | 1.9261148e-05 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.738 | -| learning_rate | 0.0003 | -| loss | 0.000429 | -| n_updates | 107850 | -| policy_gradient_loss | 0.00486 | -| std | 0.0285 | -| value_loss | 1.75e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10787 | -| time_elapsed | 60669 | -| total_timesteps | 1380736 | -| train/ | | -| approx_kl | 0.0005800775 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.516 | -| learning_rate | 0.0003 | -| loss | 0.00273 | -| n_updates | 107860 | -| policy_gradient_loss | 0.00344 | -| std | 0.0285 | -| value_loss | 2.32e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10788 | -| time_elapsed | 60673 | -| total_timesteps | 1380864 | -| train/ | | -| approx_kl | 0.00026611052 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 107870 | -| policy_gradient_loss | 0.00539 | -| std | 0.0285 | -| value_loss | 5.68e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 10789 | -| time_elapsed | 60677 | -| total_timesteps | 1380992 | -| train/ | | -| approx_kl | 0.00795221 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.0843 | -| learning_rate | 0.0003 | -| loss | 0.00531 | -| n_updates | 107880 | -| policy_gradient_loss | 0.00377 | -| std | 0.0284 | -| value_loss | 4.52e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 22 | -| iterations | 10790 | -| time_elapsed | 60680 | -| total_timesteps | 1381120 | -| train/ | | -| approx_kl | 0.0019547744 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.0807 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 107890 | -| policy_gradient_loss | 0.0017 | -| std | 0.0284 | -| value_loss | 2.17e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 22 | -| iterations | 10791 | -| time_elapsed | 60690 | -| total_timesteps | 1381248 | -| train/ | | -| approx_kl | 0.027179152 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.025 | -| n_updates | 107900 | -| policy_gradient_loss | -0.0172 | -| std | 0.0284 | -| value_loss | 0.00139 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 22 | -| iterations | 10792 | -| time_elapsed | 60693 | -| total_timesteps | 1381376 | -| train/ | | -| approx_kl | 0.023723463 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -99.1 | -| learning_rate | 0.0003 | -| loss | 0.0406 | -| n_updates | 107910 | -| policy_gradient_loss | -0.00667 | -| std | 0.0284 | -| value_loss | 2.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 22 | -| iterations | 10793 | -| time_elapsed | 60695 | -| total_timesteps | 1381504 | -| train/ | | -| approx_kl | 0.005869493 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -75.9 | -| learning_rate | 0.0003 | -| loss | 0.00203 | -| n_updates | 107920 | -| policy_gradient_loss | 0.00342 | -| std | 0.0284 | -| value_loss | 1.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 22 | -| iterations | 10794 | -| time_elapsed | 60697 | -| total_timesteps | 1381632 | -| train/ | | -| approx_kl | 0.0011019697 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -6.05 | -| learning_rate | 0.0003 | -| loss | -0.00387 | -| n_updates | 107930 | -| policy_gradient_loss | -0.00421 | -| std | 0.0284 | -| value_loss | 1.29e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 22 | -| iterations | 10795 | -| time_elapsed | 60699 | -| total_timesteps | 1381760 | -| train/ | | -| approx_kl | 0.006379061 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.425 | -| learning_rate | 0.0003 | -| loss | -0.00703 | -| n_updates | 107940 | -| policy_gradient_loss | -0.00362 | -| std | 0.0284 | -| value_loss | 2.99e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 22 | -| iterations | 10796 | -| time_elapsed | 60701 | -| total_timesteps | 1381888 | -| train/ | | -| approx_kl | 0.0016350374 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | 0.00462 | -| learning_rate | 0.0003 | -| loss | -0.000994 | -| n_updates | 107950 | -| policy_gradient_loss | 0.00675 | -| std | 0.0284 | -| value_loss | 2.75e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10797 | -| time_elapsed | 60702 | -| total_timesteps | 1382016 | -| train/ | | -| approx_kl | 0.0039792056 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.000478 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 107960 | -| policy_gradient_loss | -0.00477 | -| std | 0.0284 | -| value_loss | 6.31e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10798 | -| time_elapsed | 60712 | -| total_timesteps | 1382144 | -| train/ | | -| approx_kl | 0.00041019125 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 107970 | -| policy_gradient_loss | -0.00423 | -| std | 0.0284 | -| value_loss | 0.000132 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10799 | -| time_elapsed | 60716 | -| total_timesteps | 1382272 | -| train/ | | -| approx_kl | 0.0077757617 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | 0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00904 | -| n_updates | 107980 | -| policy_gradient_loss | -0.00535 | -| std | 0.0284 | -| value_loss | 9.89e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10800 | -| time_elapsed | 60720 | -| total_timesteps | 1382400 | -| train/ | | -| approx_kl | 0.00015789643 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.378 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 107990 | -| policy_gradient_loss | -0.00311 | -| std | 0.0284 | -| value_loss | 1.1e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10801 | -| time_elapsed | 60724 | -| total_timesteps | 1382528 | -| train/ | | -| approx_kl | 5.2386895e-07 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | -0.000102 | -| n_updates | 108000 | -| policy_gradient_loss | -0.00631 | -| std | 0.0285 | -| value_loss | 6.05e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10802 | -| time_elapsed | 60727 | -| total_timesteps | 1382656 | -| train/ | | -| approx_kl | 0.0022516828 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 108010 | -| policy_gradient_loss | -0.0159 | -| std | 0.0285 | -| value_loss | 4.15e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10803 | -| time_elapsed | 60731 | -| total_timesteps | 1382784 | -| train/ | | -| approx_kl | 0.00027652737 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.0982 | -| learning_rate | 0.0003 | -| loss | 0.00207 | -| n_updates | 108020 | -| policy_gradient_loss | -0.000754 | -| std | 0.0285 | -| value_loss | 2.53e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 22 | -| iterations | 10804 | -| time_elapsed | 60734 | -| total_timesteps | 1382912 | -| train/ | | -| approx_kl | 0.0050154855 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.00836 | -| n_updates | 108030 | -| policy_gradient_loss | 0.00294 | -| std | 0.0285 | -| value_loss | 1.26e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10805 | -| time_elapsed | 60736 | -| total_timesteps | 1383040 | -| train/ | | -| approx_kl | 0.006214944 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 108040 | -| policy_gradient_loss | 0.00223 | -| std | 0.0284 | -| value_loss | 1.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10806 | -| time_elapsed | 60743 | -| total_timesteps | 1383168 | -| train/ | | -| approx_kl | 0.018077306 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.381 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 108050 | -| policy_gradient_loss | -0.0103 | -| std | 0.0284 | -| value_loss | 0.00312 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10807 | -| time_elapsed | 60745 | -| total_timesteps | 1383296 | -| train/ | | -| approx_kl | 0.002509064 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -108 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 108060 | -| policy_gradient_loss | 0.0048 | -| std | 0.0284 | -| value_loss | 6.72e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10808 | -| time_elapsed | 60748 | -| total_timesteps | 1383424 | -| train/ | | -| approx_kl | 0.0005696099 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -121 | -| learning_rate | 0.0003 | -| loss | -0.00561 | -| n_updates | 108070 | -| policy_gradient_loss | -0.0116 | -| std | 0.0284 | -| value_loss | 2.87e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10809 | -| time_elapsed | 60751 | -| total_timesteps | 1383552 | -| train/ | | -| approx_kl | 0.006518698 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -42.6 | -| learning_rate | 0.0003 | -| loss | -0.00831 | -| n_updates | 108080 | -| policy_gradient_loss | -0.00567 | -| std | 0.0284 | -| value_loss | 3.57e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10810 | -| time_elapsed | 60754 | -| total_timesteps | 1383680 | -| train/ | | -| approx_kl | 0.0028321347 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -7.65 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 108090 | -| policy_gradient_loss | -0.0129 | -| std | 0.0284 | -| value_loss | 1.74e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10811 | -| time_elapsed | 60758 | -| total_timesteps | 1383808 | -| train/ | | -| approx_kl | 0.009724343 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -1.44 | -| learning_rate | 0.0003 | -| loss | 0.00267 | -| n_updates | 108100 | -| policy_gradient_loss | 0.00184 | -| std | 0.0284 | -| value_loss | 9.7e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 10812 | -| time_elapsed | 60762 | -| total_timesteps | 1383936 | -| train/ | | -| approx_kl | 4.8160087e-05 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.0845 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 108110 | -| policy_gradient_loss | -0.00278 | -| std | 0.0284 | -| value_loss | 6.9e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10813 | -| time_elapsed | 60765 | -| total_timesteps | 1384064 | -| train/ | | -| approx_kl | 0.0051879794 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.00128 | -| n_updates | 108120 | -| policy_gradient_loss | 0.00356 | -| std | 0.0283 | -| value_loss | 3.73e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10814 | -| time_elapsed | 60771 | -| total_timesteps | 1384192 | -| train/ | | -| approx_kl | 0.01922436 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 2.14 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 108130 | -| policy_gradient_loss | -0.00853 | -| std | 0.0283 | -| value_loss | 0.000273 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10815 | -| time_elapsed | 60776 | -| total_timesteps | 1384320 | -| train/ | | -| approx_kl | 0.007150598 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -600 | -| learning_rate | 0.0003 | -| loss | -6.93e-05 | -| n_updates | 108140 | -| policy_gradient_loss | 6.99e-05 | -| std | 0.0283 | -| value_loss | 2.48e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10816 | -| time_elapsed | 60778 | -| total_timesteps | 1384448 | -| train/ | | -| approx_kl | 0.0074231992 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -624 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 108150 | -| policy_gradient_loss | -0.00273 | -| std | 0.0283 | -| value_loss | 1.3e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10817 | -| time_elapsed | 60782 | -| total_timesteps | 1384576 | -| train/ | | -| approx_kl | 0.0011348715 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -94.2 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 108160 | -| policy_gradient_loss | -0.00198 | -| std | 0.0282 | -| value_loss | 1.84e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10818 | -| time_elapsed | 60785 | -| total_timesteps | 1384704 | -| train/ | | -| approx_kl | 0.02587972 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -17.1 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 108170 | -| policy_gradient_loss | -0.00791 | -| std | 0.0282 | -| value_loss | 2.73e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10819 | -| time_elapsed | 60788 | -| total_timesteps | 1384832 | -| train/ | | -| approx_kl | 0.016470283 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -25.5 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 108180 | -| policy_gradient_loss | -0.00955 | -| std | 0.0282 | -| value_loss | 2.71e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10820 | -| time_elapsed | 60792 | -| total_timesteps | 1384960 | -| train/ | | -| approx_kl | 0.0071323104 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.561 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 108190 | -| policy_gradient_loss | 0.00483 | -| std | 0.0282 | -| value_loss | 6.95e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10821 | -| time_elapsed | 60795 | -| total_timesteps | 1385088 | -| train/ | | -| approx_kl | 0.04287276 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 108200 | -| policy_gradient_loss | -0.00902 | -| std | 0.0282 | -| value_loss | 3.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10822 | -| time_elapsed | 60802 | -| total_timesteps | 1385216 | -| train/ | | -| approx_kl | 0.0154129015 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 108210 | -| policy_gradient_loss | -0.00875 | -| std | 0.0282 | -| value_loss | 5.21e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10823 | -| time_elapsed | 60806 | -| total_timesteps | 1385344 | -| train/ | | -| approx_kl | 0.02358045 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.294 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 108220 | -| policy_gradient_loss | 0.00126 | -| std | 0.0282 | -| value_loss | 9.13e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10824 | -| time_elapsed | 60809 | -| total_timesteps | 1385472 | -| train/ | | -| approx_kl | 0.00044678105 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.0044 | -| n_updates | 108230 | -| policy_gradient_loss | 0.00753 | -| std | 0.0282 | -| value_loss | 1.43e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10825 | -| time_elapsed | 60814 | -| total_timesteps | 1385600 | -| train/ | | -| approx_kl | 2.1932647e-06 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | 0.000351 | -| n_updates | 108240 | -| policy_gradient_loss | -0.0056 | -| std | 0.0282 | -| value_loss | 4.46e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10826 | -| time_elapsed | 60819 | -| total_timesteps | 1385728 | -| train/ | | -| approx_kl | 0.0090222405 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 108250 | -| policy_gradient_loss | -0.0113 | -| std | 0.0282 | -| value_loss | 2.81e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10827 | -| time_elapsed | 60823 | -| total_timesteps | 1385856 | -| train/ | | -| approx_kl | 0.015178211 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.00882 | -| n_updates | 108260 | -| policy_gradient_loss | 0.00473 | -| std | 0.0282 | -| value_loss | 1.34e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10828 | -| time_elapsed | 60826 | -| total_timesteps | 1385984 | -| train/ | | -| approx_kl | 0.001868675 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 108270 | -| policy_gradient_loss | -0.00184 | -| std | 0.0282 | -| value_loss | 1.49e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10829 | -| time_elapsed | 60831 | -| total_timesteps | 1386112 | -| train/ | | -| approx_kl | 0.018804723 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.00268 | -| n_updates | 108280 | -| policy_gradient_loss | 0.000469 | -| std | 0.0282 | -| value_loss | 6.94e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10830 | -| time_elapsed | 60840 | -| total_timesteps | 1386240 | -| train/ | | -| approx_kl | 0.041343905 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 108290 | -| policy_gradient_loss | -0.0161 | -| std | 0.0282 | -| value_loss | 7.56e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10831 | -| time_elapsed | 60843 | -| total_timesteps | 1386368 | -| train/ | | -| approx_kl | 0.004564232 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -3.88 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 108300 | -| policy_gradient_loss | 0.00261 | -| std | 0.0281 | -| value_loss | 4.66e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10832 | -| time_elapsed | 60846 | -| total_timesteps | 1386496 | -| train/ | | -| approx_kl | 3.3359043e-05 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -3.19 | -| learning_rate | 0.0003 | -| loss | -0.000337 | -| n_updates | 108310 | -| policy_gradient_loss | 0.00442 | -| std | 0.0281 | -| value_loss | 8.8e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10833 | -| time_elapsed | 60850 | -| total_timesteps | 1386624 | -| train/ | | -| approx_kl | 0.0001799725 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 108320 | -| policy_gradient_loss | -0.00164 | -| std | 0.0281 | -| value_loss | 1.18e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10834 | -| time_elapsed | 60853 | -| total_timesteps | 1386752 | -| train/ | | -| approx_kl | 0.005879221 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.634 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 108330 | -| policy_gradient_loss | -0.0148 | -| std | 0.0281 | -| value_loss | 5.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10835 | -| time_elapsed | 60857 | -| total_timesteps | 1386880 | -| train/ | | -| approx_kl | 0.002435491 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 108340 | -| policy_gradient_loss | 0.00238 | -| std | 0.0281 | -| value_loss | 2.02e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10836 | -| time_elapsed | 60860 | -| total_timesteps | 1387008 | -| train/ | | -| approx_kl | 0.032145113 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 108350 | -| policy_gradient_loss | -0.00858 | -| std | 0.0281 | -| value_loss | 2.89e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10837 | -| time_elapsed | 60868 | -| total_timesteps | 1387136 | -| train/ | | -| approx_kl | 0.014047794 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 108360 | -| policy_gradient_loss | -0.0111 | -| std | 0.0281 | -| value_loss | 0.00228 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10838 | -| time_elapsed | 60871 | -| total_timesteps | 1387264 | -| train/ | | -| approx_kl | 0.029401109 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | 0.372 | -| learning_rate | 0.0003 | -| loss | 0.00622 | -| n_updates | 108370 | -| policy_gradient_loss | -0.000247 | -| std | 0.028 | -| value_loss | 1.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10839 | -| time_elapsed | 60874 | -| total_timesteps | 1387392 | -| train/ | | -| approx_kl | 0.024016388 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -2.5 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 108380 | -| policy_gradient_loss | -0.00693 | -| std | 0.0281 | -| value_loss | 3.8e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10840 | -| time_elapsed | 60876 | -| total_timesteps | 1387520 | -| train/ | | -| approx_kl | 0.0023798654 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | 0.00259 | -| n_updates | 108390 | -| policy_gradient_loss | 0.00591 | -| std | 0.0281 | -| value_loss | 2.64e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10841 | -| time_elapsed | 60879 | -| total_timesteps | 1387648 | -| train/ | | -| approx_kl | 0.0036109732 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 2.15 | -| explained_variance | -0.518 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 108400 | -| policy_gradient_loss | 6.55e-06 | -| std | 0.0281 | -| value_loss | 3.71e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10842 | -| time_elapsed | 60882 | -| total_timesteps | 1387776 | -| train/ | | -| approx_kl | 0.019198816 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 2.84e-05 | -| n_updates | 108410 | -| policy_gradient_loss | -0.00202 | -| std | 0.028 | -| value_loss | 2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10843 | -| time_elapsed | 60885 | -| total_timesteps | 1387904 | -| train/ | | -| approx_kl | 0.007391278 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | 0.00331 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 108420 | -| policy_gradient_loss | -0.00209 | -| std | 0.028 | -| value_loss | 2.29e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10844 | -| time_elapsed | 60889 | -| total_timesteps | 1388032 | -| train/ | | -| approx_kl | 0.0072415546 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 108430 | -| policy_gradient_loss | 0.00388 | -| std | 0.028 | -| value_loss | 1.2e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10845 | -| time_elapsed | 60896 | -| total_timesteps | 1388160 | -| train/ | | -| approx_kl | 0.0007013222 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | 0.765 | -| learning_rate | 0.0003 | -| loss | 0.00678 | -| n_updates | 108440 | -| policy_gradient_loss | -0.00755 | -| std | 0.028 | -| value_loss | 0.00309 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10846 | -| time_elapsed | 60900 | -| total_timesteps | 1388288 | -| train/ | | -| approx_kl | 0.010344046 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.426 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 108450 | -| policy_gradient_loss | -0.00897 | -| std | 0.028 | -| value_loss | 0.000162 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10847 | -| time_elapsed | 60903 | -| total_timesteps | 1388416 | -| train/ | | -| approx_kl | 0.0047909752 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.447 | -| learning_rate | 0.0003 | -| loss | -0.0094 | -| n_updates | 108460 | -| policy_gradient_loss | -0.00805 | -| std | 0.028 | -| value_loss | 0.000106 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10848 | -| time_elapsed | 60905 | -| total_timesteps | 1388544 | -| train/ | | -| approx_kl | 0.00044104317 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0096 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 108470 | -| policy_gradient_loss | -0.00492 | -| std | 0.028 | -| value_loss | 0.000115 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10849 | -| time_elapsed | 60909 | -| total_timesteps | 1388672 | -| train/ | | -| approx_kl | 0.00207996 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -5.35 | -| learning_rate | 0.0003 | -| loss | -0.00729 | -| n_updates | 108480 | -| policy_gradient_loss | -0.00877 | -| std | 0.0279 | -| value_loss | 0.000155 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10850 | -| time_elapsed | 60911 | -| total_timesteps | 1388800 | -| train/ | | -| approx_kl | 0.00010536285 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -11 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 108490 | -| policy_gradient_loss | 0.00517 | -| std | 0.0279 | -| value_loss | 4.22e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10851 | -| time_elapsed | 60914 | -| total_timesteps | 1388928 | -| train/ | | -| approx_kl | 0.00088853994 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.413 | -| learning_rate | 0.0003 | -| loss | 0.00521 | -| n_updates | 108500 | -| policy_gradient_loss | 0.00146 | -| std | 0.0279 | -| value_loss | 8.88e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10852 | -| time_elapsed | 60917 | -| total_timesteps | 1389056 | -| train/ | | -| approx_kl | 0.046718914 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -17.8 | -| learning_rate | 0.0003 | -| loss | -0.00615 | -| n_updates | 108510 | -| policy_gradient_loss | -0.00478 | -| std | 0.0279 | -| value_loss | 2.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10853 | -| time_elapsed | 60923 | -| total_timesteps | 1389184 | -| train/ | | -| approx_kl | 0.016392939 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 108520 | -| policy_gradient_loss | -0.0142 | -| std | 0.0279 | -| value_loss | 0.00111 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10854 | -| time_elapsed | 60926 | -| total_timesteps | 1389312 | -| train/ | | -| approx_kl | 0.028142964 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -30.3 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 108530 | -| policy_gradient_loss | -0.0182 | -| std | 0.0279 | -| value_loss | 2.48e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10855 | -| time_elapsed | 60930 | -| total_timesteps | 1389440 | -| train/ | | -| approx_kl | 0.033571493 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -208 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 108540 | -| policy_gradient_loss | -0.0022 | -| std | 0.0279 | -| value_loss | 0.000141 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10856 | -| time_elapsed | 60934 | -| total_timesteps | 1389568 | -| train/ | | -| approx_kl | 0.011483533 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.575 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 108550 | -| policy_gradient_loss | 0.00189 | -| std | 0.0279 | -| value_loss | 0.00104 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10857 | -| time_elapsed | 60936 | -| total_timesteps | 1389696 | -| train/ | | -| approx_kl | 0.0014416515 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 108560 | -| policy_gradient_loss | -0.00407 | -| std | 0.0279 | -| value_loss | 0.0022 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10858 | -| time_elapsed | 60939 | -| total_timesteps | 1389824 | -| train/ | | -| approx_kl | 0.030936245 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 108570 | -| policy_gradient_loss | -0.00589 | -| std | 0.0279 | -| value_loss | 0.000225 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10859 | -| time_elapsed | 60943 | -| total_timesteps | 1389952 | -| train/ | | -| approx_kl | 0.011995006 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0731 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 108580 | -| policy_gradient_loss | 0.00111 | -| std | 0.0279 | -| value_loss | 9.9e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10860 | -| time_elapsed | 60947 | -| total_timesteps | 1390080 | -| train/ | | -| approx_kl | 0.0061438335 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0781 | -| learning_rate | 0.0003 | -| loss | 0.0044 | -| n_updates | 108590 | -| policy_gradient_loss | 0.0122 | -| std | 0.0279 | -| value_loss | 0.000111 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10861 | -| time_elapsed | 60955 | -| total_timesteps | 1390208 | -| train/ | | -| approx_kl | 0.09624585 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 108600 | -| policy_gradient_loss | -0.0104 | -| std | 0.0279 | -| value_loss | 0.00104 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10862 | -| time_elapsed | 60957 | -| total_timesteps | 1390336 | -| train/ | | -| approx_kl | 0.003124319 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.000867 | -| n_updates | 108610 | -| policy_gradient_loss | -0.000709 | -| std | 0.0279 | -| value_loss | 1.68e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10863 | -| time_elapsed | 60962 | -| total_timesteps | 1390464 | -| train/ | | -| approx_kl | 0.013828067 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.0742 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 108620 | -| policy_gradient_loss | -0.000179 | -| std | 0.0278 | -| value_loss | 4.93e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10864 | -| time_elapsed | 60966 | -| total_timesteps | 1390592 | -| train/ | | -| approx_kl | 0.0028384905 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 2.16 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | -0.00523 | -| n_updates | 108630 | -| policy_gradient_loss | -0.005 | -| std | 0.0278 | -| value_loss | 7.02e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10865 | -| time_elapsed | 60970 | -| total_timesteps | 1390720 | -| train/ | | -| approx_kl | 0.020956691 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | 0.00778 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 108640 | -| policy_gradient_loss | 0.0152 | -| std | 0.0277 | -| value_loss | 6.94e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10866 | -| time_elapsed | 60973 | -| total_timesteps | 1390848 | -| train/ | | -| approx_kl | 0.0058928654 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.0523 | -| learning_rate | 0.0003 | -| loss | 0.00709 | -| n_updates | 108650 | -| policy_gradient_loss | 0.0106 | -| std | 0.0277 | -| value_loss | 3.44e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10867 | -| time_elapsed | 60976 | -| total_timesteps | 1390976 | -| train/ | | -| approx_kl | 0.015554655 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.000139 | -| n_updates | 108660 | -| policy_gradient_loss | -0.000271 | -| std | 0.0277 | -| value_loss | 7.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10868 | -| time_elapsed | 60980 | -| total_timesteps | 1391104 | -| train/ | | -| approx_kl | 0.035887435 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 108670 | -| policy_gradient_loss | -0.00861 | -| std | 0.0277 | -| value_loss | 2.41e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10869 | -| time_elapsed | 60987 | -| total_timesteps | 1391232 | -| train/ | | -| approx_kl | 0.11432444 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.376 | -| learning_rate | 0.0003 | -| loss | 0.00115 | -| n_updates | 108680 | -| policy_gradient_loss | -0.0023 | -| std | 0.0277 | -| value_loss | 0.00268 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10870 | -| time_elapsed | 60991 | -| total_timesteps | 1391360 | -| train/ | | -| approx_kl | 0.022570198 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 108690 | -| policy_gradient_loss | -0.0127 | -| std | 0.0277 | -| value_loss | 7.44e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10871 | -| time_elapsed | 60994 | -| total_timesteps | 1391488 | -| train/ | | -| approx_kl | 0.010205828 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -6.36 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 108700 | -| policy_gradient_loss | -0.00717 | -| std | 0.0277 | -| value_loss | 9.18e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10872 | -| time_elapsed | 60998 | -| total_timesteps | 1391616 | -| train/ | | -| approx_kl | 0.0047024074 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -1.96 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 108710 | -| policy_gradient_loss | -0.00108 | -| std | 0.0277 | -| value_loss | 2.53e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10873 | -| time_elapsed | 61002 | -| total_timesteps | 1391744 | -| train/ | | -| approx_kl | 0.00494761 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.888 | -| learning_rate | 0.0003 | -| loss | -0.00314 | -| n_updates | 108720 | -| policy_gradient_loss | 0.00643 | -| std | 0.0276 | -| value_loss | 1.15e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10874 | -| time_elapsed | 61006 | -| total_timesteps | 1391872 | -| train/ | | -| approx_kl | 3.1101517e-05 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.652 | -| learning_rate | 0.0003 | -| loss | -0.000773 | -| n_updates | 108730 | -| policy_gradient_loss | 0.00481 | -| std | 0.0275 | -| value_loss | 2.26e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10875 | -| time_elapsed | 61010 | -| total_timesteps | 1392000 | -| train/ | | -| approx_kl | 0.00017024018 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 108740 | -| policy_gradient_loss | -0.0072 | -| std | 0.0275 | -| value_loss | 3.74e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10876 | -| time_elapsed | 61015 | -| total_timesteps | 1392128 | -| train/ | | -| approx_kl | 0.012786906 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | 0.00598 | -| learning_rate | 0.0003 | -| loss | 0.00339 | -| n_updates | 108750 | -| policy_gradient_loss | -0.000661 | -| std | 0.0275 | -| value_loss | 4.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10877 | -| time_elapsed | 61022 | -| total_timesteps | 1392256 | -| train/ | | -| approx_kl | 0.020370921 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | 0.708 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 108760 | -| policy_gradient_loss | -0.00785 | -| std | 0.0275 | -| value_loss | 0.00106 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10878 | -| time_elapsed | 61025 | -| total_timesteps | 1392384 | -| train/ | | -| approx_kl | 2.6850495e-05 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -23.9 | -| learning_rate | 0.0003 | -| loss | 0.000782 | -| n_updates | 108770 | -| policy_gradient_loss | -0.00194 | -| std | 0.0275 | -| value_loss | 2.43e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10879 | -| time_elapsed | 61029 | -| total_timesteps | 1392512 | -| train/ | | -| approx_kl | 0.080999225 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -18 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 108780 | -| policy_gradient_loss | -0.00457 | -| std | 0.0275 | -| value_loss | 1.58e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10880 | -| time_elapsed | 61033 | -| total_timesteps | 1392640 | -| train/ | | -| approx_kl | 0.00041011441 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.17 | -| explained_variance | -12.2 | -| learning_rate | 0.0003 | -| loss | -0.000837 | -| n_updates | 108790 | -| policy_gradient_loss | -0.000289 | -| std | 0.0275 | -| value_loss | 1.73e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10881 | -| time_elapsed | 61036 | -| total_timesteps | 1392768 | -| train/ | | -| approx_kl | 0.016532702 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.0375 | -| n_updates | 108800 | -| policy_gradient_loss | 0.0108 | -| std | 0.0275 | -| value_loss | 1.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 22 | -| iterations | 10882 | -| time_elapsed | 61040 | -| total_timesteps | 1392896 | -| train/ | | -| approx_kl | 0.009789839 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.81 | -| learning_rate | 0.0003 | -| loss | -0.000299 | -| n_updates | 108810 | -| policy_gradient_loss | 7.78e-05 | -| std | 0.0274 | -| value_loss | 1.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10883 | -| time_elapsed | 61043 | -| total_timesteps | 1393024 | -| train/ | | -| approx_kl | 0.009357199 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.063 | -| learning_rate | 0.0003 | -| loss | -0.00837 | -| n_updates | 108820 | -| policy_gradient_loss | -0.00293 | -| std | 0.0274 | -| value_loss | 3.83e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10884 | -| time_elapsed | 61053 | -| total_timesteps | 1393152 | -| train/ | | -| approx_kl | 0.015466515 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 108830 | -| policy_gradient_loss | -0.0127 | -| std | 0.0274 | -| value_loss | 0.00102 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10885 | -| time_elapsed | 61057 | -| total_timesteps | 1393280 | -| train/ | | -| approx_kl | 0.00044003734 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.000646 | -| n_updates | 108840 | -| policy_gradient_loss | 0.00172 | -| std | 0.0274 | -| value_loss | 6.27e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10886 | -| time_elapsed | 61061 | -| total_timesteps | 1393408 | -| train/ | | -| approx_kl | 0.028294431 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -50 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 108850 | -| policy_gradient_loss | -0.0187 | -| std | 0.0274 | -| value_loss | 7.21e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10887 | -| time_elapsed | 61064 | -| total_timesteps | 1393536 | -| train/ | | -| approx_kl | 0.0039775223 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -1.32 | -| learning_rate | 0.0003 | -| loss | 0.000873 | -| n_updates | 108860 | -| policy_gradient_loss | 0.00311 | -| std | 0.0274 | -| value_loss | 1.98e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10888 | -| time_elapsed | 61068 | -| total_timesteps | 1393664 | -| train/ | | -| approx_kl | 5.881302e-07 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.532 | -| learning_rate | 0.0003 | -| loss | -1.9e-05 | -| n_updates | 108870 | -| policy_gradient_loss | 0.00287 | -| std | 0.0274 | -| value_loss | 3.06e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10889 | -| time_elapsed | 61071 | -| total_timesteps | 1393792 | -| train/ | | -| approx_kl | 0.038882755 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 108880 | -| policy_gradient_loss | 0.00207 | -| std | 0.0274 | -| value_loss | 1.36e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10890 | -| time_elapsed | 61075 | -| total_timesteps | 1393920 | -| train/ | | -| approx_kl | 0.0076529253 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0882 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 108890 | -| policy_gradient_loss | -0.00239 | -| std | 0.0274 | -| value_loss | 9.02e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10891 | -| time_elapsed | 61077 | -| total_timesteps | 1394048 | -| train/ | | -| approx_kl | 0.0038548466 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 108900 | -| policy_gradient_loss | -0.00118 | -| std | 0.0274 | -| value_loss | 5.67e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10892 | -| time_elapsed | 61084 | -| total_timesteps | 1394176 | -| train/ | | -| approx_kl | 0.0038355272 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 108910 | -| policy_gradient_loss | -0.012 | -| std | 0.0274 | -| value_loss | 0.000321 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10893 | -| time_elapsed | 61087 | -| total_timesteps | 1394304 | -| train/ | | -| approx_kl | 0.03807524 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.826 | -| learning_rate | 0.0003 | -| loss | 0.0067 | -| n_updates | 108920 | -| policy_gradient_loss | -0.000353 | -| std | 0.0274 | -| value_loss | 7.13e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10894 | -| time_elapsed | 61090 | -| total_timesteps | 1394432 | -| train/ | | -| approx_kl | 1.7522369e-05 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.423 | -| learning_rate | 0.0003 | -| loss | 0.000303 | -| n_updates | 108930 | -| policy_gradient_loss | -0.00259 | -| std | 0.0273 | -| value_loss | 1.42e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10895 | -| time_elapsed | 61094 | -| total_timesteps | 1394560 | -| train/ | | -| approx_kl | 0.022215748 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.00191 | -| n_updates | 108940 | -| policy_gradient_loss | -0.00156 | -| std | 0.0273 | -| value_loss | 2.81e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10896 | -| time_elapsed | 61097 | -| total_timesteps | 1394688 | -| train/ | | -| approx_kl | 0.006718991 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.000945 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 108950 | -| policy_gradient_loss | -0.00101 | -| std | 0.0273 | -| value_loss | 8.86e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10897 | -| time_elapsed | 61099 | -| total_timesteps | 1394816 | -| train/ | | -| approx_kl | 0.0034304461 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.000685 | -| n_updates | 108960 | -| policy_gradient_loss | 0.000457 | -| std | 0.0273 | -| value_loss | 7.31e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 22 | -| iterations | 10898 | -| time_elapsed | 61103 | -| total_timesteps | 1394944 | -| train/ | | -| approx_kl | 0.0008561867 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.00777 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 108970 | -| policy_gradient_loss | -0.00575 | -| std | 0.0274 | -| value_loss | 1.45e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10899 | -| time_elapsed | 61107 | -| total_timesteps | 1395072 | -| train/ | | -| approx_kl | 0.026528604 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.0245 | -| n_updates | 108980 | -| policy_gradient_loss | -0.0187 | -| std | 0.0274 | -| value_loss | 1.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10900 | -| time_elapsed | 61113 | -| total_timesteps | 1395200 | -| train/ | | -| approx_kl | 0.01784224 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.847 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 108990 | -| policy_gradient_loss | -0.0103 | -| std | 0.0274 | -| value_loss | 0.00342 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10901 | -| time_elapsed | 61116 | -| total_timesteps | 1395328 | -| train/ | | -| approx_kl | 0.024245122 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.0056 | -| n_updates | 109000 | -| policy_gradient_loss | -2.15e-05 | -| std | 0.0274 | -| value_loss | 4.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10902 | -| time_elapsed | 61120 | -| total_timesteps | 1395456 | -| train/ | | -| approx_kl | 0.027787346 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.722 | -| learning_rate | 0.0003 | -| loss | 0.00865 | -| n_updates | 109010 | -| policy_gradient_loss | 0.00229 | -| std | 0.0274 | -| value_loss | 1.88e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10903 | -| time_elapsed | 61122 | -| total_timesteps | 1395584 | -| train/ | | -| approx_kl | 0.00013836939 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.297 | -| learning_rate | 0.0003 | -| loss | 0.00164 | -| n_updates | 109020 | -| policy_gradient_loss | 0.000595 | -| std | 0.0274 | -| value_loss | 7.64e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10904 | -| time_elapsed | 61126 | -| total_timesteps | 1395712 | -| train/ | | -| approx_kl | 0.008977145 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 109030 | -| policy_gradient_loss | 0.00112 | -| std | 0.0274 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10905 | -| time_elapsed | 61129 | -| total_timesteps | 1395840 | -| train/ | | -| approx_kl | 0.0001675142 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0973 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 109040 | -| policy_gradient_loss | -0.000755 | -| std | 0.0274 | -| value_loss | 1.25e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 22 | -| iterations | 10906 | -| time_elapsed | 61132 | -| total_timesteps | 1395968 | -| train/ | | -| approx_kl | 0.0025807694 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 109050 | -| policy_gradient_loss | -0.00551 | -| std | 0.0274 | -| value_loss | 6.48e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10907 | -| time_elapsed | 61135 | -| total_timesteps | 1396096 | -| train/ | | -| approx_kl | 8.877832e-06 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | 0.000647 | -| n_updates | 109060 | -| policy_gradient_loss | 0.00175 | -| std | 0.0274 | -| value_loss | 7.29e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10908 | -| time_elapsed | 61142 | -| total_timesteps | 1396224 | -| train/ | | -| approx_kl | 0.00017666304 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | -0.00561 | -| n_updates | 109070 | -| policy_gradient_loss | -0.00519 | -| std | 0.0274 | -| value_loss | 0.00157 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10909 | -| time_elapsed | 61144 | -| total_timesteps | 1396352 | -| train/ | | -| approx_kl | 0.003965406 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.00743 | -| n_updates | 109080 | -| policy_gradient_loss | 0.00191 | -| std | 0.0274 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10910 | -| time_elapsed | 61147 | -| total_timesteps | 1396480 | -| train/ | | -| approx_kl | 0.002624345 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.402 | -| learning_rate | 0.0003 | -| loss | 0.00284 | -| n_updates | 109090 | -| policy_gradient_loss | 0.00452 | -| std | 0.0274 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10911 | -| time_elapsed | 61150 | -| total_timesteps | 1396608 | -| train/ | | -| approx_kl | 0.00781453 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.252 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 109100 | -| policy_gradient_loss | 0.00178 | -| std | 0.0274 | -| value_loss | 8.94e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10912 | -| time_elapsed | 61153 | -| total_timesteps | 1396736 | -| train/ | | -| approx_kl | 0.0002950565 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0816 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 109110 | -| policy_gradient_loss | 4.12e-05 | -| std | 0.0274 | -| value_loss | 3.77e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10913 | -| time_elapsed | 61157 | -| total_timesteps | 1396864 | -| train/ | | -| approx_kl | 0.0123861395 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 109120 | -| policy_gradient_loss | 0.00108 | -| std | 0.0274 | -| value_loss | 2.56e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 10914 | -| time_elapsed | 61160 | -| total_timesteps | 1396992 | -| train/ | | -| approx_kl | 0.00010295259 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 109130 | -| policy_gradient_loss | -0.00901 | -| std | 0.0273 | -| value_loss | 3.23e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10915 | -| time_elapsed | 61163 | -| total_timesteps | 1397120 | -| train/ | | -| approx_kl | 0.011572849 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 109140 | -| policy_gradient_loss | 0.00272 | -| std | 0.0273 | -| value_loss | 2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10916 | -| time_elapsed | 61173 | -| total_timesteps | 1397248 | -| train/ | | -| approx_kl | 0.018235244 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.257 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 109150 | -| policy_gradient_loss | -0.0113 | -| std | 0.0273 | -| value_loss | 0.00195 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10917 | -| time_elapsed | 61175 | -| total_timesteps | 1397376 | -| train/ | | -| approx_kl | 0.027476158 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | -0.00966 | -| n_updates | 109160 | -| policy_gradient_loss | -0.00896 | -| std | 0.0273 | -| value_loss | 4.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10918 | -| time_elapsed | 61179 | -| total_timesteps | 1397504 | -| train/ | | -| approx_kl | 0.03010137 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -11.9 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 109170 | -| policy_gradient_loss | -0.0087 | -| std | 0.0273 | -| value_loss | 5.65e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10919 | -| time_elapsed | 61182 | -| total_timesteps | 1397632 | -| train/ | | -| approx_kl | 0.012980493 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -1.96 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 109180 | -| policy_gradient_loss | -0.00463 | -| std | 0.0273 | -| value_loss | 3.45e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10920 | -| time_elapsed | 61185 | -| total_timesteps | 1397760 | -| train/ | | -| approx_kl | 0.0112438 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.519 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 109190 | -| policy_gradient_loss | 0.000209 | -| std | 0.0273 | -| value_loss | 7.85e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 10921 | -| time_elapsed | 61188 | -| total_timesteps | 1397888 | -| train/ | | -| approx_kl | 0.021389505 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0867 | -| learning_rate | 0.0003 | -| loss | 0.00017 | -| n_updates | 109200 | -| policy_gradient_loss | -0.00171 | -| std | 0.0273 | -| value_loss | 1.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10922 | -| time_elapsed | 61191 | -| total_timesteps | 1398016 | -| train/ | | -| approx_kl | 0.004453654 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 109210 | -| policy_gradient_loss | -0.00047 | -| std | 0.0273 | -| value_loss | 3.4e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10923 | -| time_elapsed | 61199 | -| total_timesteps | 1398144 | -| train/ | | -| approx_kl | 0.14217961 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.867 | -| learning_rate | 0.0003 | -| loss | 0.0285 | -| n_updates | 109220 | -| policy_gradient_loss | 0.00386 | -| std | 0.0272 | -| value_loss | 0.00285 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10924 | -| time_elapsed | 61202 | -| total_timesteps | 1398272 | -| train/ | | -| approx_kl | 0.02311871 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | 0.0582 | -| learning_rate | 0.0003 | -| loss | 0.00823 | -| n_updates | 109230 | -| policy_gradient_loss | 0.00325 | -| std | 0.0272 | -| value_loss | 4.13e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10925 | -| time_elapsed | 61205 | -| total_timesteps | 1398400 | -| train/ | | -| approx_kl | 0.03233947 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.435 | -| learning_rate | 0.0003 | -| loss | 0.00357 | -| n_updates | 109240 | -| policy_gradient_loss | -0.00101 | -| std | 0.0272 | -| value_loss | 4.17e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10926 | -| time_elapsed | 61209 | -| total_timesteps | 1398528 | -| train/ | | -| approx_kl | 2.72654e-05 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.000822 | -| n_updates | 109250 | -| policy_gradient_loss | 0.00102 | -| std | 0.0272 | -| value_loss | 2.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10927 | -| time_elapsed | 61211 | -| total_timesteps | 1398656 | -| train/ | | -| approx_kl | 0.026713002 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.307 | -| learning_rate | 0.0003 | -| loss | 0.000398 | -| n_updates | 109260 | -| policy_gradient_loss | -0.00202 | -| std | 0.0272 | -| value_loss | 1.76e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10928 | -| time_elapsed | 61213 | -| total_timesteps | 1398784 | -| train/ | | -| approx_kl | 0.00033629267 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | 0.000679 | -| n_updates | 109270 | -| policy_gradient_loss | 0.000987 | -| std | 0.0272 | -| value_loss | 2.02e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10929 | -| time_elapsed | 61216 | -| total_timesteps | 1398912 | -| train/ | | -| approx_kl | 0.0071884994 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -1.58 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 109280 | -| policy_gradient_loss | -0.000263 | -| std | 0.0272 | -| value_loss | 9.54e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10930 | -| time_elapsed | 61217 | -| total_timesteps | 1399040 | -| train/ | | -| approx_kl | 0.012311969 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.00066 | -| n_updates | 109290 | -| policy_gradient_loss | 0.00169 | -| std | 0.0272 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10931 | -| time_elapsed | 61225 | -| total_timesteps | 1399168 | -| train/ | | -| approx_kl | 0.0025675166 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -0.000704 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 109300 | -| policy_gradient_loss | -0.0081 | -| std | 0.0272 | -| value_loss | 0.00225 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10932 | -| time_elapsed | 61228 | -| total_timesteps | 1399296 | -| train/ | | -| approx_kl | 0.00095965574 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -6.32 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 109310 | -| policy_gradient_loss | -0.000466 | -| std | 0.0272 | -| value_loss | 7.99e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10933 | -| time_elapsed | 61231 | -| total_timesteps | 1399424 | -| train/ | | -| approx_kl | 0.026917648 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.18 | -| explained_variance | -86.4 | -| learning_rate | 0.0003 | -| loss | 0.000323 | -| n_updates | 109320 | -| policy_gradient_loss | -0.00126 | -| std | 0.0272 | -| value_loss | 2.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10934 | -| time_elapsed | 61234 | -| total_timesteps | 1399552 | -| train/ | | -| approx_kl | 0.011659973 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -2.69 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 109330 | -| policy_gradient_loss | 4.59e-05 | -| std | 0.0272 | -| value_loss | 6.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10935 | -| time_elapsed | 61238 | -| total_timesteps | 1399680 | -| train/ | | -| approx_kl | 0.012146204 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 109340 | -| policy_gradient_loss | -0.00292 | -| std | 0.0272 | -| value_loss | 1.1e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10936 | -| time_elapsed | 61241 | -| total_timesteps | 1399808 | -| train/ | | -| approx_kl | 6.357208e-05 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | 0.00451 | -| learning_rate | 0.0003 | -| loss | -0.00077 | -| n_updates | 109350 | -| policy_gradient_loss | 0.00317 | -| std | 0.0272 | -| value_loss | 1.75e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 22 | -| iterations | 10937 | -| time_elapsed | 61244 | -| total_timesteps | 1399936 | -| train/ | | -| approx_kl | 0.006732607 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.00361 | -| learning_rate | 0.0003 | -| loss | 0.00646 | -| n_updates | 109360 | -| policy_gradient_loss | 0.00387 | -| std | 0.0272 | -| value_loss | 1.31e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10938 | -| time_elapsed | 61248 | -| total_timesteps | 1400064 | -| train/ | | -| approx_kl | 0.00013947021 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | -0.000235 | -| n_updates | 109370 | -| policy_gradient_loss | -6.6e-05 | -| std | 0.0271 | -| value_loss | 4.65e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10939 | -| time_elapsed | 61253 | -| total_timesteps | 1400192 | -| train/ | | -| approx_kl | 0.003340642 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | -0.00784 | -| n_updates | 109380 | -| policy_gradient_loss | -0.00485 | -| std | 0.0269 | -| value_loss | 0.00206 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10940 | -| time_elapsed | 61257 | -| total_timesteps | 1400320 | -| train/ | | -| approx_kl | 0.0033321711 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -9.69 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 109390 | -| policy_gradient_loss | -0.00864 | -| std | 0.0268 | -| value_loss | 4.21e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10941 | -| time_elapsed | 61261 | -| total_timesteps | 1400448 | -| train/ | | -| approx_kl | 0.030111223 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -7.93 | -| learning_rate | 0.0003 | -| loss | -0.000418 | -| n_updates | 109400 | -| policy_gradient_loss | -0.00394 | -| std | 0.0268 | -| value_loss | 1.41e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10942 | -| time_elapsed | 61265 | -| total_timesteps | 1400576 | -| train/ | | -| approx_kl | 0.019342575 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | 0.00304 | -| n_updates | 109410 | -| policy_gradient_loss | -9.42e-05 | -| std | 0.0268 | -| value_loss | 4.67e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10943 | -| time_elapsed | 61269 | -| total_timesteps | 1400704 | -| train/ | | -| approx_kl | 0.0006432147 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.769 | -| learning_rate | 0.0003 | -| loss | -0.00404 | -| n_updates | 109420 | -| policy_gradient_loss | -0.00464 | -| std | 0.0268 | -| value_loss | 5.31e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10944 | -| time_elapsed | 61271 | -| total_timesteps | 1400832 | -| train/ | | -| approx_kl | 0.0011269273 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | 0.000137 | -| n_updates | 109430 | -| policy_gradient_loss | 0.00336 | -| std | 0.0268 | -| value_loss | 1.24e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10945 | -| time_elapsed | 61275 | -| total_timesteps | 1400960 | -| train/ | | -| approx_kl | 0.014366753 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 109440 | -| policy_gradient_loss | 0.00801 | -| std | 0.0269 | -| value_loss | 0.00186 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10946 | -| time_elapsed | 61279 | -| total_timesteps | 1401088 | -| train/ | | -| approx_kl | 0.0013815863 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.399 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 109450 | -| policy_gradient_loss | 0.00408 | -| std | 0.0269 | -| value_loss | 0.000868 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10947 | -| time_elapsed | 61287 | -| total_timesteps | 1401216 | -| train/ | | -| approx_kl | 0.02303911 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 109460 | -| policy_gradient_loss | -0.0166 | -| std | 0.0269 | -| value_loss | 0.000325 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10948 | -| time_elapsed | 61290 | -| total_timesteps | 1401344 | -| train/ | | -| approx_kl | 0.022706352 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | 0.00579 | -| n_updates | 109470 | -| policy_gradient_loss | 0.000774 | -| std | 0.0269 | -| value_loss | 5.72e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10949 | -| time_elapsed | 61293 | -| total_timesteps | 1401472 | -| train/ | | -| approx_kl | 0.06976984 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.092 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 109480 | -| policy_gradient_loss | 0.0119 | -| std | 0.0269 | -| value_loss | 1.87e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10950 | -| time_elapsed | 61295 | -| total_timesteps | 1401600 | -| train/ | | -| approx_kl | 0.013729977 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 109490 | -| policy_gradient_loss | 0.00778 | -| std | 0.027 | -| value_loss | 2.93e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10951 | -| time_elapsed | 61298 | -| total_timesteps | 1401728 | -| train/ | | -| approx_kl | 6.31162e-05 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.000943 | -| n_updates | 109500 | -| policy_gradient_loss | -0.00408 | -| std | 0.027 | -| value_loss | 1.33e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10952 | -| time_elapsed | 61301 | -| total_timesteps | 1401856 | -| train/ | | -| approx_kl | 0.020809155 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.0782 | -| learning_rate | 0.0003 | -| loss | 0.00597 | -| n_updates | 109510 | -| policy_gradient_loss | -0.00115 | -| std | 0.027 | -| value_loss | 1.56e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 10953 | -| time_elapsed | 61304 | -| total_timesteps | 1401984 | -| train/ | | -| approx_kl | 0.025007367 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | 0.00494 | -| learning_rate | 0.0003 | -| loss | 0.00517 | -| n_updates | 109520 | -| policy_gradient_loss | -0.00152 | -| std | 0.027 | -| value_loss | 7.87e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10954 | -| time_elapsed | 61307 | -| total_timesteps | 1402112 | -| train/ | | -| approx_kl | 0.00784569 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | 0.00289 | -| learning_rate | 0.0003 | -| loss | -0.000888 | -| n_updates | 109530 | -| policy_gradient_loss | -0.00017 | -| std | 0.027 | -| value_loss | 1.23e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10955 | -| time_elapsed | 61316 | -| total_timesteps | 1402240 | -| train/ | | -| approx_kl | 0.027010664 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.931 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 109540 | -| policy_gradient_loss | -0.0112 | -| std | 0.027 | -| value_loss | 0.00344 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10956 | -| time_elapsed | 61320 | -| total_timesteps | 1402368 | -| train/ | | -| approx_kl | 1.0105781e-05 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.000409 | -| n_updates | 109550 | -| policy_gradient_loss | -0.00115 | -| std | 0.027 | -| value_loss | 6.13e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10957 | -| time_elapsed | 61323 | -| total_timesteps | 1402496 | -| train/ | | -| approx_kl | 0.006178257 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -8.03 | -| learning_rate | 0.0003 | -| loss | 0.00589 | -| n_updates | 109560 | -| policy_gradient_loss | 0.00483 | -| std | 0.027 | -| value_loss | 1.92e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10958 | -| time_elapsed | 61327 | -| total_timesteps | 1402624 | -| train/ | | -| approx_kl | 1.3330951e-05 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -1.22 | -| learning_rate | 0.0003 | -| loss | -0.000359 | -| n_updates | 109570 | -| policy_gradient_loss | 0.00744 | -| std | 0.027 | -| value_loss | 5.34e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10959 | -| time_elapsed | 61330 | -| total_timesteps | 1402752 | -| train/ | | -| approx_kl | 0.01624487 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.604 | -| learning_rate | 0.0003 | -| loss | 0.00721 | -| n_updates | 109580 | -| policy_gradient_loss | 0.00146 | -| std | 0.027 | -| value_loss | 1.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 10960 | -| time_elapsed | 61334 | -| total_timesteps | 1402880 | -| train/ | | -| approx_kl | 0.009788232 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.19 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 109590 | -| policy_gradient_loss | 0.00712 | -| std | 0.0269 | -| value_loss | 4.34e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10961 | -| time_elapsed | 61337 | -| total_timesteps | 1403008 | -| train/ | | -| approx_kl | 0.0085616745 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 109600 | -| policy_gradient_loss | 0.00661 | -| std | 0.0269 | -| value_loss | 5.08e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10962 | -| time_elapsed | 61347 | -| total_timesteps | 1403136 | -| train/ | | -| approx_kl | 0.00080204196 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -1.54 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 109610 | -| policy_gradient_loss | -0.014 | -| std | 0.0269 | -| value_loss | 0.0031 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10963 | -| time_elapsed | 61350 | -| total_timesteps | 1403264 | -| train/ | | -| approx_kl | 5.5879354e-08 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | 0.0472 | -| learning_rate | 0.0003 | -| loss | 0.000221 | -| n_updates | 109620 | -| policy_gradient_loss | 0.00527 | -| std | 0.0269 | -| value_loss | 0.000427 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10964 | -| time_elapsed | 61353 | -| total_timesteps | 1403392 | -| train/ | | -| approx_kl | 0.036470626 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -4.84 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 109630 | -| policy_gradient_loss | -0.015 | -| std | 0.0269 | -| value_loss | 3.23e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10965 | -| time_elapsed | 61357 | -| total_timesteps | 1403520 | -| train/ | | -| approx_kl | 0.0029126317 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 109640 | -| policy_gradient_loss | -0.00037 | -| std | 0.0269 | -| value_loss | 3.01e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10966 | -| time_elapsed | 61359 | -| total_timesteps | 1403648 | -| train/ | | -| approx_kl | 0.0017821053 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.00442 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 109650 | -| policy_gradient_loss | 0.00139 | -| std | 0.0269 | -| value_loss | 4.12e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10967 | -| time_elapsed | 61363 | -| total_timesteps | 1403776 | -| train/ | | -| approx_kl | 0.004256364 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0902 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 109660 | -| policy_gradient_loss | -0.00713 | -| std | 0.0269 | -| value_loss | 3.33e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 10968 | -| time_elapsed | 61367 | -| total_timesteps | 1403904 | -| train/ | | -| approx_kl | 0.0054585123 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.00502 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 109670 | -| policy_gradient_loss | -0.00121 | -| std | 0.0269 | -| value_loss | 3.68e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10969 | -| time_elapsed | 61370 | -| total_timesteps | 1404032 | -| train/ | | -| approx_kl | 0.0032634283 | -| clip_fraction | 0.00781 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.000136 | -| n_updates | 109680 | -| policy_gradient_loss | -0.000102 | -| std | 0.0269 | -| value_loss | 1.53e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10970 | -| time_elapsed | 61377 | -| total_timesteps | 1404160 | -| train/ | | -| approx_kl | 0.0009134882 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 109690 | -| policy_gradient_loss | -0.012 | -| std | 0.0268 | -| value_loss | 0.00055 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10971 | -| time_elapsed | 61380 | -| total_timesteps | 1404288 | -| train/ | | -| approx_kl | 0.00941056 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.0058 | -| n_updates | 109700 | -| policy_gradient_loss | 0.00966 | -| std | 0.0267 | -| value_loss | 1.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10972 | -| time_elapsed | 61383 | -| total_timesteps | 1404416 | -| train/ | | -| approx_kl | 0.025867714 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -34.9 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 109710 | -| policy_gradient_loss | -0.0126 | -| std | 0.0267 | -| value_loss | 3.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10973 | -| time_elapsed | 61387 | -| total_timesteps | 1404544 | -| train/ | | -| approx_kl | 0.00249882 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.00946 | -| n_updates | 109720 | -| policy_gradient_loss | -0.00427 | -| std | 0.0267 | -| value_loss | 1.86e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10974 | -| time_elapsed | 61390 | -| total_timesteps | 1404672 | -| train/ | | -| approx_kl | 0.005829152 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | 0.00151 | -| learning_rate | 0.0003 | -| loss | -0.00845 | -| n_updates | 109730 | -| policy_gradient_loss | -0.00385 | -| std | 0.0267 | -| value_loss | 4.28e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10975 | -| time_elapsed | 61394 | -| total_timesteps | 1404800 | -| train/ | | -| approx_kl | 0.0023029959 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | 0.00933 | -| learning_rate | 0.0003 | -| loss | -0.00431 | -| n_updates | 109740 | -| policy_gradient_loss | 0.00603 | -| std | 0.0267 | -| value_loss | 4.59e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 22 | -| iterations | 10976 | -| time_elapsed | 61396 | -| total_timesteps | 1404928 | -| train/ | | -| approx_kl | 0.0034361933 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 109750 | -| policy_gradient_loss | -0.00238 | -| std | 0.0267 | -| value_loss | 2.3e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10977 | -| time_elapsed | 61398 | -| total_timesteps | 1405056 | -| train/ | | -| approx_kl | 0.00042329542 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0974 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 109760 | -| policy_gradient_loss | -0.00105 | -| std | 0.0267 | -| value_loss | 5.85e-10 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10978 | -| time_elapsed | 61405 | -| total_timesteps | 1405184 | -| train/ | | -| approx_kl | 0.01513715 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -10 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 109770 | -| policy_gradient_loss | -0.00848 | -| std | 0.0267 | -| value_loss | 0.00434 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10979 | -| time_elapsed | 61409 | -| total_timesteps | 1405312 | -| train/ | | -| approx_kl | 0.00014448818 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | 0.000856 | -| n_updates | 109780 | -| policy_gradient_loss | -0.0018 | -| std | 0.0267 | -| value_loss | 8.69e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10980 | -| time_elapsed | 61414 | -| total_timesteps | 1405440 | -| train/ | | -| approx_kl | 0.025569662 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.78 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 109790 | -| policy_gradient_loss | 0.00201 | -| std | 0.0267 | -| value_loss | 6.97e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10981 | -| time_elapsed | 61417 | -| total_timesteps | 1405568 | -| train/ | | -| approx_kl | 4.3486245e-05 | -| clip_fraction | 0.00313 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | 5.6e-05 | -| n_updates | 109800 | -| policy_gradient_loss | -8.6e-05 | -| std | 0.0267 | -| value_loss | 7.12e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10982 | -| time_elapsed | 61421 | -| total_timesteps | 1405696 | -| train/ | | -| approx_kl | 0.0011367584 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | 0.00485 | -| n_updates | 109810 | -| policy_gradient_loss | 0.000849 | -| std | 0.0267 | -| value_loss | 3.1e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10983 | -| time_elapsed | 61424 | -| total_timesteps | 1405824 | -| train/ | | -| approx_kl | 0.0012419452 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 109820 | -| policy_gradient_loss | -0.00325 | -| std | 0.0267 | -| value_loss | 1.97e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 10984 | -| time_elapsed | 61427 | -| total_timesteps | 1405952 | -| train/ | | -| approx_kl | 7.140217e-05 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.00705 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 109830 | -| policy_gradient_loss | -0.00312 | -| std | 0.0267 | -| value_loss | 1.25e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10985 | -| time_elapsed | 61430 | -| total_timesteps | 1406080 | -| train/ | | -| approx_kl | 8.0205034e-05 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | 0.00441 | -| learning_rate | 0.0003 | -| loss | -0.000876 | -| n_updates | 109840 | -| policy_gradient_loss | -0.000235 | -| std | 0.0267 | -| value_loss | 1.78e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10986 | -| time_elapsed | 61436 | -| total_timesteps | 1406208 | -| train/ | | -| approx_kl | 0.005630895 | -| clip_fraction | 0.0328 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | 0.805 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 109850 | -| policy_gradient_loss | -0.00944 | -| std | 0.0267 | -| value_loss | 0.0035 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10987 | -| time_elapsed | 61439 | -| total_timesteps | 1406336 | -| train/ | | -| approx_kl | 0.0048401807 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 109860 | -| policy_gradient_loss | 0.000248 | -| std | 0.0268 | -| value_loss | 0.000272 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10988 | -| time_elapsed | 61443 | -| total_timesteps | 1406464 | -| train/ | | -| approx_kl | 0.00061428035 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -2.86 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 109870 | -| policy_gradient_loss | -0.000856 | -| std | 0.0268 | -| value_loss | 0.000394 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10989 | -| time_elapsed | 61447 | -| total_timesteps | 1406592 | -| train/ | | -| approx_kl | 0.0047028544 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -74.6 | -| learning_rate | 0.0003 | -| loss | -0.000569 | -| n_updates | 109880 | -| policy_gradient_loss | -0.000148 | -| std | 0.0267 | -| value_loss | 6.77e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10990 | -| time_elapsed | 61451 | -| total_timesteps | 1406720 | -| train/ | | -| approx_kl | 0.03471911 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.2 | -| explained_variance | -0.294 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 109890 | -| policy_gradient_loss | 0.00203 | -| std | 0.0267 | -| value_loss | 0.00194 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10991 | -| time_elapsed | 61455 | -| total_timesteps | 1406848 | -| train/ | | -| approx_kl | 0.0002846308 | -| clip_fraction | 0.0141 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.000677 | -| n_updates | 109900 | -| policy_gradient_loss | -0.000191 | -| std | 0.0266 | -| value_loss | 0.000271 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 10992 | -| time_elapsed | 61458 | -| total_timesteps | 1406976 | -| train/ | | -| approx_kl | 0.00010307366 | -| clip_fraction | 0.00469 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | -0.000189 | -| n_updates | 109910 | -| policy_gradient_loss | -0.00182 | -| std | 0.0265 | -| value_loss | 0.00151 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10993 | -| time_elapsed | 61462 | -| total_timesteps | 1407104 | -| train/ | | -| approx_kl | 0.0020063487 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.00822 | -| learning_rate | 0.0003 | -| loss | 0.00296 | -| n_updates | 109920 | -| policy_gradient_loss | 0.00392 | -| std | 0.0264 | -| value_loss | 0.00105 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10994 | -| time_elapsed | 61471 | -| total_timesteps | 1407232 | -| train/ | | -| approx_kl | 0.0004035649 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 109930 | -| policy_gradient_loss | -0.0028 | -| std | 0.0264 | -| value_loss | 0.000737 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10995 | -| time_elapsed | 61474 | -| total_timesteps | 1407360 | -| train/ | | -| approx_kl | 0.0010446673 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 109940 | -| policy_gradient_loss | 0.000401 | -| std | 0.0264 | -| value_loss | 0.000152 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10996 | -| time_elapsed | 61478 | -| total_timesteps | 1407488 | -| train/ | | -| approx_kl | 0.012577605 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.00735 | -| learning_rate | 0.0003 | -| loss | -0.00777 | -| n_updates | 109950 | -| policy_gradient_loss | -0.0014 | -| std | 0.0264 | -| value_loss | 9.86e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10997 | -| time_elapsed | 61480 | -| total_timesteps | 1407616 | -| train/ | | -| approx_kl | 0.00081681134 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0691 | -| learning_rate | 0.0003 | -| loss | 0.00355 | -| n_updates | 109960 | -| policy_gradient_loss | 0.00955 | -| std | 0.0264 | -| value_loss | 6.98e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10998 | -| time_elapsed | 61484 | -| total_timesteps | 1407744 | -| train/ | | -| approx_kl | 0.0017786673 | -| clip_fraction | 0.0359 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.00315 | -| n_updates | 109970 | -| policy_gradient_loss | -0.00166 | -| std | 0.0264 | -| value_loss | 4.31e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 10999 | -| time_elapsed | 61486 | -| total_timesteps | 1407872 | -| train/ | | -| approx_kl | 0.0037776702 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 109980 | -| policy_gradient_loss | -0.00318 | -| std | 0.0264 | -| value_loss | 3.46e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11000 | -| time_elapsed | 61488 | -| total_timesteps | 1408000 | -| train/ | | -| approx_kl | 0.012206994 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0643 | -| learning_rate | 0.0003 | -| loss | 0.000207 | -| n_updates | 109990 | -| policy_gradient_loss | -0.000615 | -| std | 0.0264 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11001 | -| time_elapsed | 61490 | -| total_timesteps | 1408128 | -| train/ | | -| approx_kl | 0.004675898 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.00445 | -| learning_rate | 0.0003 | -| loss | -0.00062 | -| n_updates | 110000 | -| policy_gradient_loss | 0.0036 | -| std | 0.0265 | -| value_loss | 5.32e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11002 | -| time_elapsed | 61496 | -| total_timesteps | 1408256 | -| train/ | | -| approx_kl | 0.0020287079 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -9.04 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 110010 | -| policy_gradient_loss | -0.00911 | -| std | 0.0265 | -| value_loss | 0.00388 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11003 | -| time_elapsed | 61500 | -| total_timesteps | 1408384 | -| train/ | | -| approx_kl | 0.007924221 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 110020 | -| policy_gradient_loss | 0.00692 | -| std | 0.0265 | -| value_loss | 9.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11004 | -| time_elapsed | 61503 | -| total_timesteps | 1408512 | -| train/ | | -| approx_kl | 0.008394673 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.459 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 110030 | -| policy_gradient_loss | -0.000567 | -| std | 0.0265 | -| value_loss | 0.000149 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11005 | -| time_elapsed | 61508 | -| total_timesteps | 1408640 | -| train/ | | -| approx_kl | 0.005896508 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | 0.00819 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 110040 | -| policy_gradient_loss | 0.00137 | -| std | 0.0265 | -| value_loss | 5.75e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11006 | -| time_elapsed | 61511 | -| total_timesteps | 1408768 | -| train/ | | -| approx_kl | 0.0051764036 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | 0.00884 | -| learning_rate | 0.0003 | -| loss | 0.00864 | -| n_updates | 110050 | -| policy_gradient_loss | 0.01 | -| std | 0.0265 | -| value_loss | 5.69e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11007 | -| time_elapsed | 61514 | -| total_timesteps | 1408896 | -| train/ | | -| approx_kl | 0.013983186 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.00335 | -| n_updates | 110060 | -| policy_gradient_loss | 0.00176 | -| std | 0.0265 | -| value_loss | 1.96e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11008 | -| time_elapsed | 61517 | -| total_timesteps | 1409024 | -| train/ | | -| approx_kl | 0.042861704 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 110070 | -| policy_gradient_loss | -0.00737 | -| std | 0.0265 | -| value_loss | 2.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11009 | -| time_elapsed | 61526 | -| total_timesteps | 1409152 | -| train/ | | -| approx_kl | 0.028022204 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 110080 | -| policy_gradient_loss | -0.011 | -| std | 0.0265 | -| value_loss | 0.0016 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11010 | -| time_elapsed | 61530 | -| total_timesteps | 1409280 | -| train/ | | -| approx_kl | 0.033759065 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.00153 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 110090 | -| policy_gradient_loss | 0.00236 | -| std | 0.0265 | -| value_loss | 1.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11011 | -| time_elapsed | 61532 | -| total_timesteps | 1409408 | -| train/ | | -| approx_kl | 0.006979709 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 110100 | -| policy_gradient_loss | 0.00204 | -| std | 0.0265 | -| value_loss | 1.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11012 | -| time_elapsed | 61535 | -| total_timesteps | 1409536 | -| train/ | | -| approx_kl | 0.004115766 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 110110 | -| policy_gradient_loss | -0.00148 | -| std | 0.0264 | -| value_loss | 4.15e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11013 | -| time_elapsed | 61537 | -| total_timesteps | 1409664 | -| train/ | | -| approx_kl | 0.00079441816 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.21 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 110120 | -| policy_gradient_loss | -0.00479 | -| std | 0.0264 | -| value_loss | 7.9e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11014 | -| time_elapsed | 61539 | -| total_timesteps | 1409792 | -| train/ | | -| approx_kl | 8.294592e-05 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.00287 | -| n_updates | 110130 | -| policy_gradient_loss | -0.0127 | -| std | 0.0264 | -| value_loss | 1.79e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 22 | -| iterations | 11015 | -| time_elapsed | 61542 | -| total_timesteps | 1409920 | -| train/ | | -| approx_kl | 0.00261159 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | -0.0075 | -| n_updates | 110140 | -| policy_gradient_loss | -0.00738 | -| std | 0.0263 | -| value_loss | 1.36e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11016 | -| time_elapsed | 61545 | -| total_timesteps | 1410048 | -| train/ | | -| approx_kl | 0.0063590263 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 110150 | -| policy_gradient_loss | -0.00562 | -| std | 0.0263 | -| value_loss | 9.04e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11017 | -| time_elapsed | 61551 | -| total_timesteps | 1410176 | -| train/ | | -| approx_kl | 0.028418712 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.418 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 110160 | -| policy_gradient_loss | -0.0157 | -| std | 0.0263 | -| value_loss | 0.00116 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11018 | -| time_elapsed | 61556 | -| total_timesteps | 1410304 | -| train/ | | -| approx_kl | 0.004491708 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -7.83 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 110170 | -| policy_gradient_loss | 0.00569 | -| std | 0.0263 | -| value_loss | 7.76e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11019 | -| time_elapsed | 61561 | -| total_timesteps | 1410432 | -| train/ | | -| approx_kl | 0.0015506535 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.00788 | -| n_updates | 110180 | -| policy_gradient_loss | -0.0111 | -| std | 0.0263 | -| value_loss | 1.75e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11020 | -| time_elapsed | 61564 | -| total_timesteps | 1410560 | -| train/ | | -| approx_kl | 0.0008689123 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | -0.00379 | -| n_updates | 110190 | -| policy_gradient_loss | -0.00633 | -| std | 0.0263 | -| value_loss | 2.44e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11021 | -| time_elapsed | 61567 | -| total_timesteps | 1410688 | -| train/ | | -| approx_kl | 0.027674917 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -7.96 | -| learning_rate | 0.0003 | -| loss | 9.84e-05 | -| n_updates | 110200 | -| policy_gradient_loss | -0.000843 | -| std | 0.0263 | -| value_loss | 2.36e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11022 | -| time_elapsed | 61570 | -| total_timesteps | 1410816 | -| train/ | | -| approx_kl | 0.010297598 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | -0.0341 | -| n_updates | 110210 | -| policy_gradient_loss | -0.0269 | -| std | 0.0263 | -| value_loss | 1.1e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11023 | -| time_elapsed | 61574 | -| total_timesteps | 1410944 | -| train/ | | -| approx_kl | 0.031282842 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | -0.0062 | -| n_updates | 110220 | -| policy_gradient_loss | -0.0085 | -| std | 0.0263 | -| value_loss | 2.97e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11024 | -| time_elapsed | 61577 | -| total_timesteps | 1411072 | -| train/ | | -| approx_kl | 0.00890221 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.00588 | -| n_updates | 110230 | -| policy_gradient_loss | -0.00469 | -| std | 0.0263 | -| value_loss | 2.11e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11025 | -| time_elapsed | 61583 | -| total_timesteps | 1411200 | -| train/ | | -| approx_kl | 0.0018679746 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.00888 | -| n_updates | 110240 | -| policy_gradient_loss | -0.00324 | -| std | 0.0263 | -| value_loss | 0.000558 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11026 | -| time_elapsed | 61587 | -| total_timesteps | 1411328 | -| train/ | | -| approx_kl | 0.00590155 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.455 | -| learning_rate | 0.0003 | -| loss | -0.000995 | -| n_updates | 110250 | -| policy_gradient_loss | 0.000216 | -| std | 0.0263 | -| value_loss | 1.47e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11027 | -| time_elapsed | 61591 | -| total_timesteps | 1411456 | -| train/ | | -| approx_kl | 0.008627614 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.00186 | -| n_updates | 110260 | -| policy_gradient_loss | 0.000953 | -| std | 0.0263 | -| value_loss | 1.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11028 | -| time_elapsed | 61596 | -| total_timesteps | 1411584 | -| train/ | | -| approx_kl | 0.003974332 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | -0.000545 | -| n_updates | 110270 | -| policy_gradient_loss | 0.000528 | -| std | 0.0263 | -| value_loss | 8.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11029 | -| time_elapsed | 61599 | -| total_timesteps | 1411712 | -| train/ | | -| approx_kl | 0.007884622 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.00593 | -| learning_rate | 0.0003 | -| loss | -0.000524 | -| n_updates | 110280 | -| policy_gradient_loss | 0.000781 | -| std | 0.0263 | -| value_loss | 1.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11030 | -| time_elapsed | 61603 | -| total_timesteps | 1411840 | -| train/ | | -| approx_kl | 0.025837194 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | -0.00959 | -| n_updates | 110290 | -| policy_gradient_loss | -0.00952 | -| std | 0.0263 | -| value_loss | 5.67e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 22 | -| iterations | 11031 | -| time_elapsed | 61605 | -| total_timesteps | 1411968 | -| train/ | | -| approx_kl | 0.011930434 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.00349 | -| learning_rate | 0.0003 | -| loss | -0.000813 | -| n_updates | 110300 | -| policy_gradient_loss | -0.00199 | -| std | 0.0263 | -| value_loss | 2.11e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11032 | -| time_elapsed | 61608 | -| total_timesteps | 1412096 | -| train/ | | -| approx_kl | 0.00018112408 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.000193 | -| n_updates | 110310 | -| policy_gradient_loss | 7.89e-05 | -| std | 0.0262 | -| value_loss | 1.03e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11033 | -| time_elapsed | 61615 | -| total_timesteps | 1412224 | -| train/ | | -| approx_kl | 0.0055547524 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.844 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 110320 | -| policy_gradient_loss | -0.00493 | -| std | 0.0262 | -| value_loss | 0.00231 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11034 | -| time_elapsed | 61619 | -| total_timesteps | 1412352 | -| train/ | | -| approx_kl | 0.0015059663 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | -0.00624 | -| n_updates | 110330 | -| policy_gradient_loss | -0.00302 | -| std | 0.0261 | -| value_loss | 7.88e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11035 | -| time_elapsed | 61622 | -| total_timesteps | 1412480 | -| train/ | | -| approx_kl | 0.01804167 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.00369 | -| n_updates | 110340 | -| policy_gradient_loss | 0.00337 | -| std | 0.0261 | -| value_loss | 7.69e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11036 | -| time_elapsed | 61623 | -| total_timesteps | 1412608 | -| train/ | | -| approx_kl | 0.002722918 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0972 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 110350 | -| policy_gradient_loss | -0.00771 | -| std | 0.0261 | -| value_loss | 6.5e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11037 | -| time_elapsed | 61625 | -| total_timesteps | 1412736 | -| train/ | | -| approx_kl | 0.0004193196 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.068 | -| learning_rate | 0.0003 | -| loss | -0.000506 | -| n_updates | 110360 | -| policy_gradient_loss | 0.00181 | -| std | 0.0262 | -| value_loss | 3.63e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11038 | -| time_elapsed | 61628 | -| total_timesteps | 1412864 | -| train/ | | -| approx_kl | 0.00028177258 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.00303 | -| n_updates | 110370 | -| policy_gradient_loss | 0.00778 | -| std | 0.0262 | -| value_loss | 9.58e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11039 | -| time_elapsed | 61631 | -| total_timesteps | 1412992 | -| train/ | | -| approx_kl | 0.02160919 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.00266 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 110380 | -| policy_gradient_loss | -0.0043 | -| std | 0.0262 | -| value_loss | 5.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 11040 | -| time_elapsed | 61634 | -| total_timesteps | 1413120 | -| train/ | | -| approx_kl | 0.013203079 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 110390 | -| policy_gradient_loss | 0.00354 | -| std | 0.0262 | -| value_loss | 1.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 11041 | -| time_elapsed | 61644 | -| total_timesteps | 1413248 | -| train/ | | -| approx_kl | 0.041069757 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.749 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 110400 | -| policy_gradient_loss | -0.00524 | -| std | 0.0262 | -| value_loss | 0.00557 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 11042 | -| time_elapsed | 61647 | -| total_timesteps | 1413376 | -| train/ | | -| approx_kl | 0.019275999 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.00503 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 110410 | -| policy_gradient_loss | -0.00658 | -| std | 0.0262 | -| value_loss | 2.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 11043 | -| time_elapsed | 61651 | -| total_timesteps | 1413504 | -| train/ | | -| approx_kl | 0.003227755 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 110420 | -| policy_gradient_loss | 0.00305 | -| std | 0.0262 | -| value_loss | 4.61e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 11044 | -| time_elapsed | 61654 | -| total_timesteps | 1413632 | -| train/ | | -| approx_kl | 4.2375177e-08 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 3.17e-05 | -| n_updates | 110430 | -| policy_gradient_loss | 0.00962 | -| std | 0.0262 | -| value_loss | 3e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 11045 | -| time_elapsed | 61658 | -| total_timesteps | 1413760 | -| train/ | | -| approx_kl | 0.00032244856 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | -0.000903 | -| n_updates | 110440 | -| policy_gradient_loss | 0.00886 | -| std | 0.0262 | -| value_loss | 1.22e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 22 | -| iterations | 11046 | -| time_elapsed | 61661 | -| total_timesteps | 1413888 | -| train/ | | -| approx_kl | 0.03032925 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0719 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 110450 | -| policy_gradient_loss | -0.0116 | -| std | 0.0262 | -| value_loss | 9.13e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11047 | -| time_elapsed | 61664 | -| total_timesteps | 1414016 | -| train/ | | -| approx_kl | 0.02217483 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.00616 | -| n_updates | 110460 | -| policy_gradient_loss | -0.000879 | -| std | 0.0262 | -| value_loss | 4.64e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11048 | -| time_elapsed | 61674 | -| total_timesteps | 1414144 | -| train/ | | -| approx_kl | 0.019855501 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -2.88 | -| learning_rate | 0.0003 | -| loss | -0.00617 | -| n_updates | 110470 | -| policy_gradient_loss | -0.00982 | -| std | 0.0263 | -| value_loss | 0.00268 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11049 | -| time_elapsed | 61677 | -| total_timesteps | 1414272 | -| train/ | | -| approx_kl | 0.017624501 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0696 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 110480 | -| policy_gradient_loss | -0.00966 | -| std | 0.0263 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11050 | -| time_elapsed | 61681 | -| total_timesteps | 1414400 | -| train/ | | -| approx_kl | 0.047011413 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -29.3 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 110490 | -| policy_gradient_loss | -0.00499 | -| std | 0.0263 | -| value_loss | 5.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11051 | -| time_elapsed | 61684 | -| total_timesteps | 1414528 | -| train/ | | -| approx_kl | 0.024642847 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -4.46 | -| learning_rate | 0.0003 | -| loss | -0.00611 | -| n_updates | 110500 | -| policy_gradient_loss | -0.00133 | -| std | 0.0263 | -| value_loss | 1.16e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11052 | -| time_elapsed | 61687 | -| total_timesteps | 1414656 | -| train/ | | -| approx_kl | 0.02259346 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.541 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 110510 | -| policy_gradient_loss | 0.000885 | -| std | 0.0263 | -| value_loss | 2.6e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11053 | -| time_elapsed | 61690 | -| total_timesteps | 1414784 | -| train/ | | -| approx_kl | 9.0165995e-06 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0092 | -| learning_rate | 0.0003 | -| loss | 2.49e-05 | -| n_updates | 110520 | -| policy_gradient_loss | 0.00829 | -| std | 0.0263 | -| value_loss | 8.05e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 22 | -| iterations | 11054 | -| time_elapsed | 61694 | -| total_timesteps | 1414912 | -| train/ | | -| approx_kl | 0.011508275 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.00861 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 110530 | -| policy_gradient_loss | 0.00185 | -| std | 0.0263 | -| value_loss | 1.56e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11055 | -| time_elapsed | 61697 | -| total_timesteps | 1415040 | -| train/ | | -| approx_kl | 0.0013997401 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0715 | -| learning_rate | 0.0003 | -| loss | 0.0071 | -| n_updates | 110540 | -| policy_gradient_loss | 0.000111 | -| std | 0.0263 | -| value_loss | 1.37e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11056 | -| time_elapsed | 61703 | -| total_timesteps | 1415168 | -| train/ | | -| approx_kl | 0.0016353852 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | 0.726 | -| learning_rate | 0.0003 | -| loss | 0.0089 | -| n_updates | 110550 | -| policy_gradient_loss | -0.00584 | -| std | 0.0263 | -| value_loss | 0.00669 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11057 | -| time_elapsed | 61706 | -| total_timesteps | 1415296 | -| train/ | | -| approx_kl | 0.01645525 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 110560 | -| policy_gradient_loss | -0.00674 | -| std | 0.0263 | -| value_loss | 3.59e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11058 | -| time_elapsed | 61709 | -| total_timesteps | 1415424 | -| train/ | | -| approx_kl | 0.007438032 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | 0.000562 | -| n_updates | 110570 | -| policy_gradient_loss | 0.00435 | -| std | 0.0263 | -| value_loss | 5.43e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11059 | -| time_elapsed | 61712 | -| total_timesteps | 1415552 | -| train/ | | -| approx_kl | 4.7297217e-06 | -| clip_fraction | 0.0219 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.00797 | -| learning_rate | 0.0003 | -| loss | -0.000181 | -| n_updates | 110580 | -| policy_gradient_loss | -9.06e-06 | -| std | 0.0262 | -| value_loss | 8.79e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11060 | -| time_elapsed | 61715 | -| total_timesteps | 1415680 | -| train/ | | -| approx_kl | 0.02070456 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.22 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00924 | -| n_updates | 110590 | -| policy_gradient_loss | 0.00396 | -| std | 0.0261 | -| value_loss | 2.33e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11061 | -| time_elapsed | 61719 | -| total_timesteps | 1415808 | -| train/ | | -| approx_kl | 0.015951373 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.00753 | -| learning_rate | 0.0003 | -| loss | 0.00723 | -| n_updates | 110600 | -| policy_gradient_loss | 0.00227 | -| std | 0.0261 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 22 | -| iterations | 11062 | -| time_elapsed | 61723 | -| total_timesteps | 1415936 | -| train/ | | -| approx_kl | 0.020720923 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.00187 | -| n_updates | 110610 | -| policy_gradient_loss | -0.000407 | -| std | 0.0261 | -| value_loss | 4.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11063 | -| time_elapsed | 61726 | -| total_timesteps | 1416064 | -| train/ | | -| approx_kl | 0.000228283 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 110620 | -| policy_gradient_loss | -0.00734 | -| std | 0.0261 | -| value_loss | 1.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11064 | -| time_elapsed | 61732 | -| total_timesteps | 1416192 | -| train/ | | -| approx_kl | 0.055581987 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.715 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 110630 | -| policy_gradient_loss | -0.0112 | -| std | 0.0261 | -| value_loss | 0.000733 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11065 | -| time_elapsed | 61736 | -| total_timesteps | 1416320 | -| train/ | | -| approx_kl | 0.0048623187 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.00582 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 110640 | -| policy_gradient_loss | 0.00909 | -| std | 0.0261 | -| value_loss | 3.94e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11066 | -| time_elapsed | 61740 | -| total_timesteps | 1416448 | -| train/ | | -| approx_kl | 0.0006007594 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.00249 | -| n_updates | 110650 | -| policy_gradient_loss | 0.00206 | -| std | 0.0261 | -| value_loss | 8.81e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11067 | -| time_elapsed | 61741 | -| total_timesteps | 1416576 | -| train/ | | -| approx_kl | 0.00090770517 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.0079 | -| learning_rate | 0.0003 | -| loss | 0.000777 | -| n_updates | 110660 | -| policy_gradient_loss | 0.0136 | -| std | 0.026 | -| value_loss | 1.98e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11068 | -| time_elapsed | 61743 | -| total_timesteps | 1416704 | -| train/ | | -| approx_kl | 0.16098952 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0064 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 110670 | -| policy_gradient_loss | 0.0365 | -| std | 0.0261 | -| value_loss | 1.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11069 | -| time_elapsed | 61745 | -| total_timesteps | 1416832 | -| train/ | | -| approx_kl | 0.031048061 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.00549 | -| learning_rate | 0.0003 | -| loss | 0.00894 | -| n_updates | 110680 | -| policy_gradient_loss | 0.000545 | -| std | 0.0261 | -| value_loss | 2.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 22 | -| iterations | 11070 | -| time_elapsed | 61748 | -| total_timesteps | 1416960 | -| train/ | | -| approx_kl | 0.012801111 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.00769 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 110690 | -| policy_gradient_loss | 0.00816 | -| std | 0.0261 | -| value_loss | 2.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11071 | -| time_elapsed | 61751 | -| total_timesteps | 1417088 | -| train/ | | -| approx_kl | 0.004977728 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 110700 | -| policy_gradient_loss | 0.00851 | -| std | 0.0261 | -| value_loss | 4.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11072 | -| time_elapsed | 61758 | -| total_timesteps | 1417216 | -| train/ | | -| approx_kl | 0.007623673 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 110710 | -| policy_gradient_loss | -0.00412 | -| std | 0.026 | -| value_loss | 0.00284 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11073 | -| time_elapsed | 61762 | -| total_timesteps | 1417344 | -| train/ | | -| approx_kl | 0.004662635 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -26.8 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 110720 | -| policy_gradient_loss | -0.00185 | -| std | 0.026 | -| value_loss | 4.84e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11074 | -| time_elapsed | 61767 | -| total_timesteps | 1417472 | -| train/ | | -| approx_kl | 0.01762525 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -102 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 110730 | -| policy_gradient_loss | -0.00704 | -| std | 0.026 | -| value_loss | 2.08e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11075 | -| time_elapsed | 61771 | -| total_timesteps | 1417600 | -| train/ | | -| approx_kl | 0.0022730716 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -120 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 110740 | -| policy_gradient_loss | -0.0101 | -| std | 0.026 | -| value_loss | 2.69e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11076 | -| time_elapsed | 61775 | -| total_timesteps | 1417728 | -| train/ | | -| approx_kl | 2.2654422e-06 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -245 | -| learning_rate | 0.0003 | -| loss | 0.00031 | -| n_updates | 110750 | -| policy_gradient_loss | -0.000391 | -| std | 0.026 | -| value_loss | 1.42e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11077 | -| time_elapsed | 61779 | -| total_timesteps | 1417856 | -| train/ | | -| approx_kl | 0.00028244965 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -4.46 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 110760 | -| policy_gradient_loss | -2.08e-05 | -| std | 0.026 | -| value_loss | 5.92e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 22 | -| iterations | 11078 | -| time_elapsed | 61782 | -| total_timesteps | 1417984 | -| train/ | | -| approx_kl | 0.007548518 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | -0.00537 | -| n_updates | 110770 | -| policy_gradient_loss | 0.00233 | -| std | 0.026 | -| value_loss | 1.83e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 22 | -| iterations | 11079 | -| time_elapsed | 61785 | -| total_timesteps | 1418112 | -| train/ | | -| approx_kl | 0.00083247386 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.00502 | -| learning_rate | 0.0003 | -| loss | 0.00054 | -| n_updates | 110780 | -| policy_gradient_loss | 0.00252 | -| std | 0.026 | -| value_loss | 1.26e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 22 | -| iterations | 11080 | -| time_elapsed | 61793 | -| total_timesteps | 1418240 | -| train/ | | -| approx_kl | 0.0035550045 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 110790 | -| policy_gradient_loss | -0.000266 | -| std | 0.026 | -| value_loss | 0.00278 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 22 | -| iterations | 11081 | -| time_elapsed | 61796 | -| total_timesteps | 1418368 | -| train/ | | -| approx_kl | 0.007967261 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.00758 | -| n_updates | 110800 | -| policy_gradient_loss | -0.00232 | -| std | 0.026 | -| value_loss | 3.49e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 22 | -| iterations | 11082 | -| time_elapsed | 61798 | -| total_timesteps | 1418496 | -| train/ | | -| approx_kl | 0.0131690465 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | -0.00742 | -| n_updates | 110810 | -| policy_gradient_loss | -0.00113 | -| std | 0.0261 | -| value_loss | 1.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 22 | -| iterations | 11083 | -| time_elapsed | 61801 | -| total_timesteps | 1418624 | -| train/ | | -| approx_kl | 0.0007180064 | -| clip_fraction | 0.00703 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | -2.86e-05 | -| n_updates | 110820 | -| policy_gradient_loss | -4.44e-06 | -| std | 0.026 | -| value_loss | 2.6e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 22 | -| iterations | 11084 | -| time_elapsed | 61804 | -| total_timesteps | 1418752 | -| train/ | | -| approx_kl | 0.0077022933 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0829 | -| learning_rate | 0.0003 | -| loss | -0.000719 | -| n_updates | 110830 | -| policy_gradient_loss | -3.4e-05 | -| std | 0.026 | -| value_loss | 4.29e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 22 | -| iterations | 11085 | -| time_elapsed | 61808 | -| total_timesteps | 1418880 | -| train/ | | -| approx_kl | 0.008693984 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.000627 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 110840 | -| policy_gradient_loss | -0.0017 | -| std | 0.026 | -| value_loss | 5.88e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11086 | -| time_elapsed | 61810 | -| total_timesteps | 1419008 | -| train/ | | -| approx_kl | 0.0124498755 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 110850 | -| policy_gradient_loss | -0.00555 | -| std | 0.026 | -| value_loss | 2.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11087 | -| time_elapsed | 61819 | -| total_timesteps | 1419136 | -| train/ | | -| approx_kl | 0.010554152 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.00969 | -| n_updates | 110860 | -| policy_gradient_loss | -0.00643 | -| std | 0.026 | -| value_loss | 0.00323 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11088 | -| time_elapsed | 61823 | -| total_timesteps | 1419264 | -| train/ | | -| approx_kl | 0.0001198682 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.11 | -| learning_rate | 0.0003 | -| loss | -1.73e-05 | -| n_updates | 110870 | -| policy_gradient_loss | 0.0197 | -| std | 0.026 | -| value_loss | 0.000237 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11089 | -| time_elapsed | 61826 | -| total_timesteps | 1419392 | -| train/ | | -| approx_kl | 0.00024059694 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 110880 | -| policy_gradient_loss | 0.00344 | -| std | 0.0259 | -| value_loss | 1.65e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11090 | -| time_elapsed | 61830 | -| total_timesteps | 1419520 | -| train/ | | -| approx_kl | 0.006083816 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.000552 | -| n_updates | 110890 | -| policy_gradient_loss | 0.00739 | -| std | 0.0259 | -| value_loss | 8.24e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11091 | -| time_elapsed | 61833 | -| total_timesteps | 1419648 | -| train/ | | -| approx_kl | 0.0010499116 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.00693 | -| learning_rate | 0.0003 | -| loss | 0.0011 | -| n_updates | 110900 | -| policy_gradient_loss | 0.0059 | -| std | 0.0259 | -| value_loss | 0.000119 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11092 | -| time_elapsed | 61836 | -| total_timesteps | 1419776 | -| train/ | | -| approx_kl | 0.0008049109 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | 0.00292 | -| n_updates | 110910 | -| policy_gradient_loss | 0.00938 | -| std | 0.0259 | -| value_loss | 5.32e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11093 | -| time_elapsed | 61840 | -| total_timesteps | 1419904 | -| train/ | | -| approx_kl | 0.0006659669 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.409 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 110920 | -| policy_gradient_loss | 0.000306 | -| std | 0.0259 | -| value_loss | 8.7e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11094 | -| time_elapsed | 61844 | -| total_timesteps | 1420032 | -| train/ | | -| approx_kl | 0.0074382154 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.00905 | -| learning_rate | 0.0003 | -| loss | 0.00107 | -| n_updates | 110930 | -| policy_gradient_loss | 0.0104 | -| std | 0.0259 | -| value_loss | 4.79e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11095 | -| time_elapsed | 61852 | -| total_timesteps | 1420160 | -| train/ | | -| approx_kl | 0.0095493905 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 110940 | -| policy_gradient_loss | -0.0129 | -| std | 0.026 | -| value_loss | 0.000657 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11096 | -| time_elapsed | 61856 | -| total_timesteps | 1420288 | -| train/ | | -| approx_kl | 0.00041551655 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.443 | -| learning_rate | 0.0003 | -| loss | 0.00466 | -| n_updates | 110950 | -| policy_gradient_loss | -0.00626 | -| std | 0.026 | -| value_loss | 8.01e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11097 | -| time_elapsed | 61858 | -| total_timesteps | 1420416 | -| train/ | | -| approx_kl | 0.016220186 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -310 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 110960 | -| policy_gradient_loss | 0.0026 | -| std | 0.026 | -| value_loss | 8.57e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11098 | -| time_elapsed | 61862 | -| total_timesteps | 1420544 | -| train/ | | -| approx_kl | 0.01599634 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 110970 | -| policy_gradient_loss | -0.000369 | -| std | 0.026 | -| value_loss | 1.43e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11099 | -| time_elapsed | 61866 | -| total_timesteps | 1420672 | -| train/ | | -| approx_kl | 0.02212332 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -273 | -| learning_rate | 0.0003 | -| loss | -1.84e-05 | -| n_updates | 110980 | -| policy_gradient_loss | -0.000559 | -| std | 0.026 | -| value_loss | 4.95e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11100 | -| time_elapsed | 61870 | -| total_timesteps | 1420800 | -| train/ | | -| approx_kl | 0.01641172 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.767 | -| learning_rate | 0.0003 | -| loss | -0.000758 | -| n_updates | 110990 | -| policy_gradient_loss | -0.00104 | -| std | 0.026 | -| value_loss | 8.79e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 22 | -| iterations | 11101 | -| time_elapsed | 61873 | -| total_timesteps | 1420928 | -| train/ | | -| approx_kl | 0.01788511 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.0047 | -| learning_rate | 0.0003 | -| loss | 0.00621 | -| n_updates | 111000 | -| policy_gradient_loss | 0.002 | -| std | 0.026 | -| value_loss | 2.79e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11102 | -| time_elapsed | 61876 | -| total_timesteps | 1421056 | -| train/ | | -| approx_kl | 0.005860876 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.00134 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 111010 | -| policy_gradient_loss | 0.000694 | -| std | 0.026 | -| value_loss | 6.28e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11103 | -| time_elapsed | 61882 | -| total_timesteps | 1421184 | -| train/ | | -| approx_kl | 0.00036270078 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 111020 | -| policy_gradient_loss | -0.0103 | -| std | 0.026 | -| value_loss | 0.000145 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11104 | -| time_elapsed | 61887 | -| total_timesteps | 1421312 | -| train/ | | -| approx_kl | 0.012287549 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | -0.00613 | -| n_updates | 111030 | -| policy_gradient_loss | -0.00357 | -| std | 0.026 | -| value_loss | 7.61e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11105 | -| time_elapsed | 61891 | -| total_timesteps | 1421440 | -| train/ | | -| approx_kl | 0.00912138 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 111040 | -| policy_gradient_loss | 0.0136 | -| std | 0.0259 | -| value_loss | 1.89e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11106 | -| time_elapsed | 61894 | -| total_timesteps | 1421568 | -| train/ | | -| approx_kl | 0.010577619 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | 0.00173 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 111050 | -| policy_gradient_loss | -0.00155 | -| std | 0.0259 | -| value_loss | 2.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11107 | -| time_elapsed | 61897 | -| total_timesteps | 1421696 | -| train/ | | -| approx_kl | 0.013329853 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 111060 | -| policy_gradient_loss | -0.00179 | -| std | 0.0259 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11108 | -| time_elapsed | 61900 | -| total_timesteps | 1421824 | -| train/ | | -| approx_kl | 0.019168323 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.000805 | -| n_updates | 111070 | -| policy_gradient_loss | -0.00165 | -| std | 0.0259 | -| value_loss | 4.35e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 22 | -| iterations | 11109 | -| time_elapsed | 61903 | -| total_timesteps | 1421952 | -| train/ | | -| approx_kl | 0.00029884 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.0741 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 111080 | -| policy_gradient_loss | -0.00648 | -| std | 0.0259 | -| value_loss | 3.56e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11110 | -| time_elapsed | 61906 | -| total_timesteps | 1422080 | -| train/ | | -| approx_kl | 0.014423326 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 111090 | -| policy_gradient_loss | 0.011 | -| std | 0.0259 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11111 | -| time_elapsed | 61912 | -| total_timesteps | 1422208 | -| train/ | | -| approx_kl | 0.024909165 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 111100 | -| policy_gradient_loss | -0.0124 | -| std | 0.0259 | -| value_loss | 0.000613 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11112 | -| time_elapsed | 61916 | -| total_timesteps | 1422336 | -| train/ | | -| approx_kl | 0.019354431 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00513 | -| n_updates | 111110 | -| policy_gradient_loss | 0.00135 | -| std | 0.0259 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11113 | -| time_elapsed | 61920 | -| total_timesteps | 1422464 | -| train/ | | -| approx_kl | 0.0021616742 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 111120 | -| policy_gradient_loss | -0.0048 | -| std | 0.0259 | -| value_loss | 5.25e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11114 | -| time_elapsed | 61923 | -| total_timesteps | 1422592 | -| train/ | | -| approx_kl | 2.1457672e-06 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | 0.000151 | -| n_updates | 111130 | -| policy_gradient_loss | -0.000221 | -| std | 0.0259 | -| value_loss | 1.42e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11115 | -| time_elapsed | 61927 | -| total_timesteps | 1422720 | -| train/ | | -| approx_kl | 0.04199702 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 111140 | -| policy_gradient_loss | -0.00864 | -| std | 0.0259 | -| value_loss | 3.87e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11116 | -| time_elapsed | 61930 | -| total_timesteps | 1422848 | -| train/ | | -| approx_kl | 0.0075442744 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.00268 | -| n_updates | 111150 | -| policy_gradient_loss | 0.00225 | -| std | 0.0259 | -| value_loss | 1.28e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 22 | -| iterations | 11117 | -| time_elapsed | 61934 | -| total_timesteps | 1422976 | -| train/ | | -| approx_kl | 0.009643199 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.00454 | -| n_updates | 111160 | -| policy_gradient_loss | 0.00217 | -| std | 0.0259 | -| value_loss | 4.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 11118 | -| time_elapsed | 61937 | -| total_timesteps | 1423104 | -| train/ | | -| approx_kl | 0.032357752 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.0798 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 111170 | -| policy_gradient_loss | 0.0104 | -| std | 0.0259 | -| value_loss | 2.35e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 11119 | -| time_elapsed | 61944 | -| total_timesteps | 1423232 | -| train/ | | -| approx_kl | 0.029084 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 111180 | -| policy_gradient_loss | -0.0119 | -| std | 0.0259 | -| value_loss | 0.00501 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 11120 | -| time_elapsed | 61947 | -| total_timesteps | 1423360 | -| train/ | | -| approx_kl | 0.00208044 | -| clip_fraction | 0.0289 | -| clip_range | 0.2 | -| entropy_loss | 2.23 | -| explained_variance | -0.00881 | -| learning_rate | 0.0003 | -| loss | -0.000933 | -| n_updates | 111190 | -| policy_gradient_loss | 0.000515 | -| std | 0.0258 | -| value_loss | 9.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 11121 | -| time_elapsed | 61950 | -| total_timesteps | 1423488 | -| train/ | | -| approx_kl | 0.017758206 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.893 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 111200 | -| policy_gradient_loss | 0.00392 | -| std | 0.0257 | -| value_loss | 9.73e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 11122 | -| time_elapsed | 61954 | -| total_timesteps | 1423616 | -| train/ | | -| approx_kl | 0.0007294449 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 6.49e-05 | -| n_updates | 111210 | -| policy_gradient_loss | -0.00088 | -| std | 0.0257 | -| value_loss | 0.000315 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 11123 | -| time_elapsed | 61957 | -| total_timesteps | 1423744 | -| train/ | | -| approx_kl | 0.04711558 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | -0.00863 | -| n_updates | 111220 | -| policy_gradient_loss | -0.0125 | -| std | 0.0257 | -| value_loss | 6.35e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 22 | -| iterations | 11124 | -| time_elapsed | 61961 | -| total_timesteps | 1423872 | -| train/ | | -| approx_kl | 0.01101644 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | 0.00878 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 111230 | -| policy_gradient_loss | -0.00852 | -| std | 0.0257 | -| value_loss | 0.00011 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11125 | -| time_elapsed | 61964 | -| total_timesteps | 1424000 | -| train/ | | -| approx_kl | 0.0021309983 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | 0.00477 | -| learning_rate | 0.0003 | -| loss | 0.00495 | -| n_updates | 111240 | -| policy_gradient_loss | 0.00925 | -| std | 0.0257 | -| value_loss | 1.62e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11126 | -| time_elapsed | 61968 | -| total_timesteps | 1424128 | -| train/ | | -| approx_kl | 0.006470478 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | 0.00832 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 111250 | -| policy_gradient_loss | 0.00255 | -| std | 0.0257 | -| value_loss | 1.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11127 | -| time_elapsed | 61977 | -| total_timesteps | 1424256 | -| train/ | | -| approx_kl | 0.010266629 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -1.67 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 111260 | -| policy_gradient_loss | -0.00735 | -| std | 0.0257 | -| value_loss | 0.00302 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11128 | -| time_elapsed | 61981 | -| total_timesteps | 1424384 | -| train/ | | -| approx_kl | 0.026713463 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -169 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 111270 | -| policy_gradient_loss | -0.0112 | -| std | 0.0257 | -| value_loss | 8.42e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11129 | -| time_elapsed | 61984 | -| total_timesteps | 1424512 | -| train/ | | -| approx_kl | 0.0031080772 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -194 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 111280 | -| policy_gradient_loss | 0.00418 | -| std | 0.0256 | -| value_loss | 1.87e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11130 | -| time_elapsed | 61987 | -| total_timesteps | 1424640 | -| train/ | | -| approx_kl | 0.0113858115 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -53.1 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 111290 | -| policy_gradient_loss | -0.0166 | -| std | 0.0256 | -| value_loss | 2.23e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11131 | -| time_elapsed | 61991 | -| total_timesteps | 1424768 | -| train/ | | -| approx_kl | 0.018485684 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.24 | -| explained_variance | -9.72 | -| learning_rate | 0.0003 | -| loss | 0.00425 | -| n_updates | 111300 | -| policy_gradient_loss | 0.00236 | -| std | 0.0256 | -| value_loss | 4.65e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 22 | -| iterations | 11132 | -| time_elapsed | 61994 | -| total_timesteps | 1424896 | -| train/ | | -| approx_kl | 0.019834405 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.805 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 111310 | -| policy_gradient_loss | -0.0172 | -| std | 0.0256 | -| value_loss | 1.21e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11133 | -| time_elapsed | 61997 | -| total_timesteps | 1425024 | -| train/ | | -| approx_kl | 0.0024509965 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.00702 | -| n_updates | 111320 | -| policy_gradient_loss | 0.00636 | -| std | 0.0256 | -| value_loss | 1.91e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11134 | -| time_elapsed | 62005 | -| total_timesteps | 1425152 | -| train/ | | -| approx_kl | 0.0024801637 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | 0.716 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 111330 | -| policy_gradient_loss | -0.0142 | -| std | 0.0256 | -| value_loss | 0.000919 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11135 | -| time_elapsed | 62009 | -| total_timesteps | 1425280 | -| train/ | | -| approx_kl | 0.012876091 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.448 | -| learning_rate | 0.0003 | -| loss | 0.000846 | -| n_updates | 111340 | -| policy_gradient_loss | 0.00738 | -| std | 0.0255 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11136 | -| time_elapsed | 62012 | -| total_timesteps | 1425408 | -| train/ | | -| approx_kl | 0.001304355 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -5.27 | -| learning_rate | 0.0003 | -| loss | -0.00348 | -| n_updates | 111350 | -| policy_gradient_loss | -0.000113 | -| std | 0.0255 | -| value_loss | 4.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11137 | -| time_elapsed | 62016 | -| total_timesteps | 1425536 | -| train/ | | -| approx_kl | 0.026145354 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 111360 | -| policy_gradient_loss | -0.00701 | -| std | 0.0255 | -| value_loss | 9.58e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11138 | -| time_elapsed | 62019 | -| total_timesteps | 1425664 | -| train/ | | -| approx_kl | 0.002090707 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.424 | -| learning_rate | 0.0003 | -| loss | -0.000756 | -| n_updates | 111370 | -| policy_gradient_loss | 0.00697 | -| std | 0.0255 | -| value_loss | 1.68e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11139 | -| time_elapsed | 62022 | -| total_timesteps | 1425792 | -| train/ | | -| approx_kl | 2.0185951e-05 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.00687 | -| learning_rate | 0.0003 | -| loss | 0.000348 | -| n_updates | 111380 | -| policy_gradient_loss | 0.00432 | -| std | 0.0255 | -| value_loss | 1.23e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 22 | -| iterations | 11140 | -| time_elapsed | 62026 | -| total_timesteps | 1425920 | -| train/ | | -| approx_kl | 0.03958632 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | 0.00829 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 111390 | -| policy_gradient_loss | -0.00748 | -| std | 0.0256 | -| value_loss | 1.09e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11141 | -| time_elapsed | 62029 | -| total_timesteps | 1426048 | -| train/ | | -| approx_kl | 0.0029421998 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 111400 | -| policy_gradient_loss | -0.000134 | -| std | 0.0256 | -| value_loss | 2.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11142 | -| time_elapsed | 62035 | -| total_timesteps | 1426176 | -| train/ | | -| approx_kl | 0.025162453 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.00343 | -| n_updates | 111410 | -| policy_gradient_loss | -0.00364 | -| std | 0.0255 | -| value_loss | 0.00455 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11143 | -| time_elapsed | 62038 | -| total_timesteps | 1426304 | -| train/ | | -| approx_kl | 0.014029882 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -141 | -| learning_rate | 0.0003 | -| loss | -0.00921 | -| n_updates | 111420 | -| policy_gradient_loss | -0.00349 | -| std | 0.0254 | -| value_loss | 2.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11144 | -| time_elapsed | 62041 | -| total_timesteps | 1426432 | -| train/ | | -| approx_kl | 0.033313572 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -121 | -| learning_rate | 0.0003 | -| loss | 0.0055 | -| n_updates | 111430 | -| policy_gradient_loss | 0.00112 | -| std | 0.0255 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11145 | -| time_elapsed | 62045 | -| total_timesteps | 1426560 | -| train/ | | -| approx_kl | 0.016502481 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -19.7 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 111440 | -| policy_gradient_loss | -0.00163 | -| std | 0.0255 | -| value_loss | 4.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11146 | -| time_elapsed | 62048 | -| total_timesteps | 1426688 | -| train/ | | -| approx_kl | 0.042480603 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 111450 | -| policy_gradient_loss | -0.000703 | -| std | 0.0256 | -| value_loss | 5.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11147 | -| time_elapsed | 62052 | -| total_timesteps | 1426816 | -| train/ | | -| approx_kl | 0.007572494 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.000873 | -| n_updates | 111460 | -| policy_gradient_loss | 0.00402 | -| std | 0.0256 | -| value_loss | 1.91e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 22 | -| iterations | 11148 | -| time_elapsed | 62055 | -| total_timesteps | 1426944 | -| train/ | | -| approx_kl | 0.00059534935 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.7 | -| learning_rate | 0.0003 | -| loss | -0.00444 | -| n_updates | 111470 | -| policy_gradient_loss | -0.00733 | -| std | 0.0256 | -| value_loss | 2.35e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 11149 | -| time_elapsed | 62059 | -| total_timesteps | 1427072 | -| train/ | | -| approx_kl | 0.012421229 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 111480 | -| policy_gradient_loss | 0.00122 | -| std | 0.0256 | -| value_loss | 5.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 11150 | -| time_elapsed | 62065 | -| total_timesteps | 1427200 | -| train/ | | -| approx_kl | 0.011250615 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 111490 | -| policy_gradient_loss | -0.0125 | -| std | 0.0256 | -| value_loss | 0.000261 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 11151 | -| time_elapsed | 62068 | -| total_timesteps | 1427328 | -| train/ | | -| approx_kl | 0.02052732 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | 0.000948 | -| n_updates | 111500 | -| policy_gradient_loss | -0.00475 | -| std | 0.0256 | -| value_loss | 9.07e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 11152 | -| time_elapsed | 62071 | -| total_timesteps | 1427456 | -| train/ | | -| approx_kl | 0.00017107278 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 111510 | -| policy_gradient_loss | 6.51e-05 | -| std | 0.0256 | -| value_loss | 3.29e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 11153 | -| time_elapsed | 62074 | -| total_timesteps | 1427584 | -| train/ | | -| approx_kl | 0.009853207 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.229 | -| learning_rate | 0.0003 | -| loss | -0.0323 | -| n_updates | 111520 | -| policy_gradient_loss | -0.0188 | -| std | 0.0256 | -| value_loss | 1.66e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 11154 | -| time_elapsed | 62077 | -| total_timesteps | 1427712 | -| train/ | | -| approx_kl | 0.0054991017 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | -0.00916 | -| n_updates | 111530 | -| policy_gradient_loss | -0.00522 | -| std | 0.0256 | -| value_loss | 4.91e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 22 | -| iterations | 11155 | -| time_elapsed | 62080 | -| total_timesteps | 1427840 | -| train/ | | -| approx_kl | 0.009974487 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.000461 | -| n_updates | 111540 | -| policy_gradient_loss | 0.000526 | -| std | 0.0256 | -| value_loss | 1.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 11156 | -| time_elapsed | 62084 | -| total_timesteps | 1427968 | -| train/ | | -| approx_kl | 0.009915359 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0452 | -| learning_rate | 0.0003 | -| loss | 0.00361 | -| n_updates | 111550 | -| policy_gradient_loss | 0.00637 | -| std | 0.0256 | -| value_loss | 2.51e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11157 | -| time_elapsed | 62087 | -| total_timesteps | 1428096 | -| train/ | | -| approx_kl | 0.0007282668 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.00448 | -| learning_rate | 0.0003 | -| loss | -0.00338 | -| n_updates | 111560 | -| policy_gradient_loss | 5.85e-05 | -| std | 0.0256 | -| value_loss | 3.96e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11158 | -| time_elapsed | 62095 | -| total_timesteps | 1428224 | -| train/ | | -| approx_kl | 0.009853355 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.663 | -| learning_rate | 0.0003 | -| loss | -0.0258 | -| n_updates | 111570 | -| policy_gradient_loss | -0.0191 | -| std | 0.0256 | -| value_loss | 0.00317 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11159 | -| time_elapsed | 62098 | -| total_timesteps | 1428352 | -| train/ | | -| approx_kl | 0.0008316105 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 111580 | -| policy_gradient_loss | -0.00333 | -| std | 0.0256 | -| value_loss | 0.000843 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11160 | -| time_elapsed | 62101 | -| total_timesteps | 1428480 | -| train/ | | -| approx_kl | 0.0019383761 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -19.7 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 111590 | -| policy_gradient_loss | -0.00032 | -| std | 0.0255 | -| value_loss | 0.000639 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11161 | -| time_elapsed | 62104 | -| total_timesteps | 1428608 | -| train/ | | -| approx_kl | 0.0016135494 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -2.46 | -| learning_rate | 0.0003 | -| loss | 0.00465 | -| n_updates | 111600 | -| policy_gradient_loss | -0.00084 | -| std | 0.0255 | -| value_loss | 0.000198 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11162 | -| time_elapsed | 62108 | -| total_timesteps | 1428736 | -| train/ | | -| approx_kl | 0.0041549555 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -41.9 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 111610 | -| policy_gradient_loss | -0.00408 | -| std | 0.0255 | -| value_loss | 4.45e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11163 | -| time_elapsed | 62112 | -| total_timesteps | 1428864 | -| train/ | | -| approx_kl | 0.002542465 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.592 | -| learning_rate | 0.0003 | -| loss | 0.00404 | -| n_updates | 111620 | -| policy_gradient_loss | 0.00552 | -| std | 0.0255 | -| value_loss | 8.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 11164 | -| time_elapsed | 62115 | -| total_timesteps | 1428992 | -| train/ | | -| approx_kl | 0.003486359 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -7.66 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 111630 | -| policy_gradient_loss | -0.00125 | -| std | 0.0256 | -| value_loss | 2.18e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 11165 | -| time_elapsed | 62118 | -| total_timesteps | 1429120 | -| train/ | | -| approx_kl | 4.1407533e-05 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -67.3 | -| learning_rate | 0.0003 | -| loss | -0.000835 | -| n_updates | 111640 | -| policy_gradient_loss | -0.00474 | -| std | 0.0256 | -| value_loss | 1.31e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 11166 | -| time_elapsed | 62127 | -| total_timesteps | 1429248 | -| train/ | | -| approx_kl | 0.00656587 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | 0.819 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 111650 | -| policy_gradient_loss | -0.00367 | -| std | 0.0256 | -| value_loss | 0.00375 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 11167 | -| time_elapsed | 62131 | -| total_timesteps | 1429376 | -| train/ | | -| approx_kl | 0.010114528 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.00013 | -| n_updates | 111660 | -| policy_gradient_loss | 4.83e-05 | -| std | 0.0256 | -| value_loss | 9.66e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 11168 | -| time_elapsed | 62134 | -| total_timesteps | 1429504 | -| train/ | | -| approx_kl | 0.0030110325 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 111670 | -| policy_gradient_loss | -0.00579 | -| std | 0.0256 | -| value_loss | 2.56e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 11169 | -| time_elapsed | 62138 | -| total_timesteps | 1429632 | -| train/ | | -| approx_kl | 0.00096001895 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | -0.000328 | -| n_updates | 111680 | -| policy_gradient_loss | 0.000402 | -| std | 0.0256 | -| value_loss | 1.2e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 11170 | -| time_elapsed | 62142 | -| total_timesteps | 1429760 | -| train/ | | -| approx_kl | 6.97691e-05 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | 0.00152 | -| n_updates | 111690 | -| policy_gradient_loss | -0.00463 | -| std | 0.0255 | -| value_loss | 9.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 11171 | -| time_elapsed | 62145 | -| total_timesteps | 1429888 | -| train/ | | -| approx_kl | 0.002267933 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.0924 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 111700 | -| policy_gradient_loss | -0.00347 | -| std | 0.0254 | -| value_loss | 7.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11172 | -| time_elapsed | 62148 | -| total_timesteps | 1430016 | -| train/ | | -| approx_kl | 0.026365628 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 111710 | -| policy_gradient_loss | -0.0133 | -| std | 0.0254 | -| value_loss | 2.51e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11173 | -| time_elapsed | 62155 | -| total_timesteps | 1430144 | -| train/ | | -| approx_kl | 0.0049462486 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | 0.000519 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 111720 | -| policy_gradient_loss | -0.0184 | -| std | 0.0254 | -| value_loss | 0.00178 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11174 | -| time_elapsed | 62159 | -| total_timesteps | 1430272 | -| train/ | | -| approx_kl | 1.5753321e-06 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.000156 | -| n_updates | 111730 | -| policy_gradient_loss | -0.00159 | -| std | 0.0254 | -| value_loss | 2.31e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11175 | -| time_elapsed | 62162 | -| total_timesteps | 1430400 | -| train/ | | -| approx_kl | 0.01072358 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -1.77 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 111740 | -| policy_gradient_loss | -0.00616 | -| std | 0.0254 | -| value_loss | 1.29e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11176 | -| time_elapsed | 62165 | -| total_timesteps | 1430528 | -| train/ | | -| approx_kl | 0.011917989 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.00367 | -| learning_rate | 0.0003 | -| loss | 0.00684 | -| n_updates | 111750 | -| policy_gradient_loss | 0.00507 | -| std | 0.0253 | -| value_loss | 9.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11177 | -| time_elapsed | 62169 | -| total_timesteps | 1430656 | -| train/ | | -| approx_kl | 0.009900099 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.581 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 111760 | -| policy_gradient_loss | -0.000292 | -| std | 0.0253 | -| value_loss | 9.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11178 | -| time_elapsed | 62173 | -| total_timesteps | 1430784 | -| train/ | | -| approx_kl | 0.020774776 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.435 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 111770 | -| policy_gradient_loss | -0.0026 | -| std | 0.0253 | -| value_loss | 3.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11179 | -| time_elapsed | 62176 | -| total_timesteps | 1430912 | -| train/ | | -| approx_kl | 0.01009818 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 111780 | -| policy_gradient_loss | 0.00871 | -| std | 0.0253 | -| value_loss | 7.31e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11180 | -| time_elapsed | 62179 | -| total_timesteps | 1431040 | -| train/ | | -| approx_kl | 0.0011260537 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.506 | -| learning_rate | 0.0003 | -| loss | -0.000473 | -| n_updates | 111790 | -| policy_gradient_loss | -9.37e-06 | -| std | 0.0253 | -| value_loss | 1.93e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11181 | -| time_elapsed | 62185 | -| total_timesteps | 1431168 | -| train/ | | -| approx_kl | 0.022928614 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -8.91 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 111800 | -| policy_gradient_loss | -0.0151 | -| std | 0.0254 | -| value_loss | 0.00373 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11182 | -| time_elapsed | 62190 | -| total_timesteps | 1431296 | -| train/ | | -| approx_kl | 0.0007394925 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -0.601 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 111810 | -| policy_gradient_loss | -0.00454 | -| std | 0.0254 | -| value_loss | 7.75e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11183 | -| time_elapsed | 62193 | -| total_timesteps | 1431424 | -| train/ | | -| approx_kl | 0.0023200656 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -208 | -| learning_rate | 0.0003 | -| loss | 0.00539 | -| n_updates | 111820 | -| policy_gradient_loss | 0.00118 | -| std | 0.0254 | -| value_loss | 2.35e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11184 | -| time_elapsed | 62197 | -| total_timesteps | 1431552 | -| train/ | | -| approx_kl | 5.1091425e-05 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -52.1 | -| learning_rate | 0.0003 | -| loss | 0.00112 | -| n_updates | 111830 | -| policy_gradient_loss | -0.00379 | -| std | 0.0254 | -| value_loss | 4.51e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11185 | -| time_elapsed | 62200 | -| total_timesteps | 1431680 | -| train/ | | -| approx_kl | 0.0061668195 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -105 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 111840 | -| policy_gradient_loss | -0.000978 | -| std | 0.0254 | -| value_loss | 5.15e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11186 | -| time_elapsed | 62204 | -| total_timesteps | 1431808 | -| train/ | | -| approx_kl | 0.08688685 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -18 | -| learning_rate | 0.0003 | -| loss | 0.00368 | -| n_updates | 111850 | -| policy_gradient_loss | 0.00705 | -| std | 0.0254 | -| value_loss | 2.55e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11187 | -| time_elapsed | 62208 | -| total_timesteps | 1431936 | -| train/ | | -| approx_kl | 0.0037198788 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 2.25 | -| explained_variance | -226 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 111860 | -| policy_gradient_loss | -0.00267 | -| std | 0.0254 | -| value_loss | 4.81e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11188 | -| time_elapsed | 62212 | -| total_timesteps | 1432064 | -| train/ | | -| approx_kl | 0.0101429075 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.93 | -| learning_rate | 0.0003 | -| loss | -0.000868 | -| n_updates | 111870 | -| policy_gradient_loss | 0.000201 | -| std | 0.0253 | -| value_loss | 3.34e-11 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11189 | -| time_elapsed | 62219 | -| total_timesteps | 1432192 | -| train/ | | -| approx_kl | 0.0073149395 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | 0.766 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 111880 | -| policy_gradient_loss | -0.00711 | -| std | 0.0252 | -| value_loss | 0.00516 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11190 | -| time_elapsed | 62223 | -| total_timesteps | 1432320 | -| train/ | | -| approx_kl | 0.00080115907 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 111890 | -| policy_gradient_loss | 0.0021 | -| std | 0.0252 | -| value_loss | 8.33e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11191 | -| time_elapsed | 62225 | -| total_timesteps | 1432448 | -| train/ | | -| approx_kl | 0.030898144 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 111900 | -| policy_gradient_loss | -0.00358 | -| std | 0.0252 | -| value_loss | 1.8e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11192 | -| time_elapsed | 62229 | -| total_timesteps | 1432576 | -| train/ | | -| approx_kl | 0.00024728058 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 9.22e-05 | -| n_updates | 111910 | -| policy_gradient_loss | 0.000904 | -| std | 0.0252 | -| value_loss | 1.06e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11193 | -| time_elapsed | 62232 | -| total_timesteps | 1432704 | -| train/ | | -| approx_kl | 0.022413202 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.00367 | -| n_updates | 111920 | -| policy_gradient_loss | -1.71e-06 | -| std | 0.0253 | -| value_loss | 7.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11194 | -| time_elapsed | 62236 | -| total_timesteps | 1432832 | -| train/ | | -| approx_kl | 0.01565545 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.00579 | -| n_updates | 111930 | -| policy_gradient_loss | -0.00296 | -| std | 0.0253 | -| value_loss | 4.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 11195 | -| time_elapsed | 62239 | -| total_timesteps | 1432960 | -| train/ | | -| approx_kl | 0.005339807 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0656 | -| learning_rate | 0.0003 | -| loss | 0.000433 | -| n_updates | 111940 | -| policy_gradient_loss | 0.000674 | -| std | 0.0253 | -| value_loss | 3.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11196 | -| time_elapsed | 62243 | -| total_timesteps | 1433088 | -| train/ | | -| approx_kl | 0.03146489 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | 0.00798 | -| n_updates | 111950 | -| policy_gradient_loss | 0.00538 | -| std | 0.0253 | -| value_loss | 1.72e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11197 | -| time_elapsed | 62248 | -| total_timesteps | 1433216 | -| train/ | | -| approx_kl | 0.0034506721 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | 0.519 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 111960 | -| policy_gradient_loss | -0.0148 | -| std | 0.0253 | -| value_loss | 0.00111 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11198 | -| time_elapsed | 62252 | -| total_timesteps | 1433344 | -| train/ | | -| approx_kl | 0.023117013 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 111970 | -| policy_gradient_loss | -0.00209 | -| std | 0.0253 | -| value_loss | 3.83e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11199 | -| time_elapsed | 62255 | -| total_timesteps | 1433472 | -| train/ | | -| approx_kl | 0.007953191 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0914 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 111980 | -| policy_gradient_loss | -0.00012 | -| std | 0.0253 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11200 | -| time_elapsed | 62259 | -| total_timesteps | 1433600 | -| train/ | | -| approx_kl | 0.007818814 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | 0.00888 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 111990 | -| policy_gradient_loss | 0.00767 | -| std | 0.0253 | -| value_loss | 1.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11201 | -| time_elapsed | 62262 | -| total_timesteps | 1433728 | -| train/ | | -| approx_kl | 0.015092401 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.00198 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 112000 | -| policy_gradient_loss | -0.00397 | -| std | 0.0253 | -| value_loss | 7.83e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11202 | -| time_elapsed | 62265 | -| total_timesteps | 1433856 | -| train/ | | -| approx_kl | 0.012420052 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.00795 | -| n_updates | 112010 | -| policy_gradient_loss | -0.00363 | -| std | 0.0253 | -| value_loss | 4.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11203 | -| time_elapsed | 62268 | -| total_timesteps | 1433984 | -| train/ | | -| approx_kl | 0.018115573 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.000534 | -| n_updates | 112020 | -| policy_gradient_loss | 0.00893 | -| std | 0.0253 | -| value_loss | 2.87e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11204 | -| time_elapsed | 62271 | -| total_timesteps | 1434112 | -| train/ | | -| approx_kl | 0.0020735255 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | 0.00335 | -| n_updates | 112030 | -| policy_gradient_loss | 0.0044 | -| std | 0.0253 | -| value_loss | 2.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11205 | -| time_elapsed | 62279 | -| total_timesteps | 1434240 | -| train/ | | -| approx_kl | 0.009729423 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | 0.824 | -| learning_rate | 0.0003 | -| loss | 0.00429 | -| n_updates | 112040 | -| policy_gradient_loss | -0.00541 | -| std | 0.0253 | -| value_loss | 0.00312 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11206 | -| time_elapsed | 62283 | -| total_timesteps | 1434368 | -| train/ | | -| approx_kl | 0.0057753487 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.00182 | -| n_updates | 112050 | -| policy_gradient_loss | 0.00457 | -| std | 0.0253 | -| value_loss | 2.09e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11207 | -| time_elapsed | 62287 | -| total_timesteps | 1434496 | -| train/ | | -| approx_kl | 0.0024323524 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 112060 | -| policy_gradient_loss | 0.00239 | -| std | 0.0253 | -| value_loss | 9.18e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11208 | -| time_elapsed | 62290 | -| total_timesteps | 1434624 | -| train/ | | -| approx_kl | 0.0012819176 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.00534 | -| n_updates | 112070 | -| policy_gradient_loss | -0.00691 | -| std | 0.0253 | -| value_loss | 1.48e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11209 | -| time_elapsed | 62294 | -| total_timesteps | 1434752 | -| train/ | | -| approx_kl | 0.02614801 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0016 | -| n_updates | 112080 | -| policy_gradient_loss | -0.00195 | -| std | 0.0253 | -| value_loss | 2.78e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11210 | -| time_elapsed | 62297 | -| total_timesteps | 1434880 | -| train/ | | -| approx_kl | 0.014415555 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0993 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 112090 | -| policy_gradient_loss | -0.00167 | -| std | 0.0253 | -| value_loss | 1.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11211 | -| time_elapsed | 62301 | -| total_timesteps | 1435008 | -| train/ | | -| approx_kl | 0.015560529 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 112100 | -| policy_gradient_loss | 0.000963 | -| std | 0.0253 | -| value_loss | 2.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11212 | -| time_elapsed | 62309 | -| total_timesteps | 1435136 | -| train/ | | -| approx_kl | 0.007394753 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 112110 | -| policy_gradient_loss | -0.00474 | -| std | 0.0253 | -| value_loss | 0.00127 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11213 | -| time_elapsed | 62312 | -| total_timesteps | 1435264 | -| train/ | | -| approx_kl | 0.00047839247 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | 0.0561 | -| learning_rate | 0.0003 | -| loss | -0.000398 | -| n_updates | 112120 | -| policy_gradient_loss | 0.00212 | -| std | 0.0252 | -| value_loss | 0.00113 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11214 | -| time_elapsed | 62315 | -| total_timesteps | 1435392 | -| train/ | | -| approx_kl | 0.00018099183 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | 0.000715 | -| n_updates | 112130 | -| policy_gradient_loss | 0.0126 | -| std | 0.0252 | -| value_loss | 2.95e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11215 | -| time_elapsed | 62319 | -| total_timesteps | 1435520 | -| train/ | | -| approx_kl | 0.00050788885 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0999 | -| learning_rate | 0.0003 | -| loss | -0.00345 | -| n_updates | 112140 | -| policy_gradient_loss | 8.79e-05 | -| std | 0.0252 | -| value_loss | 6.11e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11216 | -| time_elapsed | 62322 | -| total_timesteps | 1435648 | -| train/ | | -| approx_kl | 0.007369682 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | 0.00076 | -| n_updates | 112150 | -| policy_gradient_loss | 0.00379 | -| std | 0.0252 | -| value_loss | 8.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11217 | -| time_elapsed | 62325 | -| total_timesteps | 1435776 | -| train/ | | -| approx_kl | 0.012798367 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0928 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 112160 | -| policy_gradient_loss | -0.0132 | -| std | 0.0252 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11218 | -| time_elapsed | 62328 | -| total_timesteps | 1435904 | -| train/ | | -| approx_kl | 0.013033643 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 112170 | -| policy_gradient_loss | 0.00641 | -| std | 0.0252 | -| value_loss | 2.24e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11219 | -| time_elapsed | 62332 | -| total_timesteps | 1436032 | -| train/ | | -| approx_kl | 0.0017058044 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 112180 | -| policy_gradient_loss | 0.00406 | -| std | 0.0252 | -| value_loss | 3.83e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11220 | -| time_elapsed | 62339 | -| total_timesteps | 1436160 | -| train/ | | -| approx_kl | 0.0040123938 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 112190 | -| policy_gradient_loss | -0.00571 | -| std | 0.0252 | -| value_loss | 0.00189 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11221 | -| time_elapsed | 62342 | -| total_timesteps | 1436288 | -| train/ | | -| approx_kl | 0.008163003 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 112200 | -| policy_gradient_loss | -0.000622 | -| std | 0.0253 | -| value_loss | 7.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11222 | -| time_elapsed | 62345 | -| total_timesteps | 1436416 | -| train/ | | -| approx_kl | 0.010264162 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 112210 | -| policy_gradient_loss | -0.00131 | -| std | 0.0252 | -| value_loss | 5.19e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11223 | -| time_elapsed | 62349 | -| total_timesteps | 1436544 | -| train/ | | -| approx_kl | 0.015489663 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.906 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 112220 | -| policy_gradient_loss | 0.00477 | -| std | 0.0252 | -| value_loss | 2.79e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11224 | -| time_elapsed | 62352 | -| total_timesteps | 1436672 | -| train/ | | -| approx_kl | 0.023082873 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.26 | -| explained_variance | -0.212 | -| learning_rate | 0.0003 | -| loss | 0.00885 | -| n_updates | 112230 | -| policy_gradient_loss | 0.00416 | -| std | 0.0251 | -| value_loss | 9.73e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11225 | -| time_elapsed | 62355 | -| total_timesteps | 1436800 | -| train/ | | -| approx_kl | 0.0004071556 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.47 | -| learning_rate | 0.0003 | -| loss | -0.000719 | -| n_updates | 112240 | -| policy_gradient_loss | -0.000158 | -| std | 0.025 | -| value_loss | 5.84e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11226 | -| time_elapsed | 62357 | -| total_timesteps | 1436928 | -| train/ | | -| approx_kl | 0.00019772071 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.0845 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 112250 | -| policy_gradient_loss | 0.00465 | -| std | 0.0248 | -| value_loss | 0.000737 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11227 | -| time_elapsed | 62361 | -| total_timesteps | 1437056 | -| train/ | | -| approx_kl | 0.00023397338 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.608 | -| learning_rate | 0.0003 | -| loss | 0.00234 | -| n_updates | 112260 | -| policy_gradient_loss | 0.0139 | -| std | 0.0248 | -| value_loss | 0.00012 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11228 | -| time_elapsed | 62367 | -| total_timesteps | 1437184 | -| train/ | | -| approx_kl | 0.013939898 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 112270 | -| policy_gradient_loss | -0.00641 | -| std | 0.0248 | -| value_loss | 0.000803 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11229 | -| time_elapsed | 62370 | -| total_timesteps | 1437312 | -| train/ | | -| approx_kl | 0.011787621 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 112280 | -| policy_gradient_loss | 0.0107 | -| std | 0.0248 | -| value_loss | 4.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11230 | -| time_elapsed | 62374 | -| total_timesteps | 1437440 | -| train/ | | -| approx_kl | 0.009130297 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 112290 | -| policy_gradient_loss | -0.00263 | -| std | 0.0248 | -| value_loss | 2.99e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11231 | -| time_elapsed | 62377 | -| total_timesteps | 1437568 | -| train/ | | -| approx_kl | 0.0035806317 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0863 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 112300 | -| policy_gradient_loss | 0.00333 | -| std | 0.0248 | -| value_loss | 4.1e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11232 | -| time_elapsed | 62380 | -| total_timesteps | 1437696 | -| train/ | | -| approx_kl | 0.015872356 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.000706 | -| n_updates | 112310 | -| policy_gradient_loss | -0.000189 | -| std | 0.0248 | -| value_loss | 2.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11233 | -| time_elapsed | 62383 | -| total_timesteps | 1437824 | -| train/ | | -| approx_kl | 0.017766135 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 112320 | -| policy_gradient_loss | -0.00234 | -| std | 0.0248 | -| value_loss | 4.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11234 | -| time_elapsed | 62385 | -| total_timesteps | 1437952 | -| train/ | | -| approx_kl | 0.024485184 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.00645 | -| learning_rate | 0.0003 | -| loss | 0.00773 | -| n_updates | 112330 | -| policy_gradient_loss | 0.000297 | -| std | 0.0248 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11235 | -| time_elapsed | 62389 | -| total_timesteps | 1438080 | -| train/ | | -| approx_kl | 0.020225132 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | -0.00492 | -| n_updates | 112340 | -| policy_gradient_loss | -0.00472 | -| std | 0.0248 | -| value_loss | 9.52e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11236 | -| time_elapsed | 62396 | -| total_timesteps | 1438208 | -| train/ | | -| approx_kl | 0.04604739 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | -0.000308 | -| n_updates | 112350 | -| policy_gradient_loss | -0.00416 | -| std | 0.0248 | -| value_loss | 0.000664 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11237 | -| time_elapsed | 62399 | -| total_timesteps | 1438336 | -| train/ | | -| approx_kl | 0.0019127247 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 112360 | -| policy_gradient_loss | 8.25e-05 | -| std | 0.0248 | -| value_loss | 3.32e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11238 | -| time_elapsed | 62403 | -| total_timesteps | 1438464 | -| train/ | | -| approx_kl | 0.01727239 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -1.91 | -| learning_rate | 0.0003 | -| loss | -0.00682 | -| n_updates | 112370 | -| policy_gradient_loss | -0.00293 | -| std | 0.0248 | -| value_loss | 1.58e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11239 | -| time_elapsed | 62406 | -| total_timesteps | 1438592 | -| train/ | | -| approx_kl | 0.0038003647 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.000191 | -| n_updates | 112380 | -| policy_gradient_loss | 0.00478 | -| std | 0.0247 | -| value_loss | 8.84e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11240 | -| time_elapsed | 62410 | -| total_timesteps | 1438720 | -| train/ | | -| approx_kl | 0.00497886 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | 0.00474 | -| n_updates | 112390 | -| policy_gradient_loss | 0.00291 | -| std | 0.0247 | -| value_loss | 6.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11241 | -| time_elapsed | 62413 | -| total_timesteps | 1438848 | -| train/ | | -| approx_kl | 0.004849525 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -1.97 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 112400 | -| policy_gradient_loss | 0.00317 | -| std | 0.0248 | -| value_loss | 3.61e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11242 | -| time_elapsed | 62417 | -| total_timesteps | 1438976 | -| train/ | | -| approx_kl | 0.00563427 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.00856 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 112410 | -| policy_gradient_loss | -4.62e-07 | -| std | 0.0248 | -| value_loss | 5.96e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11243 | -| time_elapsed | 62420 | -| total_timesteps | 1439104 | -| train/ | | -| approx_kl | 0.0011172136 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0647 | -| learning_rate | 0.0003 | -| loss | 0.00715 | -| n_updates | 112420 | -| policy_gradient_loss | 0.00399 | -| std | 0.0248 | -| value_loss | 7.1e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11244 | -| time_elapsed | 62428 | -| total_timesteps | 1439232 | -| train/ | | -| approx_kl | 0.035987806 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.153 | -| learning_rate | 0.0003 | -| loss | 7.15e-06 | -| n_updates | 112430 | -| policy_gradient_loss | -0.014 | -| std | 0.0248 | -| value_loss | 0.00162 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11245 | -| time_elapsed | 62432 | -| total_timesteps | 1439360 | -| train/ | | -| approx_kl | 0.0013368083 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.466 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 112440 | -| policy_gradient_loss | -0.00763 | -| std | 0.0248 | -| value_loss | 1.3e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11246 | -| time_elapsed | 62435 | -| total_timesteps | 1439488 | -| train/ | | -| approx_kl | 0.0002798224 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.00471 | -| n_updates | 112450 | -| policy_gradient_loss | -0.000873 | -| std | 0.0248 | -| value_loss | 2.19e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11247 | -| time_elapsed | 62438 | -| total_timesteps | 1439616 | -| train/ | | -| approx_kl | 0.025151512 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 112460 | -| policy_gradient_loss | 0.00467 | -| std | 0.0248 | -| value_loss | 7.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11248 | -| time_elapsed | 62441 | -| total_timesteps | 1439744 | -| train/ | | -| approx_kl | 0.014614059 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.00576 | -| n_updates | 112470 | -| policy_gradient_loss | 0.00187 | -| std | 0.0248 | -| value_loss | 1.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11249 | -| time_elapsed | 62444 | -| total_timesteps | 1439872 | -| train/ | | -| approx_kl | 0.013355094 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 112480 | -| policy_gradient_loss | -0.00566 | -| std | 0.0248 | -| value_loss | 4.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11250 | -| time_elapsed | 62447 | -| total_timesteps | 1440000 | -| train/ | | -| approx_kl | 0.002040253 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.00131 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 112490 | -| policy_gradient_loss | 0.00412 | -| std | 0.0248 | -| value_loss | 2.25e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11251 | -| time_elapsed | 62450 | -| total_timesteps | 1440128 | -| train/ | | -| approx_kl | 0.0018056966 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.0067 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 112500 | -| policy_gradient_loss | 0.00197 | -| std | 0.0248 | -| value_loss | 2.25e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11252 | -| time_elapsed | 62458 | -| total_timesteps | 1440256 | -| train/ | | -| approx_kl | 0.0024692803 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -6.66 | -| learning_rate | 0.0003 | -| loss | -0.0233 | -| n_updates | 112510 | -| policy_gradient_loss | -0.0153 | -| std | 0.0248 | -| value_loss | 0.00333 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11253 | -| time_elapsed | 62463 | -| total_timesteps | 1440384 | -| train/ | | -| approx_kl | 0.0028284267 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.479 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 112520 | -| policy_gradient_loss | 0.0072 | -| std | 0.0248 | -| value_loss | 2.84e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11254 | -| time_elapsed | 62467 | -| total_timesteps | 1440512 | -| train/ | | -| approx_kl | 1.2656674e-06 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -30.6 | -| learning_rate | 0.0003 | -| loss | 0.000331 | -| n_updates | 112530 | -| policy_gradient_loss | -0.000759 | -| std | 0.0248 | -| value_loss | 2.97e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11255 | -| time_elapsed | 62471 | -| total_timesteps | 1440640 | -| train/ | | -| approx_kl | 0.00031717587 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.456 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 112540 | -| policy_gradient_loss | 0.00692 | -| std | 0.0248 | -| value_loss | 2.04e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11256 | -| time_elapsed | 62473 | -| total_timesteps | 1440768 | -| train/ | | -| approx_kl | 0.00889644 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.773 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 112550 | -| policy_gradient_loss | -0.00612 | -| std | 0.0248 | -| value_loss | 8.97e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 11257 | -| time_elapsed | 62476 | -| total_timesteps | 1440896 | -| train/ | | -| approx_kl | 0.002987519 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0726 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 112560 | -| policy_gradient_loss | 0.000445 | -| std | 0.0248 | -| value_loss | 4.27e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11258 | -| time_elapsed | 62480 | -| total_timesteps | 1441024 | -| train/ | | -| approx_kl | 0.0033635027 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0898 | -| learning_rate | 0.0003 | -| loss | 0.000725 | -| n_updates | 112570 | -| policy_gradient_loss | 0.00475 | -| std | 0.0248 | -| value_loss | 1.65e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11259 | -| time_elapsed | 62488 | -| total_timesteps | 1441152 | -| train/ | | -| approx_kl | 0.0012055733 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | -0.00871 | -| n_updates | 112580 | -| policy_gradient_loss | -0.00561 | -| std | 0.0248 | -| value_loss | 0.00156 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11260 | -| time_elapsed | 62492 | -| total_timesteps | 1441280 | -| train/ | | -| approx_kl | 0.0033663805 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 112590 | -| policy_gradient_loss | 0.00124 | -| std | 0.0248 | -| value_loss | 5.23e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11261 | -| time_elapsed | 62494 | -| total_timesteps | 1441408 | -| train/ | | -| approx_kl | 0.0020337221 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0709 | -| learning_rate | 0.0003 | -| loss | 0.00422 | -| n_updates | 112600 | -| policy_gradient_loss | 0.00351 | -| std | 0.0248 | -| value_loss | 2.37e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11262 | -| time_elapsed | 62496 | -| total_timesteps | 1441536 | -| train/ | | -| approx_kl | 0.03330594 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.416 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 112610 | -| policy_gradient_loss | -0.0125 | -| std | 0.0248 | -| value_loss | 3.27e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11263 | -| time_elapsed | 62500 | -| total_timesteps | 1441664 | -| train/ | | -| approx_kl | 0.01062277 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 112620 | -| policy_gradient_loss | -0.0114 | -| std | 0.0248 | -| value_loss | 7.87e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11264 | -| time_elapsed | 62502 | -| total_timesteps | 1441792 | -| train/ | | -| approx_kl | 0.0049442677 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0656 | -| learning_rate | 0.0003 | -| loss | -0.00831 | -| n_updates | 112630 | -| policy_gradient_loss | -0.0038 | -| std | 0.0248 | -| value_loss | 6.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 11265 | -| time_elapsed | 62505 | -| total_timesteps | 1441920 | -| train/ | | -| approx_kl | 0.010414127 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.000926 | -| n_updates | 112640 | -| policy_gradient_loss | 0.000345 | -| std | 0.0248 | -| value_loss | 3.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11266 | -| time_elapsed | 62509 | -| total_timesteps | 1442048 | -| train/ | | -| approx_kl | 0.011576318 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | 0.00559 | -| n_updates | 112650 | -| policy_gradient_loss | 0.00978 | -| std | 0.0248 | -| value_loss | 2.47e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11267 | -| time_elapsed | 62514 | -| total_timesteps | 1442176 | -| train/ | | -| approx_kl | 0.0127674155 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.921 | -| learning_rate | 0.0003 | -| loss | -0.00928 | -| n_updates | 112660 | -| policy_gradient_loss | -0.00585 | -| std | 0.0248 | -| value_loss | 0.000329 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11268 | -| time_elapsed | 62517 | -| total_timesteps | 1442304 | -| train/ | | -| approx_kl | 0.011914513 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.00195 | -| n_updates | 112670 | -| policy_gradient_loss | 0.00176 | -| std | 0.0248 | -| value_loss | 5.23e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11269 | -| time_elapsed | 62521 | -| total_timesteps | 1442432 | -| train/ | | -| approx_kl | 2.0217616e-05 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0975 | -| learning_rate | 0.0003 | -| loss | -0.000201 | -| n_updates | 112680 | -| policy_gradient_loss | 0.0127 | -| std | 0.0249 | -| value_loss | 1.89e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11270 | -| time_elapsed | 62524 | -| total_timesteps | 1442560 | -| train/ | | -| approx_kl | 0.0017741802 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0727 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 112690 | -| policy_gradient_loss | 0.000224 | -| std | 0.0249 | -| value_loss | 8.53e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11271 | -| time_elapsed | 62528 | -| total_timesteps | 1442688 | -| train/ | | -| approx_kl | 0.009448677 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 112700 | -| policy_gradient_loss | 0.0118 | -| std | 0.0249 | -| value_loss | 2.27e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11272 | -| time_elapsed | 62531 | -| total_timesteps | 1442816 | -| train/ | | -| approx_kl | 0.0051627997 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -55.8 | -| learning_rate | 0.0003 | -| loss | 0.00344 | -| n_updates | 112710 | -| policy_gradient_loss | -0.0012 | -| std | 0.0249 | -| value_loss | 5.87e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11273 | -| time_elapsed | 62535 | -| total_timesteps | 1442944 | -| train/ | | -| approx_kl | 0.013631925 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | 0.00592 | -| learning_rate | 0.0003 | -| loss | -0.00794 | -| n_updates | 112720 | -| policy_gradient_loss | -0.00337 | -| std | 0.0249 | -| value_loss | 1.06e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11274 | -| time_elapsed | 62538 | -| total_timesteps | 1443072 | -| train/ | | -| approx_kl | 0.0005394113 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.785 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 112730 | -| policy_gradient_loss | -0.000499 | -| std | 0.025 | -| value_loss | 2.52e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11275 | -| time_elapsed | 62544 | -| total_timesteps | 1443200 | -| train/ | | -| approx_kl | 0.04147446 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 112740 | -| policy_gradient_loss | -0.0201 | -| std | 0.0249 | -| value_loss | 0.00102 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11276 | -| time_elapsed | 62547 | -| total_timesteps | 1443328 | -| train/ | | -| approx_kl | 0.02849086 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.00321 | -| n_updates | 112750 | -| policy_gradient_loss | -0.00489 | -| std | 0.0249 | -| value_loss | 1.74e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11277 | -| time_elapsed | 62551 | -| total_timesteps | 1443456 | -| train/ | | -| approx_kl | 0.006059552 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 112760 | -| policy_gradient_loss | -0.00151 | -| std | 0.0249 | -| value_loss | 3.71e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11278 | -| time_elapsed | 62555 | -| total_timesteps | 1443584 | -| train/ | | -| approx_kl | 0.00014211796 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 112770 | -| policy_gradient_loss | -0.00285 | -| std | 0.0249 | -| value_loss | 1.23e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11279 | -| time_elapsed | 62559 | -| total_timesteps | 1443712 | -| train/ | | -| approx_kl | 0.008601384 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | 0.00171 | -| learning_rate | 0.0003 | -| loss | 0.00461 | -| n_updates | 112780 | -| policy_gradient_loss | 0.0062 | -| std | 0.0249 | -| value_loss | 3.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11280 | -| time_elapsed | 62562 | -| total_timesteps | 1443840 | -| train/ | | -| approx_kl | 0.006115397 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.0903 | -| learning_rate | 0.0003 | -| loss | -0.000938 | -| n_updates | 112790 | -| policy_gradient_loss | 0.00319 | -| std | 0.0249 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 11281 | -| time_elapsed | 62565 | -| total_timesteps | 1443968 | -| train/ | | -| approx_kl | 0.016339928 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.006 | -| n_updates | 112800 | -| policy_gradient_loss | 0.00287 | -| std | 0.0249 | -| value_loss | 4.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11282 | -| time_elapsed | 62568 | -| total_timesteps | 1444096 | -| train/ | | -| approx_kl | 0.016033674 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.0602 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 112810 | -| policy_gradient_loss | -0.00293 | -| std | 0.0249 | -| value_loss | 3.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11283 | -| time_elapsed | 62576 | -| total_timesteps | 1444224 | -| train/ | | -| approx_kl | 0.022517545 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 112820 | -| policy_gradient_loss | -0.0171 | -| std | 0.0249 | -| value_loss | 0.00391 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11284 | -| time_elapsed | 62579 | -| total_timesteps | 1444352 | -| train/ | | -| approx_kl | 0.024572147 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.00897 | -| learning_rate | 0.0003 | -| loss | 0.000929 | -| n_updates | 112830 | -| policy_gradient_loss | -0.00411 | -| std | 0.0249 | -| value_loss | 2.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11285 | -| time_elapsed | 62583 | -| total_timesteps | 1444480 | -| train/ | | -| approx_kl | 0.017437106 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.318 | -| learning_rate | 0.0003 | -| loss | -0.00861 | -| n_updates | 112840 | -| policy_gradient_loss | -0.00679 | -| std | 0.0249 | -| value_loss | 2.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11286 | -| time_elapsed | 62586 | -| total_timesteps | 1444608 | -| train/ | | -| approx_kl | 0.010099306 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.27 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.000864 | -| n_updates | 112850 | -| policy_gradient_loss | 0.00511 | -| std | 0.0249 | -| value_loss | 9.17e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11287 | -| time_elapsed | 62590 | -| total_timesteps | 1444736 | -| train/ | | -| approx_kl | 0.00057450123 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0858 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 112860 | -| policy_gradient_loss | 0.00257 | -| std | 0.0249 | -| value_loss | 7.41e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11288 | -| time_elapsed | 62593 | -| total_timesteps | 1444864 | -| train/ | | -| approx_kl | 0.015360077 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.072 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 112870 | -| policy_gradient_loss | -6.28e-05 | -| std | 0.0249 | -| value_loss | 3.75e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11289 | -| time_elapsed | 62597 | -| total_timesteps | 1444992 | -| train/ | | -| approx_kl | 9.2204195e-05 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0574 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 112880 | -| policy_gradient_loss | -0.000962 | -| std | 0.0249 | -| value_loss | 2.06e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11290 | -| time_elapsed | 62601 | -| total_timesteps | 1445120 | -| train/ | | -| approx_kl | 0.008021164 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | 0.0088 | -| n_updates | 112890 | -| policy_gradient_loss | 0.00336 | -| std | 0.0249 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11291 | -| time_elapsed | 62609 | -| total_timesteps | 1445248 | -| train/ | | -| approx_kl | 0.015999682 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.861 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 112900 | -| policy_gradient_loss | -0.0119 | -| std | 0.0248 | -| value_loss | 0.00175 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11292 | -| time_elapsed | 62613 | -| total_timesteps | 1445376 | -| train/ | | -| approx_kl | 0.01586522 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0691 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 112910 | -| policy_gradient_loss | 0.000294 | -| std | 0.0248 | -| value_loss | 6.71e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11293 | -| time_elapsed | 62617 | -| total_timesteps | 1445504 | -| train/ | | -| approx_kl | 0.0010375706 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.00627 | -| n_updates | 112920 | -| policy_gradient_loss | 0.00763 | -| std | 0.0248 | -| value_loss | 2.87e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11294 | -| time_elapsed | 62620 | -| total_timesteps | 1445632 | -| train/ | | -| approx_kl | 0.0181012 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0007 | -| n_updates | 112930 | -| policy_gradient_loss | -0.0017 | -| std | 0.0248 | -| value_loss | 1.5e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11295 | -| time_elapsed | 62623 | -| total_timesteps | 1445760 | -| train/ | | -| approx_kl | 0.014318852 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.072 | -| learning_rate | 0.0003 | -| loss | -0.00513 | -| n_updates | 112940 | -| policy_gradient_loss | -0.00278 | -| std | 0.0248 | -| value_loss | 9.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11296 | -| time_elapsed | 62625 | -| total_timesteps | 1445888 | -| train/ | | -| approx_kl | 0.020217098 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | 0.000234 | -| n_updates | 112950 | -| policy_gradient_loss | -0.00186 | -| std | 0.0248 | -| value_loss | 5.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11297 | -| time_elapsed | 62629 | -| total_timesteps | 1446016 | -| train/ | | -| approx_kl | 0.010967189 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0489 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 112960 | -| policy_gradient_loss | 0.00539 | -| std | 0.0248 | -| value_loss | 3.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11298 | -| time_elapsed | 62636 | -| total_timesteps | 1446144 | -| train/ | | -| approx_kl | 0.060757592 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.718 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 112970 | -| policy_gradient_loss | -0.0113 | -| std | 0.0248 | -| value_loss | 0.000784 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11299 | -| time_elapsed | 62639 | -| total_timesteps | 1446272 | -| train/ | | -| approx_kl | 0.004335871 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.0498 | -| learning_rate | 0.0003 | -| loss | 0.00366 | -| n_updates | 112980 | -| policy_gradient_loss | 0.00467 | -| std | 0.0248 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11300 | -| time_elapsed | 62642 | -| total_timesteps | 1446400 | -| train/ | | -| approx_kl | 0.0051596644 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.799 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 112990 | -| policy_gradient_loss | -0.000722 | -| std | 0.0247 | -| value_loss | 3.49e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11301 | -| time_elapsed | 62645 | -| total_timesteps | 1446528 | -| train/ | | -| approx_kl | 0.021987323 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -5.66 | -| learning_rate | 0.0003 | -| loss | -4.44e-05 | -| n_updates | 113000 | -| policy_gradient_loss | -0.00106 | -| std | 0.0247 | -| value_loss | 4.92e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11302 | -| time_elapsed | 62648 | -| total_timesteps | 1446656 | -| train/ | | -| approx_kl | 0.020819757 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.35 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 113010 | -| policy_gradient_loss | 0.00711 | -| std | 0.0246 | -| value_loss | 3.08e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11303 | -| time_elapsed | 62651 | -| total_timesteps | 1446784 | -| train/ | | -| approx_kl | 0.007217743 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 113020 | -| policy_gradient_loss | 0.00294 | -| std | 0.0246 | -| value_loss | 1.54e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11304 | -| time_elapsed | 62656 | -| total_timesteps | 1446912 | -| train/ | | -| approx_kl | 0.0009779548 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.573 | -| learning_rate | 0.0003 | -| loss | -0.000223 | -| n_updates | 113030 | -| policy_gradient_loss | -0.001 | -| std | 0.0247 | -| value_loss | 1.49e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11305 | -| time_elapsed | 62660 | -| total_timesteps | 1447040 | -| train/ | | -| approx_kl | 0.01906731 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.00297 | -| n_updates | 113040 | -| policy_gradient_loss | 0.012 | -| std | 0.0248 | -| value_loss | 1.12e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11306 | -| time_elapsed | 62667 | -| total_timesteps | 1447168 | -| train/ | | -| approx_kl | 0.03464846 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | 0.00608 | -| n_updates | 113050 | -| policy_gradient_loss | 0.0176 | -| std | 0.0248 | -| value_loss | 0.00157 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11307 | -| time_elapsed | 62670 | -| total_timesteps | 1447296 | -| train/ | | -| approx_kl | 0.022087928 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.599 | -| learning_rate | 0.0003 | -| loss | -0.000821 | -| n_updates | 113060 | -| policy_gradient_loss | -0.00563 | -| std | 0.0248 | -| value_loss | 6.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11308 | -| time_elapsed | 62674 | -| total_timesteps | 1447424 | -| train/ | | -| approx_kl | 0.027240576 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | 0.00773 | -| n_updates | 113070 | -| policy_gradient_loss | -0.00128 | -| std | 0.0248 | -| value_loss | 3.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11309 | -| time_elapsed | 62677 | -| total_timesteps | 1447552 | -| train/ | | -| approx_kl | 0.009176457 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.271 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 113080 | -| policy_gradient_loss | 0.00397 | -| std | 0.0248 | -| value_loss | 9.82e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11310 | -| time_elapsed | 62680 | -| total_timesteps | 1447680 | -| train/ | | -| approx_kl | 2.2585038e-05 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 2.28 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | -0.000943 | -| n_updates | 113090 | -| policy_gradient_loss | 0.000677 | -| std | 0.0246 | -| value_loss | 5.68e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11311 | -| time_elapsed | 62684 | -| total_timesteps | 1447808 | -| train/ | | -| approx_kl | 0.008292616 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 113100 | -| policy_gradient_loss | 0.00612 | -| std | 0.0246 | -| value_loss | 2.12e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11312 | -| time_elapsed | 62687 | -| total_timesteps | 1447936 | -| train/ | | -| approx_kl | 0.00054949336 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 113110 | -| policy_gradient_loss | -0.00253 | -| std | 0.0245 | -| value_loss | 2.33e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11313 | -| time_elapsed | 62691 | -| total_timesteps | 1448064 | -| train/ | | -| approx_kl | 0.0021345215 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 113120 | -| policy_gradient_loss | 0.00103 | -| std | 0.0245 | -| value_loss | 9.7e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11314 | -| time_elapsed | 62698 | -| total_timesteps | 1448192 | -| train/ | | -| approx_kl | 0.005383211 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 113130 | -| policy_gradient_loss | -0.00565 | -| std | 0.0245 | -| value_loss | 0.00213 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11315 | -| time_elapsed | 62702 | -| total_timesteps | 1448320 | -| train/ | | -| approx_kl | 0.00549808 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 113140 | -| policy_gradient_loss | -0.0057 | -| std | 0.0245 | -| value_loss | 1.96e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11316 | -| time_elapsed | 62705 | -| total_timesteps | 1448448 | -| train/ | | -| approx_kl | 7.910188e-06 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.313 | -| learning_rate | 0.0003 | -| loss | 0.000218 | -| n_updates | 113150 | -| policy_gradient_loss | -0.00258 | -| std | 0.0245 | -| value_loss | 1.53e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11317 | -| time_elapsed | 62708 | -| total_timesteps | 1448576 | -| train/ | | -| approx_kl | 0.00560508 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.000226 | -| n_updates | 113160 | -| policy_gradient_loss | 0.00126 | -| std | 0.0245 | -| value_loss | 1.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11318 | -| time_elapsed | 62711 | -| total_timesteps | 1448704 | -| train/ | | -| approx_kl | 0.010885036 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | 0.00503 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 113170 | -| policy_gradient_loss | -0.00473 | -| std | 0.0245 | -| value_loss | 3.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11319 | -| time_elapsed | 62714 | -| total_timesteps | 1448832 | -| train/ | | -| approx_kl | 0.01693181 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 113180 | -| policy_gradient_loss | 0.000487 | -| std | 0.0245 | -| value_loss | 9.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 11320 | -| time_elapsed | 62716 | -| total_timesteps | 1448960 | -| train/ | | -| approx_kl | 0.010105284 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.09 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 113190 | -| policy_gradient_loss | 0.00952 | -| std | 0.0245 | -| value_loss | 0.000264 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11321 | -| time_elapsed | 62718 | -| total_timesteps | 1449088 | -| train/ | | -| approx_kl | 0.003255669 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | -0.000549 | -| n_updates | 113200 | -| policy_gradient_loss | 0.000292 | -| std | 0.0245 | -| value_loss | 4.56e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11322 | -| time_elapsed | 62724 | -| total_timesteps | 1449216 | -| train/ | | -| approx_kl | 0.23618251 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -3.69 | -| learning_rate | 0.0003 | -| loss | 0.00677 | -| n_updates | 113210 | -| policy_gradient_loss | -0.00323 | -| std | 0.0245 | -| value_loss | 0.00333 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11323 | -| time_elapsed | 62726 | -| total_timesteps | 1449344 | -| train/ | | -| approx_kl | 0.044518765 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.38 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 113220 | -| policy_gradient_loss | -0.00878 | -| std | 0.0245 | -| value_loss | 5.75e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11324 | -| time_elapsed | 62728 | -| total_timesteps | 1449472 | -| train/ | | -| approx_kl | 0.001987773 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | -0.000894 | -| n_updates | 113230 | -| policy_gradient_loss | 0.000464 | -| std | 0.0245 | -| value_loss | 6.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11325 | -| time_elapsed | 62732 | -| total_timesteps | 1449600 | -| train/ | | -| approx_kl | 0.024301503 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.00396 | -| n_updates | 113240 | -| policy_gradient_loss | -0.00115 | -| std | 0.0245 | -| value_loss | 1.62e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11326 | -| time_elapsed | 62735 | -| total_timesteps | 1449728 | -| train/ | | -| approx_kl | 0.04213273 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.00972 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 113250 | -| policy_gradient_loss | 0.000707 | -| std | 0.0245 | -| value_loss | 4.23e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11327 | -| time_elapsed | 62739 | -| total_timesteps | 1449856 | -| train/ | | -| approx_kl | 0.0008001905 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0618 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 113260 | -| policy_gradient_loss | -0.00211 | -| std | 0.0245 | -| value_loss | 2.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11328 | -| time_elapsed | 62743 | -| total_timesteps | 1449984 | -| train/ | | -| approx_kl | 0.006494868 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | 0.000622 | -| n_updates | 113270 | -| policy_gradient_loss | 0.00258 | -| std | 0.0245 | -| value_loss | 2.06e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11329 | -| time_elapsed | 62746 | -| total_timesteps | 1450112 | -| train/ | | -| approx_kl | 0.0225939 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | 0.00192 | -| learning_rate | 0.0003 | -| loss | -0.000644 | -| n_updates | 113280 | -| policy_gradient_loss | 0.000161 | -| std | 0.0245 | -| value_loss | 4.37e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11330 | -| time_elapsed | 62755 | -| total_timesteps | 1450240 | -| train/ | | -| approx_kl | 0.025544886 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 113290 | -| policy_gradient_loss | -0.00746 | -| std | 0.0245 | -| value_loss | 0.000231 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11331 | -| time_elapsed | 62757 | -| total_timesteps | 1450368 | -| train/ | | -| approx_kl | 0.038045622 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | 0.00277 | -| learning_rate | 0.0003 | -| loss | 0.00844 | -| n_updates | 113300 | -| policy_gradient_loss | -0.000682 | -| std | 0.0245 | -| value_loss | 9.93e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11332 | -| time_elapsed | 62760 | -| total_timesteps | 1450496 | -| train/ | | -| approx_kl | 0.00026220828 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.00579 | -| learning_rate | 0.0003 | -| loss | 0.00118 | -| n_updates | 113310 | -| policy_gradient_loss | 0.0047 | -| std | 0.0245 | -| value_loss | 3.15e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11333 | -| time_elapsed | 62764 | -| total_timesteps | 1450624 | -| train/ | | -| approx_kl | 0.0028814655 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00887 | -| n_updates | 113320 | -| policy_gradient_loss | -0.00508 | -| std | 0.0244 | -| value_loss | 1.46e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11334 | -| time_elapsed | 62768 | -| total_timesteps | 1450752 | -| train/ | | -| approx_kl | 0.002963155 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -5.91 | -| learning_rate | 0.0003 | -| loss | 0.00253 | -| n_updates | 113330 | -| policy_gradient_loss | 0.00382 | -| std | 0.0244 | -| value_loss | 6.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11335 | -| time_elapsed | 62772 | -| total_timesteps | 1450880 | -| train/ | | -| approx_kl | 0.0006868886 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -31.1 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 113340 | -| policy_gradient_loss | -0.000762 | -| std | 0.0244 | -| value_loss | 6.01e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11336 | -| time_elapsed | 62775 | -| total_timesteps | 1451008 | -| train/ | | -| approx_kl | 0.027615862 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 2.29 | -| explained_variance | -0.092 | -| learning_rate | 0.0003 | -| loss | 0.00841 | -| n_updates | 113350 | -| policy_gradient_loss | 0.00122 | -| std | 0.0244 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11337 | -| time_elapsed | 62784 | -| total_timesteps | 1451136 | -| train/ | | -| approx_kl | 0.027758092 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 113360 | -| policy_gradient_loss | -0.0121 | -| std | 0.0243 | -| value_loss | 1.42e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11338 | -| time_elapsed | 62788 | -| total_timesteps | 1451264 | -| train/ | | -| approx_kl | 0.001498641 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | 0.291 | -| learning_rate | 0.0003 | -| loss | 0.0054 | -| n_updates | 113370 | -| policy_gradient_loss | -0.000985 | -| std | 0.0243 | -| value_loss | 1.14e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11339 | -| time_elapsed | 62792 | -| total_timesteps | 1451392 | -| train/ | | -| approx_kl | 0.034772377 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.00293 | -| learning_rate | 0.0003 | -| loss | -0.000394 | -| n_updates | 113380 | -| policy_gradient_loss | -0.00488 | -| std | 0.0243 | -| value_loss | 4.35e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11340 | -| time_elapsed | 62795 | -| total_timesteps | 1451520 | -| train/ | | -| approx_kl | 0.0141874915 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | 0.00276 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 113390 | -| policy_gradient_loss | 0.00979 | -| std | 0.0243 | -| value_loss | 1.93e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11341 | -| time_elapsed | 62799 | -| total_timesteps | 1451648 | -| train/ | | -| approx_kl | 0.013264375 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.00169 | -| learning_rate | 0.0003 | -| loss | 0.0051 | -| n_updates | 113400 | -| policy_gradient_loss | 0.001 | -| std | 0.0243 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11342 | -| time_elapsed | 62803 | -| total_timesteps | 1451776 | -| train/ | | -| approx_kl | 0.0009283782 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | 0.00577 | -| learning_rate | 0.0003 | -| loss | 0.00436 | -| n_updates | 113410 | -| policy_gradient_loss | 0.00289 | -| std | 0.0242 | -| value_loss | 4.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11343 | -| time_elapsed | 62808 | -| total_timesteps | 1451904 | -| train/ | | -| approx_kl | 0.019568138 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.00365 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 113420 | -| policy_gradient_loss | -0.00391 | -| std | 0.0242 | -| value_loss | 1.13e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11344 | -| time_elapsed | 62812 | -| total_timesteps | 1452032 | -| train/ | | -| approx_kl | 0.00040459726 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | -0.00465 | -| n_updates | 113430 | -| policy_gradient_loss | -0.00275 | -| std | 0.0242 | -| value_loss | 4.8e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11345 | -| time_elapsed | 62819 | -| total_timesteps | 1452160 | -| train/ | | -| approx_kl | 0.049945325 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 113440 | -| policy_gradient_loss | 0.0297 | -| std | 0.0242 | -| value_loss | 0.000129 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11346 | -| time_elapsed | 62824 | -| total_timesteps | 1452288 | -| train/ | | -| approx_kl | 0.0011594249 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.828 | -| learning_rate | 0.0003 | -| loss | 0.00398 | -| n_updates | 113450 | -| policy_gradient_loss | 0.00888 | -| std | 0.0242 | -| value_loss | 9.55e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11347 | -| time_elapsed | 62827 | -| total_timesteps | 1452416 | -| train/ | | -| approx_kl | 0.0007304093 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.00542 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 113460 | -| policy_gradient_loss | -0.00178 | -| std | 0.0242 | -| value_loss | 1.43e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11348 | -| time_elapsed | 62831 | -| total_timesteps | 1452544 | -| train/ | | -| approx_kl | 0.0048235 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.077 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 113470 | -| policy_gradient_loss | 0.00326 | -| std | 0.0242 | -| value_loss | 1.3e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11349 | -| time_elapsed | 62835 | -| total_timesteps | 1452672 | -| train/ | | -| approx_kl | 0.0327769 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | 0.0018 | -| learning_rate | 0.0003 | -| loss | 0.0454 | -| n_updates | 113480 | -| policy_gradient_loss | 0.0133 | -| std | 0.0242 | -| value_loss | 1.1e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11350 | -| time_elapsed | 62839 | -| total_timesteps | 1452800 | -| train/ | | -| approx_kl | 4.125759e-07 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 2.3 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | -8.73e-05 | -| n_updates | 113490 | -| policy_gradient_loss | -0.00546 | -| std | 0.0241 | -| value_loss | 9.39e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11351 | -| time_elapsed | 62844 | -| total_timesteps | 1452928 | -| train/ | | -| approx_kl | 0.018341184 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.31 | -| explained_variance | -0.0775 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 113500 | -| policy_gradient_loss | 0.00372 | -| std | 0.0241 | -| value_loss | 4.66e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11352 | -| time_elapsed | 62847 | -| total_timesteps | 1453056 | -| train/ | | -| approx_kl | 0.0038662879 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 2.31 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 113510 | -| policy_gradient_loss | 0.000911 | -| std | 0.0241 | -| value_loss | 1.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11353 | -| time_elapsed | 62853 | -| total_timesteps | 1453184 | -| train/ | | -| approx_kl | 0.023274451 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.31 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | 0.0413 | -| n_updates | 113520 | -| policy_gradient_loss | 0.0159 | -| std | 0.0241 | -| value_loss | 0.00335 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11354 | -| time_elapsed | 62857 | -| total_timesteps | 1453312 | -| train/ | | -| approx_kl | 0.017461233 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.31 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.00267 | -| n_updates | 113530 | -| policy_gradient_loss | -0.00137 | -| std | 0.0241 | -| value_loss | 2.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11355 | -| time_elapsed | 62860 | -| total_timesteps | 1453440 | -| train/ | | -| approx_kl | 0.011191613 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.31 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.00816 | -| n_updates | 113540 | -| policy_gradient_loss | 0.00202 | -| std | 0.0241 | -| value_loss | 2.88e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11356 | -| time_elapsed | 62862 | -| total_timesteps | 1453568 | -| train/ | | -| approx_kl | 1.898082e-05 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 2.31 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | -0.000164 | -| n_updates | 113550 | -| policy_gradient_loss | -6.55e-05 | -| std | 0.024 | -| value_loss | 5.57e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11357 | -| time_elapsed | 62865 | -| total_timesteps | 1453696 | -| train/ | | -| approx_kl | 4.0647108e-05 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.31 | -| explained_variance | -0.0792 | -| learning_rate | 0.0003 | -| loss | 0.000363 | -| n_updates | 113560 | -| policy_gradient_loss | 0.00202 | -| std | 0.0239 | -| value_loss | 7.02e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11358 | -| time_elapsed | 62868 | -| total_timesteps | 1453824 | -| train/ | | -| approx_kl | 0.00047261082 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -1.97 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 113570 | -| policy_gradient_loss | 0.00292 | -| std | 0.0239 | -| value_loss | 2.45e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11359 | -| time_elapsed | 62872 | -| total_timesteps | 1453952 | -| train/ | | -| approx_kl | 0.0077374685 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 113580 | -| policy_gradient_loss | 0.000112 | -| std | 0.0239 | -| value_loss | 9.13e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11360 | -| time_elapsed | 62875 | -| total_timesteps | 1454080 | -| train/ | | -| approx_kl | 0.036547992 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -7.53 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 113590 | -| policy_gradient_loss | -0.00188 | -| std | 0.0239 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11361 | -| time_elapsed | 62880 | -| total_timesteps | 1454208 | -| train/ | | -| approx_kl | 0.035169974 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 113600 | -| policy_gradient_loss | -0.00814 | -| std | 0.0239 | -| value_loss | 0.00436 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11362 | -| time_elapsed | 62883 | -| total_timesteps | 1454336 | -| train/ | | -| approx_kl | 0.019945275 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.454 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 113610 | -| policy_gradient_loss | 0.00541 | -| std | 0.0239 | -| value_loss | 7.15e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11363 | -| time_elapsed | 62886 | -| total_timesteps | 1454464 | -| train/ | | -| approx_kl | 0.018694347 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.00861 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 113620 | -| policy_gradient_loss | 0.0243 | -| std | 0.0239 | -| value_loss | 5.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11364 | -| time_elapsed | 62889 | -| total_timesteps | 1454592 | -| train/ | | -| approx_kl | 0.028016763 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0783 | -| learning_rate | 0.0003 | -| loss | 0.0088 | -| n_updates | 113630 | -| policy_gradient_loss | -0.0019 | -| std | 0.0239 | -| value_loss | 4.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11365 | -| time_elapsed | 62893 | -| total_timesteps | 1454720 | -| train/ | | -| approx_kl | 0.017061135 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | -0.00648 | -| n_updates | 113640 | -| policy_gradient_loss | -0.00513 | -| std | 0.0239 | -| value_loss | 2.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11366 | -| time_elapsed | 62896 | -| total_timesteps | 1454848 | -| train/ | | -| approx_kl | 0.010005057 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 113650 | -| policy_gradient_loss | 0.00292 | -| std | 0.0239 | -| value_loss | 1.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 11367 | -| time_elapsed | 62900 | -| total_timesteps | 1454976 | -| train/ | | -| approx_kl | 0.02162003 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.00784 | -| n_updates | 113660 | -| policy_gradient_loss | 0.00358 | -| std | 0.0239 | -| value_loss | 1.32e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11368 | -| time_elapsed | 62904 | -| total_timesteps | 1455104 | -| train/ | | -| approx_kl | 0.0493701 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | -0.00827 | -| n_updates | 113670 | -| policy_gradient_loss | -0.00965 | -| std | 0.0239 | -| value_loss | 7.37e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11369 | -| time_elapsed | 62911 | -| total_timesteps | 1455232 | -| train/ | | -| approx_kl | 0.015306883 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.793 | -| learning_rate | 0.0003 | -| loss | -0.0268 | -| n_updates | 113680 | -| policy_gradient_loss | -0.0177 | -| std | 0.0239 | -| value_loss | 0.00078 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11370 | -| time_elapsed | 62914 | -| total_timesteps | 1455360 | -| train/ | | -| approx_kl | 0.019259438 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 113690 | -| policy_gradient_loss | -0.00822 | -| std | 0.0239 | -| value_loss | 8.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11371 | -| time_elapsed | 62916 | -| total_timesteps | 1455488 | -| train/ | | -| approx_kl | 0.017717147 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 113700 | -| policy_gradient_loss | -0.011 | -| std | 0.0239 | -| value_loss | 3.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11372 | -| time_elapsed | 62919 | -| total_timesteps | 1455616 | -| train/ | | -| approx_kl | 0.022766605 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.363 | -| learning_rate | 0.0003 | -| loss | 0.00624 | -| n_updates | 113710 | -| policy_gradient_loss | -0.00131 | -| std | 0.0239 | -| value_loss | 8.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11373 | -| time_elapsed | 62921 | -| total_timesteps | 1455744 | -| train/ | | -| approx_kl | 0.002007912 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 113720 | -| policy_gradient_loss | 0.00476 | -| std | 0.0239 | -| value_loss | 5.78e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11374 | -| time_elapsed | 62924 | -| total_timesteps | 1455872 | -| train/ | | -| approx_kl | 0.00045761606 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.00332 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 113730 | -| policy_gradient_loss | 0.00268 | -| std | 0.0239 | -| value_loss | 8.52e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11375 | -| time_elapsed | 62927 | -| total_timesteps | 1456000 | -| train/ | | -| approx_kl | 0.008108611 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0889 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 113740 | -| policy_gradient_loss | 0.00299 | -| std | 0.0238 | -| value_loss | 3.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11376 | -| time_elapsed | 62930 | -| total_timesteps | 1456128 | -| train/ | | -| approx_kl | 0.009916497 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.00299 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 113750 | -| policy_gradient_loss | 0.0001 | -| std | 0.0238 | -| value_loss | 1.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11377 | -| time_elapsed | 62938 | -| total_timesteps | 1456256 | -| train/ | | -| approx_kl | 0.005602926 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.824 | -| learning_rate | 0.0003 | -| loss | 0.0294 | -| n_updates | 113760 | -| policy_gradient_loss | 0.00425 | -| std | 0.0238 | -| value_loss | 0.00277 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11378 | -| time_elapsed | 62942 | -| total_timesteps | 1456384 | -| train/ | | -| approx_kl | 0.007125127 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.000379 | -| n_updates | 113770 | -| policy_gradient_loss | 0.0029 | -| std | 0.0238 | -| value_loss | 0.000187 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11379 | -| time_elapsed | 62946 | -| total_timesteps | 1456512 | -| train/ | | -| approx_kl | 0.0133590065 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -6.64 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 113780 | -| policy_gradient_loss | -8.83e-06 | -| std | 0.0237 | -| value_loss | 1.1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11380 | -| time_elapsed | 62950 | -| total_timesteps | 1456640 | -| train/ | | -| approx_kl | 0.028287249 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.00639 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 113790 | -| policy_gradient_loss | -0.000995 | -| std | 0.0237 | -| value_loss | 1.62e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11381 | -| time_elapsed | 62953 | -| total_timesteps | 1456768 | -| train/ | | -| approx_kl | 0.00012525264 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.000203 | -| n_updates | 113800 | -| policy_gradient_loss | 0.000291 | -| std | 0.0237 | -| value_loss | 1.11e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 11382 | -| time_elapsed | 62956 | -| total_timesteps | 1456896 | -| train/ | | -| approx_kl | 0.0003039078 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 113810 | -| policy_gradient_loss | -0.00188 | -| std | 0.0237 | -| value_loss | 5.77e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11383 | -| time_elapsed | 62959 | -| total_timesteps | 1457024 | -| train/ | | -| approx_kl | 0.013265461 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 113820 | -| policy_gradient_loss | 0.0159 | -| std | 0.0237 | -| value_loss | 3.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11384 | -| time_elapsed | 62967 | -| total_timesteps | 1457152 | -| train/ | | -| approx_kl | 0.055143442 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 113830 | -| policy_gradient_loss | -0.0134 | -| std | 0.0238 | -| value_loss | 0.00185 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11385 | -| time_elapsed | 62970 | -| total_timesteps | 1457280 | -| train/ | | -| approx_kl | 0.018939782 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -14.4 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 113840 | -| policy_gradient_loss | -0.00926 | -| std | 0.0238 | -| value_loss | 4.49e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11386 | -| time_elapsed | 62973 | -| total_timesteps | 1457408 | -| train/ | | -| approx_kl | 0.0016343952 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -11.7 | -| learning_rate | 0.0003 | -| loss | -0.00453 | -| n_updates | 113850 | -| policy_gradient_loss | -0.00432 | -| std | 0.0238 | -| value_loss | 4.75e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11387 | -| time_elapsed | 62977 | -| total_timesteps | 1457536 | -| train/ | | -| approx_kl | 3.763335e-05 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.303 | -| learning_rate | 0.0003 | -| loss | 0.000467 | -| n_updates | 113860 | -| policy_gradient_loss | 0.0124 | -| std | 0.0238 | -| value_loss | 2.16e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11388 | -| time_elapsed | 62980 | -| total_timesteps | 1457664 | -| train/ | | -| approx_kl | 0.0022611916 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.000214 | -| n_updates | 113870 | -| policy_gradient_loss | 0.000388 | -| std | 0.0237 | -| value_loss | 1.35e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11389 | -| time_elapsed | 62983 | -| total_timesteps | 1457792 | -| train/ | | -| approx_kl | 0.0019586426 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.00188 | -| n_updates | 113880 | -| policy_gradient_loss | 0.000749 | -| std | 0.0237 | -| value_loss | 1.45e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11390 | -| time_elapsed | 62986 | -| total_timesteps | 1457920 | -| train/ | | -| approx_kl | 0.020214487 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 113890 | -| policy_gradient_loss | -0.00247 | -| std | 0.0237 | -| value_loss | 2.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11391 | -| time_elapsed | 62989 | -| total_timesteps | 1458048 | -| train/ | | -| approx_kl | 0.007419088 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00991 | -| n_updates | 113900 | -| policy_gradient_loss | -0.00439 | -| std | 0.0237 | -| value_loss | 8.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11392 | -| time_elapsed | 62995 | -| total_timesteps | 1458176 | -| train/ | | -| approx_kl | 0.017454244 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | 0.0604 | -| n_updates | 113910 | -| policy_gradient_loss | 0.0237 | -| std | 0.0237 | -| value_loss | 0.000604 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11393 | -| time_elapsed | 62998 | -| total_timesteps | 1458304 | -| train/ | | -| approx_kl | 0.009646293 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.473 | -| learning_rate | 0.0003 | -| loss | -0.000111 | -| n_updates | 113920 | -| policy_gradient_loss | 0.00231 | -| std | 0.0237 | -| value_loss | 2.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11394 | -| time_elapsed | 63003 | -| total_timesteps | 1458432 | -| train/ | | -| approx_kl | 0.010057669 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0908 | -| learning_rate | 0.0003 | -| loss | -0.00986 | -| n_updates | 113930 | -| policy_gradient_loss | -0.00672 | -| std | 0.0237 | -| value_loss | 2.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11395 | -| time_elapsed | 63007 | -| total_timesteps | 1458560 | -| train/ | | -| approx_kl | 0.012027385 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.46 | -| learning_rate | 0.0003 | -| loss | -0.0246 | -| n_updates | 113940 | -| policy_gradient_loss | -0.0168 | -| std | 0.0237 | -| value_loss | 3.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11396 | -| time_elapsed | 63011 | -| total_timesteps | 1458688 | -| train/ | | -| approx_kl | 0.004933515 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.661 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 113950 | -| policy_gradient_loss | 0.0016 | -| std | 0.0237 | -| value_loss | 2.06e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11397 | -| time_elapsed | 63014 | -| total_timesteps | 1458816 | -| train/ | | -| approx_kl | 0.0132041555 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.00352 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 113960 | -| policy_gradient_loss | -0.00459 | -| std | 0.0237 | -| value_loss | 7.19e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11398 | -| time_elapsed | 63019 | -| total_timesteps | 1458944 | -| train/ | | -| approx_kl | 0.0021496303 | -| clip_fraction | 0.00859 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.781 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 113970 | -| policy_gradient_loss | -0.000968 | -| std | 0.0238 | -| value_loss | 3.13e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11399 | -| time_elapsed | 63022 | -| total_timesteps | 1459072 | -| train/ | | -| approx_kl | 0.00396115 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.00743 | -| learning_rate | 0.0003 | -| loss | -8.39e-05 | -| n_updates | 113980 | -| policy_gradient_loss | -1.85e-05 | -| std | 0.0238 | -| value_loss | 8.7e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11400 | -| time_elapsed | 63027 | -| total_timesteps | 1459200 | -| train/ | | -| approx_kl | 0.0021494431 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.851 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 113990 | -| policy_gradient_loss | -0.0125 | -| std | 0.0238 | -| value_loss | 0.00294 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11401 | -| time_elapsed | 63031 | -| total_timesteps | 1459328 | -| train/ | | -| approx_kl | 0.00035674125 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 114000 | -| policy_gradient_loss | 0.004 | -| std | 0.0238 | -| value_loss | 4.66e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11402 | -| time_elapsed | 63035 | -| total_timesteps | 1459456 | -| train/ | | -| approx_kl | 0.044946536 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.749 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 114010 | -| policy_gradient_loss | -0.00174 | -| std | 0.0238 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11403 | -| time_elapsed | 63038 | -| total_timesteps | 1459584 | -| train/ | | -| approx_kl | 0.043004192 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 114020 | -| policy_gradient_loss | 0.000264 | -| std | 0.0238 | -| value_loss | 5.59e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11404 | -| time_elapsed | 63043 | -| total_timesteps | 1459712 | -| train/ | | -| approx_kl | 0.0070618633 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0879 | -| learning_rate | 0.0003 | -| loss | -5.74e-05 | -| n_updates | 114030 | -| policy_gradient_loss | 0.0033 | -| std | 0.0237 | -| value_loss | 4.99e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11405 | -| time_elapsed | 63046 | -| total_timesteps | 1459840 | -| train/ | | -| approx_kl | 0.019533813 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0718 | -| learning_rate | 0.0003 | -| loss | 0.00683 | -| n_updates | 114040 | -| policy_gradient_loss | 0.00318 | -| std | 0.0237 | -| value_loss | 1.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11406 | -| time_elapsed | 63049 | -| total_timesteps | 1459968 | -| train/ | | -| approx_kl | 0.010715446 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | -0.00646 | -| n_updates | 114050 | -| policy_gradient_loss | 0.00011 | -| std | 0.0237 | -| value_loss | 3.29e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11407 | -| time_elapsed | 63052 | -| total_timesteps | 1460096 | -| train/ | | -| approx_kl | 0.0005751839 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 114060 | -| policy_gradient_loss | 0.0016 | -| std | 0.0237 | -| value_loss | 2.11e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11408 | -| time_elapsed | 63060 | -| total_timesteps | 1460224 | -| train/ | | -| approx_kl | 0.03211065 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | 0.783 | -| learning_rate | 0.0003 | -| loss | -0.00414 | -| n_updates | 114070 | -| policy_gradient_loss | -0.0118 | -| std | 0.0237 | -| value_loss | 0.00607 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11409 | -| time_elapsed | 63064 | -| total_timesteps | 1460352 | -| train/ | | -| approx_kl | 0.028925927 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.0219 | -| n_updates | 114080 | -| policy_gradient_loss | -0.0136 | -| std | 0.0237 | -| value_loss | 0.000241 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11410 | -| time_elapsed | 63068 | -| total_timesteps | 1460480 | -| train/ | | -| approx_kl | 0.0024651955 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.32 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | 0.00611 | -| n_updates | 114090 | -| policy_gradient_loss | 0.00454 | -| std | 0.0236 | -| value_loss | 0.0018 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11411 | -| time_elapsed | 63072 | -| total_timesteps | 1460608 | -| train/ | | -| approx_kl | 0.0001429827 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | 0.00048 | -| n_updates | 114100 | -| policy_gradient_loss | 0.00828 | -| std | 0.0236 | -| value_loss | 0.000535 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11412 | -| time_elapsed | 63077 | -| total_timesteps | 1460736 | -| train/ | | -| approx_kl | 0.010428244 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00364 | -| n_updates | 114110 | -| policy_gradient_loss | 7.68e-05 | -| std | 0.0236 | -| value_loss | 0.000534 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11413 | -| time_elapsed | 63080 | -| total_timesteps | 1460864 | -| train/ | | -| approx_kl | 0.024683377 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.00542 | -| n_updates | 114120 | -| policy_gradient_loss | -0.000852 | -| std | 0.0236 | -| value_loss | 0.000174 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11414 | -| time_elapsed | 63082 | -| total_timesteps | 1460992 | -| train/ | | -| approx_kl | 0.043486953 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 114130 | -| policy_gradient_loss | 0.00193 | -| std | 0.0235 | -| value_loss | 5.58e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11415 | -| time_elapsed | 63086 | -| total_timesteps | 1461120 | -| train/ | | -| approx_kl | 0.009525681 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0653 | -| learning_rate | 0.0003 | -| loss | 0.0038 | -| n_updates | 114140 | -| policy_gradient_loss | 0.00593 | -| std | 0.0235 | -| value_loss | 3.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11416 | -| time_elapsed | 63097 | -| total_timesteps | 1461248 | -| train/ | | -| approx_kl | 0.055496104 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 114150 | -| policy_gradient_loss | 0.0215 | -| std | 0.0235 | -| value_loss | 0.00168 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11417 | -| time_elapsed | 63101 | -| total_timesteps | 1461376 | -| train/ | | -| approx_kl | 0.02989395 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 114160 | -| policy_gradient_loss | 0.0324 | -| std | 0.0235 | -| value_loss | 1.41e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11418 | -| time_elapsed | 63105 | -| total_timesteps | 1461504 | -| train/ | | -| approx_kl | 0.009426344 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0853 | -| learning_rate | 0.0003 | -| loss | 0.000807 | -| n_updates | 114170 | -| policy_gradient_loss | 0.000683 | -| std | 0.0235 | -| value_loss | 7.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11419 | -| time_elapsed | 63109 | -| total_timesteps | 1461632 | -| train/ | | -| approx_kl | 0.009497363 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.00286 | -| n_updates | 114180 | -| policy_gradient_loss | 0.00327 | -| std | 0.0235 | -| value_loss | 8.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11420 | -| time_elapsed | 63113 | -| total_timesteps | 1461760 | -| train/ | | -| approx_kl | 0.012419781 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | 0.000591 | -| n_updates | 114190 | -| policy_gradient_loss | 0.000421 | -| std | 0.0235 | -| value_loss | 4.53e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11421 | -| time_elapsed | 63117 | -| total_timesteps | 1461888 | -| train/ | | -| approx_kl | 0.02159205 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0878 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 114200 | -| policy_gradient_loss | -0.00568 | -| std | 0.0235 | -| value_loss | 3.54e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11422 | -| time_elapsed | 63120 | -| total_timesteps | 1462016 | -| train/ | | -| approx_kl | 0.0043673273 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.33 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 114210 | -| policy_gradient_loss | -0.00799 | -| std | 0.0234 | -| value_loss | 2.87e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11423 | -| time_elapsed | 63129 | -| total_timesteps | 1462144 | -| train/ | | -| approx_kl | 0.12756342 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 114220 | -| policy_gradient_loss | 0.00971 | -| std | 0.0234 | -| value_loss | 0.000701 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11424 | -| time_elapsed | 63134 | -| total_timesteps | 1462272 | -| train/ | | -| approx_kl | 0.029047204 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | 0.211 | -| learning_rate | 0.0003 | -| loss | 0.0456 | -| n_updates | 114230 | -| policy_gradient_loss | 0.0216 | -| std | 0.0234 | -| value_loss | 1.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11425 | -| time_elapsed | 63138 | -| total_timesteps | 1462400 | -| train/ | | -| approx_kl | 0.009795172 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -0.87 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 114240 | -| policy_gradient_loss | -0.000522 | -| std | 0.0233 | -| value_loss | 2.41e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11426 | -| time_elapsed | 63140 | -| total_timesteps | 1462528 | -| train/ | | -| approx_kl | 0.0046957503 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 114250 | -| policy_gradient_loss | 0.00106 | -| std | 0.0233 | -| value_loss | 8.8e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11427 | -| time_elapsed | 63145 | -| total_timesteps | 1462656 | -| train/ | | -| approx_kl | 0.005616693 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00807 | -| n_updates | 114260 | -| policy_gradient_loss | -0.00724 | -| std | 0.0233 | -| value_loss | 3.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11428 | -| time_elapsed | 63148 | -| total_timesteps | 1462784 | -| train/ | | -| approx_kl | 0.018910415 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -0.0801 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 114270 | -| policy_gradient_loss | 0.00369 | -| std | 0.0233 | -| value_loss | 4.72e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11429 | -| time_elapsed | 63152 | -| total_timesteps | 1462912 | -| train/ | | -| approx_kl | 4.7114212e-05 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 114280 | -| policy_gradient_loss | -0.00825 | -| std | 0.0233 | -| value_loss | 7.3e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11430 | -| time_elapsed | 63155 | -| total_timesteps | 1463040 | -| train/ | | -| approx_kl | 0.005618941 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 114290 | -| policy_gradient_loss | 0.000889 | -| std | 0.0233 | -| value_loss | 3.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11431 | -| time_elapsed | 63161 | -| total_timesteps | 1463168 | -| train/ | | -| approx_kl | 0.038518142 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | 0.951 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 114300 | -| policy_gradient_loss | -0.0138 | -| std | 0.0233 | -| value_loss | 0.000457 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11432 | -| time_elapsed | 63164 | -| total_timesteps | 1463296 | -| train/ | | -| approx_kl | 0.0024208487 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -90.2 | -| learning_rate | 0.0003 | -| loss | 0.00224 | -| n_updates | 114310 | -| policy_gradient_loss | 0.00177 | -| std | 0.0233 | -| value_loss | 8.15e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11433 | -| time_elapsed | 63168 | -| total_timesteps | 1463424 | -| train/ | | -| approx_kl | 0.0019258885 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -53.5 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 114320 | -| policy_gradient_loss | -0.00201 | -| std | 0.0232 | -| value_loss | 2.48e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11434 | -| time_elapsed | 63172 | -| total_timesteps | 1463552 | -| train/ | | -| approx_kl | 0.00029201806 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.34 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | 0.000322 | -| n_updates | 114330 | -| policy_gradient_loss | 8.72e-05 | -| std | 0.0232 | -| value_loss | 5.38e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11435 | -| time_elapsed | 63175 | -| total_timesteps | 1463680 | -| train/ | | -| approx_kl | 2.844911e-05 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -0.869 | -| learning_rate | 0.0003 | -| loss | -0.000421 | -| n_updates | 114340 | -| policy_gradient_loss | 0.00368 | -| std | 0.0232 | -| value_loss | 1.46e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11436 | -| time_elapsed | 63179 | -| total_timesteps | 1463808 | -| train/ | | -| approx_kl | 0.008251096 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -0.0659 | -| learning_rate | 0.0003 | -| loss | 0.00774 | -| n_updates | 114350 | -| policy_gradient_loss | 0.00501 | -| std | 0.0232 | -| value_loss | 2.52e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11437 | -| time_elapsed | 63183 | -| total_timesteps | 1463936 | -| train/ | | -| approx_kl | 0.0035196561 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -0.00106 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 114360 | -| policy_gradient_loss | 0.00823 | -| std | 0.0231 | -| value_loss | 3.84e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11438 | -| time_elapsed | 63186 | -| total_timesteps | 1464064 | -| train/ | | -| approx_kl | 0.005048562 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -0.0955 | -| learning_rate | 0.0003 | -| loss | 0.00459 | -| n_updates | 114370 | -| policy_gradient_loss | 0.0079 | -| std | 0.0231 | -| value_loss | 1.05e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11439 | -| time_elapsed | 63193 | -| total_timesteps | 1464192 | -| train/ | | -| approx_kl | 0.026358714 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | 0.876 | -| learning_rate | 0.0003 | -| loss | -0.00789 | -| n_updates | 114380 | -| policy_gradient_loss | -0.00677 | -| std | 0.0231 | -| value_loss | 0.00228 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11440 | -| time_elapsed | 63197 | -| total_timesteps | 1464320 | -| train/ | | -| approx_kl | 0.014256541 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 114390 | -| policy_gradient_loss | 1.96e-05 | -| std | 0.0231 | -| value_loss | 3.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11441 | -| time_elapsed | 63201 | -| total_timesteps | 1464448 | -| train/ | | -| approx_kl | 0.040225618 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -7.98 | -| learning_rate | 0.0003 | -| loss | -0.0083 | -| n_updates | 114400 | -| policy_gradient_loss | -0.00798 | -| std | 0.0231 | -| value_loss | 1.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11442 | -| time_elapsed | 63204 | -| total_timesteps | 1464576 | -| train/ | | -| approx_kl | 0.035836063 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -2.21 | -| learning_rate | 0.0003 | -| loss | 0.00653 | -| n_updates | 114410 | -| policy_gradient_loss | -0.00134 | -| std | 0.0231 | -| value_loss | 1.12e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11443 | -| time_elapsed | 63207 | -| total_timesteps | 1464704 | -| train/ | | -| approx_kl | 0.05391097 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -2.8 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 114420 | -| policy_gradient_loss | -0.000453 | -| std | 0.0232 | -| value_loss | 9.24e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11444 | -| time_elapsed | 63210 | -| total_timesteps | 1464832 | -| train/ | | -| approx_kl | 0.0036972547 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 114430 | -| policy_gradient_loss | -0.00108 | -| std | 0.0232 | -| value_loss | 1.79e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11445 | -| time_elapsed | 63213 | -| total_timesteps | 1464960 | -| train/ | | -| approx_kl | 0.0012471047 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.00696 | -| n_updates | 114440 | -| policy_gradient_loss | -0.00871 | -| std | 0.0231 | -| value_loss | 9.49e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11446 | -| time_elapsed | 63217 | -| total_timesteps | 1465088 | -| train/ | | -| approx_kl | 0.0014673756 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -0.357 | -| learning_rate | 0.0003 | -| loss | -0.000905 | -| n_updates | 114450 | -| policy_gradient_loss | 0.000532 | -| std | 0.0231 | -| value_loss | 4.12e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11447 | -| time_elapsed | 63224 | -| total_timesteps | 1465216 | -| train/ | | -| approx_kl | 0.07365139 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 114460 | -| policy_gradient_loss | -0.0188 | -| std | 0.023 | -| value_loss | 0.000702 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11448 | -| time_elapsed | 63226 | -| total_timesteps | 1465344 | -| train/ | | -| approx_kl | 0.0005983999 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.35 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | 0.00387 | -| n_updates | 114470 | -| policy_gradient_loss | 0.00136 | -| std | 0.023 | -| value_loss | 5.92e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11449 | -| time_elapsed | 63229 | -| total_timesteps | 1465472 | -| train/ | | -| approx_kl | 0.0020159981 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -8.44 | -| learning_rate | 0.0003 | -| loss | -2.8e-06 | -| n_updates | 114480 | -| policy_gradient_loss | 0.000387 | -| std | 0.0229 | -| value_loss | 7.91e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11450 | -| time_elapsed | 63233 | -| total_timesteps | 1465600 | -| train/ | | -| approx_kl | 0.0070378645 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.0878 | -| learning_rate | 0.0003 | -| loss | -0.0044 | -| n_updates | 114490 | -| policy_gradient_loss | -0.000765 | -| std | 0.0229 | -| value_loss | 0.00099 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11451 | -| time_elapsed | 63237 | -| total_timesteps | 1465728 | -| train/ | | -| approx_kl | 0.034319676 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.359 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 114500 | -| policy_gradient_loss | 0.00383 | -| std | 0.0229 | -| value_loss | 0.00171 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11452 | -| time_elapsed | 63241 | -| total_timesteps | 1465856 | -| train/ | | -| approx_kl | 0.0511854 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.00727 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 114510 | -| policy_gradient_loss | 0.00184 | -| std | 0.0229 | -| value_loss | 7.84e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 11453 | -| time_elapsed | 63244 | -| total_timesteps | 1465984 | -| train/ | | -| approx_kl | 0.0012314492 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 114520 | -| policy_gradient_loss | -0.00399 | -| std | 0.0229 | -| value_loss | 6.02e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11454 | -| time_elapsed | 63249 | -| total_timesteps | 1466112 | -| train/ | | -| approx_kl | 0.007637729 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 114530 | -| policy_gradient_loss | 1.66e-05 | -| std | 0.0229 | -| value_loss | 3.39e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11455 | -| time_elapsed | 63257 | -| total_timesteps | 1466240 | -| train/ | | -| approx_kl | 0.019668035 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 114540 | -| policy_gradient_loss | -0.00796 | -| std | 0.0229 | -| value_loss | 0.00191 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11456 | -| time_elapsed | 63260 | -| total_timesteps | 1466368 | -| train/ | | -| approx_kl | 0.008056261 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | 0.000806 | -| n_updates | 114550 | -| policy_gradient_loss | 0.00126 | -| std | 0.0229 | -| value_loss | 1e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11457 | -| time_elapsed | 63263 | -| total_timesteps | 1466496 | -| train/ | | -| approx_kl | 0.0043835156 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 114560 | -| policy_gradient_loss | -0.0132 | -| std | 0.0229 | -| value_loss | 7.3e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11458 | -| time_elapsed | 63266 | -| total_timesteps | 1466624 | -| train/ | | -| approx_kl | 0.011314765 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 114570 | -| policy_gradient_loss | -0.0105 | -| std | 0.0229 | -| value_loss | 4.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11459 | -| time_elapsed | 63270 | -| total_timesteps | 1466752 | -| train/ | | -| approx_kl | 0.0009186696 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 114580 | -| policy_gradient_loss | -0.00303 | -| std | 0.0228 | -| value_loss | 6.94e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11460 | -| time_elapsed | 63272 | -| total_timesteps | 1466880 | -| train/ | | -| approx_kl | 0.03424914 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 114590 | -| policy_gradient_loss | -0.00558 | -| std | 0.0228 | -| value_loss | 1.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11461 | -| time_elapsed | 63276 | -| total_timesteps | 1467008 | -| train/ | | -| approx_kl | 0.018212717 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 114600 | -| policy_gradient_loss | -0.00192 | -| std | 0.0228 | -| value_loss | 4.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11462 | -| time_elapsed | 63285 | -| total_timesteps | 1467136 | -| train/ | | -| approx_kl | 0.041161153 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | 0.857 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 114610 | -| policy_gradient_loss | -0.0201 | -| std | 0.0228 | -| value_loss | 0.000961 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11463 | -| time_elapsed | 63288 | -| total_timesteps | 1467264 | -| train/ | | -| approx_kl | 0.0047479817 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | 0.0615 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 114620 | -| policy_gradient_loss | 0.00593 | -| std | 0.0228 | -| value_loss | 8.98e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11464 | -| time_elapsed | 63291 | -| total_timesteps | 1467392 | -| train/ | | -| approx_kl | 0.0002660309 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 2.36 | -| explained_variance | -280 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 114630 | -| policy_gradient_loss | 0.00168 | -| std | 0.0227 | -| value_loss | 0.00011 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11465 | -| time_elapsed | 63295 | -| total_timesteps | 1467520 | -| train/ | | -| approx_kl | 0.000735268 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.408 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 114640 | -| policy_gradient_loss | 0.00548 | -| std | 0.0227 | -| value_loss | 0.00111 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11466 | -| time_elapsed | 63299 | -| total_timesteps | 1467648 | -| train/ | | -| approx_kl | 0.005423094 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 114650 | -| policy_gradient_loss | -0.000392 | -| std | 0.0227 | -| value_loss | 2.49e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11467 | -| time_elapsed | 63302 | -| total_timesteps | 1467776 | -| train/ | | -| approx_kl | 0.007463872 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0969 | -| learning_rate | 0.0003 | -| loss | 0.00975 | -| n_updates | 114660 | -| policy_gradient_loss | 0.012 | -| std | 0.0227 | -| value_loss | 1.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11468 | -| time_elapsed | 63305 | -| total_timesteps | 1467904 | -| train/ | | -| approx_kl | 0.008728024 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.00804 | -| n_updates | 114670 | -| policy_gradient_loss | 0.0135 | -| std | 0.0227 | -| value_loss | 6.54e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11469 | -| time_elapsed | 63309 | -| total_timesteps | 1468032 | -| train/ | | -| approx_kl | 0.01690026 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0561 | -| learning_rate | 0.0003 | -| loss | -0.00499 | -| n_updates | 114680 | -| policy_gradient_loss | -0.00537 | -| std | 0.0227 | -| value_loss | 4.82e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11470 | -| time_elapsed | 63317 | -| total_timesteps | 1468160 | -| train/ | | -| approx_kl | 0.009706715 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.0274 | -| n_updates | 114690 | -| policy_gradient_loss | -0.0127 | -| std | 0.0227 | -| value_loss | 0.000353 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11471 | -| time_elapsed | 63321 | -| total_timesteps | 1468288 | -| train/ | | -| approx_kl | 0.0014126184 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.33 | -| learning_rate | 0.0003 | -| loss | 0.000767 | -| n_updates | 114700 | -| policy_gradient_loss | 0.0171 | -| std | 0.0227 | -| value_loss | 7.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11472 | -| time_elapsed | 63324 | -| total_timesteps | 1468416 | -| train/ | | -| approx_kl | 0.007075112 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 114710 | -| policy_gradient_loss | 0.0118 | -| std | 0.0227 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11473 | -| time_elapsed | 63327 | -| total_timesteps | 1468544 | -| train/ | | -| approx_kl | 0.0065320674 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 114720 | -| policy_gradient_loss | 0.00489 | -| std | 0.0227 | -| value_loss | 3.49e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11474 | -| time_elapsed | 63330 | -| total_timesteps | 1468672 | -| train/ | | -| approx_kl | 0.02102003 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 114730 | -| policy_gradient_loss | -0.00258 | -| std | 0.0227 | -| value_loss | 2.29e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11475 | -| time_elapsed | 63335 | -| total_timesteps | 1468800 | -| train/ | | -| approx_kl | 0.02483423 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | 0.00842 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 114740 | -| policy_gradient_loss | 0.00382 | -| std | 0.0227 | -| value_loss | 2.76e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 11476 | -| time_elapsed | 63339 | -| total_timesteps | 1468928 | -| train/ | | -| approx_kl | 0.00031954097 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 114750 | -| policy_gradient_loss | -0.0102 | -| std | 0.0227 | -| value_loss | 2.04e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11477 | -| time_elapsed | 63344 | -| total_timesteps | 1469056 | -| train/ | | -| approx_kl | 0.03187271 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 114760 | -| policy_gradient_loss | -0.00343 | -| std | 0.0227 | -| value_loss | 8.9e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11478 | -| time_elapsed | 63351 | -| total_timesteps | 1469184 | -| train/ | | -| approx_kl | 0.0062966864 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | 0.939 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 114770 | -| policy_gradient_loss | -0.00927 | -| std | 0.0226 | -| value_loss | 0.000705 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11479 | -| time_elapsed | 63355 | -| total_timesteps | 1469312 | -| train/ | | -| approx_kl | 0.01694671 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.00159 | -| n_updates | 114780 | -| policy_gradient_loss | 0.00803 | -| std | 0.0226 | -| value_loss | 6.2e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11480 | -| time_elapsed | 63359 | -| total_timesteps | 1469440 | -| train/ | | -| approx_kl | 0.02843767 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0964 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 114790 | -| policy_gradient_loss | 0.00527 | -| std | 0.0226 | -| value_loss | 1.85e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11481 | -| time_elapsed | 63362 | -| total_timesteps | 1469568 | -| train/ | | -| approx_kl | 0.01172491 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.00526 | -| n_updates | 114800 | -| policy_gradient_loss | 0.0026 | -| std | 0.0226 | -| value_loss | 9.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11482 | -| time_elapsed | 63364 | -| total_timesteps | 1469696 | -| train/ | | -| approx_kl | 0.024542574 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 114810 | -| policy_gradient_loss | 0.00691 | -| std | 0.0226 | -| value_loss | 6.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11483 | -| time_elapsed | 63367 | -| total_timesteps | 1469824 | -| train/ | | -| approx_kl | 0.018031681 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 114820 | -| policy_gradient_loss | -0.000287 | -| std | 0.0226 | -| value_loss | 4.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11484 | -| time_elapsed | 63371 | -| total_timesteps | 1469952 | -| train/ | | -| approx_kl | 0.007847371 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -0.000833 | -| n_updates | 114830 | -| policy_gradient_loss | 0.000691 | -| std | 0.0226 | -| value_loss | 2.96e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11485 | -| time_elapsed | 63374 | -| total_timesteps | 1470080 | -| train/ | | -| approx_kl | 0.0022566505 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -0.0737 | -| learning_rate | 0.0003 | -| loss | -7.76e-05 | -| n_updates | 114840 | -| policy_gradient_loss | 0.000908 | -| std | 0.0226 | -| value_loss | 3.1e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11486 | -| time_elapsed | 63380 | -| total_timesteps | 1470208 | -| train/ | | -| approx_kl | 0.16085654 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | 0.576 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 114850 | -| policy_gradient_loss | -0.0188 | -| std | 0.0226 | -| value_loss | 0.00146 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11487 | -| time_elapsed | 63384 | -| total_timesteps | 1470336 | -| train/ | | -| approx_kl | 0.02879019 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -8.84 | -| learning_rate | 0.0003 | -| loss | 0.000858 | -| n_updates | 114860 | -| policy_gradient_loss | -0.00234 | -| std | 0.0225 | -| value_loss | 1.27e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11488 | -| time_elapsed | 63388 | -| total_timesteps | 1470464 | -| train/ | | -| approx_kl | 6.0563907e-06 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.37 | -| explained_variance | -18.5 | -| learning_rate | 0.0003 | -| loss | -0.0001 | -| n_updates | 114870 | -| policy_gradient_loss | 0.000414 | -| std | 0.0225 | -| value_loss | 1.1e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11489 | -| time_elapsed | 63391 | -| total_timesteps | 1470592 | -| train/ | | -| approx_kl | 0.005712333 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 114880 | -| policy_gradient_loss | 0.00295 | -| std | 0.0225 | -| value_loss | 3.87e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11490 | -| time_elapsed | 63394 | -| total_timesteps | 1470720 | -| train/ | | -| approx_kl | 0.0030984646 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.00708 | -| n_updates | 114890 | -| policy_gradient_loss | 0.0033 | -| std | 0.0225 | -| value_loss | 1.42e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11491 | -| time_elapsed | 63397 | -| total_timesteps | 1470848 | -| train/ | | -| approx_kl | 0.0062847803 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -0.00464 | -| learning_rate | 0.0003 | -| loss | 0.00336 | -| n_updates | 114900 | -| policy_gradient_loss | 0.00889 | -| std | 0.0224 | -| value_loss | 1.5e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11492 | -| time_elapsed | 63400 | -| total_timesteps | 1470976 | -| train/ | | -| approx_kl | 2.6798807e-06 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -0.07 | -| learning_rate | 0.0003 | -| loss | 4.51e-05 | -| n_updates | 114910 | -| policy_gradient_loss | 0.0104 | -| std | 0.0224 | -| value_loss | 1.05e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 11493 | -| time_elapsed | 63403 | -| total_timesteps | 1471104 | -| train/ | | -| approx_kl | 0.008619113 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -0.087 | -| learning_rate | 0.0003 | -| loss | -0.000239 | -| n_updates | 114920 | -| policy_gradient_loss | 0.00259 | -| std | 0.0224 | -| value_loss | 2.75e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 11494 | -| time_elapsed | 63411 | -| total_timesteps | 1471232 | -| train/ | | -| approx_kl | 0.047252536 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | 0.925 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 114930 | -| policy_gradient_loss | -0.00961 | -| std | 0.0224 | -| value_loss | 0.000816 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 11495 | -| time_elapsed | 63414 | -| total_timesteps | 1471360 | -| train/ | | -| approx_kl | 0.0036269934 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -39.9 | -| learning_rate | 0.0003 | -| loss | -0.000814 | -| n_updates | 114940 | -| policy_gradient_loss | 0.000185 | -| std | 0.0224 | -| value_loss | 3.04e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 11496 | -| time_elapsed | 63417 | -| total_timesteps | 1471488 | -| train/ | | -| approx_kl | 0.0055782525 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -21.5 | -| learning_rate | 0.0003 | -| loss | -0.000923 | -| n_updates | 114950 | -| policy_gradient_loss | -0.000334 | -| std | 0.0224 | -| value_loss | 8.86e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 11497 | -| time_elapsed | 63420 | -| total_timesteps | 1471616 | -| train/ | | -| approx_kl | 0.05877144 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -4.05 | -| learning_rate | 0.0003 | -| loss | -0.00879 | -| n_updates | 114960 | -| policy_gradient_loss | -0.00863 | -| std | 0.0223 | -| value_loss | 1.03e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 11498 | -| time_elapsed | 63424 | -| total_timesteps | 1471744 | -| train/ | | -| approx_kl | 0.040756833 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -1.77 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 114970 | -| policy_gradient_loss | -0.0119 | -| std | 0.0223 | -| value_loss | 1.38e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 11499 | -| time_elapsed | 63425 | -| total_timesteps | 1471872 | -| train/ | | -| approx_kl | 0.01852651 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.38 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | 0.00612 | -| n_updates | 114980 | -| policy_gradient_loss | 0.0032 | -| std | 0.0223 | -| value_loss | 1.18e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11500 | -| time_elapsed | 63429 | -| total_timesteps | 1472000 | -| train/ | | -| approx_kl | 0.016932957 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.756 | -| learning_rate | 0.0003 | -| loss | 0.00383 | -| n_updates | 114990 | -| policy_gradient_loss | 0.00122 | -| std | 0.0223 | -| value_loss | 1.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11501 | -| time_elapsed | 63431 | -| total_timesteps | 1472128 | -| train/ | | -| approx_kl | 0.021889996 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.00665 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 115000 | -| policy_gradient_loss | -0.00144 | -| std | 0.0223 | -| value_loss | 1.81e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11502 | -| time_elapsed | 63438 | -| total_timesteps | 1472256 | -| train/ | | -| approx_kl | 0.12122247 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 115010 | -| policy_gradient_loss | -0.0156 | -| std | 0.0223 | -| value_loss | 0.0053 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11503 | -| time_elapsed | 63442 | -| total_timesteps | 1472384 | -| train/ | | -| approx_kl | 0.020506503 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 115020 | -| policy_gradient_loss | 0.0162 | -| std | 0.0223 | -| value_loss | 2.25e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11504 | -| time_elapsed | 63446 | -| total_timesteps | 1472512 | -| train/ | | -| approx_kl | 0.0029811761 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.85 | -| learning_rate | 0.0003 | -| loss | 4.01e-05 | -| n_updates | 115030 | -| policy_gradient_loss | 0.000713 | -| std | 0.0223 | -| value_loss | 1.14e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11505 | -| time_elapsed | 63450 | -| total_timesteps | 1472640 | -| train/ | | -| approx_kl | 0.045289494 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -6.27 | -| learning_rate | 0.0003 | -| loss | 0.0063 | -| n_updates | 115040 | -| policy_gradient_loss | 0.00105 | -| std | 0.0222 | -| value_loss | 2.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11506 | -| time_elapsed | 63453 | -| total_timesteps | 1472768 | -| train/ | | -| approx_kl | 0.027813412 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 115050 | -| policy_gradient_loss | -0.000819 | -| std | 0.0222 | -| value_loss | 4.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11507 | -| time_elapsed | 63456 | -| total_timesteps | 1472896 | -| train/ | | -| approx_kl | 0.006840165 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 115060 | -| policy_gradient_loss | 0.00884 | -| std | 0.0222 | -| value_loss | 8.58e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11508 | -| time_elapsed | 63461 | -| total_timesteps | 1473024 | -| train/ | | -| approx_kl | 0.0009496929 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.00353 | -| n_updates | 115070 | -| policy_gradient_loss | 0.0052 | -| std | 0.0222 | -| value_loss | 3.68e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11509 | -| time_elapsed | 63468 | -| total_timesteps | 1473152 | -| train/ | | -| approx_kl | 0.06353333 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 115080 | -| policy_gradient_loss | -0.0173 | -| std | 0.0222 | -| value_loss | 0.0015 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11510 | -| time_elapsed | 63473 | -| total_timesteps | 1473280 | -| train/ | | -| approx_kl | 0.010755948 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.00635 | -| learning_rate | 0.0003 | -| loss | 0.00481 | -| n_updates | 115090 | -| policy_gradient_loss | 0.00607 | -| std | 0.0222 | -| value_loss | 7.04e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11511 | -| time_elapsed | 63477 | -| total_timesteps | 1473408 | -| train/ | | -| approx_kl | 0.0075186123 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -27.3 | -| learning_rate | 0.0003 | -| loss | -0.00526 | -| n_updates | 115100 | -| policy_gradient_loss | -0.000657 | -| std | 0.0223 | -| value_loss | 2.1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11512 | -| time_elapsed | 63481 | -| total_timesteps | 1473536 | -| train/ | | -| approx_kl | 0.004815357 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | 0.00508 | -| n_updates | 115110 | -| policy_gradient_loss | -0.000503 | -| std | 0.0223 | -| value_loss | 1.18e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11513 | -| time_elapsed | 63485 | -| total_timesteps | 1473664 | -| train/ | | -| approx_kl | 0.007859201 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.000183 | -| n_updates | 115120 | -| policy_gradient_loss | 0.00173 | -| std | 0.0222 | -| value_loss | 9.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11514 | -| time_elapsed | 63488 | -| total_timesteps | 1473792 | -| train/ | | -| approx_kl | 0.012836287 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00638 | -| n_updates | 115130 | -| policy_gradient_loss | 0.0205 | -| std | 0.0222 | -| value_loss | 1.37e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11515 | -| time_elapsed | 63490 | -| total_timesteps | 1473920 | -| train/ | | -| approx_kl | 0.0058804234 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 115140 | -| policy_gradient_loss | 0.00444 | -| std | 0.0222 | -| value_loss | 3.43e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11516 | -| time_elapsed | 63493 | -| total_timesteps | 1474048 | -| train/ | | -| approx_kl | 0.0087205265 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 115150 | -| policy_gradient_loss | 0.00406 | -| std | 0.0221 | -| value_loss | 1.28e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11517 | -| time_elapsed | 63499 | -| total_timesteps | 1474176 | -| train/ | | -| approx_kl | 0.0180063 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.834 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 115160 | -| policy_gradient_loss | -0.00606 | -| std | 0.0221 | -| value_loss | 0.00332 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11518 | -| time_elapsed | 63502 | -| total_timesteps | 1474304 | -| train/ | | -| approx_kl | 0.018272843 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.00373 | -| n_updates | 115170 | -| policy_gradient_loss | -0.000514 | -| std | 0.0221 | -| value_loss | 1.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11519 | -| time_elapsed | 63505 | -| total_timesteps | 1474432 | -| train/ | | -| approx_kl | 0.004711573 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 115180 | -| policy_gradient_loss | -0.017 | -| std | 0.0221 | -| value_loss | 3.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11520 | -| time_elapsed | 63508 | -| total_timesteps | 1474560 | -| train/ | | -| approx_kl | 0.008178528 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.00709 | -| n_updates | 115190 | -| policy_gradient_loss | -0.00488 | -| std | 0.0221 | -| value_loss | 1.69e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11521 | -| time_elapsed | 63512 | -| total_timesteps | 1474688 | -| train/ | | -| approx_kl | 0.0005561183 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 115200 | -| policy_gradient_loss | 0.000166 | -| std | 0.0221 | -| value_loss | 1.63e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11522 | -| time_elapsed | 63515 | -| total_timesteps | 1474816 | -| train/ | | -| approx_kl | 0.0048426753 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -18.4 | -| learning_rate | 0.0003 | -| loss | 0.00056 | -| n_updates | 115210 | -| policy_gradient_loss | 0.00217 | -| std | 0.0221 | -| value_loss | 1.33e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11523 | -| time_elapsed | 63519 | -| total_timesteps | 1474944 | -| train/ | | -| approx_kl | 0.006182789 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 115220 | -| policy_gradient_loss | 0.00681 | -| std | 0.0221 | -| value_loss | 1.66e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11524 | -| time_elapsed | 63522 | -| total_timesteps | 1475072 | -| train/ | | -| approx_kl | 2.5937334e-06 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -5.84e-05 | -| n_updates | 115230 | -| policy_gradient_loss | 0.00842 | -| std | 0.0221 | -| value_loss | 3.4e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11525 | -| time_elapsed | 63528 | -| total_timesteps | 1475200 | -| train/ | | -| approx_kl | 0.05617376 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -14.4 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 115240 | -| policy_gradient_loss | -0.0178 | -| std | 0.0221 | -| value_loss | 0.00532 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11526 | -| time_elapsed | 63532 | -| total_timesteps | 1475328 | -| train/ | | -| approx_kl | 0.0005799411 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | 0.0014 | -| n_updates | 115250 | -| policy_gradient_loss | 0.0051 | -| std | 0.0221 | -| value_loss | 1.47e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11527 | -| time_elapsed | 63535 | -| total_timesteps | 1475456 | -| train/ | | -| approx_kl | 0.0070561958 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -9.06 | -| learning_rate | 0.0003 | -| loss | 0.000611 | -| n_updates | 115260 | -| policy_gradient_loss | 0.00584 | -| std | 0.022 | -| value_loss | 2.2e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11528 | -| time_elapsed | 63538 | -| total_timesteps | 1475584 | -| train/ | | -| approx_kl | 0.0066382815 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 115270 | -| policy_gradient_loss | 0.00714 | -| std | 0.022 | -| value_loss | 4.51e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11529 | -| time_elapsed | 63542 | -| total_timesteps | 1475712 | -| train/ | | -| approx_kl | 0.024509417 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.00314 | -| learning_rate | 0.0003 | -| loss | 0.00296 | -| n_updates | 115280 | -| policy_gradient_loss | -0.000529 | -| std | 0.022 | -| value_loss | 3.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11530 | -| time_elapsed | 63545 | -| total_timesteps | 1475840 | -| train/ | | -| approx_kl | 0.025521837 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00895 | -| n_updates | 115290 | -| policy_gradient_loss | -0.00703 | -| std | 0.022 | -| value_loss | 1.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11531 | -| time_elapsed | 63549 | -| total_timesteps | 1475968 | -| train/ | | -| approx_kl | 0.047748063 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 115300 | -| policy_gradient_loss | 0.00219 | -| std | 0.022 | -| value_loss | 9.33e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11532 | -| time_elapsed | 63552 | -| total_timesteps | 1476096 | -| train/ | | -| approx_kl | 0.011573529 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 115310 | -| policy_gradient_loss | -0.000304 | -| std | 0.022 | -| value_loss | 7.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11533 | -| time_elapsed | 63560 | -| total_timesteps | 1476224 | -| train/ | | -| approx_kl | 0.018090006 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 115320 | -| policy_gradient_loss | -0.0148 | -| std | 0.022 | -| value_loss | 0.000381 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11534 | -| time_elapsed | 63563 | -| total_timesteps | 1476352 | -| train/ | | -| approx_kl | 2.440717e-05 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.000453 | -| n_updates | 115330 | -| policy_gradient_loss | 0.0063 | -| std | 0.022 | -| value_loss | 2.46e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11535 | -| time_elapsed | 63566 | -| total_timesteps | 1476480 | -| train/ | | -| approx_kl | 0.000557038 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00415 | -| n_updates | 115340 | -| policy_gradient_loss | 0.00812 | -| std | 0.022 | -| value_loss | 2.89e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11536 | -| time_elapsed | 63569 | -| total_timesteps | 1476608 | -| train/ | | -| approx_kl | 0.00083626295 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 115350 | -| policy_gradient_loss | 0.00661 | -| std | 0.022 | -| value_loss | 1.21e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11537 | -| time_elapsed | 63573 | -| total_timesteps | 1476736 | -| train/ | | -| approx_kl | 0.008045873 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 115360 | -| policy_gradient_loss | 0.00152 | -| std | 0.022 | -| value_loss | 8.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11538 | -| time_elapsed | 63577 | -| total_timesteps | 1476864 | -| train/ | | -| approx_kl | 0.022560786 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.000123 | -| n_updates | 115370 | -| policy_gradient_loss | -0.00122 | -| std | 0.022 | -| value_loss | 2.1e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11539 | -| time_elapsed | 63581 | -| total_timesteps | 1476992 | -| train/ | | -| approx_kl | 5.6487974e-05 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -5.51 | -| learning_rate | 0.0003 | -| loss | -0.000343 | -| n_updates | 115380 | -| policy_gradient_loss | 0.000513 | -| std | 0.0221 | -| value_loss | 2.61e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11540 | -| time_elapsed | 63584 | -| total_timesteps | 1477120 | -| train/ | | -| approx_kl | 0.012520706 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -313 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 115390 | -| policy_gradient_loss | 0.00274 | -| std | 0.0221 | -| value_loss | 6.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11541 | -| time_elapsed | 63594 | -| total_timesteps | 1477248 | -| train/ | | -| approx_kl | 0.025784137 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 115400 | -| policy_gradient_loss | -0.00692 | -| std | 0.0221 | -| value_loss | 0.000702 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11542 | -| time_elapsed | 63598 | -| total_timesteps | 1477376 | -| train/ | | -| approx_kl | 0.014769668 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.334 | -| learning_rate | 0.0003 | -| loss | 0.000965 | -| n_updates | 115410 | -| policy_gradient_loss | -0.000438 | -| std | 0.0221 | -| value_loss | 4.51e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11543 | -| time_elapsed | 63602 | -| total_timesteps | 1477504 | -| train/ | | -| approx_kl | 0.0190573 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.367 | -| learning_rate | 0.0003 | -| loss | 0.00864 | -| n_updates | 115420 | -| policy_gradient_loss | 0.000783 | -| std | 0.0221 | -| value_loss | 2.2e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11544 | -| time_elapsed | 63606 | -| total_timesteps | 1477632 | -| train/ | | -| approx_kl | 7.602852e-06 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | -0.000279 | -| n_updates | 115430 | -| policy_gradient_loss | 0.00434 | -| std | 0.0221 | -| value_loss | 7.44e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11545 | -| time_elapsed | 63610 | -| total_timesteps | 1477760 | -| train/ | | -| approx_kl | 0.00087654823 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0772 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 115440 | -| policy_gradient_loss | 0.00595 | -| std | 0.0221 | -| value_loss | 4.87e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11546 | -| time_elapsed | 63614 | -| total_timesteps | 1477888 | -| train/ | | -| approx_kl | 0.018317891 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | 0.00317 | -| n_updates | 115450 | -| policy_gradient_loss | -0.00176 | -| std | 0.0221 | -| value_loss | 2.74e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11547 | -| time_elapsed | 63619 | -| total_timesteps | 1478016 | -| train/ | | -| approx_kl | 8.895528e-06 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0516 | -| learning_rate | 0.0003 | -| loss | -0.000292 | -| n_updates | 115460 | -| policy_gradient_loss | 0.00417 | -| std | 0.0221 | -| value_loss | 1.81e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11548 | -| time_elapsed | 63627 | -| total_timesteps | 1478144 | -| train/ | | -| approx_kl | 0.010019733 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 115470 | -| policy_gradient_loss | -0.0117 | -| std | 0.0221 | -| value_loss | 0.000282 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11549 | -| time_elapsed | 63630 | -| total_timesteps | 1478272 | -| train/ | | -| approx_kl | 0.006940025 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | 0.00097 | -| n_updates | 115480 | -| policy_gradient_loss | 0.00162 | -| std | 0.0221 | -| value_loss | 9.13e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11550 | -| time_elapsed | 63633 | -| total_timesteps | 1478400 | -| train/ | | -| approx_kl | 0.010855766 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.517 | -| learning_rate | 0.0003 | -| loss | 0.00188 | -| n_updates | 115490 | -| policy_gradient_loss | 0.00222 | -| std | 0.0221 | -| value_loss | 2.41e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11551 | -| time_elapsed | 63637 | -| total_timesteps | 1478528 | -| train/ | | -| approx_kl | 0.004183961 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 115500 | -| policy_gradient_loss | 0.000975 | -| std | 0.0222 | -| value_loss | 8.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11552 | -| time_elapsed | 63640 | -| total_timesteps | 1478656 | -| train/ | | -| approx_kl | 0.024534486 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 115510 | -| policy_gradient_loss | -0.00901 | -| std | 0.0222 | -| value_loss | 3.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11553 | -| time_elapsed | 63644 | -| total_timesteps | 1478784 | -| train/ | | -| approx_kl | 0.012450315 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 115520 | -| policy_gradient_loss | -0.00743 | -| std | 0.0222 | -| value_loss | 9.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11554 | -| time_elapsed | 63648 | -| total_timesteps | 1478912 | -| train/ | | -| approx_kl | 0.024238734 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -591 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 115530 | -| policy_gradient_loss | -0.00658 | -| std | 0.0222 | -| value_loss | 8.67e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11555 | -| time_elapsed | 63651 | -| total_timesteps | 1479040 | -| train/ | | -| approx_kl | 0.0016610054 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.00651 | -| n_updates | 115540 | -| policy_gradient_loss | -0.000514 | -| std | 0.0222 | -| value_loss | 4.83e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11556 | -| time_elapsed | 63659 | -| total_timesteps | 1479168 | -| train/ | | -| approx_kl | 0.10795797 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.00184 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 115550 | -| policy_gradient_loss | -0.0176 | -| std | 0.0222 | -| value_loss | 0.00206 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11557 | -| time_elapsed | 63663 | -| total_timesteps | 1479296 | -| train/ | | -| approx_kl | 0.016670862 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.00271 | -| n_updates | 115560 | -| policy_gradient_loss | 0.00164 | -| std | 0.0222 | -| value_loss | 6.8e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11558 | -| time_elapsed | 63667 | -| total_timesteps | 1479424 | -| train/ | | -| approx_kl | 0.0011903327 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | 0.0066 | -| n_updates | 115570 | -| policy_gradient_loss | -0.00236 | -| std | 0.0221 | -| value_loss | 0.000268 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11559 | -| time_elapsed | 63671 | -| total_timesteps | 1479552 | -| train/ | | -| approx_kl | 0.0055485573 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | -0.000993 | -| n_updates | 115580 | -| policy_gradient_loss | -0.000824 | -| std | 0.0221 | -| value_loss | 1.21e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11560 | -| time_elapsed | 63674 | -| total_timesteps | 1479680 | -| train/ | | -| approx_kl | 0.0001831213 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0929 | -| learning_rate | 0.0003 | -| loss | 0.00249 | -| n_updates | 115590 | -| policy_gradient_loss | -2.37e-05 | -| std | 0.0221 | -| value_loss | 9.66e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11561 | -| time_elapsed | 63678 | -| total_timesteps | 1479808 | -| train/ | | -| approx_kl | 0.0005933973 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 115600 | -| policy_gradient_loss | -0.0026 | -| std | 0.0221 | -| value_loss | 1.88e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11562 | -| time_elapsed | 63682 | -| total_timesteps | 1479936 | -| train/ | | -| approx_kl | 0.019227866 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | 0.00527 | -| n_updates | 115610 | -| policy_gradient_loss | -0.000635 | -| std | 0.0221 | -| value_loss | 1.29e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11563 | -| time_elapsed | 63686 | -| total_timesteps | 1480064 | -| train/ | | -| approx_kl | 2.7136877e-05 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.00107 | -| n_updates | 115620 | -| policy_gradient_loss | 0.00295 | -| std | 0.0221 | -| value_loss | 1.1e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11564 | -| time_elapsed | 63692 | -| total_timesteps | 1480192 | -| train/ | | -| approx_kl | 0.06334675 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 115630 | -| policy_gradient_loss | -0.0138 | -| std | 0.0221 | -| value_loss | 0.00274 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11565 | -| time_elapsed | 63697 | -| total_timesteps | 1480320 | -| train/ | | -| approx_kl | 0.00023906585 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | 0.0026 | -| n_updates | 115640 | -| policy_gradient_loss | -0.00714 | -| std | 0.0221 | -| value_loss | 6.42e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11566 | -| time_elapsed | 63700 | -| total_timesteps | 1480448 | -| train/ | | -| approx_kl | 0.05668132 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 115650 | -| policy_gradient_loss | -0.00752 | -| std | 0.0221 | -| value_loss | 2.49e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11567 | -| time_elapsed | 63703 | -| total_timesteps | 1480576 | -| train/ | | -| approx_kl | 0.0012808363 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | -0.000405 | -| n_updates | 115660 | -| policy_gradient_loss | -0.00026 | -| std | 0.0221 | -| value_loss | 5.71e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11568 | -| time_elapsed | 63706 | -| total_timesteps | 1480704 | -| train/ | | -| approx_kl | 0.009440562 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 115670 | -| policy_gradient_loss | 0.0037 | -| std | 0.0221 | -| value_loss | 4.88e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11569 | -| time_elapsed | 63709 | -| total_timesteps | 1480832 | -| train/ | | -| approx_kl | 0.0021812213 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.00202 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 115680 | -| policy_gradient_loss | -0.0004 | -| std | 0.0222 | -| value_loss | 9.13e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11570 | -| time_elapsed | 63711 | -| total_timesteps | 1480960 | -| train/ | | -| approx_kl | 0.0114376675 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | 0.00271 | -| n_updates | 115690 | -| policy_gradient_loss | 0.00357 | -| std | 0.0222 | -| value_loss | 3.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11571 | -| time_elapsed | 63714 | -| total_timesteps | 1481088 | -| train/ | | -| approx_kl | 0.022631349 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.00291 | -| n_updates | 115700 | -| policy_gradient_loss | 0.00701 | -| std | 0.0222 | -| value_loss | 1.87e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11572 | -| time_elapsed | 63720 | -| total_timesteps | 1481216 | -| train/ | | -| approx_kl | 0.07977359 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | -0.0272 | -| n_updates | 115710 | -| policy_gradient_loss | -0.0197 | -| std | 0.0222 | -| value_loss | 0.000215 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11573 | -| time_elapsed | 63723 | -| total_timesteps | 1481344 | -| train/ | | -| approx_kl | 0.0012531928 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -2.39 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 115720 | -| policy_gradient_loss | -0.00187 | -| std | 0.0222 | -| value_loss | 5.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11574 | -| time_elapsed | 63726 | -| total_timesteps | 1481472 | -| train/ | | -| approx_kl | 0.001331897 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -9.83 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 115730 | -| policy_gradient_loss | 0.00164 | -| std | 0.0222 | -| value_loss | 5.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11575 | -| time_elapsed | 63730 | -| total_timesteps | 1481600 | -| train/ | | -| approx_kl | 0.013594936 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -2.36 | -| learning_rate | 0.0003 | -| loss | 0.000968 | -| n_updates | 115740 | -| policy_gradient_loss | 0.003 | -| std | 0.0221 | -| value_loss | 2.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11576 | -| time_elapsed | 63734 | -| total_timesteps | 1481728 | -| train/ | | -| approx_kl | 0.022561532 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.584 | -| learning_rate | 0.0003 | -| loss | -0.00813 | -| n_updates | 115750 | -| policy_gradient_loss | -0.00579 | -| std | 0.0221 | -| value_loss | 6.81e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11577 | -| time_elapsed | 63738 | -| total_timesteps | 1481856 | -| train/ | | -| approx_kl | 0.0071280417 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | 0.000178 | -| n_updates | 115760 | -| policy_gradient_loss | 0.00338 | -| std | 0.0221 | -| value_loss | 2.13e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 11578 | -| time_elapsed | 63741 | -| total_timesteps | 1481984 | -| train/ | | -| approx_kl | 0.018168688 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.39 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | 0.00919 | -| n_updates | 115770 | -| policy_gradient_loss | 0.0111 | -| std | 0.0221 | -| value_loss | 1.06e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 11579 | -| time_elapsed | 63745 | -| total_timesteps | 1482112 | -| train/ | | -| approx_kl | 0.0011971709 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.000811 | -| n_updates | 115780 | -| policy_gradient_loss | -0.000172 | -| std | 0.022 | -| value_loss | 9.55e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 11580 | -| time_elapsed | 63756 | -| total_timesteps | 1482240 | -| train/ | | -| approx_kl | 0.021760505 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.865 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 115790 | -| policy_gradient_loss | -0.00922 | -| std | 0.0221 | -| value_loss | 0.00183 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 11581 | -| time_elapsed | 63759 | -| total_timesteps | 1482368 | -| train/ | | -| approx_kl | 0.04682521 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.00305 | -| n_updates | 115800 | -| policy_gradient_loss | -0.00604 | -| std | 0.0221 | -| value_loss | 1.9e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 11582 | -| time_elapsed | 63763 | -| total_timesteps | 1482496 | -| train/ | | -| approx_kl | 0.06766671 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.00233 | -| learning_rate | 0.0003 | -| loss | 0.0319 | -| n_updates | 115810 | -| policy_gradient_loss | 0.00211 | -| std | 0.022 | -| value_loss | 7.61e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 11583 | -| time_elapsed | 63766 | -| total_timesteps | 1482624 | -| train/ | | -| approx_kl | 0.0016122647 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 115820 | -| policy_gradient_loss | -0.00523 | -| std | 0.022 | -| value_loss | 2.72e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 11584 | -| time_elapsed | 63770 | -| total_timesteps | 1482752 | -| train/ | | -| approx_kl | 0.008628298 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.00573 | -| learning_rate | 0.0003 | -| loss | -0.00969 | -| n_updates | 115830 | -| policy_gradient_loss | -0.00695 | -| std | 0.022 | -| value_loss | 2.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 11585 | -| time_elapsed | 63773 | -| total_timesteps | 1482880 | -| train/ | | -| approx_kl | 0.006123553 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00808 | -| n_updates | 115840 | -| policy_gradient_loss | -0.00138 | -| std | 0.022 | -| value_loss | 4.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11586 | -| time_elapsed | 63777 | -| total_timesteps | 1483008 | -| train/ | | -| approx_kl | 0.008512311 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 115850 | -| policy_gradient_loss | -0.00495 | -| std | 0.022 | -| value_loss | 1.23e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11587 | -| time_elapsed | 63785 | -| total_timesteps | 1483136 | -| train/ | | -| approx_kl | 0.07763032 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.754 | -| learning_rate | 0.0003 | -| loss | -0.0274 | -| n_updates | 115860 | -| policy_gradient_loss | -0.0222 | -| std | 0.022 | -| value_loss | 0.000749 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11588 | -| time_elapsed | 63789 | -| total_timesteps | 1483264 | -| train/ | | -| approx_kl | 0.006510787 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.0578 | -| learning_rate | 0.0003 | -| loss | -0.00993 | -| n_updates | 115870 | -| policy_gradient_loss | 0.00183 | -| std | 0.022 | -| value_loss | 4.28e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11589 | -| time_elapsed | 63792 | -| total_timesteps | 1483392 | -| train/ | | -| approx_kl | 1.4134217e-05 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -1.57 | -| learning_rate | 0.0003 | -| loss | -0.00098 | -| n_updates | 115880 | -| policy_gradient_loss | -0.00143 | -| std | 0.022 | -| value_loss | 1.27e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11590 | -| time_elapsed | 63796 | -| total_timesteps | 1483520 | -| train/ | | -| approx_kl | 0.00043348502 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.00554 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 115890 | -| policy_gradient_loss | 0.000363 | -| std | 0.022 | -| value_loss | 6.91e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11591 | -| time_elapsed | 63799 | -| total_timesteps | 1483648 | -| train/ | | -| approx_kl | 0.009947964 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.00476 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 115900 | -| policy_gradient_loss | 0.00146 | -| std | 0.022 | -| value_loss | 3.86e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11592 | -| time_elapsed | 63802 | -| total_timesteps | 1483776 | -| train/ | | -| approx_kl | 0.0014962964 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 115910 | -| policy_gradient_loss | 0.00551 | -| std | 0.022 | -| value_loss | 2.58e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11593 | -| time_elapsed | 63805 | -| total_timesteps | 1483904 | -| train/ | | -| approx_kl | 0.0015162956 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.00185 | -| n_updates | 115920 | -| policy_gradient_loss | 0.00682 | -| std | 0.022 | -| value_loss | 2.44e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11594 | -| time_elapsed | 63808 | -| total_timesteps | 1484032 | -| train/ | | -| approx_kl | 0.016417246 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | 0.00449 | -| n_updates | 115930 | -| policy_gradient_loss | -0.000281 | -| std | 0.022 | -| value_loss | 1.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11595 | -| time_elapsed | 63816 | -| total_timesteps | 1484160 | -| train/ | | -| approx_kl | 0.02931082 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.85 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 115940 | -| policy_gradient_loss | -0.0158 | -| std | 0.022 | -| value_loss | 0.00218 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11596 | -| time_elapsed | 63820 | -| total_timesteps | 1484288 | -| train/ | | -| approx_kl | 0.10045358 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | 0.0674 | -| n_updates | 115950 | -| policy_gradient_loss | 0.0121 | -| std | 0.0219 | -| value_loss | 3.58e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11597 | -| time_elapsed | 63823 | -| total_timesteps | 1484416 | -| train/ | | -| approx_kl | 1.7105136e-05 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | 2.54e-05 | -| n_updates | 115960 | -| policy_gradient_loss | 0.00793 | -| std | 0.0219 | -| value_loss | 9.31e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11598 | -| time_elapsed | 63827 | -| total_timesteps | 1484544 | -| train/ | | -| approx_kl | 0.0010354519 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.00412 | -| n_updates | 115970 | -| policy_gradient_loss | 0.00675 | -| std | 0.0219 | -| value_loss | 6.31e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11599 | -| time_elapsed | 63831 | -| total_timesteps | 1484672 | -| train/ | | -| approx_kl | 0.021702114 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.00643 | -| n_updates | 115980 | -| policy_gradient_loss | -0.00797 | -| std | 0.0219 | -| value_loss | 6.29e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11600 | -| time_elapsed | 63835 | -| total_timesteps | 1484800 | -| train/ | | -| approx_kl | 8.529518e-06 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.000193 | -| n_updates | 115990 | -| policy_gradient_loss | 0.000337 | -| std | 0.022 | -| value_loss | 6.54e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 11601 | -| time_elapsed | 63839 | -| total_timesteps | 1484928 | -| train/ | | -| approx_kl | 5.7005323e-05 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.00242 | -| learning_rate | 0.0003 | -| loss | 0.00075 | -| n_updates | 116000 | -| policy_gradient_loss | 0.00559 | -| std | 0.022 | -| value_loss | 1.55e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11602 | -| time_elapsed | 63842 | -| total_timesteps | 1485056 | -| train/ | | -| approx_kl | 0.0008259136 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.00489 | -| n_updates | 116010 | -| policy_gradient_loss | 0.0138 | -| std | 0.022 | -| value_loss | 9.93e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11603 | -| time_elapsed | 63848 | -| total_timesteps | 1485184 | -| train/ | | -| approx_kl | 0.018752651 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.815 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 116020 | -| policy_gradient_loss | -0.0107 | -| std | 0.022 | -| value_loss | 0.00341 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11604 | -| time_elapsed | 63851 | -| total_timesteps | 1485312 | -| train/ | | -| approx_kl | 0.00052542426 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 116030 | -| policy_gradient_loss | 0.00977 | -| std | 0.022 | -| value_loss | 1.05e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11605 | -| time_elapsed | 63856 | -| total_timesteps | 1485440 | -| train/ | | -| approx_kl | 0.0011348454 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.6 | -| learning_rate | 0.0003 | -| loss | 0.0003 | -| n_updates | 116040 | -| policy_gradient_loss | 0.014 | -| std | 0.022 | -| value_loss | 2.21e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11606 | -| time_elapsed | 63859 | -| total_timesteps | 1485568 | -| train/ | | -| approx_kl | 0.0074957674 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 116050 | -| policy_gradient_loss | 0.00451 | -| std | 0.022 | -| value_loss | 1.66e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11607 | -| time_elapsed | 63861 | -| total_timesteps | 1485696 | -| train/ | | -| approx_kl | 0.0026051686 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -5.84 | -| learning_rate | 0.0003 | -| loss | -0.00673 | -| n_updates | 116060 | -| policy_gradient_loss | 0.00303 | -| std | 0.022 | -| value_loss | 2.59e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11608 | -| time_elapsed | 63864 | -| total_timesteps | 1485824 | -| train/ | | -| approx_kl | 0.039018653 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.00648 | -| n_updates | 116070 | -| policy_gradient_loss | -0.00294 | -| std | 0.022 | -| value_loss | 6.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11609 | -| time_elapsed | 63866 | -| total_timesteps | 1485952 | -| train/ | | -| approx_kl | 0.035414226 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.751 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 116080 | -| policy_gradient_loss | -0.0161 | -| std | 0.022 | -| value_loss | 3.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11610 | -| time_elapsed | 63869 | -| total_timesteps | 1486080 | -| train/ | | -| approx_kl | 0.027275834 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 116090 | -| policy_gradient_loss | 0.00544 | -| std | 0.022 | -| value_loss | 1.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11611 | -| time_elapsed | 63875 | -| total_timesteps | 1486208 | -| train/ | | -| approx_kl | 0.021768223 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 116100 | -| policy_gradient_loss | -0.0167 | -| std | 0.022 | -| value_loss | 0.00196 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11612 | -| time_elapsed | 63878 | -| total_timesteps | 1486336 | -| train/ | | -| approx_kl | 0.0005630539 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | -0.000728 | -| n_updates | 116110 | -| policy_gradient_loss | -0.000414 | -| std | 0.0219 | -| value_loss | 2.7e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11613 | -| time_elapsed | 63880 | -| total_timesteps | 1486464 | -| train/ | | -| approx_kl | 0.0036992915 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.00711 | -| n_updates | 116120 | -| policy_gradient_loss | 0.00734 | -| std | 0.0219 | -| value_loss | 1.42e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11614 | -| time_elapsed | 63884 | -| total_timesteps | 1486592 | -| train/ | | -| approx_kl | 0.011183285 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 116130 | -| policy_gradient_loss | 0.00507 | -| std | 0.0219 | -| value_loss | 5.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11615 | -| time_elapsed | 63886 | -| total_timesteps | 1486720 | -| train/ | | -| approx_kl | 0.0010156711 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2.4 | -| explained_variance | -0.09 | -| learning_rate | 0.0003 | -| loss | -0.000398 | -| n_updates | 116140 | -| policy_gradient_loss | 0.00227 | -| std | 0.0219 | -| value_loss | 6.05e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11616 | -| time_elapsed | 63890 | -| total_timesteps | 1486848 | -| train/ | | -| approx_kl | 0.041589312 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | 0.00698 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 116150 | -| policy_gradient_loss | 0.00336 | -| std | 0.0218 | -| value_loss | 5.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11617 | -| time_elapsed | 63893 | -| total_timesteps | 1486976 | -| train/ | | -| approx_kl | 0.006804377 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -0.00101 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 116160 | -| policy_gradient_loss | 0.00411 | -| std | 0.0217 | -| value_loss | 4.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 11618 | -| time_elapsed | 63895 | -| total_timesteps | 1487104 | -| train/ | | -| approx_kl | 0.02620731 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -0.772 | -| learning_rate | 0.0003 | -| loss | 0.00388 | -| n_updates | 116170 | -| policy_gradient_loss | 0.00176 | -| std | 0.0217 | -| value_loss | 6.06e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 11619 | -| time_elapsed | 63903 | -| total_timesteps | 1487232 | -| train/ | | -| approx_kl | 0.06576163 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 116180 | -| policy_gradient_loss | -0.0135 | -| std | 0.0217 | -| value_loss | 0.0044 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 11620 | -| time_elapsed | 63907 | -| total_timesteps | 1487360 | -| train/ | | -| approx_kl | 0.028164975 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -49 | -| learning_rate | 0.0003 | -| loss | -0.00977 | -| n_updates | 116190 | -| policy_gradient_loss | -0.00648 | -| std | 0.0217 | -| value_loss | 8.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 11621 | -| time_elapsed | 63911 | -| total_timesteps | 1487488 | -| train/ | | -| approx_kl | 0.015840467 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -32.1 | -| learning_rate | 0.0003 | -| loss | 0.00975 | -| n_updates | 116200 | -| policy_gradient_loss | 0.00535 | -| std | 0.0217 | -| value_loss | 3.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 11622 | -| time_elapsed | 63914 | -| total_timesteps | 1487616 | -| train/ | | -| approx_kl | 0.006941316 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -5.11 | -| learning_rate | 0.0003 | -| loss | 0.00889 | -| n_updates | 116210 | -| policy_gradient_loss | 0.0105 | -| std | 0.0217 | -| value_loss | 4.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 11623 | -| time_elapsed | 63918 | -| total_timesteps | 1487744 | -| train/ | | -| approx_kl | 0.007913491 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -0.7 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 116220 | -| policy_gradient_loss | -0.00724 | -| std | 0.0217 | -| value_loss | 3.1e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 11624 | -| time_elapsed | 63922 | -| total_timesteps | 1487872 | -| train/ | | -| approx_kl | 0.0063652084 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.00554 | -| n_updates | 116230 | -| policy_gradient_loss | 0.0088 | -| std | 0.0217 | -| value_loss | 2.46e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11625 | -| time_elapsed | 63926 | -| total_timesteps | 1488000 | -| train/ | | -| approx_kl | 0.0013759076 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -0.00127 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 116240 | -| policy_gradient_loss | 0.000664 | -| std | 0.0217 | -| value_loss | 4.74e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11626 | -| time_elapsed | 63930 | -| total_timesteps | 1488128 | -| train/ | | -| approx_kl | 0.002088516 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | 0.00141 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 116250 | -| policy_gradient_loss | -0.0022 | -| std | 0.0216 | -| value_loss | 3.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11627 | -| time_elapsed | 63939 | -| total_timesteps | 1488256 | -| train/ | | -| approx_kl | 0.059573542 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | 0.477 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 116260 | -| policy_gradient_loss | -0.0198 | -| std | 0.0216 | -| value_loss | 0.00107 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11628 | -| time_elapsed | 63944 | -| total_timesteps | 1488384 | -| train/ | | -| approx_kl | 0.017061556 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 116270 | -| policy_gradient_loss | -0.0126 | -| std | 0.0216 | -| value_loss | 4.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11629 | -| time_elapsed | 63948 | -| total_timesteps | 1488512 | -| train/ | | -| approx_kl | 0.05994189 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -212 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 116280 | -| policy_gradient_loss | -0.0121 | -| std | 0.0216 | -| value_loss | 1.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11630 | -| time_elapsed | 63951 | -| total_timesteps | 1488640 | -| train/ | | -| approx_kl | 0.017461441 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -193 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 116290 | -| policy_gradient_loss | -0.0128 | -| std | 0.0216 | -| value_loss | 1.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11631 | -| time_elapsed | 63955 | -| total_timesteps | 1488768 | -| train/ | | -| approx_kl | 0.016696876 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -41.4 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 116300 | -| policy_gradient_loss | 0.00053 | -| std | 0.0216 | -| value_loss | 1.56e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11632 | -| time_elapsed | 63959 | -| total_timesteps | 1488896 | -| train/ | | -| approx_kl | 0.009319179 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 2.41 | -| explained_variance | -9.97 | -| learning_rate | 0.0003 | -| loss | 0.00013 | -| n_updates | 116310 | -| policy_gradient_loss | 0.000641 | -| std | 0.0216 | -| value_loss | 3.82e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11633 | -| time_elapsed | 63963 | -| total_timesteps | 1489024 | -| train/ | | -| approx_kl | 0.040297695 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.789 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 116320 | -| policy_gradient_loss | 0.00194 | -| std | 0.0216 | -| value_loss | 4.2e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11634 | -| time_elapsed | 63969 | -| total_timesteps | 1489152 | -| train/ | | -| approx_kl | 0.016820837 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0267 | -| n_updates | 116330 | -| policy_gradient_loss | -0.0153 | -| std | 0.0216 | -| value_loss | 9.04e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11635 | -| time_elapsed | 63973 | -| total_timesteps | 1489280 | -| train/ | | -| approx_kl | 0.03325667 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | 0.00738 | -| n_updates | 116340 | -| policy_gradient_loss | 7.68e-05 | -| std | 0.0216 | -| value_loss | 5.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11636 | -| time_elapsed | 63976 | -| total_timesteps | 1489408 | -| train/ | | -| approx_kl | 0.017499696 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -27.7 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 116350 | -| policy_gradient_loss | 0.00134 | -| std | 0.0216 | -| value_loss | 1.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11637 | -| time_elapsed | 63980 | -| total_timesteps | 1489536 | -| train/ | | -| approx_kl | 0.03472158 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0632 | -| learning_rate | 0.0003 | -| loss | 0.0191 | -| n_updates | 116360 | -| policy_gradient_loss | 0.00415 | -| std | 0.0215 | -| value_loss | 2.51e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11638 | -| time_elapsed | 63984 | -| total_timesteps | 1489664 | -| train/ | | -| approx_kl | 0.0024100523 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 116370 | -| policy_gradient_loss | -0.00759 | -| std | 0.0215 | -| value_loss | 1.23e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11639 | -| time_elapsed | 63986 | -| total_timesteps | 1489792 | -| train/ | | -| approx_kl | 0.020049954 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -1.02 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 116380 | -| policy_gradient_loss | -0.0106 | -| std | 0.0215 | -| value_loss | 6.69e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 11640 | -| time_elapsed | 63990 | -| total_timesteps | 1489920 | -| train/ | | -| approx_kl | 0.022048546 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.395 | -| learning_rate | 0.0003 | -| loss | 0.00328 | -| n_updates | 116390 | -| policy_gradient_loss | 0.00294 | -| std | 0.0215 | -| value_loss | 4.39e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11641 | -| time_elapsed | 63993 | -| total_timesteps | 1490048 | -| train/ | | -| approx_kl | 0.034287892 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.399 | -| learning_rate | 0.0003 | -| loss | 0.00975 | -| n_updates | 116400 | -| policy_gradient_loss | 0.00202 | -| std | 0.0215 | -| value_loss | 3.09e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11642 | -| time_elapsed | 63997 | -| total_timesteps | 1490176 | -| train/ | | -| approx_kl | 0.00522016 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 116410 | -| policy_gradient_loss | -0.0134 | -| std | 0.0215 | -| value_loss | 9.46e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11643 | -| time_elapsed | 64000 | -| total_timesteps | 1490304 | -| train/ | | -| approx_kl | 0.0003272267 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 116420 | -| policy_gradient_loss | -0.00436 | -| std | 0.0215 | -| value_loss | 3.87e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11644 | -| time_elapsed | 64003 | -| total_timesteps | 1490432 | -| train/ | | -| approx_kl | 0.008708073 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.464 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 116430 | -| policy_gradient_loss | -0.00596 | -| std | 0.0215 | -| value_loss | 2.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11645 | -| time_elapsed | 64007 | -| total_timesteps | 1490560 | -| train/ | | -| approx_kl | 0.012776364 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.00639 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 116440 | -| policy_gradient_loss | -0.00105 | -| std | 0.0215 | -| value_loss | 2.49e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11646 | -| time_elapsed | 64009 | -| total_timesteps | 1490688 | -| train/ | | -| approx_kl | 0.0070107975 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0725 | -| learning_rate | 0.0003 | -| loss | -0.00363 | -| n_updates | 116450 | -| policy_gradient_loss | -0.00215 | -| std | 0.0215 | -| value_loss | 1.33e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11647 | -| time_elapsed | 64012 | -| total_timesteps | 1490816 | -| train/ | | -| approx_kl | 0.024300514 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 116460 | -| policy_gradient_loss | 0.00101 | -| std | 0.0215 | -| value_loss | 7.89e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11648 | -| time_elapsed | 64014 | -| total_timesteps | 1490944 | -| train/ | | -| approx_kl | 0.0041994336 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.00462 | -| learning_rate | 0.0003 | -| loss | -0.00703 | -| n_updates | 116470 | -| policy_gradient_loss | 0.00307 | -| std | 0.0215 | -| value_loss | 9.09e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11649 | -| time_elapsed | 64017 | -| total_timesteps | 1491072 | -| train/ | | -| approx_kl | 0.0029943357 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.00636 | -| learning_rate | 0.0003 | -| loss | 0.00474 | -| n_updates | 116480 | -| policy_gradient_loss | 0.00788 | -| std | 0.0215 | -| value_loss | 1.92e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11650 | -| time_elapsed | 64021 | -| total_timesteps | 1491200 | -| train/ | | -| approx_kl | 0.008076391 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 116490 | -| policy_gradient_loss | -0.0108 | -| std | 0.0215 | -| value_loss | 0.00116 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11651 | -| time_elapsed | 64024 | -| total_timesteps | 1491328 | -| train/ | | -| approx_kl | 0.009178229 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | 0.00414 | -| n_updates | 116500 | -| policy_gradient_loss | 0.00839 | -| std | 0.0216 | -| value_loss | 3.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11652 | -| time_elapsed | 64027 | -| total_timesteps | 1491456 | -| train/ | | -| approx_kl | 0.029379409 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.00321 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 116510 | -| policy_gradient_loss | 0.00249 | -| std | 0.0216 | -| value_loss | 8.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11653 | -| time_elapsed | 64030 | -| total_timesteps | 1491584 | -| train/ | | -| approx_kl | 0.035004746 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 116520 | -| policy_gradient_loss | -0.00882 | -| std | 0.0216 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11654 | -| time_elapsed | 64034 | -| total_timesteps | 1491712 | -| train/ | | -| approx_kl | 0.0063762665 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 116530 | -| policy_gradient_loss | -0.00594 | -| std | 0.0216 | -| value_loss | 1.49e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11655 | -| time_elapsed | 64038 | -| total_timesteps | 1491840 | -| train/ | | -| approx_kl | 0.0051262532 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.00328 | -| n_updates | 116540 | -| policy_gradient_loss | 0.00719 | -| std | 0.0216 | -| value_loss | 1.64e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11656 | -| time_elapsed | 64042 | -| total_timesteps | 1491968 | -| train/ | | -| approx_kl | 0.0106782615 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 116550 | -| policy_gradient_loss | 0.00653 | -| std | 0.0216 | -| value_loss | 7.33e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11657 | -| time_elapsed | 64046 | -| total_timesteps | 1492096 | -| train/ | | -| approx_kl | 0.0020244704 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.00383 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 116560 | -| policy_gradient_loss | 0.000855 | -| std | 0.0216 | -| value_loss | 9.55e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11658 | -| time_elapsed | 64053 | -| total_timesteps | 1492224 | -| train/ | | -| approx_kl | 0.00661363 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 116570 | -| policy_gradient_loss | -0.00425 | -| std | 0.0216 | -| value_loss | 0.00165 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11659 | -| time_elapsed | 64057 | -| total_timesteps | 1492352 | -| train/ | | -| approx_kl | 0.027886948 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | 0.00968 | -| n_updates | 116580 | -| policy_gradient_loss | 0.00413 | -| std | 0.0215 | -| value_loss | 7.09e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11660 | -| time_elapsed | 64061 | -| total_timesteps | 1492480 | -| train/ | | -| approx_kl | 0.02523506 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.786 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 116590 | -| policy_gradient_loss | -0.000898 | -| std | 0.0215 | -| value_loss | 4.49e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11661 | -| time_elapsed | 64064 | -| total_timesteps | 1492608 | -| train/ | | -| approx_kl | 0.0016172384 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.00355 | -| n_updates | 116600 | -| policy_gradient_loss | -0.00233 | -| std | 0.0215 | -| value_loss | 5.24e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11662 | -| time_elapsed | 64066 | -| total_timesteps | 1492736 | -| train/ | | -| approx_kl | 0.0011273674 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 116610 | -| policy_gradient_loss | 0.000842 | -| std | 0.0215 | -| value_loss | 3.02e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11663 | -| time_elapsed | 64068 | -| total_timesteps | 1492864 | -| train/ | | -| approx_kl | 0.025313752 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00656 | -| n_updates | 116620 | -| policy_gradient_loss | -0.00441 | -| std | 0.0215 | -| value_loss | 1.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 11664 | -| time_elapsed | 64071 | -| total_timesteps | 1492992 | -| train/ | | -| approx_kl | 0.007510596 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 116630 | -| policy_gradient_loss | -0.000823 | -| std | 0.0215 | -| value_loss | 3.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11665 | -| time_elapsed | 64073 | -| total_timesteps | 1493120 | -| train/ | | -| approx_kl | 0.037663296 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 116640 | -| policy_gradient_loss | 0.00223 | -| std | 0.0215 | -| value_loss | 3.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11666 | -| time_elapsed | 64081 | -| total_timesteps | 1493248 | -| train/ | | -| approx_kl | 0.017772892 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -8.63 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 116650 | -| policy_gradient_loss | -0.0141 | -| std | 0.0215 | -| value_loss | 0.00336 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11667 | -| time_elapsed | 64084 | -| total_timesteps | 1493376 | -| train/ | | -| approx_kl | 0.023841448 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -42.6 | -| learning_rate | 0.0003 | -| loss | 0.000757 | -| n_updates | 116660 | -| policy_gradient_loss | 0.00509 | -| std | 0.0215 | -| value_loss | 4.47e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11668 | -| time_elapsed | 64087 | -| total_timesteps | 1493504 | -| train/ | | -| approx_kl | 0.02699988 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 116670 | -| policy_gradient_loss | 0.0318 | -| std | 0.0215 | -| value_loss | 2.02e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11669 | -| time_elapsed | 64091 | -| total_timesteps | 1493632 | -| train/ | | -| approx_kl | 0.037420116 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.297 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 116680 | -| policy_gradient_loss | 0.0415 | -| std | 0.0215 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11670 | -| time_elapsed | 64094 | -| total_timesteps | 1493760 | -| train/ | | -| approx_kl | 0.0067802756 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 116690 | -| policy_gradient_loss | -0.00222 | -| std | 0.0215 | -| value_loss | 6.82e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 11671 | -| time_elapsed | 64096 | -| total_timesteps | 1493888 | -| train/ | | -| approx_kl | 0.021585576 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 116700 | -| policy_gradient_loss | 0.0131 | -| std | 0.0215 | -| value_loss | 3.56e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11672 | -| time_elapsed | 64100 | -| total_timesteps | 1494016 | -| train/ | | -| approx_kl | 0.0018306933 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.00372 | -| n_updates | 116710 | -| policy_gradient_loss | 0.000512 | -| std | 0.0214 | -| value_loss | 1.31e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11673 | -| time_elapsed | 64110 | -| total_timesteps | 1494144 | -| train/ | | -| approx_kl | 0.015733967 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.918 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 116720 | -| policy_gradient_loss | -0.017 | -| std | 0.0214 | -| value_loss | 0.00162 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11674 | -| time_elapsed | 64114 | -| total_timesteps | 1494272 | -| train/ | | -| approx_kl | 0.0002057585 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.000337 | -| n_updates | 116730 | -| policy_gradient_loss | 0.00177 | -| std | 0.0214 | -| value_loss | 1.59e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11675 | -| time_elapsed | 64117 | -| total_timesteps | 1494400 | -| train/ | | -| approx_kl | 0.10088116 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -12.7 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 116740 | -| policy_gradient_loss | -0.0191 | -| std | 0.0214 | -| value_loss | 1.11e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11676 | -| time_elapsed | 64120 | -| total_timesteps | 1494528 | -| train/ | | -| approx_kl | 0.0072683385 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 116750 | -| policy_gradient_loss | -0.000155 | -| std | 0.0214 | -| value_loss | 6.79e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11677 | -| time_elapsed | 64124 | -| total_timesteps | 1494656 | -| train/ | | -| approx_kl | 0.007383453 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 116760 | -| policy_gradient_loss | -0.00729 | -| std | 0.0214 | -| value_loss | 2.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11678 | -| time_elapsed | 64129 | -| total_timesteps | 1494784 | -| train/ | | -| approx_kl | 0.045325212 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 116770 | -| policy_gradient_loss | -0.00637 | -| std | 0.0214 | -| value_loss | 4.06e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11679 | -| time_elapsed | 64132 | -| total_timesteps | 1494912 | -| train/ | | -| approx_kl | 0.00017057778 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.42 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.000971 | -| n_updates | 116780 | -| policy_gradient_loss | -0.000624 | -| std | 0.0214 | -| value_loss | 1.04e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11680 | -| time_elapsed | 64137 | -| total_timesteps | 1495040 | -| train/ | | -| approx_kl | 0.03123288 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 116790 | -| policy_gradient_loss | 0.000311 | -| std | 0.0214 | -| value_loss | 6.24e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11681 | -| time_elapsed | 64145 | -| total_timesteps | 1495168 | -| train/ | | -| approx_kl | 0.03232079 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.694 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 116800 | -| policy_gradient_loss | 0.00602 | -| std | 0.0213 | -| value_loss | 0.0063 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11682 | -| time_elapsed | 64148 | -| total_timesteps | 1495296 | -| train/ | | -| approx_kl | 0.00073119486 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.00451 | -| learning_rate | 0.0003 | -| loss | 0.00847 | -| n_updates | 116810 | -| policy_gradient_loss | 0.00542 | -| std | 0.0213 | -| value_loss | 2.35e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11683 | -| time_elapsed | 64152 | -| total_timesteps | 1495424 | -| train/ | | -| approx_kl | 0.039943136 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 116820 | -| policy_gradient_loss | 0.00957 | -| std | 0.0213 | -| value_loss | 8.16e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11684 | -| time_elapsed | 64155 | -| total_timesteps | 1495552 | -| train/ | | -| approx_kl | 0.00035569398 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 116830 | -| policy_gradient_loss | -0.000599 | -| std | 0.0213 | -| value_loss | 1.8e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11685 | -| time_elapsed | 64158 | -| total_timesteps | 1495680 | -| train/ | | -| approx_kl | 0.004458659 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | 0.00683 | -| n_updates | 116840 | -| policy_gradient_loss | -0.00104 | -| std | 0.0213 | -| value_loss | 1.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11686 | -| time_elapsed | 64161 | -| total_timesteps | 1495808 | -| train/ | | -| approx_kl | 0.010385994 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 116850 | -| policy_gradient_loss | -0.000715 | -| std | 0.0213 | -| value_loss | 9.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11687 | -| time_elapsed | 64164 | -| total_timesteps | 1495936 | -| train/ | | -| approx_kl | 0.01786099 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.00699 | -| n_updates | 116860 | -| policy_gradient_loss | 0.0109 | -| std | 0.0213 | -| value_loss | 6.41e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11688 | -| time_elapsed | 64167 | -| total_timesteps | 1496064 | -| train/ | | -| approx_kl | 0.0016669668 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.00605 | -| learning_rate | 0.0003 | -| loss | 0.00603 | -| n_updates | 116870 | -| policy_gradient_loss | -0.00415 | -| std | 0.0213 | -| value_loss | 1.86e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11689 | -| time_elapsed | 64173 | -| total_timesteps | 1496192 | -| train/ | | -| approx_kl | 0.008337595 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.715 | -| learning_rate | 0.0003 | -| loss | 0.00482 | -| n_updates | 116880 | -| policy_gradient_loss | -0.00151 | -| std | 0.0213 | -| value_loss | 0.00588 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11690 | -| time_elapsed | 64176 | -| total_timesteps | 1496320 | -| train/ | | -| approx_kl | 0.02345353 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.0059 | -| learning_rate | 0.0003 | -| loss | 0.0043 | -| n_updates | 116890 | -| policy_gradient_loss | 0.00272 | -| std | 0.0213 | -| value_loss | 0.000111 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11691 | -| time_elapsed | 64180 | -| total_timesteps | 1496448 | -| train/ | | -| approx_kl | 4.663132e-06 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.494 | -| learning_rate | 0.0003 | -| loss | -0.000122 | -| n_updates | 116900 | -| policy_gradient_loss | 0.0123 | -| std | 0.0212 | -| value_loss | 3.31e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11692 | -| time_elapsed | 64183 | -| total_timesteps | 1496576 | -| train/ | | -| approx_kl | 0.01854249 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.84 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 116910 | -| policy_gradient_loss | 0.0013 | -| std | 0.0212 | -| value_loss | 3.58e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11693 | -| time_elapsed | 64186 | -| total_timesteps | 1496704 | -| train/ | | -| approx_kl | 0.0042553945 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.361 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 116920 | -| policy_gradient_loss | 8.39e-05 | -| std | 0.0212 | -| value_loss | 6.89e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11694 | -| time_elapsed | 64188 | -| total_timesteps | 1496832 | -| train/ | | -| approx_kl | 0.042132255 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 116930 | -| policy_gradient_loss | -0.016 | -| std | 0.0212 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11695 | -| time_elapsed | 64191 | -| total_timesteps | 1496960 | -| train/ | | -| approx_kl | 0.019409645 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.00501 | -| learning_rate | 0.0003 | -| loss | 0.00863 | -| n_updates | 116940 | -| policy_gradient_loss | 0.00348 | -| std | 0.0212 | -| value_loss | 2.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11696 | -| time_elapsed | 64195 | -| total_timesteps | 1497088 | -| train/ | | -| approx_kl | 0.008995674 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.000852 | -| learning_rate | 0.0003 | -| loss | 0.000343 | -| n_updates | 116950 | -| policy_gradient_loss | 0.00141 | -| std | 0.0213 | -| value_loss | 5.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11697 | -| time_elapsed | 64201 | -| total_timesteps | 1497216 | -| train/ | | -| approx_kl | 0.016186796 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | 0.716 | -| learning_rate | 0.0003 | -| loss | -0.00852 | -| n_updates | 116960 | -| policy_gradient_loss | -0.0125 | -| std | 0.0213 | -| value_loss | 0.00802 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11698 | -| time_elapsed | 64205 | -| total_timesteps | 1497344 | -| train/ | | -| approx_kl | 0.041883994 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.00176 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 116970 | -| policy_gradient_loss | -0.00568 | -| std | 0.0213 | -| value_loss | 0.00138 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11699 | -| time_elapsed | 64209 | -| total_timesteps | 1497472 | -| train/ | | -| approx_kl | 0.0071511935 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -5.28 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 116980 | -| policy_gradient_loss | -0.00126 | -| std | 0.0213 | -| value_loss | 8.09e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11700 | -| time_elapsed | 64211 | -| total_timesteps | 1497600 | -| train/ | | -| approx_kl | 0.008281972 | -| clip_fraction | 0.018 | -| clip_range | 0.2 | -| entropy_loss | 2.43 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | 0.000553 | -| n_updates | 116990 | -| policy_gradient_loss | -4.25e-05 | -| std | 0.0212 | -| value_loss | 2.11e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11701 | -| time_elapsed | 64215 | -| total_timesteps | 1497728 | -| train/ | | -| approx_kl | 9.949785e-06 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | 0.000234 | -| n_updates | 117000 | -| policy_gradient_loss | 0.00256 | -| std | 0.0211 | -| value_loss | 7.5e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11702 | -| time_elapsed | 64218 | -| total_timesteps | 1497856 | -| train/ | | -| approx_kl | 0.0006844527 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | 0.000835 | -| n_updates | 117010 | -| policy_gradient_loss | 0.0168 | -| std | 0.0211 | -| value_loss | 5.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 11703 | -| time_elapsed | 64222 | -| total_timesteps | 1497984 | -| train/ | | -| approx_kl | 0.008019324 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | 0.00639 | -| n_updates | 117020 | -| policy_gradient_loss | 0.014 | -| std | 0.0211 | -| value_loss | 7.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11704 | -| time_elapsed | 64226 | -| total_timesteps | 1498112 | -| train/ | | -| approx_kl | 0.013831479 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 117030 | -| policy_gradient_loss | 0.000519 | -| std | 0.0211 | -| value_loss | 4.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11705 | -| time_elapsed | 64236 | -| total_timesteps | 1498240 | -| train/ | | -| approx_kl | 0.10476572 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -11.3 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 117040 | -| policy_gradient_loss | -0.0173 | -| std | 0.0211 | -| value_loss | 0.00389 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11706 | -| time_elapsed | 64239 | -| total_timesteps | 1498368 | -| train/ | | -| approx_kl | 1.7274171e-05 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | 0.000567 | -| n_updates | 117050 | -| policy_gradient_loss | -0.000398 | -| std | 0.0211 | -| value_loss | 3.64e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11707 | -| time_elapsed | 64243 | -| total_timesteps | 1498496 | -| train/ | | -| approx_kl | 0.01774364 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -3.66 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 117060 | -| policy_gradient_loss | 0.000404 | -| std | 0.0211 | -| value_loss | 1.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11708 | -| time_elapsed | 64246 | -| total_timesteps | 1498624 | -| train/ | | -| approx_kl | 0.029118828 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.936 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 117070 | -| policy_gradient_loss | -0.0101 | -| std | 0.0211 | -| value_loss | 3.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11709 | -| time_elapsed | 64249 | -| total_timesteps | 1498752 | -| train/ | | -| approx_kl | 0.028363226 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 117080 | -| policy_gradient_loss | 0.00456 | -| std | 0.0211 | -| value_loss | 2.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11710 | -| time_elapsed | 64251 | -| total_timesteps | 1498880 | -| train/ | | -| approx_kl | 0.009119037 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0937 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 117090 | -| policy_gradient_loss | 0.000106 | -| std | 0.0211 | -| value_loss | 4.56e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11711 | -| time_elapsed | 64255 | -| total_timesteps | 1499008 | -| train/ | | -| approx_kl | 0.01339235 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0954 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 117100 | -| policy_gradient_loss | 0.0142 | -| std | 0.0211 | -| value_loss | 1.68e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11712 | -| time_elapsed | 64264 | -| total_timesteps | 1499136 | -| train/ | | -| approx_kl | 0.31966996 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 117110 | -| policy_gradient_loss | -0.0087 | -| std | 0.021 | -| value_loss | 0.000116 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11713 | -| time_elapsed | 64269 | -| total_timesteps | 1499264 | -| train/ | | -| approx_kl | 0.0107471775 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | 0.0566 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 117120 | -| policy_gradient_loss | -0.0014 | -| std | 0.021 | -| value_loss | 2.35e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11714 | -| time_elapsed | 64272 | -| total_timesteps | 1499392 | -| train/ | | -| approx_kl | 0.020409752 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -33 | -| learning_rate | 0.0003 | -| loss | -0.00915 | -| n_updates | 117130 | -| policy_gradient_loss | -0.00621 | -| std | 0.021 | -| value_loss | 2.71e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11715 | -| time_elapsed | 64275 | -| total_timesteps | 1499520 | -| train/ | | -| approx_kl | 0.00083867647 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -7.04 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 117140 | -| policy_gradient_loss | -0.00441 | -| std | 0.021 | -| value_loss | 5.52e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11716 | -| time_elapsed | 64278 | -| total_timesteps | 1499648 | -| train/ | | -| approx_kl | 0.052283384 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -4.17e-06 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 117150 | -| policy_gradient_loss | -0.00335 | -| std | 0.021 | -| value_loss | 2.82e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11717 | -| time_elapsed | 64282 | -| total_timesteps | 1499776 | -| train/ | | -| approx_kl | 0.0024775122 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 117160 | -| policy_gradient_loss | -0.00181 | -| std | 0.021 | -| value_loss | 1.07e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 11718 | -| time_elapsed | 64285 | -| total_timesteps | 1499904 | -| train/ | | -| approx_kl | 0.00018305983 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 0.000248 | -| n_updates | 117170 | -| policy_gradient_loss | -0.000517 | -| std | 0.021 | -| value_loss | 6.98e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11719 | -| time_elapsed | 64290 | -| total_timesteps | 1500032 | -| train/ | | -| approx_kl | 9.559095e-05 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | -0.000554 | -| n_updates | 117180 | -| policy_gradient_loss | 0.00261 | -| std | 0.021 | -| value_loss | 1.72e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11720 | -| time_elapsed | 64298 | -| total_timesteps | 1500160 | -| train/ | | -| approx_kl | 0.0055893413 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.00927 | -| n_updates | 117190 | -| policy_gradient_loss | -0.00515 | -| std | 0.021 | -| value_loss | 8.25e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11721 | -| time_elapsed | 64302 | -| total_timesteps | 1500288 | -| train/ | | -| approx_kl | 0.025803488 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | 0.00133 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 117200 | -| policy_gradient_loss | -0.00338 | -| std | 0.0211 | -| value_loss | 1.48e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11722 | -| time_elapsed | 64306 | -| total_timesteps | 1500416 | -| train/ | | -| approx_kl | 0.0036550146 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | 0.00599 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 117210 | -| policy_gradient_loss | -0.00218 | -| std | 0.0211 | -| value_loss | 2.04e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11723 | -| time_elapsed | 64310 | -| total_timesteps | 1500544 | -| train/ | | -| approx_kl | 0.13145235 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0508 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 117220 | -| policy_gradient_loss | 0.0309 | -| std | 0.0211 | -| value_loss | 7.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11724 | -| time_elapsed | 64314 | -| total_timesteps | 1500672 | -| train/ | | -| approx_kl | 0.021394739 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 117230 | -| policy_gradient_loss | -0.00274 | -| std | 0.0211 | -| value_loss | 7.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11725 | -| time_elapsed | 64318 | -| total_timesteps | 1500800 | -| train/ | | -| approx_kl | 0.030330662 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | 0.00604 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 117240 | -| policy_gradient_loss | 0.00471 | -| std | 0.0211 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 11726 | -| time_elapsed | 64321 | -| total_timesteps | 1500928 | -| train/ | | -| approx_kl | 0.056856923 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 117250 | -| policy_gradient_loss | 0.00231 | -| std | 0.0211 | -| value_loss | 8.81e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11727 | -| time_elapsed | 64324 | -| total_timesteps | 1501056 | -| train/ | | -| approx_kl | 0.0048060166 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.00989 | -| n_updates | 117260 | -| policy_gradient_loss | 0.00477 | -| std | 0.0211 | -| value_loss | 3.43e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11728 | -| time_elapsed | 64331 | -| total_timesteps | 1501184 | -| train/ | | -| approx_kl | 0.03833506 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | 0.152 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 117270 | -| policy_gradient_loss | -0.0169 | -| std | 0.0211 | -| value_loss | 0.00133 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11729 | -| time_elapsed | 64335 | -| total_timesteps | 1501312 | -| train/ | | -| approx_kl | 0.00017416338 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.44 | -| explained_variance | -16.5 | -| learning_rate | 0.0003 | -| loss | -0.000111 | -| n_updates | 117280 | -| policy_gradient_loss | -0.000705 | -| std | 0.0209 | -| value_loss | 2.12e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11730 | -| time_elapsed | 64339 | -| total_timesteps | 1501440 | -| train/ | | -| approx_kl | 1.9355211e-05 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -15.9 | -| learning_rate | 0.0003 | -| loss | -0.000217 | -| n_updates | 117290 | -| policy_gradient_loss | -0.000741 | -| std | 0.0208 | -| value_loss | 1.09e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11731 | -| time_elapsed | 64343 | -| total_timesteps | 1501568 | -| train/ | | -| approx_kl | 3.0783005e-05 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | 0.00058 | -| n_updates | 117300 | -| policy_gradient_loss | 0.000374 | -| std | 0.0208 | -| value_loss | 5.92e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11732 | -| time_elapsed | 64347 | -| total_timesteps | 1501696 | -| train/ | | -| approx_kl | 0.004973638 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -0.0688 | -| learning_rate | 0.0003 | -| loss | 0.00598 | -| n_updates | 117310 | -| policy_gradient_loss | 0.00925 | -| std | 0.0208 | -| value_loss | 1.79e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11733 | -| time_elapsed | 64350 | -| total_timesteps | 1501824 | -| train/ | | -| approx_kl | 0.0025538118 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -0.00706 | -| learning_rate | 0.0003 | -| loss | 0.00497 | -| n_updates | 117320 | -| policy_gradient_loss | 0.0169 | -| std | 0.0208 | -| value_loss | 6.12e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 11734 | -| time_elapsed | 64352 | -| total_timesteps | 1501952 | -| train/ | | -| approx_kl | 0.013702222 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | 0.000848 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 117330 | -| policy_gradient_loss | 0.00138 | -| std | 0.0208 | -| value_loss | 6.99e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11735 | -| time_elapsed | 64355 | -| total_timesteps | 1502080 | -| train/ | | -| approx_kl | 0.0034269518 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 117340 | -| policy_gradient_loss | -0.00879 | -| std | 0.0208 | -| value_loss | 2.25e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11736 | -| time_elapsed | 64360 | -| total_timesteps | 1502208 | -| train/ | | -| approx_kl | 0.027068172 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 117350 | -| policy_gradient_loss | -0.00254 | -| std | 0.0208 | -| value_loss | 0.000471 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11737 | -| time_elapsed | 64364 | -| total_timesteps | 1502336 | -| train/ | | -| approx_kl | 0.025286224 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -0.000129 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 117360 | -| policy_gradient_loss | -0.00734 | -| std | 0.0208 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11738 | -| time_elapsed | 64367 | -| total_timesteps | 1502464 | -| train/ | | -| approx_kl | 0.027574636 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 117370 | -| policy_gradient_loss | -0.00453 | -| std | 0.0208 | -| value_loss | 9.86e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11739 | -| time_elapsed | 64370 | -| total_timesteps | 1502592 | -| train/ | | -| approx_kl | 0.00013441592 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 2.45 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 117380 | -| policy_gradient_loss | 0.000909 | -| std | 0.0207 | -| value_loss | 6.35e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11740 | -| time_elapsed | 64373 | -| total_timesteps | 1502720 | -| train/ | | -| approx_kl | 0.050413888 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.000863 | -| n_updates | 117390 | -| policy_gradient_loss | -0.0071 | -| std | 0.0207 | -| value_loss | 3.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11741 | -| time_elapsed | 64376 | -| total_timesteps | 1502848 | -| train/ | | -| approx_kl | 0.011683546 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 117400 | -| policy_gradient_loss | -0.000689 | -| std | 0.0207 | -| value_loss | 7.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 11742 | -| time_elapsed | 64379 | -| total_timesteps | 1502976 | -| train/ | | -| approx_kl | 0.04194864 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 117410 | -| policy_gradient_loss | 0.00317 | -| std | 0.0207 | -| value_loss | 4e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11743 | -| time_elapsed | 64384 | -| total_timesteps | 1503104 | -| train/ | | -| approx_kl | 0.0005693147 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.00642 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 117420 | -| policy_gradient_loss | -0.00413 | -| std | 0.0207 | -| value_loss | 8.82e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11744 | -| time_elapsed | 64392 | -| total_timesteps | 1503232 | -| train/ | | -| approx_kl | 0.021658609 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.923 | -| learning_rate | 0.0003 | -| loss | -0.00673 | -| n_updates | 117430 | -| policy_gradient_loss | -0.0127 | -| std | 0.0207 | -| value_loss | 0.00075 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11745 | -| time_elapsed | 64395 | -| total_timesteps | 1503360 | -| train/ | | -| approx_kl | 0.006367105 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.00679 | -| learning_rate | 0.0003 | -| loss | -0.000292 | -| n_updates | 117440 | -| policy_gradient_loss | 0.00226 | -| std | 0.0207 | -| value_loss | 9.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11746 | -| time_elapsed | 64399 | -| total_timesteps | 1503488 | -| train/ | | -| approx_kl | 9.774789e-05 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.00271 | -| n_updates | 117450 | -| policy_gradient_loss | -0.0147 | -| std | 0.0207 | -| value_loss | 4.65e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11747 | -| time_elapsed | 64402 | -| total_timesteps | 1503616 | -| train/ | | -| approx_kl | 0.009214448 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0761 | -| learning_rate | 0.0003 | -| loss | -0.00832 | -| n_updates | 117460 | -| policy_gradient_loss | -0.0031 | -| std | 0.0207 | -| value_loss | 2.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11748 | -| time_elapsed | 64404 | -| total_timesteps | 1503744 | -| train/ | | -| approx_kl | 0.020822179 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 117470 | -| policy_gradient_loss | -0.00385 | -| std | 0.0207 | -| value_loss | 1.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 11749 | -| time_elapsed | 64408 | -| total_timesteps | 1503872 | -| train/ | | -| approx_kl | 0.022176672 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 117480 | -| policy_gradient_loss | -0.00799 | -| std | 0.0207 | -| value_loss | 9.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11750 | -| time_elapsed | 64410 | -| total_timesteps | 1504000 | -| train/ | | -| approx_kl | 0.020140657 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 117490 | -| policy_gradient_loss | -0.00305 | -| std | 0.0207 | -| value_loss | 6.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11751 | -| time_elapsed | 64413 | -| total_timesteps | 1504128 | -| train/ | | -| approx_kl | 0.023936193 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.00287 | -| learning_rate | 0.0003 | -| loss | -0.00373 | -| n_updates | 117500 | -| policy_gradient_loss | 0.00724 | -| std | 0.0207 | -| value_loss | 2.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11752 | -| time_elapsed | 64419 | -| total_timesteps | 1504256 | -| train/ | | -| approx_kl | 0.004352262 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.774 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 117510 | -| policy_gradient_loss | -0.0168 | -| std | 0.0207 | -| value_loss | 0.00431 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11753 | -| time_elapsed | 64423 | -| total_timesteps | 1504384 | -| train/ | | -| approx_kl | 0.0038363175 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -15.3 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 117520 | -| policy_gradient_loss | -0.00526 | -| std | 0.0206 | -| value_loss | 8.89e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11754 | -| time_elapsed | 64426 | -| total_timesteps | 1504512 | -| train/ | | -| approx_kl | 7.762108e-06 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -15.6 | -| learning_rate | 0.0003 | -| loss | 0.000407 | -| n_updates | 117530 | -| policy_gradient_loss | -0.00124 | -| std | 0.0206 | -| value_loss | 6.33e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11755 | -| time_elapsed | 64429 | -| total_timesteps | 1504640 | -| train/ | | -| approx_kl | 0.0060896664 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -3.44 | -| learning_rate | 0.0003 | -| loss | 0.00316 | -| n_updates | 117540 | -| policy_gradient_loss | 0.00847 | -| std | 0.0206 | -| value_loss | 4.55e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11756 | -| time_elapsed | 64433 | -| total_timesteps | 1504768 | -| train/ | | -| approx_kl | 0.009664381 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.66 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 117550 | -| policy_gradient_loss | 0.0214 | -| std | 0.0206 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 11757 | -| time_elapsed | 64438 | -| total_timesteps | 1504896 | -| train/ | | -| approx_kl | 0.012564215 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | -0.00934 | -| n_updates | 117560 | -| policy_gradient_loss | -0.00475 | -| std | 0.0206 | -| value_loss | 9.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11758 | -| time_elapsed | 64442 | -| total_timesteps | 1505024 | -| train/ | | -| approx_kl | 0.013426188 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -286 | -| learning_rate | 0.0003 | -| loss | -3.54e-05 | -| n_updates | 117570 | -| policy_gradient_loss | 0.00231 | -| std | 0.0206 | -| value_loss | 1.34e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11759 | -| time_elapsed | 64450 | -| total_timesteps | 1505152 | -| train/ | | -| approx_kl | 0.05624067 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 117580 | -| policy_gradient_loss | -0.0182 | -| std | 0.0206 | -| value_loss | 0.00293 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11760 | -| time_elapsed | 64454 | -| total_timesteps | 1505280 | -| train/ | | -| approx_kl | 0.047221046 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.0147 | -| learning_rate | 0.0003 | -| loss | -0.00728 | -| n_updates | 117590 | -| policy_gradient_loss | -0.00672 | -| std | 0.0206 | -| value_loss | 0.000319 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11761 | -| time_elapsed | 64458 | -| total_timesteps | 1505408 | -| train/ | | -| approx_kl | 0.0018305187 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -70.7 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 117600 | -| policy_gradient_loss | -0.00674 | -| std | 0.0205 | -| value_loss | 1.02e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11762 | -| time_elapsed | 64462 | -| total_timesteps | 1505536 | -| train/ | | -| approx_kl | 0.008760552 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | -0.000901 | -| n_updates | 117610 | -| policy_gradient_loss | 0.00328 | -| std | 0.0205 | -| value_loss | 6.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11763 | -| time_elapsed | 64466 | -| total_timesteps | 1505664 | -| train/ | | -| approx_kl | 0.032070406 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.00496 | -| n_updates | 117620 | -| policy_gradient_loss | 0.000426 | -| std | 0.0205 | -| value_loss | 6.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11764 | -| time_elapsed | 64470 | -| total_timesteps | 1505792 | -| train/ | | -| approx_kl | 0.021520793 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.000322 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 117630 | -| policy_gradient_loss | -0.00133 | -| std | 0.0205 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11765 | -| time_elapsed | 64473 | -| total_timesteps | 1505920 | -| train/ | | -| approx_kl | 0.028819887 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.00472 | -| n_updates | 117640 | -| policy_gradient_loss | 7.41e-05 | -| std | 0.0205 | -| value_loss | 8.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11766 | -| time_elapsed | 64477 | -| total_timesteps | 1506048 | -| train/ | | -| approx_kl | 0.008804728 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 117650 | -| policy_gradient_loss | -0.000392 | -| std | 0.0205 | -| value_loss | 5.26e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11767 | -| time_elapsed | 64482 | -| total_timesteps | 1506176 | -| train/ | | -| approx_kl | 0.00084283063 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.765 | -| learning_rate | 0.0003 | -| loss | 0.000669 | -| n_updates | 117660 | -| policy_gradient_loss | 0.00182 | -| std | 0.0205 | -| value_loss | 0.00395 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11768 | -| time_elapsed | 64486 | -| total_timesteps | 1506304 | -| train/ | | -| approx_kl | 0.0025257175 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.244 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 117670 | -| policy_gradient_loss | 0.0173 | -| std | 0.0205 | -| value_loss | 5.81e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11769 | -| time_elapsed | 64489 | -| total_timesteps | 1506432 | -| train/ | | -| approx_kl | 0.010816166 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 117680 | -| policy_gradient_loss | 0.0212 | -| std | 0.0205 | -| value_loss | 1.49e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11770 | -| time_elapsed | 64491 | -| total_timesteps | 1506560 | -| train/ | | -| approx_kl | 0.020142984 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.00434 | -| n_updates | 117690 | -| policy_gradient_loss | -0.00161 | -| std | 0.0205 | -| value_loss | 9.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11771 | -| time_elapsed | 64495 | -| total_timesteps | 1506688 | -| train/ | | -| approx_kl | 0.0043750755 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.00479 | -| n_updates | 117700 | -| policy_gradient_loss | 0.00768 | -| std | 0.0205 | -| value_loss | 5.22e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11772 | -| time_elapsed | 64497 | -| total_timesteps | 1506816 | -| train/ | | -| approx_kl | 0.0024570748 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.000447 | -| n_updates | 117710 | -| policy_gradient_loss | 0.0215 | -| std | 0.0205 | -| value_loss | 1.77e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 11773 | -| time_elapsed | 64500 | -| total_timesteps | 1506944 | -| train/ | | -| approx_kl | 0.009932404 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.0042 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 117720 | -| policy_gradient_loss | 0.0143 | -| std | 0.0205 | -| value_loss | 7.21e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11774 | -| time_elapsed | 64503 | -| total_timesteps | 1507072 | -| train/ | | -| approx_kl | 0.019760486 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.0061 | -| learning_rate | 0.0003 | -| loss | 0.00923 | -| n_updates | 117730 | -| policy_gradient_loss | 0.000587 | -| std | 0.0205 | -| value_loss | 7.36e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11775 | -| time_elapsed | 64508 | -| total_timesteps | 1507200 | -| train/ | | -| approx_kl | 0.07575151 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 117740 | -| policy_gradient_loss | -0.0142 | -| std | 0.0205 | -| value_loss | 0.00163 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11776 | -| time_elapsed | 64512 | -| total_timesteps | 1507328 | -| train/ | | -| approx_kl | 0.021741346 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.0091 | -| n_updates | 117750 | -| policy_gradient_loss | 0.0105 | -| std | 0.0205 | -| value_loss | 0.000159 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11777 | -| time_elapsed | 64515 | -| total_timesteps | 1507456 | -| train/ | | -| approx_kl | 0.032056008 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0999 | -| learning_rate | 0.0003 | -| loss | 0.00569 | -| n_updates | 117760 | -| policy_gradient_loss | 0.00112 | -| std | 0.0205 | -| value_loss | 1.26e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11778 | -| time_elapsed | 64519 | -| total_timesteps | 1507584 | -| train/ | | -| approx_kl | 0.07253948 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.0504 | -| n_updates | 117770 | -| policy_gradient_loss | 0.0239 | -| std | 0.0206 | -| value_loss | 1.03e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11779 | -| time_elapsed | 64521 | -| total_timesteps | 1507712 | -| train/ | | -| approx_kl | 0.011853075 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.00512 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 117780 | -| policy_gradient_loss | 0.0137 | -| std | 0.0206 | -| value_loss | 2.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11780 | -| time_elapsed | 64524 | -| total_timesteps | 1507840 | -| train/ | | -| approx_kl | 0.012211688 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 117790 | -| policy_gradient_loss | 0.0165 | -| std | 0.0206 | -| value_loss | 1.95e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11781 | -| time_elapsed | 64527 | -| total_timesteps | 1507968 | -| train/ | | -| approx_kl | 0.02581447 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.000417 | -| n_updates | 117800 | -| policy_gradient_loss | -0.0043 | -| std | 0.0206 | -| value_loss | 6.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11782 | -| time_elapsed | 64530 | -| total_timesteps | 1508096 | -| train/ | | -| approx_kl | 0.020344151 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 117810 | -| policy_gradient_loss | -0.0101 | -| std | 0.0206 | -| value_loss | 3.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11783 | -| time_elapsed | 64538 | -| total_timesteps | 1508224 | -| train/ | | -| approx_kl | 0.005334468 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.723 | -| learning_rate | 0.0003 | -| loss | 0.000381 | -| n_updates | 117820 | -| policy_gradient_loss | 0.00461 | -| std | 0.0206 | -| value_loss | 0.00231 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11784 | -| time_elapsed | 64541 | -| total_timesteps | 1508352 | -| train/ | | -| approx_kl | 0.0022652512 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | 0.00478 | -| n_updates | 117830 | -| policy_gradient_loss | -0.00146 | -| std | 0.0206 | -| value_loss | 0.000116 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11785 | -| time_elapsed | 64545 | -| total_timesteps | 1508480 | -| train/ | | -| approx_kl | 0.03597161 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.582 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 117840 | -| policy_gradient_loss | 0.0118 | -| std | 0.0206 | -| value_loss | 2.27e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11786 | -| time_elapsed | 64547 | -| total_timesteps | 1508608 | -| train/ | | -| approx_kl | 0.012121558 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 117850 | -| policy_gradient_loss | -0.00605 | -| std | 0.0207 | -| value_loss | 1.4e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11787 | -| time_elapsed | 64550 | -| total_timesteps | 1508736 | -| train/ | | -| approx_kl | 0.022301968 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.0039 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 117860 | -| policy_gradient_loss | 0.0028 | -| std | 0.0207 | -| value_loss | 1.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11788 | -| time_elapsed | 64552 | -| total_timesteps | 1508864 | -| train/ | | -| approx_kl | 0.0012823446 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 117870 | -| policy_gradient_loss | -0.00445 | -| std | 0.0207 | -| value_loss | 9.34e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 11789 | -| time_elapsed | 64555 | -| total_timesteps | 1508992 | -| train/ | | -| approx_kl | 0.004997839 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00846 | -| n_updates | 117880 | -| policy_gradient_loss | -0.0071 | -| std | 0.0206 | -| value_loss | 5.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11790 | -| time_elapsed | 64558 | -| total_timesteps | 1509120 | -| train/ | | -| approx_kl | 0.003272112 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.000458 | -| n_updates | 117890 | -| policy_gradient_loss | 0.0076 | -| std | 0.0206 | -| value_loss | 6.84e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11791 | -| time_elapsed | 64566 | -| total_timesteps | 1509248 | -| train/ | | -| approx_kl | 0.0022845562 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.7 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 117900 | -| policy_gradient_loss | -0.00494 | -| std | 0.0206 | -| value_loss | 0.00572 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11792 | -| time_elapsed | 64569 | -| total_timesteps | 1509376 | -| train/ | | -| approx_kl | 1.8223654e-05 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0746 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 117910 | -| policy_gradient_loss | -9.05e-05 | -| std | 0.0205 | -| value_loss | 4.76e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11793 | -| time_elapsed | 64572 | -| total_timesteps | 1509504 | -| train/ | | -| approx_kl | 0.006065326 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.00859 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 117920 | -| policy_gradient_loss | 0.0069 | -| std | 0.0204 | -| value_loss | 3.42e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11794 | -| time_elapsed | 64576 | -| total_timesteps | 1509632 | -| train/ | | -| approx_kl | 0.027254762 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 117930 | -| policy_gradient_loss | -0.000409 | -| std | 0.0204 | -| value_loss | 7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11795 | -| time_elapsed | 64579 | -| total_timesteps | 1509760 | -| train/ | | -| approx_kl | 0.015375922 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.000453 | -| learning_rate | 0.0003 | -| loss | -0.00827 | -| n_updates | 117940 | -| policy_gradient_loss | 0.00162 | -| std | 0.0204 | -| value_loss | 1.38e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 11796 | -| time_elapsed | 64584 | -| total_timesteps | 1509888 | -| train/ | | -| approx_kl | 0.022773571 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.00411 | -| n_updates | 117950 | -| policy_gradient_loss | 0.000976 | -| std | 0.0204 | -| value_loss | 9.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11797 | -| time_elapsed | 64588 | -| total_timesteps | 1510016 | -| train/ | | -| approx_kl | 0.013272294 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | -0.00428 | -| n_updates | 117960 | -| policy_gradient_loss | 0.00247 | -| std | 0.0204 | -| value_loss | 5.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11798 | -| time_elapsed | 64597 | -| total_timesteps | 1510144 | -| train/ | | -| approx_kl | 0.013729944 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 117970 | -| policy_gradient_loss | -0.0131 | -| std | 0.0204 | -| value_loss | 0.00224 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11799 | -| time_elapsed | 64600 | -| total_timesteps | 1510272 | -| train/ | | -| approx_kl | 0.0023416872 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 117980 | -| policy_gradient_loss | 0.00325 | -| std | 0.0204 | -| value_loss | 2.09e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11800 | -| time_elapsed | 64603 | -| total_timesteps | 1510400 | -| train/ | | -| approx_kl | 0.025391426 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -1.13 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 117990 | -| policy_gradient_loss | 0.00782 | -| std | 0.0204 | -| value_loss | 1.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11801 | -| time_elapsed | 64607 | -| total_timesteps | 1510528 | -| train/ | | -| approx_kl | 0.014928181 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 118000 | -| policy_gradient_loss | -0.0019 | -| std | 0.0204 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11802 | -| time_elapsed | 64610 | -| total_timesteps | 1510656 | -| train/ | | -| approx_kl | 0.009087295 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 118010 | -| policy_gradient_loss | 0.00439 | -| std | 0.0204 | -| value_loss | 3.18e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11803 | -| time_elapsed | 64613 | -| total_timesteps | 1510784 | -| train/ | | -| approx_kl | 0.0025335317 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.00518 | -| learning_rate | 0.0003 | -| loss | 0.00607 | -| n_updates | 118020 | -| policy_gradient_loss | -0.00277 | -| std | 0.0204 | -| value_loss | 2.01e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 11804 | -| time_elapsed | 64617 | -| total_timesteps | 1510912 | -| train/ | | -| approx_kl | 0.012942718 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.00751 | -| learning_rate | 0.0003 | -| loss | 0.00783 | -| n_updates | 118030 | -| policy_gradient_loss | 0.00688 | -| std | 0.0204 | -| value_loss | 9.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11805 | -| time_elapsed | 64621 | -| total_timesteps | 1511040 | -| train/ | | -| approx_kl | 0.022807866 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.00249 | -| learning_rate | 0.0003 | -| loss | 0.00853 | -| n_updates | 118040 | -| policy_gradient_loss | 0.0115 | -| std | 0.0204 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11806 | -| time_elapsed | 64627 | -| total_timesteps | 1511168 | -| train/ | | -| approx_kl | 0.023997795 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 118050 | -| policy_gradient_loss | -0.0167 | -| std | 0.0203 | -| value_loss | 0.000511 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11807 | -| time_elapsed | 64631 | -| total_timesteps | 1511296 | -| train/ | | -| approx_kl | 0.004714462 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -9.65 | -| learning_rate | 0.0003 | -| loss | 0.00865 | -| n_updates | 118060 | -| policy_gradient_loss | 0.000851 | -| std | 0.0203 | -| value_loss | 1.87e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11808 | -| time_elapsed | 64635 | -| total_timesteps | 1511424 | -| train/ | | -| approx_kl | 0.0066539585 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 118070 | -| policy_gradient_loss | -0.0029 | -| std | 0.0203 | -| value_loss | 1.03e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11809 | -| time_elapsed | 64639 | -| total_timesteps | 1511552 | -| train/ | | -| approx_kl | 0.0060511986 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -2.32 | -| learning_rate | 0.0003 | -| loss | 0.00667 | -| n_updates | 118080 | -| policy_gradient_loss | 0.00571 | -| std | 0.0203 | -| value_loss | 5.41e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11810 | -| time_elapsed | 64644 | -| total_timesteps | 1511680 | -| train/ | | -| approx_kl | 0.008466469 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | -0.000634 | -| n_updates | 118090 | -| policy_gradient_loss | 0.000382 | -| std | 0.0203 | -| value_loss | 8.51e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11811 | -| time_elapsed | 64647 | -| total_timesteps | 1511808 | -| train/ | | -| approx_kl | 0.015464662 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 118100 | -| policy_gradient_loss | 0.00419 | -| std | 0.0203 | -| value_loss | 5.53e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 11812 | -| time_elapsed | 64651 | -| total_timesteps | 1511936 | -| train/ | | -| approx_kl | 0.03937867 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -4.3e-05 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 118110 | -| policy_gradient_loss | 0.0119 | -| std | 0.0203 | -| value_loss | 2.21e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11813 | -| time_elapsed | 64654 | -| total_timesteps | 1512064 | -| train/ | | -| approx_kl | 0.015768405 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.00976 | -| learning_rate | 0.0003 | -| loss | 0.000773 | -| n_updates | 118120 | -| policy_gradient_loss | 0.00837 | -| std | 0.0203 | -| value_loss | 1.45e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11814 | -| time_elapsed | 64660 | -| total_timesteps | 1512192 | -| train/ | | -| approx_kl | 0.0236415 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.462 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 118130 | -| policy_gradient_loss | -0.00816 | -| std | 0.0203 | -| value_loss | 0.0139 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11815 | -| time_elapsed | 64663 | -| total_timesteps | 1512320 | -| train/ | | -| approx_kl | 0.018881926 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.000257 | -| n_updates | 118140 | -| policy_gradient_loss | -0.000251 | -| std | 0.0203 | -| value_loss | 0.000282 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11816 | -| time_elapsed | 64667 | -| total_timesteps | 1512448 | -| train/ | | -| approx_kl | 0.073797286 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.00233 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 118150 | -| policy_gradient_loss | 0.00778 | -| std | 0.0203 | -| value_loss | 1.84e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11817 | -| time_elapsed | 64670 | -| total_timesteps | 1512576 | -| train/ | | -| approx_kl | 0.0035962136 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.00942 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 118160 | -| policy_gradient_loss | -0.000227 | -| std | 0.0203 | -| value_loss | 2.06e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11818 | -| time_elapsed | 64673 | -| total_timesteps | 1512704 | -| train/ | | -| approx_kl | 0.0006362372 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 118170 | -| policy_gradient_loss | 0.00359 | -| std | 0.0203 | -| value_loss | 2.45e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11819 | -| time_elapsed | 64676 | -| total_timesteps | 1512832 | -| train/ | | -| approx_kl | 0.0006037145 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0041 | -| n_updates | 118180 | -| policy_gradient_loss | 0.00689 | -| std | 0.0203 | -| value_loss | 7.66e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11820 | -| time_elapsed | 64678 | -| total_timesteps | 1512960 | -| train/ | | -| approx_kl | 0.06515042 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.00786 | -| n_updates | 118190 | -| policy_gradient_loss | -0.00499 | -| std | 0.0203 | -| value_loss | 5.71e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11821 | -| time_elapsed | 64682 | -| total_timesteps | 1513088 | -| train/ | | -| approx_kl | 0.06603389 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 118200 | -| policy_gradient_loss | -0.00222 | -| std | 0.0203 | -| value_loss | 3.67e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11822 | -| time_elapsed | 64688 | -| total_timesteps | 1513216 | -| train/ | | -| approx_kl | 0.0033865655 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.733 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 118210 | -| policy_gradient_loss | -0.0123 | -| std | 0.0203 | -| value_loss | 0.00441 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11823 | -| time_elapsed | 64691 | -| total_timesteps | 1513344 | -| train/ | | -| approx_kl | 0.011680966 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.344 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 118220 | -| policy_gradient_loss | -0.000577 | -| std | 0.0203 | -| value_loss | 0.000214 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11824 | -| time_elapsed | 64695 | -| total_timesteps | 1513472 | -| train/ | | -| approx_kl | 0.006146122 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -2.7e+03 | -| learning_rate | 0.0003 | -| loss | 0.00451 | -| n_updates | 118230 | -| policy_gradient_loss | -0.000464 | -| std | 0.0203 | -| value_loss | 2.9e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11825 | -| time_elapsed | 64698 | -| total_timesteps | 1513600 | -| train/ | | -| approx_kl | 0.012072295 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -6.44 | -| learning_rate | 0.0003 | -| loss | -0.00947 | -| n_updates | 118240 | -| policy_gradient_loss | -0.0068 | -| std | 0.0203 | -| value_loss | 1.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11826 | -| time_elapsed | 64702 | -| total_timesteps | 1513728 | -| train/ | | -| approx_kl | 0.040406093 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 118250 | -| policy_gradient_loss | 0.00397 | -| std | 0.0203 | -| value_loss | 9.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11827 | -| time_elapsed | 64706 | -| total_timesteps | 1513856 | -| train/ | | -| approx_kl | 0.040367506 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0678 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 118260 | -| policy_gradient_loss | 0.00575 | -| std | 0.0203 | -| value_loss | 0.000106 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11828 | -| time_elapsed | 64711 | -| total_timesteps | 1513984 | -| train/ | | -| approx_kl | 0.057407495 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 118270 | -| policy_gradient_loss | -0.0193 | -| std | 0.0203 | -| value_loss | 0.0027 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 11829 | -| time_elapsed | 64714 | -| total_timesteps | 1514112 | -| train/ | | -| approx_kl | 0.07877899 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.000131 | -| n_updates | 118280 | -| policy_gradient_loss | -0.00746 | -| std | 0.0203 | -| value_loss | 0.000104 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 11830 | -| time_elapsed | 64724 | -| total_timesteps | 1514240 | -| train/ | | -| approx_kl | 0.00073894765 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.707 | -| learning_rate | 0.0003 | -| loss | 0.00654 | -| n_updates | 118290 | -| policy_gradient_loss | -0.00837 | -| std | 0.0203 | -| value_loss | 0.00613 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 11831 | -| time_elapsed | 64729 | -| total_timesteps | 1514368 | -| train/ | | -| approx_kl | 0.03617471 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.00797 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 118300 | -| policy_gradient_loss | -0.0104 | -| std | 0.0204 | -| value_loss | 0.00258 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 11832 | -| time_elapsed | 64731 | -| total_timesteps | 1514496 | -| train/ | | -| approx_kl | 0.06264248 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.00709 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 118310 | -| policy_gradient_loss | 0.000628 | -| std | 0.0204 | -| value_loss | 0.000228 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 11833 | -| time_elapsed | 64734 | -| total_timesteps | 1514624 | -| train/ | | -| approx_kl | 0.00046771765 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 118320 | -| policy_gradient_loss | 0.00487 | -| std | 0.0204 | -| value_loss | 0.000204 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 11834 | -| time_elapsed | 64737 | -| total_timesteps | 1514752 | -| train/ | | -| approx_kl | 0.009004675 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0936 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 118330 | -| policy_gradient_loss | 0.000506 | -| std | 0.0204 | -| value_loss | 5.98e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 11835 | -| time_elapsed | 64742 | -| total_timesteps | 1514880 | -| train/ | | -| approx_kl | 0.0003841133 | -| clip_fraction | 0.0102 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | -0.000289 | -| n_updates | 118340 | -| policy_gradient_loss | -0.000342 | -| std | 0.0203 | -| value_loss | 9.63e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11836 | -| time_elapsed | 64745 | -| total_timesteps | 1515008 | -| train/ | | -| approx_kl | 0.029451335 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.00613 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 118350 | -| policy_gradient_loss | -0.00106 | -| std | 0.0203 | -| value_loss | 0.000914 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11837 | -| time_elapsed | 64754 | -| total_timesteps | 1515136 | -| train/ | | -| approx_kl | 0.057888143 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 118360 | -| policy_gradient_loss | -0.012 | -| std | 0.0203 | -| value_loss | 0.00324 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11838 | -| time_elapsed | 64757 | -| total_timesteps | 1515264 | -| train/ | | -| approx_kl | 0.030853719 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.112 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 118370 | -| policy_gradient_loss | 0.005 | -| std | 0.0203 | -| value_loss | 2.81e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11839 | -| time_elapsed | 64760 | -| total_timesteps | 1515392 | -| train/ | | -| approx_kl | 0.047301047 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.00684 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 118380 | -| policy_gradient_loss | -0.000958 | -| std | 0.0203 | -| value_loss | 2.85e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11840 | -| time_elapsed | 64763 | -| total_timesteps | 1515520 | -| train/ | | -| approx_kl | 0.0052245418 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.00475 | -| n_updates | 118390 | -| policy_gradient_loss | 0.00995 | -| std | 0.0203 | -| value_loss | 3.63e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11841 | -| time_elapsed | 64767 | -| total_timesteps | 1515648 | -| train/ | | -| approx_kl | 0.002049998 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 118400 | -| policy_gradient_loss | -0.0107 | -| std | 0.0203 | -| value_loss | 7.07e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11842 | -| time_elapsed | 64771 | -| total_timesteps | 1515776 | -| train/ | | -| approx_kl | 0.00019630417 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.00339 | -| n_updates | 118410 | -| policy_gradient_loss | 0.00199 | -| std | 0.0203 | -| value_loss | 1.14e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 11843 | -| time_elapsed | 64775 | -| total_timesteps | 1515904 | -| train/ | | -| approx_kl | 0.010872437 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | 0.00573 | -| n_updates | 118420 | -| policy_gradient_loss | 0.00642 | -| std | 0.0203 | -| value_loss | 3.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11844 | -| time_elapsed | 64779 | -| total_timesteps | 1516032 | -| train/ | | -| approx_kl | 0.009705666 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | -0.00266 | -| n_updates | 118430 | -| policy_gradient_loss | -0.00284 | -| std | 0.0203 | -| value_loss | 8.01e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11845 | -| time_elapsed | 64785 | -| total_timesteps | 1516160 | -| train/ | | -| approx_kl | 0.0045024264 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 118440 | -| policy_gradient_loss | -0.00219 | -| std | 0.0204 | -| value_loss | 0.00011 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11846 | -| time_elapsed | 64789 | -| total_timesteps | 1516288 | -| train/ | | -| approx_kl | 0.0058423537 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 118450 | -| policy_gradient_loss | 0.0016 | -| std | 0.0204 | -| value_loss | 4.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11847 | -| time_elapsed | 64792 | -| total_timesteps | 1516416 | -| train/ | | -| approx_kl | 0.007111789 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 118460 | -| policy_gradient_loss | -0.00627 | -| std | 0.0204 | -| value_loss | 2.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11848 | -| time_elapsed | 64795 | -| total_timesteps | 1516544 | -| train/ | | -| approx_kl | 0.022998305 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0242 | -| n_updates | 118470 | -| policy_gradient_loss | 0.0129 | -| std | 0.0205 | -| value_loss | 4.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11849 | -| time_elapsed | 64800 | -| total_timesteps | 1516672 | -| train/ | | -| approx_kl | 0.007213534 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.00487 | -| n_updates | 118480 | -| policy_gradient_loss | 0.00912 | -| std | 0.0205 | -| value_loss | 4.71e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11850 | -| time_elapsed | 64804 | -| total_timesteps | 1516800 | -| train/ | | -| approx_kl | 0.0023373412 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.00397 | -| learning_rate | 0.0003 | -| loss | -0.000151 | -| n_updates | 118490 | -| policy_gradient_loss | 0.0044 | -| std | 0.0205 | -| value_loss | 1.24e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 11851 | -| time_elapsed | 64807 | -| total_timesteps | 1516928 | -| train/ | | -| approx_kl | 0.005211235 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.00179 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 118500 | -| policy_gradient_loss | 0.00329 | -| std | 0.0205 | -| value_loss | 6.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11852 | -| time_elapsed | 64810 | -| total_timesteps | 1517056 | -| train/ | | -| approx_kl | 0.012831965 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.64 | -| learning_rate | 0.0003 | -| loss | 0.000813 | -| n_updates | 118510 | -| policy_gradient_loss | 0.00228 | -| std | 0.0205 | -| value_loss | 8.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11853 | -| time_elapsed | 64818 | -| total_timesteps | 1517184 | -| train/ | | -| approx_kl | 0.009813045 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 118520 | -| policy_gradient_loss | -0.0196 | -| std | 0.0205 | -| value_loss | 0.00304 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11854 | -| time_elapsed | 64822 | -| total_timesteps | 1517312 | -| train/ | | -| approx_kl | 0.00094116013 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -2.72 | -| learning_rate | 0.0003 | -| loss | -0.000744 | -| n_updates | 118530 | -| policy_gradient_loss | -0.000441 | -| std | 0.0205 | -| value_loss | 8.66e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11855 | -| time_elapsed | 64826 | -| total_timesteps | 1517440 | -| train/ | | -| approx_kl | 0.0037345407 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -3.11 | -| learning_rate | 0.0003 | -| loss | 0.000935 | -| n_updates | 118540 | -| policy_gradient_loss | 0.00485 | -| std | 0.0206 | -| value_loss | 1.95e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11856 | -| time_elapsed | 64830 | -| total_timesteps | 1517568 | -| train/ | | -| approx_kl | 0.120075166 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.889 | -| learning_rate | 0.0003 | -| loss | 0.0503 | -| n_updates | 118550 | -| policy_gradient_loss | 0.022 | -| std | 0.0206 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11857 | -| time_elapsed | 64834 | -| total_timesteps | 1517696 | -| train/ | | -| approx_kl | 0.017197508 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.00698 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 118560 | -| policy_gradient_loss | -0.00127 | -| std | 0.0206 | -| value_loss | 3.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11858 | -| time_elapsed | 64837 | -| total_timesteps | 1517824 | -| train/ | | -| approx_kl | 0.028323032 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | 0.00678 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 118570 | -| policy_gradient_loss | -0.0078 | -| std | 0.0206 | -| value_loss | 2.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11859 | -| time_elapsed | 64840 | -| total_timesteps | 1517952 | -| train/ | | -| approx_kl | 0.002662248 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0557 | -| learning_rate | 0.0003 | -| loss | 0.00476 | -| n_updates | 118580 | -| policy_gradient_loss | 0.00769 | -| std | 0.0206 | -| value_loss | 1.56e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11860 | -| time_elapsed | 64845 | -| total_timesteps | 1518080 | -| train/ | | -| approx_kl | 0.0017647021 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.00562 | -| n_updates | 118590 | -| policy_gradient_loss | 0.00937 | -| std | 0.0206 | -| value_loss | 9.46e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11861 | -| time_elapsed | 64853 | -| total_timesteps | 1518208 | -| train/ | | -| approx_kl | 0.039169904 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 118600 | -| policy_gradient_loss | -0.0145 | -| std | 0.0206 | -| value_loss | 0.00174 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11862 | -| time_elapsed | 64857 | -| total_timesteps | 1518336 | -| train/ | | -| approx_kl | 0.014784254 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -151 | -| learning_rate | 0.0003 | -| loss | 0.00466 | -| n_updates | 118610 | -| policy_gradient_loss | 0.00204 | -| std | 0.0206 | -| value_loss | 7.92e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11863 | -| time_elapsed | 64860 | -| total_timesteps | 1518464 | -| train/ | | -| approx_kl | 0.021329703 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -426 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 118620 | -| policy_gradient_loss | -0.0094 | -| std | 0.0205 | -| value_loss | 7.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11864 | -| time_elapsed | 64863 | -| total_timesteps | 1518592 | -| train/ | | -| approx_kl | 0.01180508 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -52.8 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 118630 | -| policy_gradient_loss | -0.00893 | -| std | 0.0205 | -| value_loss | 7.87e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11865 | -| time_elapsed | 64866 | -| total_timesteps | 1518720 | -| train/ | | -| approx_kl | 0.0008280659 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -7.92 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 118640 | -| policy_gradient_loss | -0.00121 | -| std | 0.0205 | -| value_loss | 1.33e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11866 | -| time_elapsed | 64870 | -| total_timesteps | 1518848 | -| train/ | | -| approx_kl | 0.036191486 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 118650 | -| policy_gradient_loss | 0.00203 | -| std | 0.0206 | -| value_loss | 6.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 11867 | -| time_elapsed | 64873 | -| total_timesteps | 1518976 | -| train/ | | -| approx_kl | 0.023164365 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.084 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 118660 | -| policy_gradient_loss | -0.00505 | -| std | 0.0206 | -| value_loss | 3.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11868 | -| time_elapsed | 64876 | -| total_timesteps | 1519104 | -| train/ | | -| approx_kl | 0.050986864 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.061 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 118670 | -| policy_gradient_loss | 0.00157 | -| std | 0.0206 | -| value_loss | 1.76e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11869 | -| time_elapsed | 64884 | -| total_timesteps | 1519232 | -| train/ | | -| approx_kl | 0.06111945 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.455 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 118680 | -| policy_gradient_loss | -0.0184 | -| std | 0.0206 | -| value_loss | 0.00158 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11870 | -| time_elapsed | 64888 | -| total_timesteps | 1519360 | -| train/ | | -| approx_kl | 0.012408813 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | 0.000511 | -| n_updates | 118690 | -| policy_gradient_loss | 0.00101 | -| std | 0.0205 | -| value_loss | 9.57e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11871 | -| time_elapsed | 64891 | -| total_timesteps | 1519488 | -| train/ | | -| approx_kl | 0.075363666 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -4.91 | -| learning_rate | 0.0003 | -| loss | 0.00372 | -| n_updates | 118700 | -| policy_gradient_loss | -0.00119 | -| std | 0.0205 | -| value_loss | 4.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11872 | -| time_elapsed | 64894 | -| total_timesteps | 1519616 | -| train/ | | -| approx_kl | 0.012465985 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 118710 | -| policy_gradient_loss | -0.00701 | -| std | 0.0205 | -| value_loss | 5.61e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11873 | -| time_elapsed | 64899 | -| total_timesteps | 1519744 | -| train/ | | -| approx_kl | 0.03378873 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.236 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 118720 | -| policy_gradient_loss | 0.00823 | -| std | 0.0205 | -| value_loss | 2.39e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11874 | -| time_elapsed | 64903 | -| total_timesteps | 1519872 | -| train/ | | -| approx_kl | 0.041717093 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | 0.00773 | -| n_updates | 118730 | -| policy_gradient_loss | -0.00026 | -| std | 0.0205 | -| value_loss | 7.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11875 | -| time_elapsed | 64906 | -| total_timesteps | 1520000 | -| train/ | | -| approx_kl | 0.011290846 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 118740 | -| policy_gradient_loss | 0.00161 | -| std | 0.0205 | -| value_loss | 2.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11876 | -| time_elapsed | 64911 | -| total_timesteps | 1520128 | -| train/ | | -| approx_kl | 0.025701458 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.00313 | -| learning_rate | 0.0003 | -| loss | 0.00967 | -| n_updates | 118750 | -| policy_gradient_loss | 0.00475 | -| std | 0.0205 | -| value_loss | 1.26e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11877 | -| time_elapsed | 64917 | -| total_timesteps | 1520256 | -| train/ | | -| approx_kl | 0.08334592 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 118760 | -| policy_gradient_loss | -0.015 | -| std | 0.0206 | -| value_loss | 0.000556 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11878 | -| time_elapsed | 64920 | -| total_timesteps | 1520384 | -| train/ | | -| approx_kl | 0.0076857726 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | -0.00569 | -| n_updates | 118770 | -| policy_gradient_loss | -0.00197 | -| std | 0.0206 | -| value_loss | 1.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11879 | -| time_elapsed | 64923 | -| total_timesteps | 1520512 | -| train/ | | -| approx_kl | 0.018409193 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | 0.00109 | -| n_updates | 118780 | -| policy_gradient_loss | 0.0025 | -| std | 0.0206 | -| value_loss | 6.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11880 | -| time_elapsed | 64927 | -| total_timesteps | 1520640 | -| train/ | | -| approx_kl | 0.021010805 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.626 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 118790 | -| policy_gradient_loss | -0.00389 | -| std | 0.0206 | -| value_loss | 5.78e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11881 | -| time_elapsed | 64930 | -| total_timesteps | 1520768 | -| train/ | | -| approx_kl | 0.01774041 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.46 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 118800 | -| policy_gradient_loss | -0.0061 | -| std | 0.0206 | -| value_loss | 3.32e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 11882 | -| time_elapsed | 64933 | -| total_timesteps | 1520896 | -| train/ | | -| approx_kl | 0.05124668 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 118810 | -| policy_gradient_loss | -1.47e-05 | -| std | 0.0205 | -| value_loss | 3.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11883 | -| time_elapsed | 64936 | -| total_timesteps | 1521024 | -| train/ | | -| approx_kl | 0.05965569 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -9.52 | -| learning_rate | 0.0003 | -| loss | 0.00349 | -| n_updates | 118820 | -| policy_gradient_loss | -0.00185 | -| std | 0.0205 | -| value_loss | 9.45e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11884 | -| time_elapsed | 64943 | -| total_timesteps | 1521152 | -| train/ | | -| approx_kl | 0.0706875 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.000153 | -| n_updates | 118830 | -| policy_gradient_loss | -0.00256 | -| std | 0.0205 | -| value_loss | 0.00166 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11885 | -| time_elapsed | 64947 | -| total_timesteps | 1521280 | -| train/ | | -| approx_kl | 0.0060763126 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.000821 | -| n_updates | 118840 | -| policy_gradient_loss | 0.00741 | -| std | 0.0205 | -| value_loss | 9.11e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11886 | -| time_elapsed | 64950 | -| total_timesteps | 1521408 | -| train/ | | -| approx_kl | 0.038250517 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.542 | -| learning_rate | 0.0003 | -| loss | 0.00753 | -| n_updates | 118850 | -| policy_gradient_loss | 0.00305 | -| std | 0.0205 | -| value_loss | 1.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11887 | -| time_elapsed | 64954 | -| total_timesteps | 1521536 | -| train/ | | -| approx_kl | 0.019763906 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.444 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 118860 | -| policy_gradient_loss | -0.00414 | -| std | 0.0205 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11888 | -| time_elapsed | 64957 | -| total_timesteps | 1521664 | -| train/ | | -| approx_kl | 0.030113187 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 118870 | -| policy_gradient_loss | 0.00371 | -| std | 0.0205 | -| value_loss | 2.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11889 | -| time_elapsed | 64961 | -| total_timesteps | 1521792 | -| train/ | | -| approx_kl | 0.008570073 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0668 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 118880 | -| policy_gradient_loss | 0.00342 | -| std | 0.0204 | -| value_loss | 3.12e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11890 | -| time_elapsed | 64964 | -| total_timesteps | 1521920 | -| train/ | | -| approx_kl | 0.04844047 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 118890 | -| policy_gradient_loss | 0.0048 | -| std | 0.0204 | -| value_loss | 2.13e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11891 | -| time_elapsed | 64967 | -| total_timesteps | 1522048 | -| train/ | | -| approx_kl | 0.008992294 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 118900 | -| policy_gradient_loss | 0.0058 | -| std | 0.0204 | -| value_loss | 2.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11892 | -| time_elapsed | 64975 | -| total_timesteps | 1522176 | -| train/ | | -| approx_kl | 0.42458695 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -0.919 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 118910 | -| policy_gradient_loss | -0.0154 | -| std | 0.0204 | -| value_loss | 0.0019 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11893 | -| time_elapsed | 64978 | -| total_timesteps | 1522304 | -| train/ | | -| approx_kl | 0.00020145858 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 2.47 | -| explained_variance | -69.1 | -| learning_rate | 0.0003 | -| loss | -0.000233 | -| n_updates | 118920 | -| policy_gradient_loss | 0.000454 | -| std | 0.0203 | -| value_loss | 2.84e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11894 | -| time_elapsed | 64982 | -| total_timesteps | 1522432 | -| train/ | | -| approx_kl | 0.04785463 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -37.1 | -| learning_rate | 0.0003 | -| loss | -0.00942 | -| n_updates | 118930 | -| policy_gradient_loss | -0.00913 | -| std | 0.0203 | -| value_loss | 0.0011 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11895 | -| time_elapsed | 64985 | -| total_timesteps | 1522560 | -| train/ | | -| approx_kl | 0.019620799 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 118940 | -| policy_gradient_loss | -0.00175 | -| std | 0.0202 | -| value_loss | 6.47e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11896 | -| time_elapsed | 64988 | -| total_timesteps | 1522688 | -| train/ | | -| approx_kl | 0.0072713727 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.00335 | -| learning_rate | 0.0003 | -| loss | -0.000512 | -| n_updates | 118950 | -| policy_gradient_loss | 0.00352 | -| std | 0.0202 | -| value_loss | 0.00124 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11897 | -| time_elapsed | 64991 | -| total_timesteps | 1522816 | -| train/ | | -| approx_kl | 0.024517644 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | -0.00631 | -| n_updates | 118960 | -| policy_gradient_loss | -0.00729 | -| std | 0.0202 | -| value_loss | 0.00243 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 11898 | -| time_elapsed | 64994 | -| total_timesteps | 1522944 | -| train/ | | -| approx_kl | 0.010972815 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 118970 | -| policy_gradient_loss | 0.00201 | -| std | 0.0202 | -| value_loss | 1.26e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11899 | -| time_elapsed | 64997 | -| total_timesteps | 1523072 | -| train/ | | -| approx_kl | 0.014874947 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.00357 | -| n_updates | 118980 | -| policy_gradient_loss | 0.00189 | -| std | 0.0202 | -| value_loss | 8.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11900 | -| time_elapsed | 65004 | -| total_timesteps | 1523200 | -| train/ | | -| approx_kl | 0.021712666 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 118990 | -| policy_gradient_loss | -0.0101 | -| std | 0.0202 | -| value_loss | 0.000207 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11901 | -| time_elapsed | 65007 | -| total_timesteps | 1523328 | -| train/ | | -| approx_kl | 0.011245564 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0782 | -| learning_rate | 0.0003 | -| loss | 0.00386 | -| n_updates | 119000 | -| policy_gradient_loss | 0.0085 | -| std | 0.0202 | -| value_loss | 2.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11902 | -| time_elapsed | 65010 | -| total_timesteps | 1523456 | -| train/ | | -| approx_kl | 0.008221412 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 119010 | -| policy_gradient_loss | -0.00286 | -| std | 0.0202 | -| value_loss | 3.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11903 | -| time_elapsed | 65014 | -| total_timesteps | 1523584 | -| train/ | | -| approx_kl | 0.047586635 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.00403 | -| n_updates | 119020 | -| policy_gradient_loss | -0.000942 | -| std | 0.0202 | -| value_loss | 2.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11904 | -| time_elapsed | 65018 | -| total_timesteps | 1523712 | -| train/ | | -| approx_kl | 0.025569854 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.0072 | -| n_updates | 119030 | -| policy_gradient_loss | 0.00174 | -| std | 0.0202 | -| value_loss | 3.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11905 | -| time_elapsed | 65021 | -| total_timesteps | 1523840 | -| train/ | | -| approx_kl | 0.024027023 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 119040 | -| policy_gradient_loss | -0.00415 | -| std | 0.0202 | -| value_loss | 2.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11906 | -| time_elapsed | 65025 | -| total_timesteps | 1523968 | -| train/ | | -| approx_kl | 0.06196789 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 119050 | -| policy_gradient_loss | -4.11e-05 | -| std | 0.0202 | -| value_loss | 1.57e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11907 | -| time_elapsed | 65029 | -| total_timesteps | 1524096 | -| train/ | | -| approx_kl | 0.0010495442 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 119060 | -| policy_gradient_loss | -0.00951 | -| std | 0.0202 | -| value_loss | 1.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11908 | -| time_elapsed | 65035 | -| total_timesteps | 1524224 | -| train/ | | -| approx_kl | 0.009984326 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.48 | -| explained_variance | 0.797 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 119070 | -| policy_gradient_loss | -0.000707 | -| std | 0.0202 | -| value_loss | 0.00312 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11909 | -| time_elapsed | 65039 | -| total_timesteps | 1524352 | -| train/ | | -| approx_kl | 0.020782355 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | 0.0083 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 119080 | -| policy_gradient_loss | 0.00582 | -| std | 0.0201 | -| value_loss | 4.96e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11910 | -| time_elapsed | 65042 | -| total_timesteps | 1524480 | -| train/ | | -| approx_kl | 0.009098262 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 119090 | -| policy_gradient_loss | 0.00776 | -| std | 0.0201 | -| value_loss | 1.98e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11911 | -| time_elapsed | 65044 | -| total_timesteps | 1524608 | -| train/ | | -| approx_kl | 0.0016415371 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | 0.00229 | -| n_updates | 119100 | -| policy_gradient_loss | -0.000674 | -| std | 0.0201 | -| value_loss | 4.11e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11912 | -| time_elapsed | 65048 | -| total_timesteps | 1524736 | -| train/ | | -| approx_kl | 0.022141047 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | 0.00372 | -| n_updates | 119110 | -| policy_gradient_loss | -0.000326 | -| std | 0.0201 | -| value_loss | 2.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11913 | -| time_elapsed | 65052 | -| total_timesteps | 1524864 | -| train/ | | -| approx_kl | 0.004894614 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | -0.0077 | -| n_updates | 119120 | -| policy_gradient_loss | -0.00524 | -| std | 0.0201 | -| value_loss | 5.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11914 | -| time_elapsed | 65055 | -| total_timesteps | 1524992 | -| train/ | | -| approx_kl | 0.002429822 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 119130 | -| policy_gradient_loss | -0.00901 | -| std | 0.0201 | -| value_loss | 3.64e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11915 | -| time_elapsed | 65058 | -| total_timesteps | 1525120 | -| train/ | | -| approx_kl | 0.00062024686 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.00177 | -| n_updates | 119140 | -| policy_gradient_loss | 0.0018 | -| std | 0.02 | -| value_loss | 2.18e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11916 | -| time_elapsed | 65067 | -| total_timesteps | 1525248 | -| train/ | | -| approx_kl | 0.015002774 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | 0.649 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 119150 | -| policy_gradient_loss | -0.0164 | -| std | 0.02 | -| value_loss | 0.000976 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11917 | -| time_elapsed | 65070 | -| total_timesteps | 1525376 | -| train/ | | -| approx_kl | 0.019682286 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | 0.00771 | -| n_updates | 119160 | -| policy_gradient_loss | 0.00356 | -| std | 0.02 | -| value_loss | 3.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11918 | -| time_elapsed | 65074 | -| total_timesteps | 1525504 | -| train/ | | -| approx_kl | 0.013191274 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.00192 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 119170 | -| policy_gradient_loss | -0.0041 | -| std | 0.02 | -| value_loss | 1.14e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11919 | -| time_elapsed | 65078 | -| total_timesteps | 1525632 | -| train/ | | -| approx_kl | 0.01966989 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 119180 | -| policy_gradient_loss | -0.00432 | -| std | 0.02 | -| value_loss | 6.08e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11920 | -| time_elapsed | 65081 | -| total_timesteps | 1525760 | -| train/ | | -| approx_kl | 0.0033577043 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.49 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.00555 | -| n_updates | 119190 | -| policy_gradient_loss | -0.000266 | -| std | 0.02 | -| value_loss | 6.46e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11921 | -| time_elapsed | 65085 | -| total_timesteps | 1525888 | -| train/ | | -| approx_kl | 0.008851744 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | 0.000268 | -| n_updates | 119200 | -| policy_gradient_loss | 0.00137 | -| std | 0.0199 | -| value_loss | 1.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11922 | -| time_elapsed | 65088 | -| total_timesteps | 1526016 | -| train/ | | -| approx_kl | 0.03770565 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | 0.005 | -| n_updates | 119210 | -| policy_gradient_loss | 0.00175 | -| std | 0.0199 | -| value_loss | 4.6e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11923 | -| time_elapsed | 65097 | -| total_timesteps | 1526144 | -| train/ | | -| approx_kl | 0.016789082 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | 0.204 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 119220 | -| policy_gradient_loss | -0.0169 | -| std | 0.0199 | -| value_loss | 0.00106 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11924 | -| time_elapsed | 65099 | -| total_timesteps | 1526272 | -| train/ | | -| approx_kl | 0.014576407 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.0264 | -| n_updates | 119230 | -| policy_gradient_loss | -0.0221 | -| std | 0.0199 | -| value_loss | 2.52e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11925 | -| time_elapsed | 65103 | -| total_timesteps | 1526400 | -| train/ | | -| approx_kl | 0.019683974 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 119240 | -| policy_gradient_loss | 0.00596 | -| std | 0.0199 | -| value_loss | 9.52e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11926 | -| time_elapsed | 65107 | -| total_timesteps | 1526528 | -| train/ | | -| approx_kl | 0.00033294968 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.0878 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 119250 | -| policy_gradient_loss | -0.00559 | -| std | 0.0199 | -| value_loss | 1.47e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11927 | -| time_elapsed | 65110 | -| total_timesteps | 1526656 | -| train/ | | -| approx_kl | 0.0028112791 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 119260 | -| policy_gradient_loss | -0.000892 | -| std | 0.0199 | -| value_loss | 6.65e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11928 | -| time_elapsed | 65114 | -| total_timesteps | 1526784 | -| train/ | | -| approx_kl | 0.008531789 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.00319 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 119270 | -| policy_gradient_loss | 0.0014 | -| std | 0.0199 | -| value_loss | 1.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 11929 | -| time_elapsed | 65119 | -| total_timesteps | 1526912 | -| train/ | | -| approx_kl | 0.023304936 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 119280 | -| policy_gradient_loss | 0.00862 | -| std | 0.0199 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11930 | -| time_elapsed | 65123 | -| total_timesteps | 1527040 | -| train/ | | -| approx_kl | 0.002826728 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 119290 | -| policy_gradient_loss | -0.00236 | -| std | 0.0199 | -| value_loss | 1.01e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11931 | -| time_elapsed | 65131 | -| total_timesteps | 1527168 | -| train/ | | -| approx_kl | 0.18012398 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | 0.856 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 119300 | -| policy_gradient_loss | -0.0117 | -| std | 0.0199 | -| value_loss | 0.000334 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11932 | -| time_elapsed | 65135 | -| total_timesteps | 1527296 | -| train/ | | -| approx_kl | 0.051897403 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -33.6 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 119310 | -| policy_gradient_loss | -0.0158 | -| std | 0.0199 | -| value_loss | 1.37e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11933 | -| time_elapsed | 65139 | -| total_timesteps | 1527424 | -| train/ | | -| approx_kl | 0.0002592071 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -45.3 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 119320 | -| policy_gradient_loss | -0.0106 | -| std | 0.0199 | -| value_loss | 6.43e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11934 | -| time_elapsed | 65142 | -| total_timesteps | 1527552 | -| train/ | | -| approx_kl | 0.0037367572 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -5.96 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 119330 | -| policy_gradient_loss | -0.00391 | -| std | 0.0199 | -| value_loss | 1.17e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11935 | -| time_elapsed | 65145 | -| total_timesteps | 1527680 | -| train/ | | -| approx_kl | 0.0013656807 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.802 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 119340 | -| policy_gradient_loss | -9.52e-06 | -| std | 0.0199 | -| value_loss | 1.03e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11936 | -| time_elapsed | 65148 | -| total_timesteps | 1527808 | -| train/ | | -| approx_kl | 0.0004815599 | -| clip_fraction | 0.0234 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.0749 | -| learning_rate | 0.0003 | -| loss | 0.00097 | -| n_updates | 119350 | -| policy_gradient_loss | 0.00041 | -| std | 0.0199 | -| value_loss | 2.93e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 11937 | -| time_elapsed | 65153 | -| total_timesteps | 1527936 | -| train/ | | -| approx_kl | 0.021191116 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.00441 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 119360 | -| policy_gradient_loss | 0.0232 | -| std | 0.0199 | -| value_loss | 1.41e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11938 | -| time_elapsed | 65157 | -| total_timesteps | 1528064 | -| train/ | | -| approx_kl | 0.025033765 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.00193 | -| learning_rate | 0.0003 | -| loss | 0.00924 | -| n_updates | 119370 | -| policy_gradient_loss | 0.000188 | -| std | 0.0199 | -| value_loss | 8.14e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11939 | -| time_elapsed | 65163 | -| total_timesteps | 1528192 | -| train/ | | -| approx_kl | 0.004487268 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 119380 | -| policy_gradient_loss | 0.00636 | -| std | 0.0198 | -| value_loss | 0.000208 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11940 | -| time_elapsed | 65166 | -| total_timesteps | 1528320 | -| train/ | | -| approx_kl | 0.004598974 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 2.5 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 119390 | -| policy_gradient_loss | -0.000472 | -| std | 0.0197 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11941 | -| time_elapsed | 65169 | -| total_timesteps | 1528448 | -| train/ | | -| approx_kl | 0.0054691033 | -| clip_fraction | 0.0211 | -| clip_range | 0.2 | -| entropy_loss | 2.51 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.000766 | -| n_updates | 119400 | -| policy_gradient_loss | -0.000484 | -| std | 0.0197 | -| value_loss | 4.67e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11942 | -| time_elapsed | 65172 | -| total_timesteps | 1528576 | -| train/ | | -| approx_kl | 0.012992704 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.51 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | -0.000211 | -| n_updates | 119410 | -| policy_gradient_loss | 0.00682 | -| std | 0.0197 | -| value_loss | 2.06e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11943 | -| time_elapsed | 65175 | -| total_timesteps | 1528704 | -| train/ | | -| approx_kl | 0.04416368 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 2.51 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 119420 | -| policy_gradient_loss | 0.0283 | -| std | 0.0196 | -| value_loss | 6.4e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11944 | -| time_elapsed | 65178 | -| total_timesteps | 1528832 | -| train/ | | -| approx_kl | 0.0075235344 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.51 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 119430 | -| policy_gradient_loss | 0.00618 | -| std | 0.0196 | -| value_loss | 4.61e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11945 | -| time_elapsed | 65181 | -| total_timesteps | 1528960 | -| train/ | | -| approx_kl | 0.027821403 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.51 | -| explained_variance | -0.00286 | -| learning_rate | 0.0003 | -| loss | 0.00193 | -| n_updates | 119440 | -| policy_gradient_loss | -0.00188 | -| std | 0.0195 | -| value_loss | 1.56e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11946 | -| time_elapsed | 65183 | -| total_timesteps | 1529088 | -| train/ | | -| approx_kl | 0.004290487 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.00439 | -| learning_rate | 0.0003 | -| loss | 0.00486 | -| n_updates | 119450 | -| policy_gradient_loss | -0.000136 | -| std | 0.0194 | -| value_loss | 0.000346 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11947 | -| time_elapsed | 65190 | -| total_timesteps | 1529216 | -| train/ | | -| approx_kl | 0.2700217 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.384 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 119460 | -| policy_gradient_loss | -0.00989 | -| std | 0.0194 | -| value_loss | 0.00223 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11948 | -| time_elapsed | 65194 | -| total_timesteps | 1529344 | -| train/ | | -| approx_kl | 0.030236723 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.00597 | -| learning_rate | 0.0003 | -| loss | 0.00388 | -| n_updates | 119470 | -| policy_gradient_loss | 0.00744 | -| std | 0.0194 | -| value_loss | 0.000141 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11949 | -| time_elapsed | 65198 | -| total_timesteps | 1529472 | -| train/ | | -| approx_kl | 0.025851658 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.00529 | -| learning_rate | 0.0003 | -| loss | 0.00892 | -| n_updates | 119480 | -| policy_gradient_loss | 0.00518 | -| std | 0.0194 | -| value_loss | 1.85e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11950 | -| time_elapsed | 65201 | -| total_timesteps | 1529600 | -| train/ | | -| approx_kl | 0.0291891 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | -0.00911 | -| n_updates | 119490 | -| policy_gradient_loss | -0.00474 | -| std | 0.0194 | -| value_loss | 1.29e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11951 | -| time_elapsed | 65206 | -| total_timesteps | 1529728 | -| train/ | | -| approx_kl | 0.0024945554 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.00385 | -| n_updates | 119500 | -| policy_gradient_loss | 0.00106 | -| std | 0.0194 | -| value_loss | 1.32e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11952 | -| time_elapsed | 65211 | -| total_timesteps | 1529856 | -| train/ | | -| approx_kl | 0.037987754 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 119510 | -| policy_gradient_loss | 0.0243 | -| std | 0.0194 | -| value_loss | 1.71e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 11953 | -| time_elapsed | 65214 | -| total_timesteps | 1529984 | -| train/ | | -| approx_kl | 0.016048258 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 119520 | -| policy_gradient_loss | -0.00385 | -| std | 0.0194 | -| value_loss | 1.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11954 | -| time_elapsed | 65218 | -| total_timesteps | 1530112 | -| train/ | | -| approx_kl | 0.05630597 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | 0.0429 | -| n_updates | 119530 | -| policy_gradient_loss | 0.0345 | -| std | 0.0194 | -| value_loss | 6.44e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11955 | -| time_elapsed | 65229 | -| total_timesteps | 1530240 | -| train/ | | -| approx_kl | 0.0055965655 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | 0.0098 | -| n_updates | 119540 | -| policy_gradient_loss | -0.00114 | -| std | 0.0194 | -| value_loss | 0.00175 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11956 | -| time_elapsed | 65232 | -| total_timesteps | 1530368 | -| train/ | | -| approx_kl | 0.03364937 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.00611 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 119550 | -| policy_gradient_loss | 0.00829 | -| std | 0.0194 | -| value_loss | 3.77e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11957 | -| time_elapsed | 65235 | -| total_timesteps | 1530496 | -| train/ | | -| approx_kl | 0.0030569695 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.000815 | -| n_updates | 119560 | -| policy_gradient_loss | 0.00635 | -| std | 0.0194 | -| value_loss | 5.57e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11958 | -| time_elapsed | 65239 | -| total_timesteps | 1530624 | -| train/ | | -| approx_kl | 0.016771097 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | -0.00404 | -| n_updates | 119570 | -| policy_gradient_loss | -0.0021 | -| std | 0.0193 | -| value_loss | 7.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11959 | -| time_elapsed | 65242 | -| total_timesteps | 1530752 | -| train/ | | -| approx_kl | 0.015479211 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.00609 | -| n_updates | 119580 | -| policy_gradient_loss | 0.00598 | -| std | 0.0193 | -| value_loss | 4.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 11960 | -| time_elapsed | 65245 | -| total_timesteps | 1530880 | -| train/ | | -| approx_kl | 0.01224975 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 119590 | -| policy_gradient_loss | -0.00601 | -| std | 0.0193 | -| value_loss | 2.6e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11961 | -| time_elapsed | 65248 | -| total_timesteps | 1531008 | -| train/ | | -| approx_kl | 0.034358375 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 119600 | -| policy_gradient_loss | 0.00743 | -| std | 0.0193 | -| value_loss | 2.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11962 | -| time_elapsed | 65257 | -| total_timesteps | 1531136 | -| train/ | | -| approx_kl | 0.33899686 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 119610 | -| policy_gradient_loss | -0.0149 | -| std | 0.0193 | -| value_loss | 0.000693 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11963 | -| time_elapsed | 65260 | -| total_timesteps | 1531264 | -| train/ | | -| approx_kl | 5.145557e-07 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.0635 | -| learning_rate | 0.0003 | -| loss | 1.35e-05 | -| n_updates | 119620 | -| policy_gradient_loss | -0.00422 | -| std | 0.0193 | -| value_loss | 2.24e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11964 | -| time_elapsed | 65263 | -| total_timesteps | 1531392 | -| train/ | | -| approx_kl | 0.034184046 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -1.37e+03 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 119630 | -| policy_gradient_loss | 0.000261 | -| std | 0.0193 | -| value_loss | 1.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11965 | -| time_elapsed | 65266 | -| total_timesteps | 1531520 | -| train/ | | -| approx_kl | 0.022949746 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.643 | -| learning_rate | 0.0003 | -| loss | -0.00892 | -| n_updates | 119640 | -| policy_gradient_loss | -0.00832 | -| std | 0.0194 | -| value_loss | 2.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11966 | -| time_elapsed | 65269 | -| total_timesteps | 1531648 | -| train/ | | -| approx_kl | 0.028321955 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.00476 | -| n_updates | 119650 | -| policy_gradient_loss | -0.0022 | -| std | 0.0194 | -| value_loss | 1.57e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11967 | -| time_elapsed | 65272 | -| total_timesteps | 1531776 | -| train/ | | -| approx_kl | 2.1164306e-06 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 2.52 | -| explained_variance | -0.0646 | -| learning_rate | 0.0003 | -| loss | -0.000178 | -| n_updates | 119660 | -| policy_gradient_loss | 6.72e-05 | -| std | 0.0194 | -| value_loss | 4.57e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 11968 | -| time_elapsed | 65274 | -| total_timesteps | 1531904 | -| train/ | | -| approx_kl | 0.012990111 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | -0.00719 | -| n_updates | 119670 | -| policy_gradient_loss | -0.00279 | -| std | 0.0193 | -| value_loss | 0.000122 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11969 | -| time_elapsed | 65278 | -| total_timesteps | 1532032 | -| train/ | | -| approx_kl | 0.008130675 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.00366 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 119680 | -| policy_gradient_loss | -0.00137 | -| std | 0.0193 | -| value_loss | 3.23e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11970 | -| time_elapsed | 65286 | -| total_timesteps | 1532160 | -| train/ | | -| approx_kl | 0.15579945 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -6.94 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 119690 | -| policy_gradient_loss | -0.0139 | -| std | 0.0193 | -| value_loss | 0.00239 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11971 | -| time_elapsed | 65290 | -| total_timesteps | 1532288 | -| train/ | | -| approx_kl | 0.027598217 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.326 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 119700 | -| policy_gradient_loss | 0.00579 | -| std | 0.0193 | -| value_loss | 5.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11972 | -| time_elapsed | 65295 | -| total_timesteps | 1532416 | -| train/ | | -| approx_kl | 0.017614141 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.867 | -| learning_rate | 0.0003 | -| loss | -0.00889 | -| n_updates | 119710 | -| policy_gradient_loss | -0.0015 | -| std | 0.0193 | -| value_loss | 3.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11973 | -| time_elapsed | 65299 | -| total_timesteps | 1532544 | -| train/ | | -| approx_kl | 0.031913273 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 119720 | -| policy_gradient_loss | -0.00101 | -| std | 0.0193 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11974 | -| time_elapsed | 65303 | -| total_timesteps | 1532672 | -| train/ | | -| approx_kl | 0.028207865 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0757 | -| learning_rate | 0.0003 | -| loss | -0.000787 | -| n_updates | 119730 | -| policy_gradient_loss | -0.00144 | -| std | 0.0193 | -| value_loss | 1.49e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11975 | -| time_elapsed | 65307 | -| total_timesteps | 1532800 | -| train/ | | -| approx_kl | 0.0021435618 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | 0.00657 | -| n_updates | 119740 | -| policy_gradient_loss | -0.00123 | -| std | 0.0193 | -| value_loss | 1.22e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 11976 | -| time_elapsed | 65310 | -| total_timesteps | 1532928 | -| train/ | | -| approx_kl | 0.0008031423 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | -0.000408 | -| n_updates | 119750 | -| policy_gradient_loss | 0.00117 | -| std | 0.0193 | -| value_loss | 4.68e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11977 | -| time_elapsed | 65314 | -| total_timesteps | 1533056 | -| train/ | | -| approx_kl | 0.04603118 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.0029 | -| n_updates | 119760 | -| policy_gradient_loss | -0.0039 | -| std | 0.0193 | -| value_loss | 2.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11978 | -| time_elapsed | 65318 | -| total_timesteps | 1533184 | -| train/ | | -| approx_kl | 0.010290738 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | 0.066 | -| n_updates | 119770 | -| policy_gradient_loss | 0.022 | -| std | 0.0193 | -| value_loss | 0.00015 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11979 | -| time_elapsed | 65321 | -| total_timesteps | 1533312 | -| train/ | | -| approx_kl | 0.046788704 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -8.54 | -| learning_rate | 0.0003 | -| loss | -0.00728 | -| n_updates | 119780 | -| policy_gradient_loss | -0.00293 | -| std | 0.0193 | -| value_loss | 3.73e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11980 | -| time_elapsed | 65324 | -| total_timesteps | 1533440 | -| train/ | | -| approx_kl | 0.0033017108 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.00982 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 119790 | -| policy_gradient_loss | 0.000496 | -| std | 0.0193 | -| value_loss | 8.55e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11981 | -| time_elapsed | 65327 | -| total_timesteps | 1533568 | -| train/ | | -| approx_kl | 0.0130633935 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 119800 | -| policy_gradient_loss | 0.00931 | -| std | 0.0193 | -| value_loss | 9.55e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11982 | -| time_elapsed | 65331 | -| total_timesteps | 1533696 | -| train/ | | -| approx_kl | 0.003565595 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.00633 | -| learning_rate | 0.0003 | -| loss | -0.000286 | -| n_updates | 119810 | -| policy_gradient_loss | 0.00334 | -| std | 0.0192 | -| value_loss | 1.43e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11983 | -| time_elapsed | 65334 | -| total_timesteps | 1533824 | -| train/ | | -| approx_kl | 0.04964295 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.00431 | -| n_updates | 119820 | -| policy_gradient_loss | -0.00412 | -| std | 0.0192 | -| value_loss | 1.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 11984 | -| time_elapsed | 65337 | -| total_timesteps | 1533952 | -| train/ | | -| approx_kl | 0.017314425 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.00158 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 119830 | -| policy_gradient_loss | -0.0037 | -| std | 0.0192 | -| value_loss | 3.14e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11985 | -| time_elapsed | 65340 | -| total_timesteps | 1534080 | -| train/ | | -| approx_kl | 0.04598652 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.00758 | -| n_updates | 119840 | -| policy_gradient_loss | 0.00505 | -| std | 0.0192 | -| value_loss | 2.47e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11986 | -| time_elapsed | 65346 | -| total_timesteps | 1534208 | -| train/ | | -| approx_kl | 0.0073853564 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.792 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 119850 | -| policy_gradient_loss | -0.00549 | -| std | 0.0192 | -| value_loss | 0.00292 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11987 | -| time_elapsed | 65350 | -| total_timesteps | 1534336 | -| train/ | | -| approx_kl | 0.062489197 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.000252 | -| n_updates | 119860 | -| policy_gradient_loss | -0.00827 | -| std | 0.0192 | -| value_loss | 0.000157 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11988 | -| time_elapsed | 65353 | -| total_timesteps | 1534464 | -| train/ | | -| approx_kl | 0.007297351 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 119870 | -| policy_gradient_loss | -0.00375 | -| std | 0.0192 | -| value_loss | 1.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11989 | -| time_elapsed | 65358 | -| total_timesteps | 1534592 | -| train/ | | -| approx_kl | 0.011986217 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0579 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 119880 | -| policy_gradient_loss | -0.00106 | -| std | 0.0192 | -| value_loss | 8.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11990 | -| time_elapsed | 65362 | -| total_timesteps | 1534720 | -| train/ | | -| approx_kl | 0.029598203 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.00104 | -| learning_rate | 0.0003 | -| loss | 0.00255 | -| n_updates | 119890 | -| policy_gradient_loss | -0.00151 | -| std | 0.0192 | -| value_loss | 4.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11991 | -| time_elapsed | 65367 | -| total_timesteps | 1534848 | -| train/ | | -| approx_kl | 0.003046013 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 119900 | -| policy_gradient_loss | -0.0015 | -| std | 0.0193 | -| value_loss | 5.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11992 | -| time_elapsed | 65370 | -| total_timesteps | 1534976 | -| train/ | | -| approx_kl | 0.040400743 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.000747 | -| learning_rate | 0.0003 | -| loss | 0.0576 | -| n_updates | 119910 | -| policy_gradient_loss | 0.0143 | -| std | 0.0193 | -| value_loss | 9.12e-07 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11993 | -| time_elapsed | 65373 | -| total_timesteps | 1535104 | -| train/ | | -| approx_kl | 1.17812306e-07 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.00399 | -| learning_rate | 0.0003 | -| loss | -4.1e-05 | -| n_updates | 119920 | -| policy_gradient_loss | -0.0029 | -| std | 0.0193 | -| value_loss | 5.84e-08 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11994 | -| time_elapsed | 65380 | -| total_timesteps | 1535232 | -| train/ | | -| approx_kl | 0.029684067 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | 0.0785 | -| n_updates | 119930 | -| policy_gradient_loss | 0.0283 | -| std | 0.0193 | -| value_loss | 0.00106 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11995 | -| time_elapsed | 65387 | -| total_timesteps | 1535360 | -| train/ | | -| approx_kl | 0.020750381 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 119940 | -| policy_gradient_loss | 0.000222 | -| std | 0.0193 | -| value_loss | 1.94e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11996 | -| time_elapsed | 65391 | -| total_timesteps | 1535488 | -| train/ | | -| approx_kl | 0.065175004 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | 0.0032 | -| n_updates | 119950 | -| policy_gradient_loss | -0.00185 | -| std | 0.0193 | -| value_loss | 2.67e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11997 | -| time_elapsed | 65395 | -| total_timesteps | 1535616 | -| train/ | | -| approx_kl | 8.888217e-05 | -| clip_fraction | 0.0172 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | 0.000441 | -| n_updates | 119960 | -| policy_gradient_loss | -0.000182 | -| std | 0.0193 | -| value_loss | 6.38e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11998 | -| time_elapsed | 65399 | -| total_timesteps | 1535744 | -| train/ | | -| approx_kl | 0.00015422609 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.000364 | -| n_updates | 119970 | -| policy_gradient_loss | 0.00358 | -| std | 0.0193 | -| value_loss | 3.39e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 11999 | -| time_elapsed | 65403 | -| total_timesteps | 1535872 | -| train/ | | -| approx_kl | 0.0038298112 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 119980 | -| policy_gradient_loss | 0.00136 | -| std | 0.0193 | -| value_loss | 5.63e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12000 | -| time_elapsed | 65405 | -| total_timesteps | 1536000 | -| train/ | | -| approx_kl | 0.012705052 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 119990 | -| policy_gradient_loss | 0.00567 | -| std | 0.0193 | -| value_loss | 1.15e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12001 | -| time_elapsed | 65410 | -| total_timesteps | 1536128 | -| train/ | | -| approx_kl | 0.0067564836 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.00121 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 120000 | -| policy_gradient_loss | -0.00242 | -| std | 0.0194 | -| value_loss | 1.13e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12002 | -| time_elapsed | 65417 | -| total_timesteps | 1536256 | -| train/ | | -| approx_kl | 0.54585654 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.801 | -| learning_rate | 0.0003 | -| loss | 0.00691 | -| n_updates | 120010 | -| policy_gradient_loss | 0.0161 | -| std | 0.0193 | -| value_loss | 0.00325 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12003 | -| time_elapsed | 65421 | -| total_timesteps | 1536384 | -| train/ | | -| approx_kl | 0.024145864 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 120020 | -| policy_gradient_loss | -0.0169 | -| std | 0.0193 | -| value_loss | 2.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12004 | -| time_elapsed | 65425 | -| total_timesteps | 1536512 | -| train/ | | -| approx_kl | 0.027895384 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.00929 | -| n_updates | 120030 | -| policy_gradient_loss | -2.32e-05 | -| std | 0.0193 | -| value_loss | 2.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12005 | -| time_elapsed | 65428 | -| total_timesteps | 1536640 | -| train/ | | -| approx_kl | 0.022014245 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.00391 | -| n_updates | 120040 | -| policy_gradient_loss | -0.00178 | -| std | 0.0193 | -| value_loss | 7.58e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12006 | -| time_elapsed | 65431 | -| total_timesteps | 1536768 | -| train/ | | -| approx_kl | 1.9464642e-07 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 8.65e-06 | -| n_updates | 120050 | -| policy_gradient_loss | 0.00747 | -| std | 0.0193 | -| value_loss | 1.08e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12007 | -| time_elapsed | 65434 | -| total_timesteps | 1536896 | -| train/ | | -| approx_kl | 0.000811371 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.00353 | -| n_updates | 120060 | -| policy_gradient_loss | 0.00183 | -| std | 0.0193 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12008 | -| time_elapsed | 65436 | -| total_timesteps | 1537024 | -| train/ | | -| approx_kl | 0.060865846 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | 0.000847 | -| n_updates | 120070 | -| policy_gradient_loss | -0.00904 | -| std | 0.0194 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12009 | -| time_elapsed | 65444 | -| total_timesteps | 1537152 | -| train/ | | -| approx_kl | 0.008420676 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.772 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 120080 | -| policy_gradient_loss | -0.00463 | -| std | 0.0194 | -| value_loss | 0.00455 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12010 | -| time_elapsed | 65447 | -| total_timesteps | 1537280 | -| train/ | | -| approx_kl | 0.016848592 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | 0.0653 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 120090 | -| policy_gradient_loss | 0.00326 | -| std | 0.0194 | -| value_loss | 1.43e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12011 | -| time_elapsed | 65449 | -| total_timesteps | 1537408 | -| train/ | | -| approx_kl | 0.0009116316 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | 0.00541 | -| n_updates | 120100 | -| policy_gradient_loss | 0.00148 | -| std | 0.0194 | -| value_loss | 2.66e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12012 | -| time_elapsed | 65452 | -| total_timesteps | 1537536 | -| train/ | | -| approx_kl | 0.00509313 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00695 | -| n_updates | 120110 | -| policy_gradient_loss | -0.00497 | -| std | 0.0194 | -| value_loss | 5.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12013 | -| time_elapsed | 65455 | -| total_timesteps | 1537664 | -| train/ | | -| approx_kl | 0.015827077 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | 0.00084 | -| n_updates | 120120 | -| policy_gradient_loss | 0.00825 | -| std | 0.0194 | -| value_loss | 8.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12014 | -| time_elapsed | 65459 | -| total_timesteps | 1537792 | -| train/ | | -| approx_kl | 0.00829547 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 120130 | -| policy_gradient_loss | -0.000124 | -| std | 0.0193 | -| value_loss | 2.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 12015 | -| time_elapsed | 65463 | -| total_timesteps | 1537920 | -| train/ | | -| approx_kl | 0.007363797 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.00661 | -| n_updates | 120140 | -| policy_gradient_loss | -0.00323 | -| std | 0.0193 | -| value_loss | 8.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12016 | -| time_elapsed | 65466 | -| total_timesteps | 1538048 | -| train/ | | -| approx_kl | 0.04154697 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | 0.00887 | -| n_updates | 120150 | -| policy_gradient_loss | 0.0046 | -| std | 0.0193 | -| value_loss | 3.14e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12017 | -| time_elapsed | 65473 | -| total_timesteps | 1538176 | -| train/ | | -| approx_kl | 0.18616559 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 120160 | -| policy_gradient_loss | -0.0154 | -| std | 0.0193 | -| value_loss | 0.00147 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12018 | -| time_elapsed | 65477 | -| total_timesteps | 1538304 | -| train/ | | -| approx_kl | 0.07969151 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -22.5 | -| learning_rate | 0.0003 | -| loss | 0.00228 | -| n_updates | 120170 | -| policy_gradient_loss | -0.00112 | -| std | 0.0193 | -| value_loss | 1.29e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12019 | -| time_elapsed | 65481 | -| total_timesteps | 1538432 | -| train/ | | -| approx_kl | 0.009740301 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 2.53 | -| explained_variance | -4.78 | -| learning_rate | 0.0003 | -| loss | 0.00159 | -| n_updates | 120180 | -| policy_gradient_loss | 0.000816 | -| std | 0.0192 | -| value_loss | 2.59e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12020 | -| time_elapsed | 65483 | -| total_timesteps | 1538560 | -| train/ | | -| approx_kl | 0.027286513 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.00933 | -| n_updates | 120190 | -| policy_gradient_loss | 0.00326 | -| std | 0.0191 | -| value_loss | 3.58e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12021 | -| time_elapsed | 65487 | -| total_timesteps | 1538688 | -| train/ | | -| approx_kl | 0.016950024 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -30.7 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 120200 | -| policy_gradient_loss | -0.000174 | -| std | 0.0191 | -| value_loss | 4.96e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12022 | -| time_elapsed | 65491 | -| total_timesteps | 1538816 | -| train/ | | -| approx_kl | 0.02387295 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0967 | -| learning_rate | 0.0003 | -| loss | 0.00742 | -| n_updates | 120210 | -| policy_gradient_loss | 0.00431 | -| std | 0.0191 | -| value_loss | 3.97e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12023 | -| time_elapsed | 65495 | -| total_timesteps | 1538944 | -| train/ | | -| approx_kl | 0.017611567 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.00714 | -| n_updates | 120220 | -| policy_gradient_loss | 0.0122 | -| std | 0.0191 | -| value_loss | 3.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12024 | -| time_elapsed | 65498 | -| total_timesteps | 1539072 | -| train/ | | -| approx_kl | 0.019310085 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.00296 | -| n_updates | 120230 | -| policy_gradient_loss | -0.000396 | -| std | 0.0191 | -| value_loss | 1.16e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12025 | -| time_elapsed | 65504 | -| total_timesteps | 1539200 | -| train/ | | -| approx_kl | 0.0033199391 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 120240 | -| policy_gradient_loss | 0.00874 | -| std | 0.0191 | -| value_loss | 0.00451 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12026 | -| time_elapsed | 65508 | -| total_timesteps | 1539328 | -| train/ | | -| approx_kl | 0.0021848981 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 120250 | -| policy_gradient_loss | 0.000124 | -| std | 0.0191 | -| value_loss | 4.39e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12027 | -| time_elapsed | 65512 | -| total_timesteps | 1539456 | -| train/ | | -| approx_kl | 0.020746103 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -3.07 | -| learning_rate | 0.0003 | -| loss | -0.0059 | -| n_updates | 120260 | -| policy_gradient_loss | -0.0022 | -| std | 0.0191 | -| value_loss | 1.93e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12028 | -| time_elapsed | 65515 | -| total_timesteps | 1539584 | -| train/ | | -| approx_kl | 0.0035543065 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.00479 | -| n_updates | 120270 | -| policy_gradient_loss | 0.0114 | -| std | 0.0191 | -| value_loss | 7.42e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12029 | -| time_elapsed | 65518 | -| total_timesteps | 1539712 | -| train/ | | -| approx_kl | 0.0022031702 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.00592 | -| learning_rate | 0.0003 | -| loss | 0.00266 | -| n_updates | 120280 | -| policy_gradient_loss | 0.0219 | -| std | 0.0191 | -| value_loss | 3.88e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12030 | -| time_elapsed | 65521 | -| total_timesteps | 1539840 | -| train/ | | -| approx_kl | 0.014523057 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.000373 | -| n_updates | 120290 | -| policy_gradient_loss | 0.00177 | -| std | 0.0191 | -| value_loss | 2.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 12031 | -| time_elapsed | 65525 | -| total_timesteps | 1539968 | -| train/ | | -| approx_kl | 0.013538154 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 120300 | -| policy_gradient_loss | 0.0203 | -| std | 0.0191 | -| value_loss | 1.6e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12032 | -| time_elapsed | 65529 | -| total_timesteps | 1540096 | -| train/ | | -| approx_kl | 0.006810292 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 120310 | -| policy_gradient_loss | 0.00949 | -| std | 0.0191 | -| value_loss | 1.23e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12033 | -| time_elapsed | 65537 | -| total_timesteps | 1540224 | -| train/ | | -| approx_kl | 0.1678045 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 120320 | -| policy_gradient_loss | -0.0124 | -| std | 0.0191 | -| value_loss | 0.000124 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12034 | -| time_elapsed | 65539 | -| total_timesteps | 1540352 | -| train/ | | -| approx_kl | 0.023339478 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.00446 | -| learning_rate | 0.0003 | -| loss | 0.0052 | -| n_updates | 120330 | -| policy_gradient_loss | -0.00146 | -| std | 0.0191 | -| value_loss | 1.07e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12035 | -| time_elapsed | 65542 | -| total_timesteps | 1540480 | -| train/ | | -| approx_kl | 0.00656433 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 120340 | -| policy_gradient_loss | 0.00099 | -| std | 0.0191 | -| value_loss | 3.97e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12036 | -| time_elapsed | 65545 | -| total_timesteps | 1540608 | -| train/ | | -| approx_kl | 2.9052608e-06 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | -0.000102 | -| n_updates | 120350 | -| policy_gradient_loss | 0.0259 | -| std | 0.0191 | -| value_loss | 2.13e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12037 | -| time_elapsed | 65549 | -| total_timesteps | 1540736 | -| train/ | | -| approx_kl | 0.006721019 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.00306 | -| n_updates | 120360 | -| policy_gradient_loss | 0.0183 | -| std | 0.0191 | -| value_loss | 1.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12038 | -| time_elapsed | 65553 | -| total_timesteps | 1540864 | -| train/ | | -| approx_kl | 0.01062851 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 120370 | -| policy_gradient_loss | 0.0171 | -| std | 0.0191 | -| value_loss | 1.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12039 | -| time_elapsed | 65555 | -| total_timesteps | 1540992 | -| train/ | | -| approx_kl | 0.002978691 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.000394 | -| n_updates | 120380 | -| policy_gradient_loss | 0.00213 | -| std | 0.0191 | -| value_loss | 1.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12040 | -| time_elapsed | 65559 | -| total_timesteps | 1541120 | -| train/ | | -| approx_kl | 0.020327015 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.00478 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 120390 | -| policy_gradient_loss | -0.00663 | -| std | 0.019 | -| value_loss | 1.02e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12041 | -| time_elapsed | 65569 | -| total_timesteps | 1541248 | -| train/ | | -| approx_kl | 0.37132397 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 120400 | -| policy_gradient_loss | -0.0112 | -| std | 0.019 | -| value_loss | 0.000112 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12042 | -| time_elapsed | 65573 | -| total_timesteps | 1541376 | -| train/ | | -| approx_kl | 0.018414833 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 120410 | -| policy_gradient_loss | 0.00364 | -| std | 0.019 | -| value_loss | 1.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12043 | -| time_elapsed | 65576 | -| total_timesteps | 1541504 | -| train/ | | -| approx_kl | 0.025615681 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.00106 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 120420 | -| policy_gradient_loss | 0.00177 | -| std | 0.019 | -| value_loss | 5.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12044 | -| time_elapsed | 65579 | -| total_timesteps | 1541632 | -| train/ | | -| approx_kl | 0.033279695 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 120430 | -| policy_gradient_loss | 0.00796 | -| std | 0.019 | -| value_loss | 3.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12045 | -| time_elapsed | 65582 | -| total_timesteps | 1541760 | -| train/ | | -| approx_kl | 0.025215765 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 120440 | -| policy_gradient_loss | -0.000502 | -| std | 0.019 | -| value_loss | 2.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12046 | -| time_elapsed | 65586 | -| total_timesteps | 1541888 | -| train/ | | -| approx_kl | 0.031716686 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 120450 | -| policy_gradient_loss | 0.00391 | -| std | 0.019 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12047 | -| time_elapsed | 65589 | -| total_timesteps | 1542016 | -| train/ | | -| approx_kl | 0.008870159 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 120460 | -| policy_gradient_loss | -0.000234 | -| std | 0.019 | -| value_loss | 9.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12048 | -| time_elapsed | 65598 | -| total_timesteps | 1542144 | -| train/ | | -| approx_kl | 0.007293613 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 120470 | -| policy_gradient_loss | -0.016 | -| std | 0.019 | -| value_loss | 0.00124 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12049 | -| time_elapsed | 65602 | -| total_timesteps | 1542272 | -| train/ | | -| approx_kl | 0.05034024 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.104 | -| learning_rate | 0.0003 | -| loss | 0.00389 | -| n_updates | 120480 | -| policy_gradient_loss | 0.0026 | -| std | 0.019 | -| value_loss | 1.48e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12050 | -| time_elapsed | 65606 | -| total_timesteps | 1542400 | -| train/ | | -| approx_kl | 0.004366785 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -86 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 120490 | -| policy_gradient_loss | -0.00701 | -| std | 0.019 | -| value_loss | 1.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12051 | -| time_elapsed | 65610 | -| total_timesteps | 1542528 | -| train/ | | -| approx_kl | 0.008097719 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -21.3 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 120500 | -| policy_gradient_loss | -0.00268 | -| std | 0.019 | -| value_loss | 4.11e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12052 | -| time_elapsed | 65613 | -| total_timesteps | 1542656 | -| train/ | | -| approx_kl | 0.07312149 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -2.85 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 120510 | -| policy_gradient_loss | -0.00378 | -| std | 0.019 | -| value_loss | 7.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12053 | -| time_elapsed | 65616 | -| total_timesteps | 1542784 | -| train/ | | -| approx_kl | 0.031288926 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -4.64 | -| learning_rate | 0.0003 | -| loss | 6.39e-05 | -| n_updates | 120520 | -| policy_gradient_loss | -0.00153 | -| std | 0.019 | -| value_loss | 4.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12054 | -| time_elapsed | 65620 | -| total_timesteps | 1542912 | -| train/ | | -| approx_kl | 0.035294555 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 120530 | -| policy_gradient_loss | 0.00859 | -| std | 0.019 | -| value_loss | 1.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12055 | -| time_elapsed | 65623 | -| total_timesteps | 1543040 | -| train/ | | -| approx_kl | 0.013521507 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 120540 | -| policy_gradient_loss | -0.005 | -| std | 0.019 | -| value_loss | 1.27e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12056 | -| time_elapsed | 65630 | -| total_timesteps | 1543168 | -| train/ | | -| approx_kl | 0.02845683 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 120550 | -| policy_gradient_loss | -0.0151 | -| std | 0.019 | -| value_loss | 0.0022 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12057 | -| time_elapsed | 65634 | -| total_timesteps | 1543296 | -| train/ | | -| approx_kl | 0.04605512 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 120560 | -| policy_gradient_loss | -0.00953 | -| std | 0.019 | -| value_loss | 0.000276 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12058 | -| time_elapsed | 65637 | -| total_timesteps | 1543424 | -| train/ | | -| approx_kl | 0.018665282 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.606 | -| learning_rate | 0.0003 | -| loss | 0.00452 | -| n_updates | 120570 | -| policy_gradient_loss | 0.000731 | -| std | 0.019 | -| value_loss | 3.38e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12059 | -| time_elapsed | 65639 | -| total_timesteps | 1543552 | -| train/ | | -| approx_kl | 0.0046663694 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 120580 | -| policy_gradient_loss | -0.0121 | -| std | 0.019 | -| value_loss | 1.48e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12060 | -| time_elapsed | 65641 | -| total_timesteps | 1543680 | -| train/ | | -| approx_kl | 0.0073165195 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 120590 | -| policy_gradient_loss | 0.00582 | -| std | 0.019 | -| value_loss | 4.36e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12061 | -| time_elapsed | 65644 | -| total_timesteps | 1543808 | -| train/ | | -| approx_kl | 0.01442316 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 120600 | -| policy_gradient_loss | 0.0045 | -| std | 0.019 | -| value_loss | 5.71e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12062 | -| time_elapsed | 65648 | -| total_timesteps | 1543936 | -| train/ | | -| approx_kl | 0.00474873 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 120610 | -| policy_gradient_loss | 0.00348 | -| std | 0.019 | -| value_loss | 3.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12063 | -| time_elapsed | 65653 | -| total_timesteps | 1544064 | -| train/ | | -| approx_kl | 0.04254263 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 120620 | -| policy_gradient_loss | 0.0116 | -| std | 0.019 | -| value_loss | 1.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12064 | -| time_elapsed | 65659 | -| total_timesteps | 1544192 | -| train/ | | -| approx_kl | 0.031424467 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.0255 | -| n_updates | 120630 | -| policy_gradient_loss | -0.018 | -| std | 0.019 | -| value_loss | 8.69e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12065 | -| time_elapsed | 65662 | -| total_timesteps | 1544320 | -| train/ | | -| approx_kl | 0.054388467 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 2.54 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 120640 | -| policy_gradient_loss | 0.00443 | -| std | 0.019 | -| value_loss | 3.99e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12066 | -| time_elapsed | 65666 | -| total_timesteps | 1544448 | -| train/ | | -| approx_kl | 0.015743392 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 120650 | -| policy_gradient_loss | -0.00628 | -| std | 0.0189 | -| value_loss | 0.000222 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12067 | -| time_elapsed | 65669 | -| total_timesteps | 1544576 | -| train/ | | -| approx_kl | 0.030859131 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.00847 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 120660 | -| policy_gradient_loss | -0.00295 | -| std | 0.0189 | -| value_loss | 0.000544 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12068 | -| time_elapsed | 65672 | -| total_timesteps | 1544704 | -| train/ | | -| approx_kl | 0.016814422 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 120670 | -| policy_gradient_loss | 0.00676 | -| std | 0.0189 | -| value_loss | 3.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12069 | -| time_elapsed | 65676 | -| total_timesteps | 1544832 | -| train/ | | -| approx_kl | 0.035487458 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0615 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 120680 | -| policy_gradient_loss | 0.00573 | -| std | 0.0189 | -| value_loss | 3.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12070 | -| time_elapsed | 65680 | -| total_timesteps | 1544960 | -| train/ | | -| approx_kl | 0.013270422 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | -0.0043 | -| n_updates | 120690 | -| policy_gradient_loss | 0.00255 | -| std | 0.0189 | -| value_loss | 8.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12071 | -| time_elapsed | 65684 | -| total_timesteps | 1545088 | -| train/ | | -| approx_kl | 0.027000215 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 120700 | -| policy_gradient_loss | 0.00464 | -| std | 0.0189 | -| value_loss | 6.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12072 | -| time_elapsed | 65691 | -| total_timesteps | 1545216 | -| train/ | | -| approx_kl | 0.023511872 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 120710 | -| policy_gradient_loss | -0.00253 | -| std | 0.0189 | -| value_loss | 0.000472 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12073 | -| time_elapsed | 65695 | -| total_timesteps | 1545344 | -| train/ | | -| approx_kl | 0.0025423653 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | 0.000978 | -| n_updates | 120720 | -| policy_gradient_loss | 0.00078 | -| std | 0.0189 | -| value_loss | 1.87e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12074 | -| time_elapsed | 65698 | -| total_timesteps | 1545472 | -| train/ | | -| approx_kl | 0.0153587395 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -1.61 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 120730 | -| policy_gradient_loss | 0.00124 | -| std | 0.0189 | -| value_loss | 6.27e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12075 | -| time_elapsed | 65702 | -| total_timesteps | 1545600 | -| train/ | | -| approx_kl | 0.0066847014 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.512 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 120740 | -| policy_gradient_loss | -0.000482 | -| std | 0.0189 | -| value_loss | 3.95e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12076 | -| time_elapsed | 65706 | -| total_timesteps | 1545728 | -| train/ | | -| approx_kl | 0.009038677 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 120750 | -| policy_gradient_loss | -0.0133 | -| std | 0.0189 | -| value_loss | 0.000373 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12077 | -| time_elapsed | 65709 | -| total_timesteps | 1545856 | -| train/ | | -| approx_kl | 0.007609294 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 120760 | -| policy_gradient_loss | 0.00653 | -| std | 0.0189 | -| value_loss | 0.000147 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12078 | -| time_elapsed | 65713 | -| total_timesteps | 1545984 | -| train/ | | -| approx_kl | 0.032848224 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -9.61 | -| learning_rate | 0.0003 | -| loss | -0.00752 | -| n_updates | 120770 | -| policy_gradient_loss | -0.00668 | -| std | 0.0189 | -| value_loss | 2.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12079 | -| time_elapsed | 65717 | -| total_timesteps | 1546112 | -| train/ | | -| approx_kl | 0.024312913 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.00593 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 120780 | -| policy_gradient_loss | 0.00134 | -| std | 0.0189 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12080 | -| time_elapsed | 65726 | -| total_timesteps | 1546240 | -| train/ | | -| approx_kl | 0.0027701706 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 120790 | -| policy_gradient_loss | -0.00263 | -| std | 0.0189 | -| value_loss | 0.000781 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12081 | -| time_elapsed | 65730 | -| total_timesteps | 1546368 | -| train/ | | -| approx_kl | 0.0034078243 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.00694 | -| n_updates | 120800 | -| policy_gradient_loss | 0.0074 | -| std | 0.0189 | -| value_loss | 4.55e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12082 | -| time_elapsed | 65733 | -| total_timesteps | 1546496 | -| train/ | | -| approx_kl | 0.009035645 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.647 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 120810 | -| policy_gradient_loss | -0.00114 | -| std | 0.0189 | -| value_loss | 5.33e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12083 | -| time_elapsed | 65736 | -| total_timesteps | 1546624 | -| train/ | | -| approx_kl | 0.0515541 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 120820 | -| policy_gradient_loss | 0.00763 | -| std | 0.0189 | -| value_loss | 6.59e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12084 | -| time_elapsed | 65739 | -| total_timesteps | 1546752 | -| train/ | | -| approx_kl | 0.0069328346 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.00718 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 120830 | -| policy_gradient_loss | -0.0048 | -| std | 0.0189 | -| value_loss | 2.36e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12085 | -| time_elapsed | 65741 | -| total_timesteps | 1546880 | -| train/ | | -| approx_kl | 0.056081507 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.00149 | -| learning_rate | 0.0003 | -| loss | 0.0398 | -| n_updates | 120840 | -| policy_gradient_loss | 0.0065 | -| std | 0.0189 | -| value_loss | 6.06e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12086 | -| time_elapsed | 65744 | -| total_timesteps | 1547008 | -| train/ | | -| approx_kl | 2.2668391e-05 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.000357 | -| n_updates | 120850 | -| policy_gradient_loss | -0.00167 | -| std | 0.0189 | -| value_loss | 8.11e-07 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12087 | -| time_elapsed | 65750 | -| total_timesteps | 1547136 | -| train/ | | -| approx_kl | 1.735917 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | -0.0261 | -| n_updates | 120860 | -| policy_gradient_loss | -0.0207 | -| std | 0.0189 | -| value_loss | 0.000785 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12088 | -| time_elapsed | 65754 | -| total_timesteps | 1547264 | -| train/ | | -| approx_kl | 0.011900511 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.194 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 120870 | -| policy_gradient_loss | 0.0664 | -| std | 0.019 | -| value_loss | 2.68e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12089 | -| time_elapsed | 65757 | -| total_timesteps | 1547392 | -| train/ | | -| approx_kl | 0.0035407166 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -8.94 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 120880 | -| policy_gradient_loss | -0.00362 | -| std | 0.019 | -| value_loss | 1.43e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12090 | -| time_elapsed | 65760 | -| total_timesteps | 1547520 | -| train/ | | -| approx_kl | 1.1241063e-06 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -3.63 | -| learning_rate | 0.0003 | -| loss | -5.76e-05 | -| n_updates | 120890 | -| policy_gradient_loss | 0.00506 | -| std | 0.019 | -| value_loss | 5.19e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12091 | -| time_elapsed | 65763 | -| total_timesteps | 1547648 | -| train/ | | -| approx_kl | 0.00037510414 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 120900 | -| policy_gradient_loss | -0.0116 | -| std | 0.019 | -| value_loss | 3.16e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12092 | -| time_elapsed | 65766 | -| total_timesteps | 1547776 | -| train/ | | -| approx_kl | 0.010731772 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 120910 | -| policy_gradient_loss | 0.0211 | -| std | 0.019 | -| value_loss | 9.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12093 | -| time_elapsed | 65769 | -| total_timesteps | 1547904 | -| train/ | | -| approx_kl | 0.003043599 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.00805 | -| n_updates | 120920 | -| policy_gradient_loss | 0.0139 | -| std | 0.019 | -| value_loss | 4.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12094 | -| time_elapsed | 65773 | -| total_timesteps | 1548032 | -| train/ | | -| approx_kl | 0.073771976 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 120930 | -| policy_gradient_loss | -0.00919 | -| std | 0.019 | -| value_loss | 3.41e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12095 | -| time_elapsed | 65779 | -| total_timesteps | 1548160 | -| train/ | | -| approx_kl | 0.06301315 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -4.43 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 120940 | -| policy_gradient_loss | -0.0164 | -| std | 0.019 | -| value_loss | 0.00583 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12096 | -| time_elapsed | 65782 | -| total_timesteps | 1548288 | -| train/ | | -| approx_kl | 0.060439542 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -20.7 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 120950 | -| policy_gradient_loss | -0.00507 | -| std | 0.019 | -| value_loss | 2.3e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12097 | -| time_elapsed | 65785 | -| total_timesteps | 1548416 | -| train/ | | -| approx_kl | 0.005150072 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -139 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 120960 | -| policy_gradient_loss | 0.00198 | -| std | 0.019 | -| value_loss | 5.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12098 | -| time_elapsed | 65788 | -| total_timesteps | 1548544 | -| train/ | | -| approx_kl | 0.023514912 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -21.5 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 120970 | -| policy_gradient_loss | -0.0148 | -| std | 0.019 | -| value_loss | 2.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12099 | -| time_elapsed | 65791 | -| total_timesteps | 1548672 | -| train/ | | -| approx_kl | 0.0072367303 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -45.6 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 120980 | -| policy_gradient_loss | -0.00199 | -| std | 0.019 | -| value_loss | 7.4e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12100 | -| time_elapsed | 65795 | -| total_timesteps | 1548800 | -| train/ | | -| approx_kl | 0.010540411 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | -0.0075 | -| n_updates | 120990 | -| policy_gradient_loss | -0.00538 | -| std | 0.019 | -| value_loss | 8.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12101 | -| time_elapsed | 65798 | -| total_timesteps | 1548928 | -| train/ | | -| approx_kl | 0.008832099 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 121000 | -| policy_gradient_loss | 0.00513 | -| std | 0.019 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12102 | -| time_elapsed | 65802 | -| total_timesteps | 1549056 | -| train/ | | -| approx_kl | 0.012483634 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.00873 | -| n_updates | 121010 | -| policy_gradient_loss | 0.0134 | -| std | 0.019 | -| value_loss | 4.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12103 | -| time_elapsed | 65810 | -| total_timesteps | 1549184 | -| train/ | | -| approx_kl | 0.12323804 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 121020 | -| policy_gradient_loss | -0.0157 | -| std | 0.019 | -| value_loss | 0.00285 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12104 | -| time_elapsed | 65814 | -| total_timesteps | 1549312 | -| train/ | | -| approx_kl | 0.037744887 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -6.04 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 121030 | -| policy_gradient_loss | 0.00495 | -| std | 0.0189 | -| value_loss | 4.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12105 | -| time_elapsed | 65818 | -| total_timesteps | 1549440 | -| train/ | | -| approx_kl | 0.009608236 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -68.2 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 121040 | -| policy_gradient_loss | -0.00642 | -| std | 0.0189 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12106 | -| time_elapsed | 65821 | -| total_timesteps | 1549568 | -| train/ | | -| approx_kl | 0.006368024 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -14.4 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 121050 | -| policy_gradient_loss | -0.00785 | -| std | 0.019 | -| value_loss | 2.74e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12107 | -| time_elapsed | 65824 | -| total_timesteps | 1549696 | -| train/ | | -| approx_kl | 0.01383407 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -4.2 | -| learning_rate | 0.0003 | -| loss | 0.00152 | -| n_updates | 121060 | -| policy_gradient_loss | 5.74e-05 | -| std | 0.0189 | -| value_loss | 4.61e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12108 | -| time_elapsed | 65827 | -| total_timesteps | 1549824 | -| train/ | | -| approx_kl | 0.003964721 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.769 | -| learning_rate | 0.0003 | -| loss | -0.00473 | -| n_updates | 121070 | -| policy_gradient_loss | -0.00268 | -| std | 0.0189 | -| value_loss | 3.85e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12109 | -| time_elapsed | 65831 | -| total_timesteps | 1549952 | -| train/ | | -| approx_kl | 0.016908843 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | -0.000713 | -| n_updates | 121080 | -| policy_gradient_loss | 0.00816 | -| std | 0.0189 | -| value_loss | 1.03e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12110 | -| time_elapsed | 65834 | -| total_timesteps | 1550080 | -| train/ | | -| approx_kl | 0.035530273 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.00279 | -| n_updates | 121090 | -| policy_gradient_loss | -0.0016 | -| std | 0.0189 | -| value_loss | 7.58e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12111 | -| time_elapsed | 65840 | -| total_timesteps | 1550208 | -| train/ | | -| approx_kl | 0.09136764 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.942 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 121100 | -| policy_gradient_loss | -0.00928 | -| std | 0.0189 | -| value_loss | 0.000272 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12112 | -| time_elapsed | 65844 | -| total_timesteps | 1550336 | -| train/ | | -| approx_kl | 0.011949047 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -6.22e+03 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 121110 | -| policy_gradient_loss | -0.00912 | -| std | 0.0189 | -| value_loss | 1.91e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12113 | -| time_elapsed | 65848 | -| total_timesteps | 1550464 | -| train/ | | -| approx_kl | 0.03296122 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -1.74e+04 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 121120 | -| policy_gradient_loss | -0.00529 | -| std | 0.0189 | -| value_loss | 7.81e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12114 | -| time_elapsed | 65851 | -| total_timesteps | 1550592 | -| train/ | | -| approx_kl | 0.0015750639 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -248 | -| learning_rate | 0.0003 | -| loss | 0.000633 | -| n_updates | 121130 | -| policy_gradient_loss | 0.000506 | -| std | 0.0189 | -| value_loss | 8.32e-10 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12115 | -| time_elapsed | 65855 | -| total_timesteps | 1550720 | -| train/ | | -| approx_kl | 0.00023982488 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -75.8 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 121140 | -| policy_gradient_loss | -0.00273 | -| std | 0.0189 | -| value_loss | 2.08e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12116 | -| time_elapsed | 65858 | -| total_timesteps | 1550848 | -| train/ | | -| approx_kl | 0.0073183347 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 121150 | -| policy_gradient_loss | -0.0112 | -| std | 0.0189 | -| value_loss | 2.54e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12117 | -| time_elapsed | 65861 | -| total_timesteps | 1550976 | -| train/ | | -| approx_kl | 0.000595334 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -3.5 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 121160 | -| policy_gradient_loss | 0.00268 | -| std | 0.0189 | -| value_loss | 1.45e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12118 | -| time_elapsed | 65865 | -| total_timesteps | 1551104 | -| train/ | | -| approx_kl | 0.006003949 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 121170 | -| policy_gradient_loss | -0.000549 | -| std | 0.0189 | -| value_loss | 4.67e-12 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12119 | -| time_elapsed | 65873 | -| total_timesteps | 1551232 | -| train/ | | -| approx_kl | 0.04218252 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 121180 | -| policy_gradient_loss | -0.0115 | -| std | 0.0189 | -| value_loss | 0.000155 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12120 | -| time_elapsed | 65875 | -| total_timesteps | 1551360 | -| train/ | | -| approx_kl | 0.02701621 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -6.69 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 121190 | -| policy_gradient_loss | 0.0227 | -| std | 0.0189 | -| value_loss | 6.89e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12121 | -| time_elapsed | 65878 | -| total_timesteps | 1551488 | -| train/ | | -| approx_kl | 0.027658507 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -5.4 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 121200 | -| policy_gradient_loss | -0.00757 | -| std | 0.0188 | -| value_loss | 3.86e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12122 | -| time_elapsed | 65881 | -| total_timesteps | 1551616 | -| train/ | | -| approx_kl | 0.03666593 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.55 | -| explained_variance | -0.894 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 121210 | -| policy_gradient_loss | 0.00166 | -| std | 0.0188 | -| value_loss | 1.87e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12123 | -| time_elapsed | 65885 | -| total_timesteps | 1551744 | -| train/ | | -| approx_kl | 0.0013399385 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0634 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 121220 | -| policy_gradient_loss | 0.00122 | -| std | 0.0187 | -| value_loss | 3.6e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12124 | -| time_elapsed | 65888 | -| total_timesteps | 1551872 | -| train/ | | -| approx_kl | 0.0071065514 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.0014 | -| learning_rate | 0.0003 | -| loss | -0.000777 | -| n_updates | 121230 | -| policy_gradient_loss | 0.00169 | -| std | 0.0187 | -| value_loss | 8.67e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12125 | -| time_elapsed | 65893 | -| total_timesteps | 1552000 | -| train/ | | -| approx_kl | 0.015258799 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 121240 | -| policy_gradient_loss | 0.0254 | -| std | 0.0187 | -| value_loss | 7.27e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12126 | -| time_elapsed | 65895 | -| total_timesteps | 1552128 | -| train/ | | -| approx_kl | 0.014207282 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.000128 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 121250 | -| policy_gradient_loss | 0.0148 | -| std | 0.0187 | -| value_loss | 2.24e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12127 | -| time_elapsed | 65904 | -| total_timesteps | 1552256 | -| train/ | | -| approx_kl | 0.019166581 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 121260 | -| policy_gradient_loss | 0.0232 | -| std | 0.0187 | -| value_loss | 6.95e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12128 | -| time_elapsed | 65908 | -| total_timesteps | 1552384 | -| train/ | | -| approx_kl | 0.02348786 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | 0.00481 | -| n_updates | 121270 | -| policy_gradient_loss | -0.000967 | -| std | 0.0187 | -| value_loss | 8.91e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12129 | -| time_elapsed | 65912 | -| total_timesteps | 1552512 | -| train/ | | -| approx_kl | 0.0059838505 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.000353 | -| learning_rate | 0.0003 | -| loss | 0.00596 | -| n_updates | 121280 | -| policy_gradient_loss | 0.00941 | -| std | 0.0187 | -| value_loss | 1.74e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12130 | -| time_elapsed | 65915 | -| total_timesteps | 1552640 | -| train/ | | -| approx_kl | 0.0041538244 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | -0.000874 | -| n_updates | 121290 | -| policy_gradient_loss | 0.00122 | -| std | 0.0188 | -| value_loss | 1.23e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12131 | -| time_elapsed | 65918 | -| total_timesteps | 1552768 | -| train/ | | -| approx_kl | 0.009282068 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 121300 | -| policy_gradient_loss | 0.0139 | -| std | 0.0188 | -| value_loss | 7.77e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12132 | -| time_elapsed | 65922 | -| total_timesteps | 1552896 | -| train/ | | -| approx_kl | 0.0021168413 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.000506 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 121310 | -| policy_gradient_loss | 0.00176 | -| std | 0.0188 | -| value_loss | 1.84e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12133 | -| time_elapsed | 65924 | -| total_timesteps | 1553024 | -| train/ | | -| approx_kl | 0.011076469 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 121320 | -| policy_gradient_loss | 0.0014 | -| std | 0.0188 | -| value_loss | 1.1e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12134 | -| time_elapsed | 65933 | -| total_timesteps | 1553152 | -| train/ | | -| approx_kl | 0.03946829 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.674 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 121330 | -| policy_gradient_loss | -0.0144 | -| std | 0.0188 | -| value_loss | 0.000888 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12135 | -| time_elapsed | 65937 | -| total_timesteps | 1553280 | -| train/ | | -| approx_kl | 0.0012994302 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -122 | -| learning_rate | 0.0003 | -| loss | 0.00836 | -| n_updates | 121340 | -| policy_gradient_loss | 0.000251 | -| std | 0.0188 | -| value_loss | 5.66e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12136 | -| time_elapsed | 65941 | -| total_timesteps | 1553408 | -| train/ | | -| approx_kl | 0.00048440788 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -443 | -| learning_rate | 0.0003 | -| loss | 0.00287 | -| n_updates | 121350 | -| policy_gradient_loss | -0.00381 | -| std | 0.0188 | -| value_loss | 2.55e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12137 | -| time_elapsed | 65945 | -| total_timesteps | 1553536 | -| train/ | | -| approx_kl | 0.011050528 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -68.1 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 121360 | -| policy_gradient_loss | 0.00633 | -| std | 0.0188 | -| value_loss | 3.05e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12138 | -| time_elapsed | 65949 | -| total_timesteps | 1553664 | -| train/ | | -| approx_kl | 1.2206845e-05 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.000407 | -| n_updates | 121370 | -| policy_gradient_loss | -0.0012 | -| std | 0.0188 | -| value_loss | 4.09e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12139 | -| time_elapsed | 65953 | -| total_timesteps | 1553792 | -| train/ | | -| approx_kl | 0.057231758 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -1.81 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 121380 | -| policy_gradient_loss | -0.0218 | -| std | 0.0188 | -| value_loss | 1.11e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 12140 | -| time_elapsed | 65956 | -| total_timesteps | 1553920 | -| train/ | | -| approx_kl | 0.005784009 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 121390 | -| policy_gradient_loss | -0.000952 | -| std | 0.0188 | -| value_loss | 4.91e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12141 | -| time_elapsed | 65959 | -| total_timesteps | 1554048 | -| train/ | | -| approx_kl | 0.043160543 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 121400 | -| policy_gradient_loss | 0.0279 | -| std | 0.0188 | -| value_loss | 3.37e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12142 | -| time_elapsed | 65966 | -| total_timesteps | 1554176 | -| train/ | | -| approx_kl | 0.040231254 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.59 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 121410 | -| policy_gradient_loss | -0.0159 | -| std | 0.0188 | -| value_loss | 0.000916 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12143 | -| time_elapsed | 65969 | -| total_timesteps | 1554304 | -| train/ | | -| approx_kl | 0.021468837 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -11 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 121420 | -| policy_gradient_loss | 0.00117 | -| std | 0.0188 | -| value_loss | 3.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12144 | -| time_elapsed | 65974 | -| total_timesteps | 1554432 | -| train/ | | -| approx_kl | 0.021429498 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -13.1 | -| learning_rate | 0.0003 | -| loss | -0.00826 | -| n_updates | 121430 | -| policy_gradient_loss | -0.00218 | -| std | 0.0188 | -| value_loss | 1.79e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12145 | -| time_elapsed | 65978 | -| total_timesteps | 1554560 | -| train/ | | -| approx_kl | 0.030601358 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 121440 | -| policy_gradient_loss | 0.00705 | -| std | 0.0188 | -| value_loss | 3.7e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12146 | -| time_elapsed | 65981 | -| total_timesteps | 1554688 | -| train/ | | -| approx_kl | 0.019874977 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 121450 | -| policy_gradient_loss | 0.00508 | -| std | 0.0187 | -| value_loss | 1.43e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12147 | -| time_elapsed | 65984 | -| total_timesteps | 1554816 | -| train/ | | -| approx_kl | 0.0025866218 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.00638 | -| n_updates | 121460 | -| policy_gradient_loss | -0.00263 | -| std | 0.0187 | -| value_loss | 2.75e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 12148 | -| time_elapsed | 65987 | -| total_timesteps | 1554944 | -| train/ | | -| approx_kl | 0.013562984 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.00714 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 121470 | -| policy_gradient_loss | 0.000303 | -| std | 0.0187 | -| value_loss | 2.01e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12149 | -| time_elapsed | 65990 | -| total_timesteps | 1555072 | -| train/ | | -| approx_kl | 0.018273095 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 121480 | -| policy_gradient_loss | -0.000495 | -| std | 0.0187 | -| value_loss | 1.16e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12150 | -| time_elapsed | 65997 | -| total_timesteps | 1555200 | -| train/ | | -| approx_kl | 0.007007862 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | -0.00985 | -| n_updates | 121490 | -| policy_gradient_loss | -0.0148 | -| std | 0.0187 | -| value_loss | 0.00123 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12151 | -| time_elapsed | 66000 | -| total_timesteps | 1555328 | -| train/ | | -| approx_kl | 0.014049415 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 121500 | -| policy_gradient_loss | -0.00503 | -| std | 0.0187 | -| value_loss | 1.58e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12152 | -| time_elapsed | 66003 | -| total_timesteps | 1555456 | -| train/ | | -| approx_kl | 0.022578469 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 121510 | -| policy_gradient_loss | -0.00307 | -| std | 0.0187 | -| value_loss | 1.71e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12153 | -| time_elapsed | 66007 | -| total_timesteps | 1555584 | -| train/ | | -| approx_kl | 0.02700643 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 121520 | -| policy_gradient_loss | 0.0085 | -| std | 0.0187 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12154 | -| time_elapsed | 66010 | -| total_timesteps | 1555712 | -| train/ | | -| approx_kl | 0.028360121 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | 0.000286 | -| n_updates | 121530 | -| policy_gradient_loss | -0.000879 | -| std | 0.0187 | -| value_loss | 7.81e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12155 | -| time_elapsed | 66014 | -| total_timesteps | 1555840 | -| train/ | | -| approx_kl | 0.0026155617 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.0098 | -| n_updates | 121540 | -| policy_gradient_loss | -0.00604 | -| std | 0.0187 | -| value_loss | 5.25e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 12156 | -| time_elapsed | 66019 | -| total_timesteps | 1555968 | -| train/ | | -| approx_kl | 0.006301823 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 121550 | -| policy_gradient_loss | 0.00177 | -| std | 0.0187 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12157 | -| time_elapsed | 66023 | -| total_timesteps | 1556096 | -| train/ | | -| approx_kl | 0.016235981 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 121560 | -| policy_gradient_loss | -0.00614 | -| std | 0.0187 | -| value_loss | 1.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12158 | -| time_elapsed | 66031 | -| total_timesteps | 1556224 | -| train/ | | -| approx_kl | 0.16340744 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | -0.00456 | -| n_updates | 121570 | -| policy_gradient_loss | -0.00484 | -| std | 0.0187 | -| value_loss | 0.000434 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12159 | -| time_elapsed | 66035 | -| total_timesteps | 1556352 | -| train/ | | -| approx_kl | 0.007188163 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | -0.000834 | -| n_updates | 121580 | -| policy_gradient_loss | 0.000893 | -| std | 0.0187 | -| value_loss | 1.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12160 | -| time_elapsed | 66039 | -| total_timesteps | 1556480 | -| train/ | | -| approx_kl | 0.050651465 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -3.28 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 121590 | -| policy_gradient_loss | -0.0068 | -| std | 0.0187 | -| value_loss | 5.74e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12161 | -| time_elapsed | 66043 | -| total_timesteps | 1556608 | -| train/ | | -| approx_kl | 0.0004322622 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.61 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 121600 | -| policy_gradient_loss | -0.00191 | -| std | 0.0187 | -| value_loss | 1.16e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12162 | -| time_elapsed | 66048 | -| total_timesteps | 1556736 | -| train/ | | -| approx_kl | 0.025276646 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 121610 | -| policy_gradient_loss | -0.00504 | -| std | 0.0188 | -| value_loss | 2.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12163 | -| time_elapsed | 66052 | -| total_timesteps | 1556864 | -| train/ | | -| approx_kl | 0.012775259 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.00053 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 121620 | -| policy_gradient_loss | -0.00442 | -| std | 0.0188 | -| value_loss | 4.02e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 12164 | -| time_elapsed | 66055 | -| total_timesteps | 1556992 | -| train/ | | -| approx_kl | 0.02502074 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 121630 | -| policy_gradient_loss | -0.00675 | -| std | 0.0188 | -| value_loss | 2.46e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 12165 | -| time_elapsed | 66058 | -| total_timesteps | 1557120 | -| train/ | | -| approx_kl | 0.02511324 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | 0.00591 | -| n_updates | 121640 | -| policy_gradient_loss | 0.00213 | -| std | 0.0188 | -| value_loss | 1.58e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 12166 | -| time_elapsed | 66068 | -| total_timesteps | 1557248 | -| train/ | | -| approx_kl | 0.02686825 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 121650 | -| policy_gradient_loss | -0.00395 | -| std | 0.0188 | -| value_loss | 0.000147 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 12167 | -| time_elapsed | 66071 | -| total_timesteps | 1557376 | -| train/ | | -| approx_kl | 0.02847657 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.00267 | -| learning_rate | 0.0003 | -| loss | -0.00099 | -| n_updates | 121660 | -| policy_gradient_loss | -0.00276 | -| std | 0.0188 | -| value_loss | 6.83e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 12168 | -| time_elapsed | 66075 | -| total_timesteps | 1557504 | -| train/ | | -| approx_kl | 0.0179539 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0888 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 121670 | -| policy_gradient_loss | 0.00455 | -| std | 0.0188 | -| value_loss | 5.97e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 12169 | -| time_elapsed | 66078 | -| total_timesteps | 1557632 | -| train/ | | -| approx_kl | 0.04277017 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0963 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 121680 | -| policy_gradient_loss | 0.0051 | -| std | 0.0188 | -| value_loss | 2.67e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 12170 | -| time_elapsed | 66081 | -| total_timesteps | 1557760 | -| train/ | | -| approx_kl | 0.0032067993 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.00949 | -| learning_rate | 0.0003 | -| loss | 0.00887 | -| n_updates | 121690 | -| policy_gradient_loss | 0.00674 | -| std | 0.0188 | -| value_loss | 3.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 12171 | -| time_elapsed | 66084 | -| total_timesteps | 1557888 | -| train/ | | -| approx_kl | 0.014272359 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 121700 | -| policy_gradient_loss | 0.0039 | -| std | 0.0188 | -| value_loss | 2.24e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12172 | -| time_elapsed | 66086 | -| total_timesteps | 1558016 | -| train/ | | -| approx_kl | 0.0066022403 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | -0.00796 | -| n_updates | 121710 | -| policy_gradient_loss | -0.00436 | -| std | 0.0188 | -| value_loss | 1.13e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12173 | -| time_elapsed | 66095 | -| total_timesteps | 1558144 | -| train/ | | -| approx_kl | 0.08414178 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | 0.637 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 121720 | -| policy_gradient_loss | -0.0161 | -| std | 0.0188 | -| value_loss | 0.000796 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12174 | -| time_elapsed | 66099 | -| total_timesteps | 1558272 | -| train/ | | -| approx_kl | 0.018548042 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.000748 | -| n_updates | 121730 | -| policy_gradient_loss | -0.00369 | -| std | 0.0188 | -| value_loss | 6.09e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12175 | -| time_elapsed | 66104 | -| total_timesteps | 1558400 | -| train/ | | -| approx_kl | 0.0015140143 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -496 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 121740 | -| policy_gradient_loss | -0.00069 | -| std | 0.0188 | -| value_loss | 6.69e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12176 | -| time_elapsed | 66107 | -| total_timesteps | 1558528 | -| train/ | | -| approx_kl | 0.022231787 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -139 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 121750 | -| policy_gradient_loss | -4.72e-05 | -| std | 0.0187 | -| value_loss | 6.61e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12177 | -| time_elapsed | 66110 | -| total_timesteps | 1558656 | -| train/ | | -| approx_kl | 0.00811632 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 2.56 | -| explained_variance | -11.9 | -| learning_rate | 0.0003 | -| loss | 0.000229 | -| n_updates | 121760 | -| policy_gradient_loss | 7.84e-05 | -| std | 0.0186 | -| value_loss | 1.17e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12178 | -| time_elapsed | 66114 | -| total_timesteps | 1558784 | -| train/ | | -| approx_kl | 0.014785286 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.57 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | -0.000465 | -| n_updates | 121770 | -| policy_gradient_loss | 0.000895 | -| std | 0.0185 | -| value_loss | 6.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 12179 | -| time_elapsed | 66118 | -| total_timesteps | 1558912 | -| train/ | | -| approx_kl | 0.04169532 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.57 | -| explained_variance | 0.0015 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 121780 | -| policy_gradient_loss | -0.0163 | -| std | 0.0185 | -| value_loss | 4.98e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12180 | -| time_elapsed | 66122 | -| total_timesteps | 1559040 | -| train/ | | -| approx_kl | 0.010394889 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.57 | -| explained_variance | -462 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 121790 | -| policy_gradient_loss | -0.00627 | -| std | 0.0185 | -| value_loss | 2.12e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12181 | -| time_elapsed | 66128 | -| total_timesteps | 1559168 | -| train/ | | -| approx_kl | 0.020464307 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 2.57 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 121800 | -| policy_gradient_loss | -0.0173 | -| std | 0.0185 | -| value_loss | 0.000961 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12182 | -| time_elapsed | 66132 | -| total_timesteps | 1559296 | -| train/ | | -| approx_kl | 0.031995535 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.57 | -| explained_variance | -0.39 | -| learning_rate | 0.0003 | -| loss | 0.00828 | -| n_updates | 121810 | -| policy_gradient_loss | -5.27e-05 | -| std | 0.0185 | -| value_loss | 1.69e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12183 | -| time_elapsed | 66135 | -| total_timesteps | 1559424 | -| train/ | | -| approx_kl | 0.0004078606 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.57 | -| explained_variance | -15.7 | -| learning_rate | 0.0003 | -| loss | 0.000673 | -| n_updates | 121820 | -| policy_gradient_loss | 0.00302 | -| std | 0.0184 | -| value_loss | 0.000713 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12184 | -| time_elapsed | 66138 | -| total_timesteps | 1559552 | -| train/ | | -| approx_kl | 0.13429178 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0895 | -| learning_rate | 0.0003 | -| loss | 0.0989 | -| n_updates | 121830 | -| policy_gradient_loss | 0.0552 | -| std | 0.0184 | -| value_loss | 0.000827 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12185 | -| time_elapsed | 66141 | -| total_timesteps | 1559680 | -| train/ | | -| approx_kl | 0.047217093 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.00386 | -| learning_rate | 0.0003 | -| loss | 0.0764 | -| n_updates | 121840 | -| policy_gradient_loss | 0.0167 | -| std | 0.0184 | -| value_loss | 0.000176 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12186 | -| time_elapsed | 66145 | -| total_timesteps | 1559808 | -| train/ | | -| approx_kl | 0.058426566 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 121850 | -| policy_gradient_loss | 0.00534 | -| std | 0.0184 | -| value_loss | 1.4e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 12187 | -| time_elapsed | 66148 | -| total_timesteps | 1559936 | -| train/ | | -| approx_kl | 1.590047e-05 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.00137 | -| n_updates | 121860 | -| policy_gradient_loss | -0.00646 | -| std | 0.0184 | -| value_loss | 8.74e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12188 | -| time_elapsed | 66151 | -| total_timesteps | 1560064 | -| train/ | | -| approx_kl | 0.008946127 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 121870 | -| policy_gradient_loss | 0.00876 | -| std | 0.0183 | -| value_loss | 4.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12189 | -| time_elapsed | 66158 | -| total_timesteps | 1560192 | -| train/ | | -| approx_kl | 0.0032221125 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | 0.039 | -| n_updates | 121880 | -| policy_gradient_loss | 0.0045 | -| std | 0.0183 | -| value_loss | 9.21e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12190 | -| time_elapsed | 66161 | -| total_timesteps | 1560320 | -| train/ | | -| approx_kl | 0.009445125 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 121890 | -| policy_gradient_loss | 0.00398 | -| std | 0.0183 | -| value_loss | 2.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12191 | -| time_elapsed | 66165 | -| total_timesteps | 1560448 | -| train/ | | -| approx_kl | 0.013318075 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 121900 | -| policy_gradient_loss | 0.00587 | -| std | 0.0183 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12192 | -| time_elapsed | 66169 | -| total_timesteps | 1560576 | -| train/ | | -| approx_kl | 0.016283417 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.00626 | -| n_updates | 121910 | -| policy_gradient_loss | 0.00517 | -| std | 0.0184 | -| value_loss | 1.09e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12193 | -| time_elapsed | 66172 | -| total_timesteps | 1560704 | -| train/ | | -| approx_kl | 0.00952539 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0017 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 121920 | -| policy_gradient_loss | 0.0113 | -| std | 0.0184 | -| value_loss | 4.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12194 | -| time_elapsed | 66174 | -| total_timesteps | 1560832 | -| train/ | | -| approx_kl | 0.003968415 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.00266 | -| learning_rate | 0.0003 | -| loss | 0.00217 | -| n_updates | 121930 | -| policy_gradient_loss | 0.0292 | -| std | 0.0184 | -| value_loss | 1.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 12195 | -| time_elapsed | 66178 | -| total_timesteps | 1560960 | -| train/ | | -| approx_kl | 0.014437175 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 121940 | -| policy_gradient_loss | 0.0298 | -| std | 0.0184 | -| value_loss | 7.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12196 | -| time_elapsed | 66181 | -| total_timesteps | 1561088 | -| train/ | | -| approx_kl | 0.0021393364 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.00319 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 121950 | -| policy_gradient_loss | 0.000926 | -| std | 0.0184 | -| value_loss | 3.09e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12197 | -| time_elapsed | 66189 | -| total_timesteps | 1561216 | -| train/ | | -| approx_kl | 0.0042421133 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.76 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 121960 | -| policy_gradient_loss | -0.0126 | -| std | 0.0184 | -| value_loss | 0.00466 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12198 | -| time_elapsed | 66192 | -| total_timesteps | 1561344 | -| train/ | | -| approx_kl | 1.03376806e-07 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.888 | -| learning_rate | 0.0003 | -| loss | -6.69e-06 | -| n_updates | 121970 | -| policy_gradient_loss | 0.00032 | -| std | 0.0184 | -| value_loss | 1.84e-06 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12199 | -| time_elapsed | 66195 | -| total_timesteps | 1561472 | -| train/ | | -| approx_kl | 7.115258e-05 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -3.5 | -| learning_rate | 0.0003 | -| loss | 0.000425 | -| n_updates | 121980 | -| policy_gradient_loss | 0.00207 | -| std | 0.0184 | -| value_loss | 1.61e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12200 | -| time_elapsed | 66198 | -| total_timesteps | 1561600 | -| train/ | | -| approx_kl | 0.0009108912 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.614 | -| learning_rate | 0.0003 | -| loss | 0.00321 | -| n_updates | 121990 | -| policy_gradient_loss | 0.0139 | -| std | 0.0184 | -| value_loss | 3.2e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12201 | -| time_elapsed | 66201 | -| total_timesteps | 1561728 | -| train/ | | -| approx_kl | 0.015269193 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 122000 | -| policy_gradient_loss | -0.000609 | -| std | 0.0184 | -| value_loss | 1.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12202 | -| time_elapsed | 66205 | -| total_timesteps | 1561856 | -| train/ | | -| approx_kl | 0.018135374 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0892 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 122010 | -| policy_gradient_loss | 0.0289 | -| std | 0.0184 | -| value_loss | 8.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 12203 | -| time_elapsed | 66209 | -| total_timesteps | 1561984 | -| train/ | | -| approx_kl | 0.015763106 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0099 | -| n_updates | 122020 | -| policy_gradient_loss | 0.0218 | -| std | 0.0183 | -| value_loss | 8.62e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12204 | -| time_elapsed | 66213 | -| total_timesteps | 1562112 | -| train/ | | -| approx_kl | 0.016752528 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0728 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 122030 | -| policy_gradient_loss | 0.0213 | -| std | 0.0183 | -| value_loss | 3.1e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12205 | -| time_elapsed | 66221 | -| total_timesteps | 1562240 | -| train/ | | -| approx_kl | 0.0067046406 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 122040 | -| policy_gradient_loss | 0.0102 | -| std | 0.0183 | -| value_loss | 1.73e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12206 | -| time_elapsed | 66225 | -| total_timesteps | 1562368 | -| train/ | | -| approx_kl | 0.006221997 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.00568 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 122050 | -| policy_gradient_loss | 0.00179 | -| std | 0.0183 | -| value_loss | 8.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12207 | -| time_elapsed | 66227 | -| total_timesteps | 1562496 | -| train/ | | -| approx_kl | 0.016164523 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.00854 | -| n_updates | 122060 | -| policy_gradient_loss | 0.0043 | -| std | 0.0183 | -| value_loss | 3.67e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12208 | -| time_elapsed | 66231 | -| total_timesteps | 1562624 | -| train/ | | -| approx_kl | 0.00925627 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 122070 | -| policy_gradient_loss | 0.000463 | -| std | 0.0183 | -| value_loss | 1.86e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12209 | -| time_elapsed | 66234 | -| total_timesteps | 1562752 | -| train/ | | -| approx_kl | 0.024171423 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.00935 | -| n_updates | 122080 | -| policy_gradient_loss | 0.000342 | -| std | 0.0183 | -| value_loss | 1.05e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12210 | -| time_elapsed | 66237 | -| total_timesteps | 1562880 | -| train/ | | -| approx_kl | 0.0030797962 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.000428 | -| n_updates | 122090 | -| policy_gradient_loss | 0.00554 | -| std | 0.0183 | -| value_loss | 4.44e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12211 | -| time_elapsed | 66240 | -| total_timesteps | 1563008 | -| train/ | | -| approx_kl | 0.0070048906 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 122100 | -| policy_gradient_loss | 0.018 | -| std | 0.0183 | -| value_loss | 1.65e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12212 | -| time_elapsed | 66248 | -| total_timesteps | 1563136 | -| train/ | | -| approx_kl | 0.02614431 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 122110 | -| policy_gradient_loss | -0.00208 | -| std | 0.0183 | -| value_loss | 0.00259 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12213 | -| time_elapsed | 66252 | -| total_timesteps | 1563264 | -| train/ | | -| approx_kl | 0.029758964 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.0429 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 122120 | -| policy_gradient_loss | 0.00844 | -| std | 0.0183 | -| value_loss | 0.000158 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12214 | -| time_elapsed | 66256 | -| total_timesteps | 1563392 | -| train/ | | -| approx_kl | 0.01841153 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | 0.00854 | -| n_updates | 122130 | -| policy_gradient_loss | 0.0131 | -| std | 0.0183 | -| value_loss | 1.79e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12215 | -| time_elapsed | 66260 | -| total_timesteps | 1563520 | -| train/ | | -| approx_kl | 0.031273406 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.00414 | -| n_updates | 122140 | -| policy_gradient_loss | 0.000749 | -| std | 0.0183 | -| value_loss | 9.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12216 | -| time_elapsed | 66263 | -| total_timesteps | 1563648 | -| train/ | | -| approx_kl | 0.016155122 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.302 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 122150 | -| policy_gradient_loss | -0.00201 | -| std | 0.0183 | -| value_loss | 1.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12217 | -| time_elapsed | 66266 | -| total_timesteps | 1563776 | -| train/ | | -| approx_kl | 0.038222637 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 122160 | -| policy_gradient_loss | 0.00442 | -| std | 0.0183 | -| value_loss | 6.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12218 | -| time_elapsed | 66270 | -| total_timesteps | 1563904 | -| train/ | | -| approx_kl | 0.016774282 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.00229 | -| n_updates | 122170 | -| policy_gradient_loss | 0.0108 | -| std | 0.0183 | -| value_loss | 3.79e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12219 | -| time_elapsed | 66275 | -| total_timesteps | 1564032 | -| train/ | | -| approx_kl | 0.003435074 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 122180 | -| policy_gradient_loss | -0.00275 | -| std | 0.0183 | -| value_loss | 2.81e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12220 | -| time_elapsed | 66283 | -| total_timesteps | 1564160 | -| train/ | | -| approx_kl | 0.0024269572 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.966 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 122190 | -| policy_gradient_loss | -0.00527 | -| std | 0.0183 | -| value_loss | 0.000307 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12221 | -| time_elapsed | 66286 | -| total_timesteps | 1564288 | -| train/ | | -| approx_kl | 0.012282249 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.976 | -| learning_rate | 0.0003 | -| loss | -0.00763 | -| n_updates | 122200 | -| policy_gradient_loss | -0.00667 | -| std | 0.0182 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12222 | -| time_elapsed | 66289 | -| total_timesteps | 1564416 | -| train/ | | -| approx_kl | 0.004837194 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -78.4 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 122210 | -| policy_gradient_loss | -0.00427 | -| std | 0.0182 | -| value_loss | 1.01e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12223 | -| time_elapsed | 66292 | -| total_timesteps | 1564544 | -| train/ | | -| approx_kl | 0.0040886546 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | -0.000223 | -| n_updates | 122220 | -| policy_gradient_loss | 0.00281 | -| std | 0.0182 | -| value_loss | 8.77e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12224 | -| time_elapsed | 66297 | -| total_timesteps | 1564672 | -| train/ | | -| approx_kl | 0.05482891 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.00771 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 122230 | -| policy_gradient_loss | 0.0121 | -| std | 0.0182 | -| value_loss | 6.59e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12225 | -| time_elapsed | 66301 | -| total_timesteps | 1564800 | -| train/ | | -| approx_kl | 0.009970193 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | 0.00231 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 122240 | -| policy_gradient_loss | -0.00191 | -| std | 0.0182 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12226 | -| time_elapsed | 66304 | -| total_timesteps | 1564928 | -| train/ | | -| approx_kl | 0.028966911 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.0291 | -| n_updates | 122250 | -| policy_gradient_loss | 0.0114 | -| std | 0.0183 | -| value_loss | 8.39e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12227 | -| time_elapsed | 66307 | -| total_timesteps | 1565056 | -| train/ | | -| approx_kl | 4.4095796e-05 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | -0.000559 | -| n_updates | 122260 | -| policy_gradient_loss | -0.00249 | -| std | 0.0183 | -| value_loss | 5.15e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12228 | -| time_elapsed | 66313 | -| total_timesteps | 1565184 | -| train/ | | -| approx_kl | 0.19470583 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.58 | -| explained_variance | 0.673 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 122270 | -| policy_gradient_loss | -0.0171 | -| std | 0.0182 | -| value_loss | 0.000835 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12229 | -| time_elapsed | 66317 | -| total_timesteps | 1565312 | -| train/ | | -| approx_kl | 2.341345e-05 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -32 | -| learning_rate | 0.0003 | -| loss | 0.000244 | -| n_updates | 122280 | -| policy_gradient_loss | -0.00328 | -| std | 0.0182 | -| value_loss | 4.95e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12230 | -| time_elapsed | 66320 | -| total_timesteps | 1565440 | -| train/ | | -| approx_kl | 0.029717531 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -35.8 | -| learning_rate | 0.0003 | -| loss | -0.00919 | -| n_updates | 122290 | -| policy_gradient_loss | -0.00808 | -| std | 0.0182 | -| value_loss | 6.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12231 | -| time_elapsed | 66324 | -| total_timesteps | 1565568 | -| train/ | | -| approx_kl | 0.003914256 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -5.33 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 122300 | -| policy_gradient_loss | -0.0054 | -| std | 0.0182 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12232 | -| time_elapsed | 66327 | -| total_timesteps | 1565696 | -| train/ | | -| approx_kl | 0.0118831545 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | 0.0066 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 122310 | -| policy_gradient_loss | -0.00209 | -| std | 0.0181 | -| value_loss | 2.19e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12233 | -| time_elapsed | 66331 | -| total_timesteps | 1565824 | -| train/ | | -| approx_kl | 0.00019744178 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.0453 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 122320 | -| policy_gradient_loss | -0.00667 | -| std | 0.0181 | -| value_loss | 5.5e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12234 | -| time_elapsed | 66335 | -| total_timesteps | 1565952 | -| train/ | | -| approx_kl | 0.00044226833 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.00313 | -| n_updates | 122330 | -| policy_gradient_loss | 0.0112 | -| std | 0.0181 | -| value_loss | 3.28e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12235 | -| time_elapsed | 66338 | -| total_timesteps | 1566080 | -| train/ | | -| approx_kl | 0.007869745 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 122340 | -| policy_gradient_loss | 0.0215 | -| std | 0.0181 | -| value_loss | 2.49e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12236 | -| time_elapsed | 66344 | -| total_timesteps | 1566208 | -| train/ | | -| approx_kl | 0.0039461073 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 122350 | -| policy_gradient_loss | -0.015 | -| std | 0.0181 | -| value_loss | 0.00313 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12237 | -| time_elapsed | 66348 | -| total_timesteps | 1566336 | -| train/ | | -| approx_kl | 0.020880362 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -54.3 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 122360 | -| policy_gradient_loss | -0.000343 | -| std | 0.0181 | -| value_loss | 4.52e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12238 | -| time_elapsed | 66351 | -| total_timesteps | 1566464 | -| train/ | | -| approx_kl | 0.00063544745 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -419 | -| learning_rate | 0.0003 | -| loss | -0.00426 | -| n_updates | 122370 | -| policy_gradient_loss | -0.00239 | -| std | 0.0181 | -| value_loss | 4.42e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12239 | -| time_elapsed | 66355 | -| total_timesteps | 1566592 | -| train/ | | -| approx_kl | 0.00029610144 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -56.9 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 122380 | -| policy_gradient_loss | -0.00513 | -| std | 0.0181 | -| value_loss | 4.82e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12240 | -| time_elapsed | 66359 | -| total_timesteps | 1566720 | -| train/ | | -| approx_kl | 0.012584833 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -17.5 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 122390 | -| policy_gradient_loss | -0.00521 | -| std | 0.0181 | -| value_loss | 8.53e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12241 | -| time_elapsed | 66363 | -| total_timesteps | 1566848 | -| train/ | | -| approx_kl | 0.00021172268 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -3.09 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 122400 | -| policy_gradient_loss | 0.00636 | -| std | 0.0181 | -| value_loss | 1.57e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12242 | -| time_elapsed | 66366 | -| total_timesteps | 1566976 | -| train/ | | -| approx_kl | 0.0075116213 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.937 | -| learning_rate | 0.0003 | -| loss | 0.00634 | -| n_updates | 122410 | -| policy_gradient_loss | 0.0159 | -| std | 0.0181 | -| value_loss | 6.14e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12243 | -| time_elapsed | 66370 | -| total_timesteps | 1567104 | -| train/ | | -| approx_kl | 0.011576528 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 122420 | -| policy_gradient_loss | 0.0116 | -| std | 0.0181 | -| value_loss | 4.04e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12244 | -| time_elapsed | 66378 | -| total_timesteps | 1567232 | -| train/ | | -| approx_kl | 0.04220868 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | 0.914 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 122430 | -| policy_gradient_loss | -0.0131 | -| std | 0.0181 | -| value_loss | 0.00154 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12245 | -| time_elapsed | 66382 | -| total_timesteps | 1567360 | -| train/ | | -| approx_kl | 0.02890637 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 122440 | -| policy_gradient_loss | 0.00412 | -| std | 0.0181 | -| value_loss | 6.64e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12246 | -| time_elapsed | 66386 | -| total_timesteps | 1567488 | -| train/ | | -| approx_kl | 0.012633739 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.0852 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 122450 | -| policy_gradient_loss | 0.00265 | -| std | 0.0181 | -| value_loss | 0.00018 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12247 | -| time_elapsed | 66390 | -| total_timesteps | 1567616 | -| train/ | | -| approx_kl | 0.019415064 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | 0.00198 | -| learning_rate | 0.0003 | -| loss | 0.00518 | -| n_updates | 122460 | -| policy_gradient_loss | 0.00434 | -| std | 0.0181 | -| value_loss | 9.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12248 | -| time_elapsed | 66394 | -| total_timesteps | 1567744 | -| train/ | | -| approx_kl | 0.024210917 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.00766 | -| n_updates | 122470 | -| policy_gradient_loss | 0.00304 | -| std | 0.0181 | -| value_loss | 2.42e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12249 | -| time_elapsed | 66398 | -| total_timesteps | 1567872 | -| train/ | | -| approx_kl | 0.10420493 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.0722 | -| n_updates | 122480 | -| policy_gradient_loss | 0.0135 | -| std | 0.0181 | -| value_loss | 1.14e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12250 | -| time_elapsed | 66401 | -| total_timesteps | 1568000 | -| train/ | | -| approx_kl | 0.018167794 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.00273 | -| learning_rate | 0.0003 | -| loss | 0.00742 | -| n_updates | 122490 | -| policy_gradient_loss | 0.0117 | -| std | 0.0181 | -| value_loss | 1.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12251 | -| time_elapsed | 66404 | -| total_timesteps | 1568128 | -| train/ | | -| approx_kl | 0.002750469 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.00028 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 122500 | -| policy_gradient_loss | 0.0132 | -| std | 0.0181 | -| value_loss | 2.42e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12252 | -| time_elapsed | 66411 | -| total_timesteps | 1568256 | -| train/ | | -| approx_kl | 0.22310509 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.676 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 122510 | -| policy_gradient_loss | -0.0152 | -| std | 0.0181 | -| value_loss | 0.00298 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12253 | -| time_elapsed | 66415 | -| total_timesteps | 1568384 | -| train/ | | -| approx_kl | 0.0024571368 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -4.7 | -| learning_rate | 0.0003 | -| loss | 0.00477 | -| n_updates | 122520 | -| policy_gradient_loss | -0.00253 | -| std | 0.0181 | -| value_loss | 6.1e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12254 | -| time_elapsed | 66419 | -| total_timesteps | 1568512 | -| train/ | | -| approx_kl | 0.08698873 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | 0.00556 | -| n_updates | 122530 | -| policy_gradient_loss | -0.00151 | -| std | 0.0181 | -| value_loss | 1.03e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12255 | -| time_elapsed | 66422 | -| total_timesteps | 1568640 | -| train/ | | -| approx_kl | 8.729333e-05 | -| clip_fraction | 0.0227 | -| clip_range | 0.2 | -| entropy_loss | 2.59 | -| explained_variance | -0.825 | -| learning_rate | 0.0003 | -| loss | -0.000146 | -| n_updates | 122540 | -| policy_gradient_loss | 3.4e-05 | -| std | 0.018 | -| value_loss | 1.02e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12256 | -| time_elapsed | 66427 | -| total_timesteps | 1568768 | -| train/ | | -| approx_kl | 0.0031638057 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.0092 | -| n_updates | 122550 | -| policy_gradient_loss | 0.00768 | -| std | 0.018 | -| value_loss | 1.92e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12257 | -| time_elapsed | 66430 | -| total_timesteps | 1568896 | -| train/ | | -| approx_kl | 0.00039890455 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | 0.00254 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 122560 | -| policy_gradient_loss | -0.00165 | -| std | 0.018 | -| value_loss | 7.78e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12258 | -| time_elapsed | 66433 | -| total_timesteps | 1569024 | -| train/ | | -| approx_kl | 0.028974045 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.00468 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 122570 | -| policy_gradient_loss | 0.0135 | -| std | 0.0179 | -| value_loss | 7.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12259 | -| time_elapsed | 66438 | -| total_timesteps | 1569152 | -| train/ | | -| approx_kl | 0.084930085 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 122580 | -| policy_gradient_loss | -0.00167 | -| std | 0.0179 | -| value_loss | 9.65e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12260 | -| time_elapsed | 66442 | -| total_timesteps | 1569280 | -| train/ | | -| approx_kl | 0.02115289 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | 0.025 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 122590 | -| policy_gradient_loss | 0.00906 | -| std | 0.0179 | -| value_loss | 1.8e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12261 | -| time_elapsed | 66446 | -| total_timesteps | 1569408 | -| train/ | | -| approx_kl | 0.034717694 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | 0.000101 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 122600 | -| policy_gradient_loss | -0.000727 | -| std | 0.0179 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12262 | -| time_elapsed | 66450 | -| total_timesteps | 1569536 | -| train/ | | -| approx_kl | 0.032348327 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.00853 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 122610 | -| policy_gradient_loss | 0.00353 | -| std | 0.0179 | -| value_loss | 4.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12263 | -| time_elapsed | 66453 | -| total_timesteps | 1569664 | -| train/ | | -| approx_kl | 0.085261896 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.0604 | -| n_updates | 122620 | -| policy_gradient_loss | 0.0105 | -| std | 0.0179 | -| value_loss | 2.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12264 | -| time_elapsed | 66458 | -| total_timesteps | 1569792 | -| train/ | | -| approx_kl | 0.004632672 | -| clip_fraction | 0.0156 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 122630 | -| policy_gradient_loss | -0.000334 | -| std | 0.0179 | -| value_loss | 2.78e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 12265 | -| time_elapsed | 66462 | -| total_timesteps | 1569920 | -| train/ | | -| approx_kl | 0.0007987614 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.0061 | -| n_updates | 122640 | -| policy_gradient_loss | 0.00445 | -| std | 0.0179 | -| value_loss | 1.96e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12266 | -| time_elapsed | 66466 | -| total_timesteps | 1570048 | -| train/ | | -| approx_kl | 0.0007775235 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | 0.00526 | -| learning_rate | 0.0003 | -| loss | 0.00154 | -| n_updates | 122650 | -| policy_gradient_loss | 0.0165 | -| std | 0.0179 | -| value_loss | 2.3e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12267 | -| time_elapsed | 66473 | -| total_timesteps | 1570176 | -| train/ | | -| approx_kl | 0.14405628 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -2.68 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 122660 | -| policy_gradient_loss | -0.0158 | -| std | 0.0179 | -| value_loss | 0.00325 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12268 | -| time_elapsed | 66475 | -| total_timesteps | 1570304 | -| train/ | | -| approx_kl | 0.033480406 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -70.3 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 122670 | -| policy_gradient_loss | -0.0157 | -| std | 0.0179 | -| value_loss | 3.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12269 | -| time_elapsed | 66479 | -| total_timesteps | 1570432 | -| train/ | | -| approx_kl | 0.016711287 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -69.1 | -| learning_rate | 0.0003 | -| loss | 0.00032 | -| n_updates | 122680 | -| policy_gradient_loss | 0.000356 | -| std | 0.0179 | -| value_loss | 7.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12270 | -| time_elapsed | 66482 | -| total_timesteps | 1570560 | -| train/ | | -| approx_kl | 0.01718207 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -2.98 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 122690 | -| policy_gradient_loss | 0.000434 | -| std | 0.0179 | -| value_loss | 4.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12271 | -| time_elapsed | 66485 | -| total_timesteps | 1570688 | -| train/ | | -| approx_kl | 0.020289045 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 122700 | -| policy_gradient_loss | -0.00362 | -| std | 0.0179 | -| value_loss | 1.43e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12272 | -| time_elapsed | 66487 | -| total_timesteps | 1570816 | -| train/ | | -| approx_kl | 0.0034575765 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.00616 | -| n_updates | 122710 | -| policy_gradient_loss | -0.000199 | -| std | 0.0179 | -| value_loss | 1.46e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12273 | -| time_elapsed | 66489 | -| total_timesteps | 1570944 | -| train/ | | -| approx_kl | 0.012523564 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.000467 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 122720 | -| policy_gradient_loss | -0.00324 | -| std | 0.0179 | -| value_loss | 5.58e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12274 | -| time_elapsed | 66493 | -| total_timesteps | 1571072 | -| train/ | | -| approx_kl | 0.0043890025 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 122730 | -| policy_gradient_loss | 0.00169 | -| std | 0.0179 | -| value_loss | 2.75e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12275 | -| time_elapsed | 66499 | -| total_timesteps | 1571200 | -| train/ | | -| approx_kl | 0.043901965 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 122740 | -| policy_gradient_loss | 0.0152 | -| std | 0.0179 | -| value_loss | 0.0025 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12276 | -| time_elapsed | 66503 | -| total_timesteps | 1571328 | -| train/ | | -| approx_kl | 0.017308902 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 122750 | -| policy_gradient_loss | 0.00254 | -| std | 0.0179 | -| value_loss | 1.19e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12277 | -| time_elapsed | 66507 | -| total_timesteps | 1571456 | -| train/ | | -| approx_kl | 0.062965654 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.0384 | -| n_updates | 122760 | -| policy_gradient_loss | 0.0066 | -| std | 0.0178 | -| value_loss | 2.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12278 | -| time_elapsed | 66509 | -| total_timesteps | 1571584 | -| train/ | | -| approx_kl | 0.012886003 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0971 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 122770 | -| policy_gradient_loss | 0.0129 | -| std | 0.0178 | -| value_loss | 7.74e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12279 | -| time_elapsed | 66512 | -| total_timesteps | 1571712 | -| train/ | | -| approx_kl | 0.0025472841 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.00519 | -| n_updates | 122780 | -| policy_gradient_loss | -0.00363 | -| std | 0.0179 | -| value_loss | 4.96e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12280 | -| time_elapsed | 66514 | -| total_timesteps | 1571840 | -| train/ | | -| approx_kl | 0.008472244 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.00124 | -| learning_rate | 0.0003 | -| loss | 0.00251 | -| n_updates | 122790 | -| policy_gradient_loss | 0.00258 | -| std | 0.0179 | -| value_loss | 8.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12281 | -| time_elapsed | 66518 | -| total_timesteps | 1571968 | -| train/ | | -| approx_kl | 0.016539328 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 122800 | -| policy_gradient_loss | 0.00265 | -| std | 0.0179 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12282 | -| time_elapsed | 66521 | -| total_timesteps | 1572096 | -| train/ | | -| approx_kl | 0.022803592 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | -0.00964 | -| n_updates | 122810 | -| policy_gradient_loss | -0.00402 | -| std | 0.0179 | -| value_loss | 4.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12283 | -| time_elapsed | 66529 | -| total_timesteps | 1572224 | -| train/ | | -| approx_kl | 0.12493329 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 122820 | -| policy_gradient_loss | -0.0161 | -| std | 0.0179 | -| value_loss | 0.000326 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12284 | -| time_elapsed | 66533 | -| total_timesteps | 1572352 | -| train/ | | -| approx_kl | 0.007504733 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -3 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 122830 | -| policy_gradient_loss | -0.00118 | -| std | 0.0179 | -| value_loss | 2.62e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12285 | -| time_elapsed | 66535 | -| total_timesteps | 1572480 | -| train/ | | -| approx_kl | 0.0062662 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -3.7 | -| learning_rate | 0.0003 | -| loss | 0.000284 | -| n_updates | 122840 | -| policy_gradient_loss | 0.00119 | -| std | 0.0179 | -| value_loss | 4.89e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12286 | -| time_elapsed | 66539 | -| total_timesteps | 1572608 | -| train/ | | -| approx_kl | 0.00718569 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | 0.00275 | -| n_updates | 122850 | -| policy_gradient_loss | 0.0244 | -| std | 0.0179 | -| value_loss | 8.38e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12287 | -| time_elapsed | 66542 | -| total_timesteps | 1572736 | -| train/ | | -| approx_kl | 0.020638904 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 122860 | -| policy_gradient_loss | 0.00742 | -| std | 0.0179 | -| value_loss | 0.000155 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12288 | -| time_elapsed | 66545 | -| total_timesteps | 1572864 | -| train/ | | -| approx_kl | 0.01514329 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.00451 | -| learning_rate | 0.0003 | -| loss | -0.000618 | -| n_updates | 122870 | -| policy_gradient_loss | -0.00287 | -| std | 0.0179 | -| value_loss | 1.34e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12289 | -| time_elapsed | 66549 | -| total_timesteps | 1572992 | -| train/ | | -| approx_kl | 0.0033565378 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0516 | -| learning_rate | 0.0003 | -| loss | 0.00199 | -| n_updates | 122880 | -| policy_gradient_loss | 0.00294 | -| std | 0.0179 | -| value_loss | 0.000863 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 12290 | -| time_elapsed | 66553 | -| total_timesteps | 1573120 | -| train/ | | -| approx_kl | 0.02825494 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.928 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 122890 | -| policy_gradient_loss | 0.0244 | -| std | 0.0179 | -| value_loss | 0.00639 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 12291 | -| time_elapsed | 66563 | -| total_timesteps | 1573248 | -| train/ | | -| approx_kl | 0.0537499 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 122900 | -| policy_gradient_loss | -0.00976 | -| std | 0.0179 | -| value_loss | 0.000397 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 12292 | -| time_elapsed | 66566 | -| total_timesteps | 1573376 | -| train/ | | -| approx_kl | 0.03751633 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 122910 | -| policy_gradient_loss | 0.00551 | -| std | 0.0179 | -| value_loss | 4.21e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 12293 | -| time_elapsed | 66568 | -| total_timesteps | 1573504 | -| train/ | | -| approx_kl | 0.0017786832 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 2.6 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 122920 | -| policy_gradient_loss | -0.00818 | -| std | 0.0179 | -| value_loss | 0.000214 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 12294 | -| time_elapsed | 66571 | -| total_timesteps | 1573632 | -| train/ | | -| approx_kl | 0.013872424 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 122930 | -| policy_gradient_loss | 0.00568 | -| std | 0.0178 | -| value_loss | 6.09e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 12295 | -| time_elapsed | 66574 | -| total_timesteps | 1573760 | -| train/ | | -| approx_kl | 0.03900621 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.00868 | -| n_updates | 122940 | -| policy_gradient_loss | 0.00194 | -| std | 0.0178 | -| value_loss | 4.13e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 12296 | -| time_elapsed | 66577 | -| total_timesteps | 1573888 | -| train/ | | -| approx_kl | 0.03267543 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 122950 | -| policy_gradient_loss | 0.00933 | -| std | 0.0178 | -| value_loss | 6.88e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12297 | -| time_elapsed | 66580 | -| total_timesteps | 1574016 | -| train/ | | -| approx_kl | 0.007028488 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.00191 | -| n_updates | 122960 | -| policy_gradient_loss | -0.000368 | -| std | 0.0178 | -| value_loss | 1.39e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12298 | -| time_elapsed | 66587 | -| total_timesteps | 1574144 | -| train/ | | -| approx_kl | 5.071843e-05 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | 0.00403 | -| n_updates | 122970 | -| policy_gradient_loss | 0.0165 | -| std | 0.0178 | -| value_loss | 0.00146 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12299 | -| time_elapsed | 66589 | -| total_timesteps | 1574272 | -| train/ | | -| approx_kl | 0.007492377 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.174 | -| learning_rate | 0.0003 | -| loss | -0.000245 | -| n_updates | 122980 | -| policy_gradient_loss | 0.00241 | -| std | 0.0178 | -| value_loss | 1.35e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12300 | -| time_elapsed | 66592 | -| total_timesteps | 1574400 | -| train/ | | -| approx_kl | 0.0070255366 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0853 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 122990 | -| policy_gradient_loss | -0.0085 | -| std | 0.0178 | -| value_loss | 8.61e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12301 | -| time_elapsed | 66596 | -| total_timesteps | 1574528 | -| train/ | | -| approx_kl | 0.0014949199 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | 0.00895 | -| n_updates | 123000 | -| policy_gradient_loss | -0.00816 | -| std | 0.0178 | -| value_loss | 5.34e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12302 | -| time_elapsed | 66599 | -| total_timesteps | 1574656 | -| train/ | | -| approx_kl | 0.03202334 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 123010 | -| policy_gradient_loss | -0.0114 | -| std | 0.0178 | -| value_loss | 2.98e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12303 | -| time_elapsed | 66601 | -| total_timesteps | 1574784 | -| train/ | | -| approx_kl | 0.011730965 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | -0.00534 | -| n_updates | 123020 | -| policy_gradient_loss | -0.00155 | -| std | 0.0178 | -| value_loss | 2.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12304 | -| time_elapsed | 66605 | -| total_timesteps | 1574912 | -| train/ | | -| approx_kl | 0.048928533 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 123030 | -| policy_gradient_loss | 0.0336 | -| std | 0.0178 | -| value_loss | 1.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12305 | -| time_elapsed | 66608 | -| total_timesteps | 1575040 | -| train/ | | -| approx_kl | 0.027135488 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 123040 | -| policy_gradient_loss | 0.0241 | -| std | 0.0178 | -| value_loss | 7.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12306 | -| time_elapsed | 66615 | -| total_timesteps | 1575168 | -| train/ | | -| approx_kl | 0.010272385 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.0625 | -| n_updates | 123050 | -| policy_gradient_loss | 0.0305 | -| std | 0.0178 | -| value_loss | 0.000414 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12307 | -| time_elapsed | 66620 | -| total_timesteps | 1575296 | -| train/ | | -| approx_kl | 0.001204384 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.00487 | -| n_updates | 123060 | -| policy_gradient_loss | 0.0125 | -| std | 0.0178 | -| value_loss | 1.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12308 | -| time_elapsed | 66623 | -| total_timesteps | 1575424 | -| train/ | | -| approx_kl | 0.020414665 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.00572 | -| learning_rate | 0.0003 | -| loss | 0.00521 | -| n_updates | 123070 | -| policy_gradient_loss | 0.000348 | -| std | 0.0177 | -| value_loss | 9.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12309 | -| time_elapsed | 66626 | -| total_timesteps | 1575552 | -| train/ | | -| approx_kl | 0.00567021 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | -0.00999 | -| n_updates | 123080 | -| policy_gradient_loss | 0.00436 | -| std | 0.0177 | -| value_loss | 5.91e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12310 | -| time_elapsed | 66630 | -| total_timesteps | 1575680 | -| train/ | | -| approx_kl | 0.00015290407 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | -0.000602 | -| n_updates | 123090 | -| policy_gradient_loss | 9.38e-05 | -| std | 0.0177 | -| value_loss | 4.45e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12311 | -| time_elapsed | 66634 | -| total_timesteps | 1575808 | -| train/ | | -| approx_kl | 0.0032970626 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | 0.00554 | -| n_updates | 123100 | -| policy_gradient_loss | 0.0112 | -| std | 0.0177 | -| value_loss | 1.96e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12312 | -| time_elapsed | 66638 | -| total_timesteps | 1575936 | -| train/ | | -| approx_kl | 0.00023670355 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 123110 | -| policy_gradient_loss | 0.0116 | -| std | 0.0177 | -| value_loss | 1.48e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12313 | -| time_elapsed | 66642 | -| total_timesteps | 1576064 | -| train/ | | -| approx_kl | 0.011695849 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 123120 | -| policy_gradient_loss | 0.0141 | -| std | 0.0177 | -| value_loss | 1e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12314 | -| time_elapsed | 66649 | -| total_timesteps | 1576192 | -| train/ | | -| approx_kl | 0.2823793 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | 0.00293 | -| n_updates | 123130 | -| policy_gradient_loss | -0.00822 | -| std | 0.0177 | -| value_loss | 0.000538 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12315 | -| time_elapsed | 66653 | -| total_timesteps | 1576320 | -| train/ | | -| approx_kl | 0.048213884 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.34 | -| learning_rate | 0.0003 | -| loss | 0.00565 | -| n_updates | 123140 | -| policy_gradient_loss | -0.00561 | -| std | 0.0177 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12316 | -| time_elapsed | 66657 | -| total_timesteps | 1576448 | -| train/ | | -| approx_kl | 0.013696985 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 123150 | -| policy_gradient_loss | -0.000666 | -| std | 0.0177 | -| value_loss | 5.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12317 | -| time_elapsed | 66660 | -| total_timesteps | 1576576 | -| train/ | | -| approx_kl | 0.045043223 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.000311 | -| learning_rate | 0.0003 | -| loss | 0.00545 | -| n_updates | 123160 | -| policy_gradient_loss | -0.00169 | -| std | 0.0177 | -| value_loss | 1.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12318 | -| time_elapsed | 66663 | -| total_timesteps | 1576704 | -| train/ | | -| approx_kl | 0.011764732 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.00376 | -| learning_rate | 0.0003 | -| loss | 0.00273 | -| n_updates | 123170 | -| policy_gradient_loss | 0.00277 | -| std | 0.0177 | -| value_loss | 5.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12319 | -| time_elapsed | 66665 | -| total_timesteps | 1576832 | -| train/ | | -| approx_kl | 0.017651154 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 123180 | -| policy_gradient_loss | -0.00124 | -| std | 0.0177 | -| value_loss | 1.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12320 | -| time_elapsed | 66667 | -| total_timesteps | 1576960 | -| train/ | | -| approx_kl | 0.022758529 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.00333 | -| learning_rate | 0.0003 | -| loss | 0.0095 | -| n_updates | 123190 | -| policy_gradient_loss | 0.0038 | -| std | 0.0177 | -| value_loss | 3.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12321 | -| time_elapsed | 66669 | -| total_timesteps | 1577088 | -| train/ | | -| approx_kl | 0.011243101 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.00567 | -| n_updates | 123200 | -| policy_gradient_loss | -0.00236 | -| std | 0.0177 | -| value_loss | 2.24e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12322 | -| time_elapsed | 66676 | -| total_timesteps | 1577216 | -| train/ | | -| approx_kl | 0.14270696 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.397 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 123210 | -| policy_gradient_loss | -0.0156 | -| std | 0.0177 | -| value_loss | 0.00121 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12323 | -| time_elapsed | 66679 | -| total_timesteps | 1577344 | -| train/ | | -| approx_kl | 0.007850042 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -5.06 | -| learning_rate | 0.0003 | -| loss | -0.00358 | -| n_updates | 123220 | -| policy_gradient_loss | 0.00439 | -| std | 0.0177 | -| value_loss | 4.08e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12324 | -| time_elapsed | 66681 | -| total_timesteps | 1577472 | -| train/ | | -| approx_kl | 1.2298115e-05 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | -0.000688 | -| n_updates | 123230 | -| policy_gradient_loss | 0.00138 | -| std | 0.0177 | -| value_loss | 7.05e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12325 | -| time_elapsed | 66684 | -| total_timesteps | 1577600 | -| train/ | | -| approx_kl | 0.008815774 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.875 | -| learning_rate | 0.0003 | -| loss | 0.00376 | -| n_updates | 123240 | -| policy_gradient_loss | 0.0255 | -| std | 0.0177 | -| value_loss | 7.71e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12326 | -| time_elapsed | 66687 | -| total_timesteps | 1577728 | -| train/ | | -| approx_kl | 0.01659483 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 123250 | -| policy_gradient_loss | 0.0297 | -| std | 0.0177 | -| value_loss | 4.73e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12327 | -| time_elapsed | 66690 | -| total_timesteps | 1577856 | -| train/ | | -| approx_kl | 0.027100721 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | 0.000716 | -| learning_rate | 0.0003 | -| loss | 0.00893 | -| n_updates | 123260 | -| policy_gradient_loss | -3.28e-05 | -| std | 0.0177 | -| value_loss | 2.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12328 | -| time_elapsed | 66694 | -| total_timesteps | 1577984 | -| train/ | | -| approx_kl | 0.008432028 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.00902 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 123270 | -| policy_gradient_loss | 0.0154 | -| std | 0.0177 | -| value_loss | 1.72e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12329 | -| time_elapsed | 66696 | -| total_timesteps | 1578112 | -| train/ | | -| approx_kl | 0.003245533 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.00907 | -| n_updates | 123280 | -| policy_gradient_loss | 0.014 | -| std | 0.0177 | -| value_loss | 1.36e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12330 | -| time_elapsed | 66703 | -| total_timesteps | 1578240 | -| train/ | | -| approx_kl | 0.3297334 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -14.6 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 123290 | -| policy_gradient_loss | -0.0149 | -| std | 0.0177 | -| value_loss | 0.00379 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12331 | -| time_elapsed | 66706 | -| total_timesteps | 1578368 | -| train/ | | -| approx_kl | 0.04321135 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 2.61 | -| explained_variance | -3.56 | -| learning_rate | 0.0003 | -| loss | 0.0413 | -| n_updates | 123300 | -| policy_gradient_loss | 0.01 | -| std | 0.0177 | -| value_loss | 0.000204 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12332 | -| time_elapsed | 66709 | -| total_timesteps | 1578496 | -| train/ | | -| approx_kl | 4.6654604e-05 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | 0.00144 | -| n_updates | 123310 | -| policy_gradient_loss | -0.00915 | -| std | 0.0177 | -| value_loss | 4.32e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12333 | -| time_elapsed | 66711 | -| total_timesteps | 1578624 | -| train/ | | -| approx_kl | 0.08198795 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | 0.0493 | -| n_updates | 123320 | -| policy_gradient_loss | 0.00668 | -| std | 0.0177 | -| value_loss | 4.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12334 | -| time_elapsed | 66714 | -| total_timesteps | 1578752 | -| train/ | | -| approx_kl | 0.020361878 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | 0.00383 | -| n_updates | 123330 | -| policy_gradient_loss | -0.000348 | -| std | 0.0177 | -| value_loss | 3.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12335 | -| time_elapsed | 66717 | -| total_timesteps | 1578880 | -| train/ | | -| approx_kl | 0.021298103 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | 0.000483 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 123340 | -| policy_gradient_loss | 0.0124 | -| std | 0.0177 | -| value_loss | 1.74e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12336 | -| time_elapsed | 66720 | -| total_timesteps | 1579008 | -| train/ | | -| approx_kl | 0.0054916926 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.00387 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 123350 | -| policy_gradient_loss | -0.00154 | -| std | 0.0177 | -| value_loss | 1.41e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12337 | -| time_elapsed | 66727 | -| total_timesteps | 1579136 | -| train/ | | -| approx_kl | 0.010207877 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | 0.971 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 123360 | -| policy_gradient_loss | 0.0122 | -| std | 0.0177 | -| value_loss | 0.000192 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12338 | -| time_elapsed | 66731 | -| total_timesteps | 1579264 | -| train/ | | -| approx_kl | 0.0058453525 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | 0.02 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 123370 | -| policy_gradient_loss | -0.0125 | -| std | 0.0176 | -| value_loss | 0.00149 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12339 | -| time_elapsed | 66735 | -| total_timesteps | 1579392 | -| train/ | | -| approx_kl | 0.025501486 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0628 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 123380 | -| policy_gradient_loss | -0.0101 | -| std | 0.0176 | -| value_loss | 8.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12340 | -| time_elapsed | 66738 | -| total_timesteps | 1579520 | -| train/ | | -| approx_kl | 0.014705857 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0006 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 123390 | -| policy_gradient_loss | 0.00472 | -| std | 0.0176 | -| value_loss | 1.02e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12341 | -| time_elapsed | 66743 | -| total_timesteps | 1579648 | -| train/ | | -| approx_kl | 0.0192355 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.00374 | -| n_updates | 123400 | -| policy_gradient_loss | 0.00187 | -| std | 0.0176 | -| value_loss | 4.14e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12342 | -| time_elapsed | 66746 | -| total_timesteps | 1579776 | -| train/ | | -| approx_kl | 0.011587352 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 123410 | -| policy_gradient_loss | -0.00228 | -| std | 0.0176 | -| value_loss | 3.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 12343 | -| time_elapsed | 66748 | -| total_timesteps | 1579904 | -| train/ | | -| approx_kl | 0.02131331 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 123420 | -| policy_gradient_loss | -0.000916 | -| std | 0.0176 | -| value_loss | 1.93e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12344 | -| time_elapsed | 66751 | -| total_timesteps | 1580032 | -| train/ | | -| approx_kl | 0.028415639 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 123430 | -| policy_gradient_loss | -0.00585 | -| std | 0.0176 | -| value_loss | 1.27e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12345 | -| time_elapsed | 66757 | -| total_timesteps | 1580160 | -| train/ | | -| approx_kl | 0.27800342 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | 0.707 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 123440 | -| policy_gradient_loss | -0.0151 | -| std | 0.0176 | -| value_loss | 0.00064 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12346 | -| time_elapsed | 66760 | -| total_timesteps | 1580288 | -| train/ | | -| approx_kl | 0.04252058 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 123450 | -| policy_gradient_loss | 0.00733 | -| std | 0.0176 | -| value_loss | 1.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12347 | -| time_elapsed | 66764 | -| total_timesteps | 1580416 | -| train/ | | -| approx_kl | 0.009736279 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0777 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 123460 | -| policy_gradient_loss | 0.000639 | -| std | 0.0176 | -| value_loss | 7.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12348 | -| time_elapsed | 66768 | -| total_timesteps | 1580544 | -| train/ | | -| approx_kl | 0.01745711 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.000443 | -| learning_rate | 0.0003 | -| loss | 0.00625 | -| n_updates | 123470 | -| policy_gradient_loss | 0.00332 | -| std | 0.0176 | -| value_loss | 4.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12349 | -| time_elapsed | 66771 | -| total_timesteps | 1580672 | -| train/ | | -| approx_kl | 0.096364744 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.00767 | -| learning_rate | 0.0003 | -| loss | 0.0512 | -| n_updates | 123480 | -| policy_gradient_loss | 0.00998 | -| std | 0.0176 | -| value_loss | 3.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12350 | -| time_elapsed | 66775 | -| total_timesteps | 1580800 | -| train/ | | -| approx_kl | 0.000541497 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 123490 | -| policy_gradient_loss | -0.00138 | -| std | 0.0176 | -| value_loss | 3.47e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12351 | -| time_elapsed | 66779 | -| total_timesteps | 1580928 | -| train/ | | -| approx_kl | 0.00023596035 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | 0.00627 | -| n_updates | 123500 | -| policy_gradient_loss | -0.00351 | -| std | 0.0175 | -| value_loss | 1.2e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12352 | -| time_elapsed | 66783 | -| total_timesteps | 1581056 | -| train/ | | -| approx_kl | 0.0013508201 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.00262 | -| n_updates | 123510 | -| policy_gradient_loss | 0.0271 | -| std | 0.0175 | -| value_loss | 4.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12353 | -| time_elapsed | 66788 | -| total_timesteps | 1581184 | -| train/ | | -| approx_kl | 0.011900527 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 123520 | -| policy_gradient_loss | 0.035 | -| std | 0.0175 | -| value_loss | 0.00101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12354 | -| time_elapsed | 66792 | -| total_timesteps | 1581312 | -| train/ | | -| approx_kl | 0.017139753 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | 0.00836 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 123530 | -| policy_gradient_loss | 0.013 | -| std | 0.0175 | -| value_loss | 0.000343 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12355 | -| time_elapsed | 66795 | -| total_timesteps | 1581440 | -| train/ | | -| approx_kl | 0.032103196 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.62 | -| explained_variance | 0.000226 | -| learning_rate | 0.0003 | -| loss | 0.00854 | -| n_updates | 123540 | -| policy_gradient_loss | -0.001 | -| std | 0.0175 | -| value_loss | 6.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12356 | -| time_elapsed | 66799 | -| total_timesteps | 1581568 | -| train/ | | -| approx_kl | 0.0065269256 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 123550 | -| policy_gradient_loss | 0.00531 | -| std | 0.0175 | -| value_loss | 1.54e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12357 | -| time_elapsed | 66803 | -| total_timesteps | 1581696 | -| train/ | | -| approx_kl | 1.8994324e-06 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.000128 | -| n_updates | 123560 | -| policy_gradient_loss | 0.0229 | -| std | 0.0175 | -| value_loss | 1.05e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12358 | -| time_elapsed | 66805 | -| total_timesteps | 1581824 | -| train/ | | -| approx_kl | 0.007074569 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 123570 | -| policy_gradient_loss | 0.0173 | -| std | 0.0175 | -| value_loss | 8.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12359 | -| time_elapsed | 66808 | -| total_timesteps | 1581952 | -| train/ | | -| approx_kl | 0.002274502 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 123580 | -| policy_gradient_loss | 0.00244 | -| std | 0.0175 | -| value_loss | 5.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12360 | -| time_elapsed | 66812 | -| total_timesteps | 1582080 | -| train/ | | -| approx_kl | 0.09362742 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.088 | -| n_updates | 123590 | -| policy_gradient_loss | 0.0428 | -| std | 0.0175 | -| value_loss | 4.08e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12361 | -| time_elapsed | 66820 | -| total_timesteps | 1582208 | -| train/ | | -| approx_kl | 0.010101995 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | 0.923 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 123600 | -| policy_gradient_loss | -0.00954 | -| std | 0.0175 | -| value_loss | 0.000647 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12362 | -| time_elapsed | 66824 | -| total_timesteps | 1582336 | -| train/ | | -| approx_kl | 0.006144115 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | -0.000229 | -| n_updates | 123610 | -| policy_gradient_loss | 0.0121 | -| std | 0.0175 | -| value_loss | 1e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12363 | -| time_elapsed | 66827 | -| total_timesteps | 1582464 | -| train/ | | -| approx_kl | 0.03916147 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.00783 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 123620 | -| policy_gradient_loss | 0.0042 | -| std | 0.0175 | -| value_loss | 1.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12364 | -| time_elapsed | 66830 | -| total_timesteps | 1582592 | -| train/ | | -| approx_kl | 0.036085203 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.00907 | -| n_updates | 123630 | -| policy_gradient_loss | 0.00206 | -| std | 0.0175 | -| value_loss | 1.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12365 | -| time_elapsed | 66834 | -| total_timesteps | 1582720 | -| train/ | | -| approx_kl | 0.041104287 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.00808 | -| n_updates | 123640 | -| policy_gradient_loss | -0.00911 | -| std | 0.0175 | -| value_loss | 1.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12366 | -| time_elapsed | 66838 | -| total_timesteps | 1582848 | -| train/ | | -| approx_kl | 0.0107647255 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.000563 | -| n_updates | 123650 | -| policy_gradient_loss | 0.0013 | -| std | 0.0175 | -| value_loss | 6.42e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 12367 | -| time_elapsed | 66842 | -| total_timesteps | 1582976 | -| train/ | | -| approx_kl | 0.03135435 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 123660 | -| policy_gradient_loss | -0.00783 | -| std | 0.0175 | -| value_loss | 7.05e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12368 | -| time_elapsed | 66845 | -| total_timesteps | 1583104 | -| train/ | | -| approx_kl | 0.0056953067 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 123670 | -| policy_gradient_loss | 0.00314 | -| std | 0.0174 | -| value_loss | 2.66e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12369 | -| time_elapsed | 66853 | -| total_timesteps | 1583232 | -| train/ | | -| approx_kl | 0.17642678 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -1.44 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 123680 | -| policy_gradient_loss | -0.0146 | -| std | 0.0174 | -| value_loss | 0.00168 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12370 | -| time_elapsed | 66857 | -| total_timesteps | 1583360 | -| train/ | | -| approx_kl | 0.044392373 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -4.76 | -| learning_rate | 0.0003 | -| loss | 0.00989 | -| n_updates | 123690 | -| policy_gradient_loss | 0.00218 | -| std | 0.0174 | -| value_loss | 3.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12371 | -| time_elapsed | 66860 | -| total_timesteps | 1583488 | -| train/ | | -| approx_kl | 0.013725635 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -2.75 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 123700 | -| policy_gradient_loss | -0.00058 | -| std | 0.0174 | -| value_loss | 2.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12372 | -| time_elapsed | 66863 | -| total_timesteps | 1583616 | -| train/ | | -| approx_kl | 0.060477234 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.296 | -| learning_rate | 0.0003 | -| loss | 0.0265 | -| n_updates | 123710 | -| policy_gradient_loss | 0.00417 | -| std | 0.0174 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12373 | -| time_elapsed | 66866 | -| total_timesteps | 1583744 | -| train/ | | -| approx_kl | 0.014226768 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.00542 | -| n_updates | 123720 | -| policy_gradient_loss | 0.0151 | -| std | 0.0174 | -| value_loss | 5.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 12374 | -| time_elapsed | 66869 | -| total_timesteps | 1583872 | -| train/ | | -| approx_kl | 0.036381822 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.000233 | -| n_updates | 123730 | -| policy_gradient_loss | -0.00309 | -| std | 0.0174 | -| value_loss | 1.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12375 | -| time_elapsed | 66873 | -| total_timesteps | 1584000 | -| train/ | | -| approx_kl | 0.01874764 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | 0.00307 | -| learning_rate | 0.0003 | -| loss | -0.000825 | -| n_updates | 123740 | -| policy_gradient_loss | 0.00708 | -| std | 0.0174 | -| value_loss | 5.26e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12376 | -| time_elapsed | 66876 | -| total_timesteps | 1584128 | -| train/ | | -| approx_kl | 0.009605296 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | 0.000704 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 123750 | -| policy_gradient_loss | -0.00734 | -| std | 0.0174 | -| value_loss | 2.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12377 | -| time_elapsed | 66885 | -| total_timesteps | 1584256 | -| train/ | | -| approx_kl | 0.27630195 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 123760 | -| policy_gradient_loss | -0.0154 | -| std | 0.0174 | -| value_loss | 0.000254 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12378 | -| time_elapsed | 66889 | -| total_timesteps | 1584384 | -| train/ | | -| approx_kl | 0.03296684 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.642 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 123770 | -| policy_gradient_loss | -0.0133 | -| std | 0.0174 | -| value_loss | 1.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12379 | -| time_elapsed | 66893 | -| total_timesteps | 1584512 | -| train/ | | -| approx_kl | 0.023033248 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.315 | -| learning_rate | 0.0003 | -| loss | 0.00351 | -| n_updates | 123780 | -| policy_gradient_loss | -0.00192 | -| std | 0.0174 | -| value_loss | 5.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12380 | -| time_elapsed | 66896 | -| total_timesteps | 1584640 | -| train/ | | -| approx_kl | 0.003198673 | -| clip_fraction | 0.0164 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 123790 | -| policy_gradient_loss | -0.000901 | -| std | 0.0174 | -| value_loss | 1.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12381 | -| time_elapsed | 66899 | -| total_timesteps | 1584768 | -| train/ | | -| approx_kl | 0.007901851 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -8.17e-05 | -| learning_rate | 0.0003 | -| loss | 3.57e-05 | -| n_updates | 123800 | -| policy_gradient_loss | -0.000127 | -| std | 0.0174 | -| value_loss | 9.73e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 12382 | -| time_elapsed | 66902 | -| total_timesteps | 1584896 | -| train/ | | -| approx_kl | 0.00053445203 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.63 | -| explained_variance | -0.00898 | -| learning_rate | 0.0003 | -| loss | 0.00182 | -| n_updates | 123810 | -| policy_gradient_loss | 0.0117 | -| std | 0.0174 | -| value_loss | 1.36e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12383 | -| time_elapsed | 66906 | -| total_timesteps | 1585024 | -| train/ | | -| approx_kl | 0.0015806318 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.000192 | -| learning_rate | 0.0003 | -| loss | 0.00771 | -| n_updates | 123820 | -| policy_gradient_loss | 0.0204 | -| std | 0.0173 | -| value_loss | 6.58e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12384 | -| time_elapsed | 66916 | -| total_timesteps | 1585152 | -| train/ | | -| approx_kl | 0.002337629 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 123830 | -| policy_gradient_loss | 0.000682 | -| std | 0.0173 | -| value_loss | 6.36e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12385 | -| time_elapsed | 66920 | -| total_timesteps | 1585280 | -| train/ | | -| approx_kl | 0.010498796 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | 0.0118 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 123840 | -| policy_gradient_loss | 0.00159 | -| std | 0.0173 | -| value_loss | 1.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12386 | -| time_elapsed | 66923 | -| total_timesteps | 1585408 | -| train/ | | -| approx_kl | 0.05125613 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | 0.00357 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 123850 | -| policy_gradient_loss | 0.00588 | -| std | 0.0173 | -| value_loss | 1.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12387 | -| time_elapsed | 66926 | -| total_timesteps | 1585536 | -| train/ | | -| approx_kl | 0.07493534 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 123860 | -| policy_gradient_loss | 0.000393 | -| std | 0.0173 | -| value_loss | 7.69e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12388 | -| time_elapsed | 66930 | -| total_timesteps | 1585664 | -| train/ | | -| approx_kl | 0.013744505 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 123870 | -| policy_gradient_loss | 0.0087 | -| std | 0.0173 | -| value_loss | 4.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12389 | -| time_elapsed | 66933 | -| total_timesteps | 1585792 | -| train/ | | -| approx_kl | 0.035493884 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.00465 | -| n_updates | 123880 | -| policy_gradient_loss | 0.00101 | -| std | 0.0173 | -| value_loss | 3.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12390 | -| time_elapsed | 66937 | -| total_timesteps | 1585920 | -| train/ | | -| approx_kl | 0.029301679 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 123890 | -| policy_gradient_loss | 0.00655 | -| std | 0.0173 | -| value_loss | 2.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12391 | -| time_elapsed | 66940 | -| total_timesteps | 1586048 | -| train/ | | -| approx_kl | 0.098305054 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.0563 | -| n_updates | 123900 | -| policy_gradient_loss | 0.01 | -| std | 0.0173 | -| value_loss | 1.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12392 | -| time_elapsed | 66946 | -| total_timesteps | 1586176 | -| train/ | | -| approx_kl | 0.020484451 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 123910 | -| policy_gradient_loss | 0.00641 | -| std | 0.0173 | -| value_loss | 0.000155 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12393 | -| time_elapsed | 66948 | -| total_timesteps | 1586304 | -| train/ | | -| approx_kl | 0.040607207 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | 0.00243 | -| learning_rate | 0.0003 | -| loss | 0.00971 | -| n_updates | 123920 | -| policy_gradient_loss | 0.00123 | -| std | 0.0173 | -| value_loss | 9.85e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12394 | -| time_elapsed | 66952 | -| total_timesteps | 1586432 | -| train/ | | -| approx_kl | 0.01611141 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 123930 | -| policy_gradient_loss | 0.000869 | -| std | 0.0173 | -| value_loss | 1.57e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12395 | -| time_elapsed | 66956 | -| total_timesteps | 1586560 | -| train/ | | -| approx_kl | 0.023560941 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 123940 | -| policy_gradient_loss | -0.000878 | -| std | 0.0173 | -| value_loss | 1.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12396 | -| time_elapsed | 66959 | -| total_timesteps | 1586688 | -| train/ | | -| approx_kl | 0.026699014 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.00955 | -| n_updates | 123950 | -| policy_gradient_loss | 0.0141 | -| std | 0.0172 | -| value_loss | 7.73e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12397 | -| time_elapsed | 66962 | -| total_timesteps | 1586816 | -| train/ | | -| approx_kl | 0.0024398812 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.00327 | -| n_updates | 123960 | -| policy_gradient_loss | 0.000201 | -| std | 0.0172 | -| value_loss | 4.78e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12398 | -| time_elapsed | 66964 | -| total_timesteps | 1586944 | -| train/ | | -| approx_kl | 0.013959356 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | -0.000942 | -| n_updates | 123970 | -| policy_gradient_loss | 0.00148 | -| std | 0.0172 | -| value_loss | 3.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12399 | -| time_elapsed | 66967 | -| total_timesteps | 1587072 | -| train/ | | -| approx_kl | 0.031270623 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.000707 | -| n_updates | 123980 | -| policy_gradient_loss | 0.00748 | -| std | 0.0172 | -| value_loss | 2.58e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12400 | -| time_elapsed | 66973 | -| total_timesteps | 1587200 | -| train/ | | -| approx_kl | 0.10272018 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -8.99 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 123990 | -| policy_gradient_loss | -0.0157 | -| std | 0.0172 | -| value_loss | 0.0023 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12401 | -| time_elapsed | 66976 | -| total_timesteps | 1587328 | -| train/ | | -| approx_kl | 0.05116685 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -33.6 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 124000 | -| policy_gradient_loss | -0.00454 | -| std | 0.0172 | -| value_loss | 9.16e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12402 | -| time_elapsed | 66980 | -| total_timesteps | 1587456 | -| train/ | | -| approx_kl | 0.0066593206 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.64 | -| explained_variance | -18.5 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 124010 | -| policy_gradient_loss | 0.000227 | -| std | 0.0172 | -| value_loss | 2.07e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12403 | -| time_elapsed | 66983 | -| total_timesteps | 1587584 | -| train/ | | -| approx_kl | 0.027738431 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -2.03 | -| learning_rate | 0.0003 | -| loss | 0.00016 | -| n_updates | 124020 | -| policy_gradient_loss | -0.00047 | -| std | 0.0171 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12404 | -| time_elapsed | 66985 | -| total_timesteps | 1587712 | -| train/ | | -| approx_kl | 0.015125349 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.00665 | -| n_updates | 124030 | -| policy_gradient_loss | 0.00663 | -| std | 0.0171 | -| value_loss | 2.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12405 | -| time_elapsed | 66988 | -| total_timesteps | 1587840 | -| train/ | | -| approx_kl | 0.023374643 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.00598 | -| learning_rate | 0.0003 | -| loss | 0.0089 | -| n_updates | 124040 | -| policy_gradient_loss | 0.00418 | -| std | 0.0171 | -| value_loss | 3.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12406 | -| time_elapsed | 66992 | -| total_timesteps | 1587968 | -| train/ | | -| approx_kl | 0.004620866 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.00477 | -| learning_rate | 0.0003 | -| loss | 0.00651 | -| n_updates | 124050 | -| policy_gradient_loss | 0.000739 | -| std | 0.0171 | -| value_loss | 2.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12407 | -| time_elapsed | 66996 | -| total_timesteps | 1588096 | -| train/ | | -| approx_kl | 0.03721147 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0201 | -| n_updates | 124060 | -| policy_gradient_loss | 0.00719 | -| std | 0.0171 | -| value_loss | 9.81e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12408 | -| time_elapsed | 67003 | -| total_timesteps | 1588224 | -| train/ | | -| approx_kl | 0.036032468 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 124070 | -| policy_gradient_loss | -0.00832 | -| std | 0.0171 | -| value_loss | 0.00162 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12409 | -| time_elapsed | 67008 | -| total_timesteps | 1588352 | -| train/ | | -| approx_kl | 0.013736533 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | -0.00842 | -| n_updates | 124080 | -| policy_gradient_loss | -0.00515 | -| std | 0.0171 | -| value_loss | 5.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12410 | -| time_elapsed | 67010 | -| total_timesteps | 1588480 | -| train/ | | -| approx_kl | 0.06311194 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -5.71 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 124090 | -| policy_gradient_loss | 0.00424 | -| std | 0.0171 | -| value_loss | 5.53e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12411 | -| time_elapsed | 67014 | -| total_timesteps | 1588608 | -| train/ | | -| approx_kl | 0.00019068317 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 124100 | -| policy_gradient_loss | 0.00522 | -| std | 0.0171 | -| value_loss | 4.51e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12412 | -| time_elapsed | 67017 | -| total_timesteps | 1588736 | -| train/ | | -| approx_kl | 0.02644249 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.511 | -| learning_rate | 0.0003 | -| loss | -0.00345 | -| n_updates | 124110 | -| policy_gradient_loss | 0.00743 | -| std | 0.0171 | -| value_loss | 1.1e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12413 | -| time_elapsed | 67020 | -| total_timesteps | 1588864 | -| train/ | | -| approx_kl | 0.0077430685 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 124120 | -| policy_gradient_loss | -0.00823 | -| std | 0.0171 | -| value_loss | 6.93e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12414 | -| time_elapsed | 67024 | -| total_timesteps | 1588992 | -| train/ | | -| approx_kl | 0.010265827 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 124130 | -| policy_gradient_loss | -0.000654 | -| std | 0.0171 | -| value_loss | 3.98e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12415 | -| time_elapsed | 67028 | -| total_timesteps | 1589120 | -| train/ | | -| approx_kl | 0.017397495 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 124140 | -| policy_gradient_loss | 0.0153 | -| std | 0.0171 | -| value_loss | 6.75e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12416 | -| time_elapsed | 67037 | -| total_timesteps | 1589248 | -| train/ | | -| approx_kl | 0.24424118 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.398 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 124150 | -| policy_gradient_loss | -0.017 | -| std | 0.0171 | -| value_loss | 0.00116 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12417 | -| time_elapsed | 67040 | -| total_timesteps | 1589376 | -| train/ | | -| approx_kl | 0.0032390445 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.486 | -| learning_rate | 0.0003 | -| loss | 0.00518 | -| n_updates | 124160 | -| policy_gradient_loss | -0.00027 | -| std | 0.017 | -| value_loss | 1.09e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12418 | -| time_elapsed | 67044 | -| total_timesteps | 1589504 | -| train/ | | -| approx_kl | 0.035016604 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | 0.0089 | -| n_updates | 124170 | -| policy_gradient_loss | 0.00166 | -| std | 0.017 | -| value_loss | 7.4e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12419 | -| time_elapsed | 67048 | -| total_timesteps | 1589632 | -| train/ | | -| approx_kl | 0.0062097223 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -3.86 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 124180 | -| policy_gradient_loss | -0.0147 | -| std | 0.017 | -| value_loss | 1.2e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12420 | -| time_elapsed | 67051 | -| total_timesteps | 1589760 | -| train/ | | -| approx_kl | 0.0021493798 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 124190 | -| policy_gradient_loss | 0.00107 | -| std | 0.017 | -| value_loss | 6.48e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12421 | -| time_elapsed | 67055 | -| total_timesteps | 1589888 | -| train/ | | -| approx_kl | 0.056728277 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | 0.000211 | -| n_updates | 124200 | -| policy_gradient_loss | -0.00604 | -| std | 0.017 | -| value_loss | 1.02e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12422 | -| time_elapsed | 67058 | -| total_timesteps | 1590016 | -| train/ | | -| approx_kl | 0.08768862 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 124210 | -| policy_gradient_loss | -0.000884 | -| std | 0.017 | -| value_loss | 1.62e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12423 | -| time_elapsed | 67065 | -| total_timesteps | 1590144 | -| train/ | | -| approx_kl | 0.0038244054 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 124220 | -| policy_gradient_loss | -0.0107 | -| std | 0.017 | -| value_loss | 0.00231 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12424 | -| time_elapsed | 67068 | -| total_timesteps | 1590272 | -| train/ | | -| approx_kl | 0.02350793 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | 0.221 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 124230 | -| policy_gradient_loss | 0.0189 | -| std | 0.017 | -| value_loss | 1.47e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12425 | -| time_elapsed | 67071 | -| total_timesteps | 1590400 | -| train/ | | -| approx_kl | 0.03214804 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -4.09 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 124240 | -| policy_gradient_loss | -0.00971 | -| std | 0.017 | -| value_loss | 1.06e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12426 | -| time_elapsed | 67075 | -| total_timesteps | 1590528 | -| train/ | | -| approx_kl | 0.008843908 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -0.936 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 124250 | -| policy_gradient_loss | 0.0146 | -| std | 0.017 | -| value_loss | 2.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12427 | -| time_elapsed | 67079 | -| total_timesteps | 1590656 | -| train/ | | -| approx_kl | 0.003640932 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.293 | -| learning_rate | 0.0003 | -| loss | 0.00256 | -| n_updates | 124260 | -| policy_gradient_loss | 0.0205 | -| std | 0.017 | -| value_loss | 1.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12428 | -| time_elapsed | 67084 | -| total_timesteps | 1590784 | -| train/ | | -| approx_kl | 0.014109578 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0996 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 124270 | -| policy_gradient_loss | 0.0236 | -| std | 0.017 | -| value_loss | 1.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12429 | -| time_elapsed | 67088 | -| total_timesteps | 1590912 | -| train/ | | -| approx_kl | 0.017539036 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 124280 | -| policy_gradient_loss | 0.0274 | -| std | 0.017 | -| value_loss | 8.44e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12430 | -| time_elapsed | 67091 | -| total_timesteps | 1591040 | -| train/ | | -| approx_kl | 0.0220423 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 124290 | -| policy_gradient_loss | 0.036 | -| std | 0.017 | -| value_loss | 4.54e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12431 | -| time_elapsed | 67098 | -| total_timesteps | 1591168 | -| train/ | | -| approx_kl | 0.038591646 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 124300 | -| policy_gradient_loss | 0.0113 | -| std | 0.017 | -| value_loss | 5.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12432 | -| time_elapsed | 67101 | -| total_timesteps | 1591296 | -| train/ | | -| approx_kl | 0.006742699 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.65 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 124310 | -| policy_gradient_loss | 0.00241 | -| std | 0.017 | -| value_loss | 4.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12433 | -| time_elapsed | 67104 | -| total_timesteps | 1591424 | -| train/ | | -| approx_kl | 0.070052564 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | 0.00264 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 124320 | -| policy_gradient_loss | 0.00552 | -| std | 0.017 | -| value_loss | 7.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12434 | -| time_elapsed | 67108 | -| total_timesteps | 1591552 | -| train/ | | -| approx_kl | 0.015406352 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | -0.000189 | -| n_updates | 124330 | -| policy_gradient_loss | 0.00166 | -| std | 0.017 | -| value_loss | 5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12435 | -| time_elapsed | 67111 | -| total_timesteps | 1591680 | -| train/ | | -| approx_kl | 0.022994213 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 124340 | -| policy_gradient_loss | -0.00804 | -| std | 0.017 | -| value_loss | 3.93e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12436 | -| time_elapsed | 67114 | -| total_timesteps | 1591808 | -| train/ | | -| approx_kl | 0.024853764 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | 0.000408 | -| n_updates | 124350 | -| policy_gradient_loss | 0.00027 | -| std | 0.017 | -| value_loss | 2.75e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12437 | -| time_elapsed | 67118 | -| total_timesteps | 1591936 | -| train/ | | -| approx_kl | 5.4479577e-05 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 2.66 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.000705 | -| n_updates | 124360 | -| policy_gradient_loss | -0.000254 | -| std | 0.0169 | -| value_loss | 2.74e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12438 | -| time_elapsed | 67121 | -| total_timesteps | 1592064 | -| train/ | | -| approx_kl | 0.020965183 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | 0.00753 | -| n_updates | 124370 | -| policy_gradient_loss | 0.00468 | -| std | 0.0168 | -| value_loss | 1.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12439 | -| time_elapsed | 67127 | -| total_timesteps | 1592192 | -| train/ | | -| approx_kl | 0.12801717 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | 0.805 | -| learning_rate | 0.0003 | -| loss | 0.0752 | -| n_updates | 124380 | -| policy_gradient_loss | 0.0388 | -| std | 0.0168 | -| value_loss | 0.00214 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12440 | -| time_elapsed | 67130 | -| total_timesteps | 1592320 | -| train/ | | -| approx_kl | 0.0051673106 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 124390 | -| policy_gradient_loss | -0.00462 | -| std | 0.0167 | -| value_loss | 4.42e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12441 | -| time_elapsed | 67134 | -| total_timesteps | 1592448 | -| train/ | | -| approx_kl | 0.14359728 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.00175 | -| learning_rate | 0.0003 | -| loss | 0.065 | -| n_updates | 124400 | -| policy_gradient_loss | 0.0128 | -| std | 0.0167 | -| value_loss | 5.62e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12442 | -| time_elapsed | 67138 | -| total_timesteps | 1592576 | -| train/ | | -| approx_kl | 0.0015764134 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 124410 | -| policy_gradient_loss | -4.34e-05 | -| std | 0.0167 | -| value_loss | 3.72e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12443 | -| time_elapsed | 67141 | -| total_timesteps | 1592704 | -| train/ | | -| approx_kl | 0.0002276511 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 124420 | -| policy_gradient_loss | 0.0112 | -| std | 0.0168 | -| value_loss | 2.25e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12444 | -| time_elapsed | 67144 | -| total_timesteps | 1592832 | -| train/ | | -| approx_kl | 0.002309952 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 124430 | -| policy_gradient_loss | 0.000293 | -| std | 0.0168 | -| value_loss | 2.62e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12445 | -| time_elapsed | 67148 | -| total_timesteps | 1592960 | -| train/ | | -| approx_kl | 0.0048417267 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | 0.00758 | -| n_updates | 124440 | -| policy_gradient_loss | 0.0114 | -| std | 0.0167 | -| value_loss | 6.23e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12446 | -| time_elapsed | 67152 | -| total_timesteps | 1593088 | -| train/ | | -| approx_kl | 0.004599582 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 124450 | -| policy_gradient_loss | 0.000957 | -| std | 0.0167 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12447 | -| time_elapsed | 67158 | -| total_timesteps | 1593216 | -| train/ | | -| approx_kl | 0.009778447 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 124460 | -| policy_gradient_loss | 0.0119 | -| std | 0.0167 | -| value_loss | 0.00113 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12448 | -| time_elapsed | 67161 | -| total_timesteps | 1593344 | -| train/ | | -| approx_kl | 0.00019642338 | -| clip_fraction | 0.032 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | 0.00747 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 124470 | -| policy_gradient_loss | -0.000198 | -| std | 0.0167 | -| value_loss | 1.91e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12449 | -| time_elapsed | 67163 | -| total_timesteps | 1593472 | -| train/ | | -| approx_kl | 0.00010096561 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 2.67 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | -0.000153 | -| n_updates | 124480 | -| policy_gradient_loss | 0.000123 | -| std | 0.0167 | -| value_loss | 6.65e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12450 | -| time_elapsed | 67167 | -| total_timesteps | 1593600 | -| train/ | | -| approx_kl | 9.0426765e-06 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0508 | -| learning_rate | 0.0003 | -| loss | -0.000201 | -| n_updates | 124490 | -| policy_gradient_loss | -0.00044 | -| std | 0.0167 | -| value_loss | 1.81e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12451 | -| time_elapsed | 67170 | -| total_timesteps | 1593728 | -| train/ | | -| approx_kl | 2.8960872e-05 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.00197 | -| learning_rate | 0.0003 | -| loss | -0.000887 | -| n_updates | 124500 | -| policy_gradient_loss | -0.00364 | -| std | 0.0167 | -| value_loss | 2.91e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12452 | -| time_elapsed | 67173 | -| total_timesteps | 1593856 | -| train/ | | -| approx_kl | 2.313964e-05 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | -0.000967 | -| n_updates | 124510 | -| policy_gradient_loss | -0.0056 | -| std | 0.0167 | -| value_loss | 2.18e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12453 | -| time_elapsed | 67177 | -| total_timesteps | 1593984 | -| train/ | | -| approx_kl | 0.0004002112 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 124520 | -| policy_gradient_loss | -0.0113 | -| std | 0.0167 | -| value_loss | 1.28e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12454 | -| time_elapsed | 67181 | -| total_timesteps | 1594112 | -| train/ | | -| approx_kl | 0.07469831 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.0294 | -| n_updates | 124530 | -| policy_gradient_loss | -0.0295 | -| std | 0.0167 | -| value_loss | 8.53e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12455 | -| time_elapsed | 67190 | -| total_timesteps | 1594240 | -| train/ | | -| approx_kl | 0.004750145 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 124540 | -| policy_gradient_loss | -0.00765 | -| std | 0.0167 | -| value_loss | 0.000921 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12456 | -| time_elapsed | 67194 | -| total_timesteps | 1594368 | -| train/ | | -| approx_kl | 0.0028242827 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | 0.00519 | -| learning_rate | 0.0003 | -| loss | 6.71e-05 | -| n_updates | 124550 | -| policy_gradient_loss | 0.000677 | -| std | 0.0167 | -| value_loss | 8.88e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12457 | -| time_elapsed | 67198 | -| total_timesteps | 1594496 | -| train/ | | -| approx_kl | 0.01155895 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.00661 | -| learning_rate | 0.0003 | -| loss | 0.00261 | -| n_updates | 124560 | -| policy_gradient_loss | 0.00305 | -| std | 0.0166 | -| value_loss | 0.00238 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12458 | -| time_elapsed | 67201 | -| total_timesteps | 1594624 | -| train/ | | -| approx_kl | 0.030026443 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.0399 | -| n_updates | 124570 | -| policy_gradient_loss | -0.0247 | -| std | 0.0166 | -| value_loss | 6.91e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12459 | -| time_elapsed | 67204 | -| total_timesteps | 1594752 | -| train/ | | -| approx_kl | 0.020387061 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0731 | -| learning_rate | 0.0003 | -| loss | 0.000243 | -| n_updates | 124580 | -| policy_gradient_loss | -0.00267 | -| std | 0.0166 | -| value_loss | 2.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12460 | -| time_elapsed | 67207 | -| total_timesteps | 1594880 | -| train/ | | -| approx_kl | 0.009319829 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 124590 | -| policy_gradient_loss | -0.00414 | -| std | 0.0166 | -| value_loss | 1.44e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12461 | -| time_elapsed | 67210 | -| total_timesteps | 1595008 | -| train/ | | -| approx_kl | 0.038052652 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 124600 | -| policy_gradient_loss | 0.0144 | -| std | 0.0166 | -| value_loss | 1.19e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12462 | -| time_elapsed | 67219 | -| total_timesteps | 1595136 | -| train/ | | -| approx_kl | 0.0031166598 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 124610 | -| policy_gradient_loss | 0.0144 | -| std | 0.0166 | -| value_loss | 0.00157 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12463 | -| time_elapsed | 67222 | -| total_timesteps | 1595264 | -| train/ | | -| approx_kl | 0.024627129 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | 0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0096 | -| n_updates | 124620 | -| policy_gradient_loss | 0.000971 | -| std | 0.0166 | -| value_loss | 0.000751 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12464 | -| time_elapsed | 67226 | -| total_timesteps | 1595392 | -| train/ | | -| approx_kl | 0.0048420574 | -| clip_fraction | 0.0367 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | 0.00563 | -| learning_rate | 0.0003 | -| loss | 0.000382 | -| n_updates | 124630 | -| policy_gradient_loss | 0.000652 | -| std | 0.0166 | -| value_loss | 1.45e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12465 | -| time_elapsed | 67231 | -| total_timesteps | 1595520 | -| train/ | | -| approx_kl | 0.0089814095 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.000343 | -| n_updates | 124640 | -| policy_gradient_loss | -1.38e-06 | -| std | 0.0166 | -| value_loss | 6.14e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12466 | -| time_elapsed | 67235 | -| total_timesteps | 1595648 | -| train/ | | -| approx_kl | 0.0073430194 | -| clip_fraction | 0.0594 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | -0.000114 | -| n_updates | 124650 | -| policy_gradient_loss | -4.15e-05 | -| std | 0.0166 | -| value_loss | 5.83e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12467 | -| time_elapsed | 67239 | -| total_timesteps | 1595776 | -| train/ | | -| approx_kl | 0.0029876856 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.00817 | -| n_updates | 124660 | -| policy_gradient_loss | 0.0115 | -| std | 0.0166 | -| value_loss | 7.34e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12468 | -| time_elapsed | 67243 | -| total_timesteps | 1595904 | -| train/ | | -| approx_kl | 0.00024188915 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -24.8 | -| learning_rate | 0.0003 | -| loss | 0.00469 | -| n_updates | 124670 | -| policy_gradient_loss | -0.00401 | -| std | 0.0166 | -| value_loss | 4.69e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12469 | -| time_elapsed | 67246 | -| total_timesteps | 1596032 | -| train/ | | -| approx_kl | 0.019524299 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 124680 | -| policy_gradient_loss | 0.00279 | -| std | 0.0166 | -| value_loss | 1.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12470 | -| time_elapsed | 67254 | -| total_timesteps | 1596160 | -| train/ | | -| approx_kl | 0.010007361 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | 0.776 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 124690 | -| policy_gradient_loss | -0.00535 | -| std | 0.0166 | -| value_loss | 0.004 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12471 | -| time_elapsed | 67258 | -| total_timesteps | 1596288 | -| train/ | | -| approx_kl | 0.0018806243 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 124700 | -| policy_gradient_loss | 0.00841 | -| std | 0.0165 | -| value_loss | 1.03e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12472 | -| time_elapsed | 67260 | -| total_timesteps | 1596416 | -| train/ | | -| approx_kl | 0.0004737121 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | 0.00485 | -| n_updates | 124710 | -| policy_gradient_loss | 0.0046 | -| std | 0.0165 | -| value_loss | 1.54e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12473 | -| time_elapsed | 67263 | -| total_timesteps | 1596544 | -| train/ | | -| approx_kl | 0.07455684 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0833 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 124720 | -| policy_gradient_loss | -0.0122 | -| std | 0.0165 | -| value_loss | 7.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12474 | -| time_elapsed | 67266 | -| total_timesteps | 1596672 | -| train/ | | -| approx_kl | 0.018087005 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.00589 | -| n_updates | 124730 | -| policy_gradient_loss | 0.00369 | -| std | 0.0165 | -| value_loss | 3.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12475 | -| time_elapsed | 67268 | -| total_timesteps | 1596800 | -| train/ | | -| approx_kl | 0.019786945 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | -0.0309 | -| n_updates | 124740 | -| policy_gradient_loss | -0.0169 | -| std | 0.0165 | -| value_loss | 2.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 12476 | -| time_elapsed | 67271 | -| total_timesteps | 1596928 | -| train/ | | -| approx_kl | 0.022500696 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 124750 | -| policy_gradient_loss | -0.00494 | -| std | 0.0165 | -| value_loss | 1.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12477 | -| time_elapsed | 67276 | -| total_timesteps | 1597056 | -| train/ | | -| approx_kl | 0.056889653 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 124760 | -| policy_gradient_loss | 0.0127 | -| std | 0.0165 | -| value_loss | 8.5e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12478 | -| time_elapsed | 67280 | -| total_timesteps | 1597184 | -| train/ | | -| approx_kl | 0.03600344 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.0297 | -| n_updates | 124770 | -| policy_gradient_loss | -0.0171 | -| std | 0.0165 | -| value_loss | 6.57e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12479 | -| time_elapsed | 67282 | -| total_timesteps | 1597312 | -| train/ | | -| approx_kl | 0.022789668 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.68 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 124780 | -| policy_gradient_loss | -0.0187 | -| std | 0.0165 | -| value_loss | 2.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12480 | -| time_elapsed | 67286 | -| total_timesteps | 1597440 | -| train/ | | -| approx_kl | 0.050403118 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.00929 | -| n_updates | 124790 | -| policy_gradient_loss | 0.0075 | -| std | 0.0165 | -| value_loss | 5.36e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12481 | -| time_elapsed | 67289 | -| total_timesteps | 1597568 | -| train/ | | -| approx_kl | 0.0051095174 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 124800 | -| policy_gradient_loss | -0.0132 | -| std | 0.0165 | -| value_loss | 4.19e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12482 | -| time_elapsed | 67292 | -| total_timesteps | 1597696 | -| train/ | | -| approx_kl | 0.00034995424 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.000133 | -| n_updates | 124810 | -| policy_gradient_loss | 9.76e-05 | -| std | 0.0165 | -| value_loss | 3.81e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12483 | -| time_elapsed | 67295 | -| total_timesteps | 1597824 | -| train/ | | -| approx_kl | 0.00019056769 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.00492 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 124820 | -| policy_gradient_loss | -0.0026 | -| std | 0.0165 | -| value_loss | 1.34e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 12484 | -| time_elapsed | 67298 | -| total_timesteps | 1597952 | -| train/ | | -| approx_kl | 0.015631286 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | 0.00194 | -| learning_rate | 0.0003 | -| loss | 0.00538 | -| n_updates | 124830 | -| policy_gradient_loss | 0.0167 | -| std | 0.0164 | -| value_loss | 2e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12485 | -| time_elapsed | 67302 | -| total_timesteps | 1598080 | -| train/ | | -| approx_kl | 0.0037037875 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 124840 | -| policy_gradient_loss | -0.00466 | -| std | 0.0164 | -| value_loss | 1.87e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12486 | -| time_elapsed | 67309 | -| total_timesteps | 1598208 | -| train/ | | -| approx_kl | 0.1561359 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | 0.418 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 124850 | -| policy_gradient_loss | -0.016 | -| std | 0.0164 | -| value_loss | 0.000915 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12487 | -| time_elapsed | 67312 | -| total_timesteps | 1598336 | -| train/ | | -| approx_kl | 0.115179345 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -158 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 124860 | -| policy_gradient_loss | -0.00883 | -| std | 0.0164 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12488 | -| time_elapsed | 67315 | -| total_timesteps | 1598464 | -| train/ | | -| approx_kl | 0.001026107 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -155 | -| learning_rate | 0.0003 | -| loss | -0.0076 | -| n_updates | 124870 | -| policy_gradient_loss | -0.00901 | -| std | 0.0164 | -| value_loss | 5.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12489 | -| time_elapsed | 67318 | -| total_timesteps | 1598592 | -| train/ | | -| approx_kl | 0.005352277 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -23.3 | -| learning_rate | 0.0003 | -| loss | 0.00429 | -| n_updates | 124880 | -| policy_gradient_loss | 0.00115 | -| std | 0.0164 | -| value_loss | 7.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12490 | -| time_elapsed | 67322 | -| total_timesteps | 1598720 | -| train/ | | -| approx_kl | 0.023164235 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -3.71 | -| learning_rate | 0.0003 | -| loss | 0.00441 | -| n_updates | 124890 | -| policy_gradient_loss | 0.0111 | -| std | 0.0164 | -| value_loss | 1.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12491 | -| time_elapsed | 67325 | -| total_timesteps | 1598848 | -| train/ | | -| approx_kl | 0.044698298 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.487 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 124900 | -| policy_gradient_loss | 0.00769 | -| std | 0.0164 | -| value_loss | 5.85e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12492 | -| time_elapsed | 67329 | -| total_timesteps | 1598976 | -| train/ | | -| approx_kl | 0.0071217474 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 124910 | -| policy_gradient_loss | 0.0107 | -| std | 0.0164 | -| value_loss | 3.54e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12493 | -| time_elapsed | 67333 | -| total_timesteps | 1599104 | -| train/ | | -| approx_kl | 0.0018053637 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | 0.00155 | -| learning_rate | 0.0003 | -| loss | 0.00372 | -| n_updates | 124920 | -| policy_gradient_loss | -0.00135 | -| std | 0.0164 | -| value_loss | 2.55e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12494 | -| time_elapsed | 67342 | -| total_timesteps | 1599232 | -| train/ | | -| approx_kl | 0.009951232 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 124930 | -| policy_gradient_loss | 0.0321 | -| std | 0.0164 | -| value_loss | 0.000204 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12495 | -| time_elapsed | 67346 | -| total_timesteps | 1599360 | -| train/ | | -| approx_kl | 0.022043897 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | 0.00669 | -| n_updates | 124940 | -| policy_gradient_loss | 0.013 | -| std | 0.0164 | -| value_loss | 5.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12496 | -| time_elapsed | 67348 | -| total_timesteps | 1599488 | -| train/ | | -| approx_kl | 0.044707526 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 124950 | -| policy_gradient_loss | 0.0106 | -| std | 0.0164 | -| value_loss | 1.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12497 | -| time_elapsed | 67350 | -| total_timesteps | 1599616 | -| train/ | | -| approx_kl | 0.026976755 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 124960 | -| policy_gradient_loss | 0.00012 | -| std | 0.0164 | -| value_loss | 1.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12498 | -| time_elapsed | 67354 | -| total_timesteps | 1599744 | -| train/ | | -| approx_kl | 0.015543742 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 124970 | -| policy_gradient_loss | -0.00102 | -| std | 0.0164 | -| value_loss | 7.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12499 | -| time_elapsed | 67358 | -| total_timesteps | 1599872 | -| train/ | | -| approx_kl | 0.019222569 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 124980 | -| policy_gradient_loss | 0.019 | -| std | 0.0164 | -| value_loss | 4.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12500 | -| time_elapsed | 67362 | -| total_timesteps | 1600000 | -| train/ | | -| approx_kl | 0.019880185 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 124990 | -| policy_gradient_loss | 0.0244 | -| std | 0.0164 | -| value_loss | 4.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12501 | -| time_elapsed | 67367 | -| total_timesteps | 1600128 | -| train/ | | -| approx_kl | 0.02417599 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | 0.00133 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 125000 | -| policy_gradient_loss | 0.0388 | -| std | 0.0164 | -| value_loss | 2.49e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12502 | -| time_elapsed | 67374 | -| total_timesteps | 1600256 | -| train/ | | -| approx_kl | 0.13796623 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 125010 | -| policy_gradient_loss | -0.0148 | -| std | 0.0164 | -| value_loss | 8.56e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12503 | -| time_elapsed | 67377 | -| total_timesteps | 1600384 | -| train/ | | -| approx_kl | 0.04109429 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | 0.00143 | -| learning_rate | 0.0003 | -| loss | 0.00691 | -| n_updates | 125020 | -| policy_gradient_loss | 0.00285 | -| std | 0.0164 | -| value_loss | 2.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12504 | -| time_elapsed | 67380 | -| total_timesteps | 1600512 | -| train/ | | -| approx_kl | 0.023982763 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.00744 | -| learning_rate | 0.0003 | -| loss | 0.00396 | -| n_updates | 125030 | -| policy_gradient_loss | 0.0104 | -| std | 0.0164 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12505 | -| time_elapsed | 67383 | -| total_timesteps | 1600640 | -| train/ | | -| approx_kl | 0.045309145 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.00161 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 125040 | -| policy_gradient_loss | 0.0119 | -| std | 0.0164 | -| value_loss | 6.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12506 | -| time_elapsed | 67386 | -| total_timesteps | 1600768 | -| train/ | | -| approx_kl | 0.027629932 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | 0.00749 | -| n_updates | 125050 | -| policy_gradient_loss | 0.0186 | -| std | 0.0164 | -| value_loss | 5.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 12507 | -| time_elapsed | 67390 | -| total_timesteps | 1600896 | -| train/ | | -| approx_kl | 0.00414169 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.00948 | -| learning_rate | 0.0003 | -| loss | -0.000529 | -| n_updates | 125060 | -| policy_gradient_loss | 0.00424 | -| std | 0.0164 | -| value_loss | 2.73e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12508 | -| time_elapsed | 67394 | -| total_timesteps | 1601024 | -| train/ | | -| approx_kl | 0.0046537486 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.69 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | -0.000122 | -| n_updates | 125070 | -| policy_gradient_loss | 0.0132 | -| std | 0.0163 | -| value_loss | 1.67e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12509 | -| time_elapsed | 67402 | -| total_timesteps | 1601152 | -| train/ | | -| approx_kl | 0.04709179 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | 0.857 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 125080 | -| policy_gradient_loss | -0.0139 | -| std | 0.0163 | -| value_loss | 0.00151 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12510 | -| time_elapsed | 67406 | -| total_timesteps | 1601280 | -| train/ | | -| approx_kl | 0.13943216 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | 0.0444 | -| learning_rate | 0.0003 | -| loss | 0.0781 | -| n_updates | 125090 | -| policy_gradient_loss | 0.0151 | -| std | 0.0163 | -| value_loss | 1.57e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12511 | -| time_elapsed | 67409 | -| total_timesteps | 1601408 | -| train/ | | -| approx_kl | 9.8936725e-05 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -10.7 | -| learning_rate | 0.0003 | -| loss | -0.000812 | -| n_updates | 125100 | -| policy_gradient_loss | 0.00576 | -| std | 0.0163 | -| value_loss | 1.97e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12512 | -| time_elapsed | 67413 | -| total_timesteps | 1601536 | -| train/ | | -| approx_kl | 0.0009784047 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 125110 | -| policy_gradient_loss | 0.018 | -| std | 0.0163 | -| value_loss | 4.18e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12513 | -| time_elapsed | 67416 | -| total_timesteps | 1601664 | -| train/ | | -| approx_kl | 0.01157525 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 125120 | -| policy_gradient_loss | 0.0178 | -| std | 0.0163 | -| value_loss | 2.72e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12514 | -| time_elapsed | 67419 | -| total_timesteps | 1601792 | -| train/ | | -| approx_kl | 0.018894162 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 125130 | -| policy_gradient_loss | 0.0304 | -| std | 0.0163 | -| value_loss | 1.96e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12515 | -| time_elapsed | 67423 | -| total_timesteps | 1601920 | -| train/ | | -| approx_kl | 0.0052400106 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0974 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 125140 | -| policy_gradient_loss | 0.00304 | -| std | 0.0163 | -| value_loss | 6.92e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12516 | -| time_elapsed | 67426 | -| total_timesteps | 1602048 | -| train/ | | -| approx_kl | 0.015652977 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 125150 | -| policy_gradient_loss | 0.00459 | -| std | 0.0163 | -| value_loss | 9.84e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12517 | -| time_elapsed | 67433 | -| total_timesteps | 1602176 | -| train/ | | -| approx_kl | 0.03660491 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 125160 | -| policy_gradient_loss | 0.00611 | -| std | 0.0163 | -| value_loss | 9.86e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12518 | -| time_elapsed | 67437 | -| total_timesteps | 1602304 | -| train/ | | -| approx_kl | 0.007559899 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | 0.00488 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 125170 | -| policy_gradient_loss | -0.00898 | -| std | 0.0163 | -| value_loss | 2.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12519 | -| time_elapsed | 67441 | -| total_timesteps | 1602432 | -| train/ | | -| approx_kl | 0.050135504 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 125180 | -| policy_gradient_loss | 0.00229 | -| std | 0.0163 | -| value_loss | 8.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12520 | -| time_elapsed | 67445 | -| total_timesteps | 1602560 | -| train/ | | -| approx_kl | 0.012464486 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | -0.006 | -| n_updates | 125190 | -| policy_gradient_loss | -2.52e-06 | -| std | 0.0163 | -| value_loss | 6.55e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12521 | -| time_elapsed | 67449 | -| total_timesteps | 1602688 | -| train/ | | -| approx_kl | 0.0065738717 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | -0.000351 | -| n_updates | 125200 | -| policy_gradient_loss | 0.00336 | -| std | 0.0163 | -| value_loss | 3.82e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12522 | -| time_elapsed | 67452 | -| total_timesteps | 1602816 | -| train/ | | -| approx_kl | 0.041383408 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 125210 | -| policy_gradient_loss | 0.00462 | -| std | 0.0163 | -| value_loss | 2.91e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12523 | -| time_elapsed | 67455 | -| total_timesteps | 1602944 | -| train/ | | -| approx_kl | 0.0050492976 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 125220 | -| policy_gradient_loss | 0.0049 | -| std | 0.0163 | -| value_loss | 3.12e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12524 | -| time_elapsed | 67459 | -| total_timesteps | 1603072 | -| train/ | | -| approx_kl | 0.01975831 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0075 | -| learning_rate | 0.0003 | -| loss | 0.00263 | -| n_updates | 125230 | -| policy_gradient_loss | 0.011 | -| std | 0.0163 | -| value_loss | 1.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12525 | -| time_elapsed | 67465 | -| total_timesteps | 1603200 | -| train/ | | -| approx_kl | 0.033770356 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 125240 | -| policy_gradient_loss | -0.0159 | -| std | 0.0163 | -| value_loss | 0.000496 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12526 | -| time_elapsed | 67470 | -| total_timesteps | 1603328 | -| train/ | | -| approx_kl | 0.028377108 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -2.26 | -| learning_rate | 0.0003 | -| loss | 0.00714 | -| n_updates | 125250 | -| policy_gradient_loss | 0.00353 | -| std | 0.0163 | -| value_loss | 5.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12527 | -| time_elapsed | 67473 | -| total_timesteps | 1603456 | -| train/ | | -| approx_kl | 0.04795631 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -2.03 | -| learning_rate | 0.0003 | -| loss | 0.0506 | -| n_updates | 125260 | -| policy_gradient_loss | 0.00721 | -| std | 0.0163 | -| value_loss | 1.82e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12528 | -| time_elapsed | 67477 | -| total_timesteps | 1603584 | -| train/ | | -| approx_kl | 0.0070471135 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0764 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 125270 | -| policy_gradient_loss | 0.000375 | -| std | 0.0163 | -| value_loss | 4.82e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12529 | -| time_elapsed | 67481 | -| total_timesteps | 1603712 | -| train/ | | -| approx_kl | 0.016427293 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.453 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 125280 | -| policy_gradient_loss | 0.0257 | -| std | 0.0162 | -| value_loss | 1.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12530 | -| time_elapsed | 67485 | -| total_timesteps | 1603840 | -| train/ | | -| approx_kl | 0.046101585 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.272 | -| learning_rate | 0.0003 | -| loss | 0.00823 | -| n_updates | 125290 | -| policy_gradient_loss | -0.00426 | -| std | 0.0162 | -| value_loss | 8.43e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12531 | -| time_elapsed | 67489 | -| total_timesteps | 1603968 | -| train/ | | -| approx_kl | 0.00023344532 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.000943 | -| n_updates | 125300 | -| policy_gradient_loss | -0.000628 | -| std | 0.0162 | -| value_loss | 5.15e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12532 | -| time_elapsed | 67491 | -| total_timesteps | 1604096 | -| train/ | | -| approx_kl | 4.6705827e-07 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 8.67e-05 | -| n_updates | 125310 | -| policy_gradient_loss | 0.00137 | -| std | 0.0162 | -| value_loss | 8.82e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12533 | -| time_elapsed | 67499 | -| total_timesteps | 1604224 | -| train/ | | -| approx_kl | 0.0020380886 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | 0.736 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 125320 | -| policy_gradient_loss | -0.00361 | -| std | 0.0162 | -| value_loss | 0.00539 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12534 | -| time_elapsed | 67503 | -| total_timesteps | 1604352 | -| train/ | | -| approx_kl | 0.07405722 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | 0.00905 | -| learning_rate | 0.0003 | -| loss | 0.0465 | -| n_updates | 125330 | -| policy_gradient_loss | 0.0068 | -| std | 0.0162 | -| value_loss | 1.13e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12535 | -| time_elapsed | 67506 | -| total_timesteps | 1604480 | -| train/ | | -| approx_kl | 8.752756e-05 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.0858 | -| learning_rate | 0.0003 | -| loss | 9.08e-05 | -| n_updates | 125340 | -| policy_gradient_loss | 0.000299 | -| std | 0.0162 | -| value_loss | 2.42e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12536 | -| time_elapsed | 67510 | -| total_timesteps | 1604608 | -| train/ | | -| approx_kl | 0.009860702 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.7 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 125350 | -| policy_gradient_loss | 0.0098 | -| std | 0.0162 | -| value_loss | 3.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12537 | -| time_elapsed | 67514 | -| total_timesteps | 1604736 | -| train/ | | -| approx_kl | 0.035577927 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.00337 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 125360 | -| policy_gradient_loss | 0.00728 | -| std | 0.0162 | -| value_loss | 5.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12538 | -| time_elapsed | 67517 | -| total_timesteps | 1604864 | -| train/ | | -| approx_kl | 0.035110444 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 125370 | -| policy_gradient_loss | 0.00315 | -| std | 0.0162 | -| value_loss | 3.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12539 | -| time_elapsed | 67520 | -| total_timesteps | 1604992 | -| train/ | | -| approx_kl | 0.10896626 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 125380 | -| policy_gradient_loss | 0.0109 | -| std | 0.0162 | -| value_loss | 2.86e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12540 | -| time_elapsed | 67523 | -| total_timesteps | 1605120 | -| train/ | | -| approx_kl | 0.021545056 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.000943 | -| n_updates | 125390 | -| policy_gradient_loss | 0.00629 | -| std | 0.0161 | -| value_loss | 1.88e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12541 | -| time_elapsed | 67532 | -| total_timesteps | 1605248 | -| train/ | | -| approx_kl | 0.1081846 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | 0.629 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 125400 | -| policy_gradient_loss | -0.0101 | -| std | 0.0161 | -| value_loss | 0.000726 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12542 | -| time_elapsed | 67536 | -| total_timesteps | 1605376 | -| train/ | | -| approx_kl | 0.02410457 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 125410 | -| policy_gradient_loss | 0.0353 | -| std | 0.0161 | -| value_loss | 4.42e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12543 | -| time_elapsed | 67539 | -| total_timesteps | 1605504 | -| train/ | | -| approx_kl | 0.0051757293 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.0621 | -| learning_rate | 0.0003 | -| loss | -3.55e-05 | -| n_updates | 125420 | -| policy_gradient_loss | 0.00378 | -| std | 0.0161 | -| value_loss | 1.46e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12544 | -| time_elapsed | 67541 | -| total_timesteps | 1605632 | -| train/ | | -| approx_kl | 0.008744201 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.00199 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 125430 | -| policy_gradient_loss | 0.00285 | -| std | 0.0161 | -| value_loss | 7.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12545 | -| time_elapsed | 67545 | -| total_timesteps | 1605760 | -| train/ | | -| approx_kl | 0.047026556 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.00528 | -| learning_rate | 0.0003 | -| loss | -0.00888 | -| n_updates | 125440 | -| policy_gradient_loss | -0.00971 | -| std | 0.0161 | -| value_loss | 6.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12546 | -| time_elapsed | 67547 | -| total_timesteps | 1605888 | -| train/ | | -| approx_kl | 0.012033547 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.00831 | -| learning_rate | 0.0003 | -| loss | 8.62e-06 | -| n_updates | 125450 | -| policy_gradient_loss | 0.00198 | -| std | 0.0161 | -| value_loss | 3.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12547 | -| time_elapsed | 67548 | -| total_timesteps | 1606016 | -| train/ | | -| approx_kl | 0.024788082 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 125460 | -| policy_gradient_loss | -0.000547 | -| std | 0.0161 | -| value_loss | 2.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12548 | -| time_elapsed | 67557 | -| total_timesteps | 1606144 | -| train/ | | -| approx_kl | 0.050126188 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | 0.0503 | -| n_updates | 125470 | -| policy_gradient_loss | 0.00775 | -| std | 0.0161 | -| value_loss | 0.000992 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12549 | -| time_elapsed | 67561 | -| total_timesteps | 1606272 | -| train/ | | -| approx_kl | 2.9252376e-05 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | 0.169 | -| learning_rate | 0.0003 | -| loss | 0.000151 | -| n_updates | 125480 | -| policy_gradient_loss | 0.0249 | -| std | 0.0161 | -| value_loss | 8.97e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12550 | -| time_elapsed | 67564 | -| total_timesteps | 1606400 | -| train/ | | -| approx_kl | 0.019867783 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.735 | -| learning_rate | 0.0003 | -| loss | 0.00921 | -| n_updates | 125490 | -| policy_gradient_loss | 0.00156 | -| std | 0.0161 | -| value_loss | 3.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12551 | -| time_elapsed | 67568 | -| total_timesteps | 1606528 | -| train/ | | -| approx_kl | 0.02223654 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.295 | -| learning_rate | 0.0003 | -| loss | 0.00975 | -| n_updates | 125500 | -| policy_gradient_loss | 0.00186 | -| std | 0.0161 | -| value_loss | 2.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12552 | -| time_elapsed | 67572 | -| total_timesteps | 1606656 | -| train/ | | -| approx_kl | 0.0032788287 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 2.71 | -| explained_variance | -0.0708 | -| learning_rate | 0.0003 | -| loss | 0.00046 | -| n_updates | 125510 | -| policy_gradient_loss | 0.000974 | -| std | 0.016 | -| value_loss | 1.75e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12553 | -| time_elapsed | 67573 | -| total_timesteps | 1606784 | -| train/ | | -| approx_kl | 0.012759272 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.00623 | -| learning_rate | 0.0003 | -| loss | -0.00566 | -| n_updates | 125520 | -| policy_gradient_loss | -0.00356 | -| std | 0.016 | -| value_loss | 3.48e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12554 | -| time_elapsed | 67576 | -| total_timesteps | 1606912 | -| train/ | | -| approx_kl | 0.10562701 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -5.17 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 125530 | -| policy_gradient_loss | -0.0111 | -| std | 0.0159 | -| value_loss | 1.78e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12555 | -| time_elapsed | 67580 | -| total_timesteps | 1607040 | -| train/ | | -| approx_kl | 0.012935241 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 125540 | -| policy_gradient_loss | 0.0143 | -| std | 0.0159 | -| value_loss | 1.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12556 | -| time_elapsed | 67588 | -| total_timesteps | 1607168 | -| train/ | | -| approx_kl | 0.014552106 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | 0.00663 | -| n_updates | 125550 | -| policy_gradient_loss | 0.00341 | -| std | 0.0159 | -| value_loss | 0.00307 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12557 | -| time_elapsed | 67592 | -| total_timesteps | 1607296 | -| train/ | | -| approx_kl | 0.0061782603 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.00133 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 125560 | -| policy_gradient_loss | 0.00128 | -| std | 0.0159 | -| value_loss | 6.64e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12558 | -| time_elapsed | 67595 | -| total_timesteps | 1607424 | -| train/ | | -| approx_kl | 0.014870411 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.268 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 125570 | -| policy_gradient_loss | 0.0256 | -| std | 0.0159 | -| value_loss | 1.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12559 | -| time_elapsed | 67599 | -| total_timesteps | 1607552 | -| train/ | | -| approx_kl | 0.017662626 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.271 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 125580 | -| policy_gradient_loss | 0.0191 | -| std | 0.0159 | -| value_loss | 2.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12560 | -| time_elapsed | 67602 | -| total_timesteps | 1607680 | -| train/ | | -| approx_kl | 0.026586408 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 125590 | -| policy_gradient_loss | 0.0357 | -| std | 0.0159 | -| value_loss | 2.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12561 | -| time_elapsed | 67605 | -| total_timesteps | 1607808 | -| train/ | | -| approx_kl | 0.039638765 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 7.26e-05 | -| n_updates | 125600 | -| policy_gradient_loss | -0.00383 | -| std | 0.0159 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 12562 | -| time_elapsed | 67606 | -| total_timesteps | 1607936 | -| train/ | | -| approx_kl | 0.009679118 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 125610 | -| policy_gradient_loss | 0.018 | -| std | 0.0159 | -| value_loss | 1.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12563 | -| time_elapsed | 67610 | -| total_timesteps | 1608064 | -| train/ | | -| approx_kl | 0.005396219 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 125620 | -| policy_gradient_loss | 0.000607 | -| std | 0.0159 | -| value_loss | 4.81e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12564 | -| time_elapsed | 67616 | -| total_timesteps | 1608192 | -| train/ | | -| approx_kl | 0.1683063 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -0.549 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 125630 | -| policy_gradient_loss | -0.0143 | -| std | 0.0159 | -| value_loss | 0.00169 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12565 | -| time_elapsed | 67620 | -| total_timesteps | 1608320 | -| train/ | | -| approx_kl | 0.002146671 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -6.71e+03 | -| learning_rate | 0.0003 | -| loss | -0.0043 | -| n_updates | 125640 | -| policy_gradient_loss | -0.00464 | -| std | 0.0159 | -| value_loss | 8.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12566 | -| time_elapsed | 67622 | -| total_timesteps | 1608448 | -| train/ | | -| approx_kl | 0.041383296 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -595 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 125650 | -| policy_gradient_loss | -0.00101 | -| std | 0.0159 | -| value_loss | 6.01e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12567 | -| time_elapsed | 67625 | -| total_timesteps | 1608576 | -| train/ | | -| approx_kl | 0.0006599743 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 2.72 | -| explained_variance | -112 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 125660 | -| policy_gradient_loss | -0.000903 | -| std | 0.0158 | -| value_loss | 6.97e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12568 | -| time_elapsed | 67629 | -| total_timesteps | 1608704 | -| train/ | | -| approx_kl | 0.004681298 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.73 | -| explained_variance | -6.56 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 125670 | -| policy_gradient_loss | -0.0184 | -| std | 0.0158 | -| value_loss | 6.88e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12569 | -| time_elapsed | 67632 | -| total_timesteps | 1608832 | -| train/ | | -| approx_kl | 0.0020205374 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.73 | -| explained_variance | -0.536 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 125680 | -| policy_gradient_loss | 0.00162 | -| std | 0.0157 | -| value_loss | 2.47e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 12570 | -| time_elapsed | 67636 | -| total_timesteps | 1608960 | -| train/ | | -| approx_kl | 0.048164356 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.73 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.00815 | -| n_updates | 125690 | -| policy_gradient_loss | -0.00115 | -| std | 0.0157 | -| value_loss | 3.03e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12571 | -| time_elapsed | 67639 | -| total_timesteps | 1609088 | -| train/ | | -| approx_kl | 0.01132351 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.73 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 125700 | -| policy_gradient_loss | 2.9e-05 | -| std | 0.0157 | -| value_loss | 1.36e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12572 | -| time_elapsed | 67646 | -| total_timesteps | 1609216 | -| train/ | | -| approx_kl | 0.10406846 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -2.67 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 125710 | -| policy_gradient_loss | -0.0156 | -| std | 0.0157 | -| value_loss | 0.00217 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12573 | -| time_elapsed | 67649 | -| total_timesteps | 1609344 | -| train/ | | -| approx_kl | 0.0022878936 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -114 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 125720 | -| policy_gradient_loss | -0.00197 | -| std | 0.0157 | -| value_loss | 1.11e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12574 | -| time_elapsed | 67652 | -| total_timesteps | 1609472 | -| train/ | | -| approx_kl | 0.09495476 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.656 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 125730 | -| policy_gradient_loss | 0.0013 | -| std | 0.0157 | -| value_loss | 0.000193 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12575 | -| time_elapsed | 67655 | -| total_timesteps | 1609600 | -| train/ | | -| approx_kl | 0.018422466 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.0076 | -| learning_rate | 0.0003 | -| loss | -0.00753 | -| n_updates | 125740 | -| policy_gradient_loss | -0.00381 | -| std | 0.0156 | -| value_loss | 4.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12576 | -| time_elapsed | 67659 | -| total_timesteps | 1609728 | -| train/ | | -| approx_kl | 0.047060788 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 125750 | -| policy_gradient_loss | 0.00451 | -| std | 0.0156 | -| value_loss | 5.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12577 | -| time_elapsed | 67662 | -| total_timesteps | 1609856 | -| train/ | | -| approx_kl | 0.012744714 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 125760 | -| policy_gradient_loss | -0.00483 | -| std | 0.0156 | -| value_loss | 2.83e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12578 | -| time_elapsed | 67666 | -| total_timesteps | 1609984 | -| train/ | | -| approx_kl | 0.036044884 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.00295 | -| learning_rate | 0.0003 | -| loss | 0.00452 | -| n_updates | 125770 | -| policy_gradient_loss | 0.0109 | -| std | 0.0156 | -| value_loss | 3.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12579 | -| time_elapsed | 67670 | -| total_timesteps | 1610112 | -| train/ | | -| approx_kl | 0.04267863 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 125780 | -| policy_gradient_loss | 0.00583 | -| std | 0.0156 | -| value_loss | 1.53e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12580 | -| time_elapsed | 67678 | -| total_timesteps | 1610240 | -| train/ | | -| approx_kl | 0.0031323126 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.934 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 125790 | -| policy_gradient_loss | -0.00458 | -| std | 0.0156 | -| value_loss | 0.000564 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12581 | -| time_elapsed | 67682 | -| total_timesteps | 1610368 | -| train/ | | -| approx_kl | 0.03065319 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 125800 | -| policy_gradient_loss | 0.00367 | -| std | 0.0156 | -| value_loss | 0.00317 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12582 | -| time_elapsed | 67685 | -| total_timesteps | 1610496 | -| train/ | | -| approx_kl | 0.025655111 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 125810 | -| policy_gradient_loss | -0.0035 | -| std | 0.0156 | -| value_loss | 0.000152 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12583 | -| time_elapsed | 67688 | -| total_timesteps | 1610624 | -| train/ | | -| approx_kl | 0.065360464 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.00396 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 125820 | -| policy_gradient_loss | -0.00917 | -| std | 0.0156 | -| value_loss | 4.96e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12584 | -| time_elapsed | 67691 | -| total_timesteps | 1610752 | -| train/ | | -| approx_kl | 0.04412365 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 125830 | -| policy_gradient_loss | 0.00943 | -| std | 0.0156 | -| value_loss | 3.24e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12585 | -| time_elapsed | 67694 | -| total_timesteps | 1610880 | -| train/ | | -| approx_kl | 0.05310183 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.0324 | -| n_updates | 125840 | -| policy_gradient_loss | 0.0127 | -| std | 0.0156 | -| value_loss | 2.04e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12586 | -| time_elapsed | 67697 | -| total_timesteps | 1611008 | -| train/ | | -| approx_kl | 0.05699424 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 125850 | -| policy_gradient_loss | 0.00298 | -| std | 0.0156 | -| value_loss | 1.44e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12587 | -| time_elapsed | 67706 | -| total_timesteps | 1611136 | -| train/ | | -| approx_kl | 0.04189721 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 125860 | -| policy_gradient_loss | -0.00994 | -| std | 0.0156 | -| value_loss | 0.000461 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12588 | -| time_elapsed | 67708 | -| total_timesteps | 1611264 | -| train/ | | -| approx_kl | 0.05758959 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | 0.0499 | -| n_updates | 125870 | -| policy_gradient_loss | 0.00895 | -| std | 0.0156 | -| value_loss | 1.56e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12589 | -| time_elapsed | 67712 | -| total_timesteps | 1611392 | -| train/ | | -| approx_kl | 0.075188175 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 125880 | -| policy_gradient_loss | 0.00705 | -| std | 0.0156 | -| value_loss | 1.75e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12590 | -| time_elapsed | 67716 | -| total_timesteps | 1611520 | -| train/ | | -| approx_kl | 0.0053309384 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.00834 | -| n_updates | 125890 | -| policy_gradient_loss | 0.00802 | -| std | 0.0156 | -| value_loss | 1.25e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12591 | -| time_elapsed | 67720 | -| total_timesteps | 1611648 | -| train/ | | -| approx_kl | 0.012497235 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 125900 | -| policy_gradient_loss | 0.00779 | -| std | 0.0156 | -| value_loss | 8.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12592 | -| time_elapsed | 67724 | -| total_timesteps | 1611776 | -| train/ | | -| approx_kl | 0.019973613 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.00472 | -| n_updates | 125910 | -| policy_gradient_loss | 0.00082 | -| std | 0.0156 | -| value_loss | 6.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12593 | -| time_elapsed | 67728 | -| total_timesteps | 1611904 | -| train/ | | -| approx_kl | 0.026819404 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.00281 | -| learning_rate | 0.0003 | -| loss | 0.00481 | -| n_updates | 125920 | -| policy_gradient_loss | 0.0128 | -| std | 0.0156 | -| value_loss | 6.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12594 | -| time_elapsed | 67732 | -| total_timesteps | 1612032 | -| train/ | | -| approx_kl | 0.053876173 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.00516 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 125930 | -| policy_gradient_loss | -0.0198 | -| std | 0.0157 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12595 | -| time_elapsed | 67740 | -| total_timesteps | 1612160 | -| train/ | | -| approx_kl | 0.0054201335 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 125940 | -| policy_gradient_loss | -0.0052 | -| std | 0.0157 | -| value_loss | 0.00153 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12596 | -| time_elapsed | 67743 | -| total_timesteps | 1612288 | -| train/ | | -| approx_kl | 0.011506643 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.426 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 125950 | -| policy_gradient_loss | -0.000297 | -| std | 0.0157 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12597 | -| time_elapsed | 67747 | -| total_timesteps | 1612416 | -| train/ | | -| approx_kl | 0.012782585 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -4.36 | -| learning_rate | 0.0003 | -| loss | -0.00749 | -| n_updates | 125960 | -| policy_gradient_loss | -0.00032 | -| std | 0.0157 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12598 | -| time_elapsed | 67751 | -| total_timesteps | 1612544 | -| train/ | | -| approx_kl | 0.050405804 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.539 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 125970 | -| policy_gradient_loss | 0.00176 | -| std | 0.0157 | -| value_loss | 2.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12599 | -| time_elapsed | 67754 | -| total_timesteps | 1612672 | -| train/ | | -| approx_kl | 0.010114076 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.00703 | -| n_updates | 125980 | -| policy_gradient_loss | 0.00225 | -| std | 0.0157 | -| value_loss | 3.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12600 | -| time_elapsed | 67757 | -| total_timesteps | 1612800 | -| train/ | | -| approx_kl | 0.027518708 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.00957 | -| n_updates | 125990 | -| policy_gradient_loss | 0.0078 | -| std | 0.0157 | -| value_loss | 1.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 12601 | -| time_elapsed | 67760 | -| total_timesteps | 1612928 | -| train/ | | -| approx_kl | 0.028344372 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 126000 | -| policy_gradient_loss | 0.00947 | -| std | 0.0157 | -| value_loss | 3.57e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12602 | -| time_elapsed | 67764 | -| total_timesteps | 1613056 | -| train/ | | -| approx_kl | 0.048785377 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 126010 | -| policy_gradient_loss | 0.00504 | -| std | 0.0157 | -| value_loss | 2.72e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12603 | -| time_elapsed | 67770 | -| total_timesteps | 1613184 | -| train/ | | -| approx_kl | 0.1400422 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.386 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 126020 | -| policy_gradient_loss | -0.0145 | -| std | 0.0157 | -| value_loss | 0.000974 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12604 | -| time_elapsed | 67773 | -| total_timesteps | 1613312 | -| train/ | | -| approx_kl | 0.0035460666 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -3.85 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 126030 | -| policy_gradient_loss | 0.0139 | -| std | 0.0157 | -| value_loss | 5.83e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12605 | -| time_elapsed | 67777 | -| total_timesteps | 1613440 | -| train/ | | -| approx_kl | 4.9093273e-05 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -4.93 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 126040 | -| policy_gradient_loss | 0.00117 | -| std | 0.0157 | -| value_loss | 2.79e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12606 | -| time_elapsed | 67780 | -| total_timesteps | 1613568 | -| train/ | | -| approx_kl | 0.0026662517 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.624 | -| learning_rate | 0.0003 | -| loss | -0.000448 | -| n_updates | 126050 | -| policy_gradient_loss | 0.00322 | -| std | 0.0157 | -| value_loss | 1.3e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12607 | -| time_elapsed | 67784 | -| total_timesteps | 1613696 | -| train/ | | -| approx_kl | 0.009206578 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 2.73 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 126060 | -| policy_gradient_loss | 0.0142 | -| std | 0.0157 | -| value_loss | 2.39e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12608 | -| time_elapsed | 67787 | -| total_timesteps | 1613824 | -| train/ | | -| approx_kl | 0.0046316637 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 2.73 | -| explained_variance | -0.00974 | -| learning_rate | 0.0003 | -| loss | 0.00997 | -| n_updates | 126070 | -| policy_gradient_loss | 0.029 | -| std | 0.0157 | -| value_loss | 1.14e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12609 | -| time_elapsed | 67791 | -| total_timesteps | 1613952 | -| train/ | | -| approx_kl | 0.0011653141 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 2.73 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.000456 | -| n_updates | 126080 | -| policy_gradient_loss | 0.00239 | -| std | 0.0157 | -| value_loss | 1.13e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12610 | -| time_elapsed | 67795 | -| total_timesteps | 1614080 | -| train/ | | -| approx_kl | 0.010241879 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.00954 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 126090 | -| policy_gradient_loss | 0.00483 | -| std | 0.0157 | -| value_loss | 9.55e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12611 | -| time_elapsed | 67801 | -| total_timesteps | 1614208 | -| train/ | | -| approx_kl | 0.07220058 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.767 | -| learning_rate | 0.0003 | -| loss | 0.00612 | -| n_updates | 126100 | -| policy_gradient_loss | 0.00113 | -| std | 0.0156 | -| value_loss | 0.00422 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12612 | -| time_elapsed | 67805 | -| total_timesteps | 1614336 | -| train/ | | -| approx_kl | 0.03272684 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.000301 | -| n_updates | 126110 | -| policy_gradient_loss | -0.00542 | -| std | 0.0156 | -| value_loss | 4.48e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12613 | -| time_elapsed | 67809 | -| total_timesteps | 1614464 | -| train/ | | -| approx_kl | 0.0008210805 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | -0.000504 | -| n_updates | 126120 | -| policy_gradient_loss | 0.00024 | -| std | 0.0156 | -| value_loss | 1.38e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12614 | -| time_elapsed | 67811 | -| total_timesteps | 1614592 | -| train/ | | -| approx_kl | 0.00039331755 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.00532 | -| n_updates | 126130 | -| policy_gradient_loss | 0.00163 | -| std | 0.0156 | -| value_loss | 2.37e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12615 | -| time_elapsed | 67814 | -| total_timesteps | 1614720 | -| train/ | | -| approx_kl | 0.0024739774 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.00916 | -| n_updates | 126140 | -| policy_gradient_loss | 0.0113 | -| std | 0.0156 | -| value_loss | 8.29e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12616 | -| time_elapsed | 67816 | -| total_timesteps | 1614848 | -| train/ | | -| approx_kl | 0.0013574501 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 126150 | -| policy_gradient_loss | 0.00246 | -| std | 0.0156 | -| value_loss | 4.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12617 | -| time_elapsed | 67819 | -| total_timesteps | 1614976 | -| train/ | | -| approx_kl | 0.006832921 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 126160 | -| policy_gradient_loss | 0.00568 | -| std | 0.0156 | -| value_loss | 3.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 12618 | -| time_elapsed | 67822 | -| total_timesteps | 1615104 | -| train/ | | -| approx_kl | 0.004772033 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 126170 | -| policy_gradient_loss | 0.0158 | -| std | 0.0156 | -| value_loss | 1.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 12619 | -| time_elapsed | 67831 | -| total_timesteps | 1615232 | -| train/ | | -| approx_kl | 0.07021471 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.942 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 126180 | -| policy_gradient_loss | -0.00996 | -| std | 0.0156 | -| value_loss | 0.000551 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 12620 | -| time_elapsed | 67835 | -| total_timesteps | 1615360 | -| train/ | | -| approx_kl | 0.005293447 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 126190 | -| policy_gradient_loss | -0.00322 | -| std | 0.0156 | -| value_loss | 4.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 12621 | -| time_elapsed | 67839 | -| total_timesteps | 1615488 | -| train/ | | -| approx_kl | 0.010234741 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | -0.00954 | -| n_updates | 126200 | -| policy_gradient_loss | -0.00503 | -| std | 0.0155 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 12622 | -| time_elapsed | 67842 | -| total_timesteps | 1615616 | -| train/ | | -| approx_kl | 0.0005695014 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.00695 | -| n_updates | 126210 | -| policy_gradient_loss | -0.000951 | -| std | 0.0155 | -| value_loss | 9.48e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 12623 | -| time_elapsed | 67845 | -| total_timesteps | 1615744 | -| train/ | | -| approx_kl | 0.0011133016 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0858 | -| learning_rate | 0.0003 | -| loss | 0.00648 | -| n_updates | 126220 | -| policy_gradient_loss | 0.0104 | -| std | 0.0155 | -| value_loss | 4.08e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 12624 | -| time_elapsed | 67850 | -| total_timesteps | 1615872 | -| train/ | | -| approx_kl | 0.01165443 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0647 | -| learning_rate | 0.0003 | -| loss | 0.00503 | -| n_updates | 126230 | -| policy_gradient_loss | 0.00201 | -| std | 0.0154 | -| value_loss | 1.08e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12625 | -| time_elapsed | 67853 | -| total_timesteps | 1616000 | -| train/ | | -| approx_kl | 0.009767412 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 126240 | -| policy_gradient_loss | 0.00219 | -| std | 0.0154 | -| value_loss | 2.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12626 | -| time_elapsed | 67857 | -| total_timesteps | 1616128 | -| train/ | | -| approx_kl | 0.023847697 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 126250 | -| policy_gradient_loss | 0.00741 | -| std | 0.0153 | -| value_loss | 6.01e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12627 | -| time_elapsed | 67865 | -| total_timesteps | 1616256 | -| train/ | | -| approx_kl | 0.1701027 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.949 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 126260 | -| policy_gradient_loss | -0.0157 | -| std | 0.0153 | -| value_loss | 0.00048 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12628 | -| time_elapsed | 67868 | -| total_timesteps | 1616384 | -| train/ | | -| approx_kl | 0.057730135 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 126270 | -| policy_gradient_loss | -0.00383 | -| std | 0.0153 | -| value_loss | 1.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12629 | -| time_elapsed | 67871 | -| total_timesteps | 1616512 | -| train/ | | -| approx_kl | 0.035858497 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 126280 | -| policy_gradient_loss | -0.00799 | -| std | 0.0153 | -| value_loss | 6.19e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12630 | -| time_elapsed | 67874 | -| total_timesteps | 1616640 | -| train/ | | -| approx_kl | 0.03414885 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | 0.00873 | -| n_updates | 126290 | -| policy_gradient_loss | 0.00296 | -| std | 0.0153 | -| value_loss | 2.55e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12631 | -| time_elapsed | 67877 | -| total_timesteps | 1616768 | -| train/ | | -| approx_kl | 0.064238265 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 126300 | -| policy_gradient_loss | 0.00861 | -| std | 0.0153 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 12632 | -| time_elapsed | 67881 | -| total_timesteps | 1616896 | -| train/ | | -| approx_kl | 0.016641539 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.056 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 126310 | -| policy_gradient_loss | -0.00969 | -| std | 0.0153 | -| value_loss | 1.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12633 | -| time_elapsed | 67885 | -| total_timesteps | 1617024 | -| train/ | | -| approx_kl | 0.0009552515 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | 0.00159 | -| n_updates | 126320 | -| policy_gradient_loss | 0.0199 | -| std | 0.0153 | -| value_loss | 2.44e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12634 | -| time_elapsed | 67894 | -| total_timesteps | 1617152 | -| train/ | | -| approx_kl | 0.28836358 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | 0.00132 | -| n_updates | 126330 | -| policy_gradient_loss | 0.0109 | -| std | 0.0153 | -| value_loss | 2.94e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12635 | -| time_elapsed | 67897 | -| total_timesteps | 1617280 | -| train/ | | -| approx_kl | 0.028136302 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 126340 | -| policy_gradient_loss | 0.0317 | -| std | 0.0153 | -| value_loss | 8.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12636 | -| time_elapsed | 67900 | -| total_timesteps | 1617408 | -| train/ | | -| approx_kl | 0.019076044 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.00953 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 126350 | -| policy_gradient_loss | 0.0232 | -| std | 0.0153 | -| value_loss | 9.06e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12637 | -| time_elapsed | 67904 | -| total_timesteps | 1617536 | -| train/ | | -| approx_kl | 0.0059303637 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 126360 | -| policy_gradient_loss | 0.00245 | -| std | 0.0153 | -| value_loss | 5.34e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12638 | -| time_elapsed | 67907 | -| total_timesteps | 1617664 | -| train/ | | -| approx_kl | 0.05075039 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.0388 | -| n_updates | 126370 | -| policy_gradient_loss | 0.0142 | -| std | 0.0153 | -| value_loss | 4.09e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12639 | -| time_elapsed | 67911 | -| total_timesteps | 1617792 | -| train/ | | -| approx_kl | 0.017080035 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | -0.00891 | -| n_updates | 126380 | -| policy_gradient_loss | -0.00657 | -| std | 0.0153 | -| value_loss | 1.9e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 12640 | -| time_elapsed | 67914 | -| total_timesteps | 1617920 | -| train/ | | -| approx_kl | 0.0062086163 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.00018 | -| n_updates | 126390 | -| policy_gradient_loss | 0.000324 | -| std | 0.0153 | -| value_loss | 8.96e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12641 | -| time_elapsed | 67918 | -| total_timesteps | 1618048 | -| train/ | | -| approx_kl | 0.011443155 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.00904 | -| learning_rate | 0.0003 | -| loss | -0.00403 | -| n_updates | 126400 | -| policy_gradient_loss | -0.00228 | -| std | 0.0153 | -| value_loss | 5.51e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12642 | -| time_elapsed | 67924 | -| total_timesteps | 1618176 | -| train/ | | -| approx_kl | 0.042725567 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.778 | -| learning_rate | 0.0003 | -| loss | 0.000996 | -| n_updates | 126410 | -| policy_gradient_loss | -0.00864 | -| std | 0.0153 | -| value_loss | 0.0057 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12643 | -| time_elapsed | 67928 | -| total_timesteps | 1618304 | -| train/ | | -| approx_kl | 0.0010368736 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.293 | -| learning_rate | 0.0003 | -| loss | 0.00573 | -| n_updates | 126420 | -| policy_gradient_loss | -0.00329 | -| std | 0.0153 | -| value_loss | 0.0137 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12644 | -| time_elapsed | 67931 | -| total_timesteps | 1618432 | -| train/ | | -| approx_kl | 0.028393049 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 126430 | -| policy_gradient_loss | 0.0132 | -| std | 0.0153 | -| value_loss | 0.00428 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12645 | -| time_elapsed | 67934 | -| total_timesteps | 1618560 | -| train/ | | -| approx_kl | 0.006464982 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.00182 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 126440 | -| policy_gradient_loss | 0.000191 | -| std | 0.0153 | -| value_loss | 0.018 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12646 | -| time_elapsed | 67938 | -| total_timesteps | 1618688 | -| train/ | | -| approx_kl | 0.040795654 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.00545 | -| learning_rate | 0.0003 | -| loss | -0.00769 | -| n_updates | 126450 | -| policy_gradient_loss | -0.0107 | -| std | 0.0153 | -| value_loss | 0.00156 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12647 | -| time_elapsed | 67941 | -| total_timesteps | 1618816 | -| train/ | | -| approx_kl | 0.006200751 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.00906 | -| n_updates | 126460 | -| policy_gradient_loss | -0.000125 | -| std | 0.0153 | -| value_loss | 0.000181 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12648 | -| time_elapsed | 67945 | -| total_timesteps | 1618944 | -| train/ | | -| approx_kl | 0.024801988 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.00717 | -| n_updates | 126470 | -| policy_gradient_loss | -0.00223 | -| std | 0.0153 | -| value_loss | 0.00018 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12649 | -| time_elapsed | 67948 | -| total_timesteps | 1619072 | -| train/ | | -| approx_kl | 0.032122247 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.000833 | -| n_updates | 126480 | -| policy_gradient_loss | 0.000601 | -| std | 0.0153 | -| value_loss | 0.000173 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12650 | -| time_elapsed | 67954 | -| total_timesteps | 1619200 | -| train/ | | -| approx_kl | 0.18590693 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.39 | -| learning_rate | 0.0003 | -| loss | 0.00279 | -| n_updates | 126490 | -| policy_gradient_loss | -0.0101 | -| std | 0.0153 | -| value_loss | 0.00193 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12651 | -| time_elapsed | 67959 | -| total_timesteps | 1619328 | -| train/ | | -| approx_kl | 0.018573176 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 126500 | -| policy_gradient_loss | 0.00848 | -| std | 0.0153 | -| value_loss | 6.02e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12652 | -| time_elapsed | 67963 | -| total_timesteps | 1619456 | -| train/ | | -| approx_kl | 0.001005949 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 126510 | -| policy_gradient_loss | 0.00375 | -| std | 0.0154 | -| value_loss | 3.62e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12653 | -| time_elapsed | 67966 | -| total_timesteps | 1619584 | -| train/ | | -| approx_kl | 0.0076417592 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | 0.00873 | -| n_updates | 126520 | -| policy_gradient_loss | 0.00697 | -| std | 0.0155 | -| value_loss | 0.000144 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12654 | -| time_elapsed | 67970 | -| total_timesteps | 1619712 | -| train/ | | -| approx_kl | 0.022217315 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | 0.00142 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 126530 | -| policy_gradient_loss | 0.00726 | -| std | 0.0155 | -| value_loss | 6.72e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12655 | -| time_elapsed | 67973 | -| total_timesteps | 1619840 | -| train/ | | -| approx_kl | 0.0057965433 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0064 | -| learning_rate | 0.0003 | -| loss | 0.00953 | -| n_updates | 126540 | -| policy_gradient_loss | -0.000148 | -| std | 0.0155 | -| value_loss | 5.23e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 12656 | -| time_elapsed | 67977 | -| total_timesteps | 1619968 | -| train/ | | -| approx_kl | 0.064556204 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.00972 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 126550 | -| policy_gradient_loss | 0.00039 | -| std | 0.0155 | -| value_loss | 3.41e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12657 | -| time_elapsed | 67981 | -| total_timesteps | 1620096 | -| train/ | | -| approx_kl | 5.480228e-05 | -| clip_fraction | 0.0266 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.000574 | -| n_updates | 126560 | -| policy_gradient_loss | -0.00184 | -| std | 0.0155 | -| value_loss | 2.03e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12658 | -| time_elapsed | 67988 | -| total_timesteps | 1620224 | -| train/ | | -| approx_kl | 0.13142876 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | 0.751 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 126570 | -| policy_gradient_loss | -0.0188 | -| std | 0.0155 | -| value_loss | 0.00077 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12659 | -| time_elapsed | 67990 | -| total_timesteps | 1620352 | -| train/ | | -| approx_kl | 0.037984513 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.00663 | -| n_updates | 126580 | -| policy_gradient_loss | 0.0112 | -| std | 0.0155 | -| value_loss | 7.19e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12660 | -| time_elapsed | 67992 | -| total_timesteps | 1620480 | -| train/ | | -| approx_kl | 0.0029496755 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.00887 | -| n_updates | 126590 | -| policy_gradient_loss | -0.00704 | -| std | 0.0155 | -| value_loss | 7.31e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12661 | -| time_elapsed | 67997 | -| total_timesteps | 1620608 | -| train/ | | -| approx_kl | 0.009836076 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 126600 | -| policy_gradient_loss | 0.00319 | -| std | 0.0155 | -| value_loss | 3.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12662 | -| time_elapsed | 68000 | -| total_timesteps | 1620736 | -| train/ | | -| approx_kl | 0.031044964 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.00652 | -| n_updates | 126610 | -| policy_gradient_loss | 0.00512 | -| std | 0.0155 | -| value_loss | 3.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12663 | -| time_elapsed | 68004 | -| total_timesteps | 1620864 | -| train/ | | -| approx_kl | 0.026515193 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 126620 | -| policy_gradient_loss | -0.00475 | -| std | 0.0156 | -| value_loss | 2.95e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 12664 | -| time_elapsed | 68007 | -| total_timesteps | 1620992 | -| train/ | | -| approx_kl | 0.05431807 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | 0.0257 | -| n_updates | 126630 | -| policy_gradient_loss | 0.00864 | -| std | 0.0156 | -| value_loss | 1.97e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12665 | -| time_elapsed | 68010 | -| total_timesteps | 1621120 | -| train/ | | -| approx_kl | 0.015553677 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 126640 | -| policy_gradient_loss | 0.0012 | -| std | 0.0156 | -| value_loss | 1.67e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12666 | -| time_elapsed | 68020 | -| total_timesteps | 1621248 | -| train/ | | -| approx_kl | 1.5468528 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.00963 | -| n_updates | 126650 | -| policy_gradient_loss | -0.00928 | -| std | 0.0156 | -| value_loss | 3.59e-05 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12667 | -| time_elapsed | 68023 | -| total_timesteps | 1621376 | -| train/ | | -| approx_kl | 0.00057459297 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0869 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 126660 | -| policy_gradient_loss | -0.00599 | -| std | 0.0155 | -| value_loss | 4.55e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12668 | -| time_elapsed | 68026 | -| total_timesteps | 1621504 | -| train/ | | -| approx_kl | 0.012022228 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.74 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 126670 | -| policy_gradient_loss | 0.00981 | -| std | 0.0155 | -| value_loss | 2.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12669 | -| time_elapsed | 68030 | -| total_timesteps | 1621632 | -| train/ | | -| approx_kl | 0.026668584 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.00198 | -| n_updates | 126680 | -| policy_gradient_loss | -0.00305 | -| std | 0.0155 | -| value_loss | 2.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12670 | -| time_elapsed | 68033 | -| total_timesteps | 1621760 | -| train/ | | -| approx_kl | 0.002637817 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | 0.00359 | -| n_updates | 126690 | -| policy_gradient_loss | 0.0047 | -| std | 0.0155 | -| value_loss | 1.98e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 12671 | -| time_elapsed | 68037 | -| total_timesteps | 1621888 | -| train/ | | -| approx_kl | 0.0089426115 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | -0.00701 | -| n_updates | 126700 | -| policy_gradient_loss | -0.00362 | -| std | 0.0155 | -| value_loss | 1.02e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12672 | -| time_elapsed | 68040 | -| total_timesteps | 1622016 | -| train/ | | -| approx_kl | 0.00059471326 | -| clip_fraction | 0.0242 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.00176 | -| n_updates | 126710 | -| policy_gradient_loss | -0.000874 | -| std | 0.0155 | -| value_loss | 8.18e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12673 | -| time_elapsed | 68049 | -| total_timesteps | 1622144 | -| train/ | | -| approx_kl | 0.22448674 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | -0.000506 | -| n_updates | 126720 | -| policy_gradient_loss | -0.00194 | -| std | 0.0155 | -| value_loss | 0.00275 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12674 | -| time_elapsed | 68052 | -| total_timesteps | 1622272 | -| train/ | | -| approx_kl | 0.0004930161 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | 0.0503 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 126730 | -| policy_gradient_loss | -0.00191 | -| std | 0.0155 | -| value_loss | 6.06e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12675 | -| time_elapsed | 68056 | -| total_timesteps | 1622400 | -| train/ | | -| approx_kl | 0.018959057 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.431 | -| learning_rate | 0.0003 | -| loss | -0.0051 | -| n_updates | 126740 | -| policy_gradient_loss | -0.00351 | -| std | 0.0155 | -| value_loss | 4.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12676 | -| time_elapsed | 68059 | -| total_timesteps | 1622528 | -| train/ | | -| approx_kl | 0.020494614 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.212 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 126750 | -| policy_gradient_loss | 0.00855 | -| std | 0.0155 | -| value_loss | 1.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12677 | -| time_elapsed | 68062 | -| total_timesteps | 1622656 | -| train/ | | -| approx_kl | 0.004933639 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0733 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 126760 | -| policy_gradient_loss | -0.00359 | -| std | 0.0155 | -| value_loss | 1.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12678 | -| time_elapsed | 68065 | -| total_timesteps | 1622784 | -| train/ | | -| approx_kl | 0.024011236 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 126770 | -| policy_gradient_loss | 0.00177 | -| std | 0.0155 | -| value_loss | 1.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12679 | -| time_elapsed | 68067 | -| total_timesteps | 1622912 | -| train/ | | -| approx_kl | 0.030638106 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 126780 | -| policy_gradient_loss | -0.00149 | -| std | 0.0155 | -| value_loss | 1.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12680 | -| time_elapsed | 68070 | -| total_timesteps | 1623040 | -| train/ | | -| approx_kl | 0.05301988 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.00929 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 126790 | -| policy_gradient_loss | 0.000962 | -| std | 0.0155 | -| value_loss | 9.16e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12681 | -| time_elapsed | 68076 | -| total_timesteps | 1623168 | -| train/ | | -| approx_kl | 0.104952104 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | 0.876 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 126800 | -| policy_gradient_loss | -0.0129 | -| std | 0.0155 | -| value_loss | 0.00179 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12682 | -| time_elapsed | 68081 | -| total_timesteps | 1623296 | -| train/ | | -| approx_kl | 0.060714155 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.0296 | -| n_updates | 126810 | -| policy_gradient_loss | 0.00461 | -| std | 0.0155 | -| value_loss | 1.09e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12683 | -| time_elapsed | 68085 | -| total_timesteps | 1623424 | -| train/ | | -| approx_kl | 0.00068283686 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.00868 | -| learning_rate | 0.0003 | -| loss | -0.00459 | -| n_updates | 126820 | -| policy_gradient_loss | -0.00666 | -| std | 0.0155 | -| value_loss | 4.01e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12684 | -| time_elapsed | 68088 | -| total_timesteps | 1623552 | -| train/ | | -| approx_kl | 0.012823941 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.00677 | -| n_updates | 126830 | -| policy_gradient_loss | 0.00589 | -| std | 0.0155 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12685 | -| time_elapsed | 68090 | -| total_timesteps | 1623680 | -| train/ | | -| approx_kl | 0.024542328 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0637 | -| learning_rate | 0.0003 | -| loss | -0.00973 | -| n_updates | 126840 | -| policy_gradient_loss | -0.00481 | -| std | 0.0155 | -| value_loss | 7.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12686 | -| time_elapsed | 68094 | -| total_timesteps | 1623808 | -| train/ | | -| approx_kl | 0.068267755 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | 0.0481 | -| n_updates | 126850 | -| policy_gradient_loss | 0.0444 | -| std | 0.0155 | -| value_loss | 7.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 12687 | -| time_elapsed | 68098 | -| total_timesteps | 1623936 | -| train/ | | -| approx_kl | 0.03332439 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 126860 | -| policy_gradient_loss | 0.0324 | -| std | 0.0155 | -| value_loss | 4.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12688 | -| time_elapsed | 68102 | -| total_timesteps | 1624064 | -| train/ | | -| approx_kl | 0.030985147 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 126870 | -| policy_gradient_loss | 0.036 | -| std | 0.0155 | -| value_loss | 6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12689 | -| time_elapsed | 68108 | -| total_timesteps | 1624192 | -| train/ | | -| approx_kl | 0.45499793 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 126880 | -| policy_gradient_loss | 0.000337 | -| std | 0.0155 | -| value_loss | 0.00169 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12690 | -| time_elapsed | 68112 | -| total_timesteps | 1624320 | -| train/ | | -| approx_kl | 0.030285005 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.00545 | -| n_updates | 126890 | -| policy_gradient_loss | -0.00197 | -| std | 0.0155 | -| value_loss | 3.68e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12691 | -| time_elapsed | 68116 | -| total_timesteps | 1624448 | -| train/ | | -| approx_kl | 0.004510173 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 126900 | -| policy_gradient_loss | -0.000486 | -| std | 0.0155 | -| value_loss | 6.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12692 | -| time_elapsed | 68119 | -| total_timesteps | 1624576 | -| train/ | | -| approx_kl | 0.010931219 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | 0.00437 | -| n_updates | 126910 | -| policy_gradient_loss | 0.00173 | -| std | 0.0155 | -| value_loss | 2.91e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12693 | -| time_elapsed | 68122 | -| total_timesteps | 1624704 | -| train/ | | -| approx_kl | 0.0004839413 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | 0.0046 | -| n_updates | 126920 | -| policy_gradient_loss | 0.00789 | -| std | 0.0155 | -| value_loss | 2.74e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12694 | -| time_elapsed | 68125 | -| total_timesteps | 1624832 | -| train/ | | -| approx_kl | 0.0024396214 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 126930 | -| policy_gradient_loss | 0.000575 | -| std | 0.0155 | -| value_loss | 1.75e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12695 | -| time_elapsed | 68128 | -| total_timesteps | 1624960 | -| train/ | | -| approx_kl | 0.020928916 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 126940 | -| policy_gradient_loss | -0.00951 | -| std | 0.0155 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12696 | -| time_elapsed | 68131 | -| total_timesteps | 1625088 | -| train/ | | -| approx_kl | 4.945323e-07 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | -0.000114 | -| n_updates | 126950 | -| policy_gradient_loss | -0.006 | -| std | 0.0155 | -| value_loss | 9.99e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12697 | -| time_elapsed | 68139 | -| total_timesteps | 1625216 | -| train/ | | -| approx_kl | 0.14945233 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 126960 | -| policy_gradient_loss | -0.0175 | -| std | 0.0155 | -| value_loss | 0.000349 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12698 | -| time_elapsed | 68142 | -| total_timesteps | 1625344 | -| train/ | | -| approx_kl | 0.00035660015 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 126970 | -| policy_gradient_loss | -0.0037 | -| std | 0.0155 | -| value_loss | 2.82e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12699 | -| time_elapsed | 68145 | -| total_timesteps | 1625472 | -| train/ | | -| approx_kl | 0.016456703 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | 0.00245 | -| n_updates | 126980 | -| policy_gradient_loss | 0.0104 | -| std | 0.0155 | -| value_loss | 8.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12700 | -| time_elapsed | 68148 | -| total_timesteps | 1625600 | -| train/ | | -| approx_kl | 0.012504576 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.515 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 126990 | -| policy_gradient_loss | -0.00749 | -| std | 0.0155 | -| value_loss | 3.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12701 | -| time_elapsed | 68151 | -| total_timesteps | 1625728 | -| train/ | | -| approx_kl | 0.03275203 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.75 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 127000 | -| policy_gradient_loss | -7.43e-05 | -| std | 0.0154 | -| value_loss | 7.85e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12702 | -| time_elapsed | 68153 | -| total_timesteps | 1625856 | -| train/ | | -| approx_kl | 1.22278e-05 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | -0.000622 | -| n_updates | 127010 | -| policy_gradient_loss | -0.00125 | -| std | 0.0154 | -| value_loss | 7.22e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12703 | -| time_elapsed | 68157 | -| total_timesteps | 1625984 | -| train/ | | -| approx_kl | 0.072158776 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 127020 | -| policy_gradient_loss | 0.00643 | -| std | 0.0154 | -| value_loss | 6.06e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12704 | -| time_elapsed | 68160 | -| total_timesteps | 1626112 | -| train/ | | -| approx_kl | 0.037176922 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.000549 | -| n_updates | 127030 | -| policy_gradient_loss | -0.00313 | -| std | 0.0154 | -| value_loss | 5.51e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12705 | -| time_elapsed | 68168 | -| total_timesteps | 1626240 | -| train/ | | -| approx_kl | 0.020789146 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.427 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 127040 | -| policy_gradient_loss | -0.0097 | -| std | 0.0154 | -| value_loss | 0.00223 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12706 | -| time_elapsed | 68171 | -| total_timesteps | 1626368 | -| train/ | | -| approx_kl | 0.05889199 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 127050 | -| policy_gradient_loss | 0.0394 | -| std | 0.0153 | -| value_loss | 3.19e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12707 | -| time_elapsed | 68175 | -| total_timesteps | 1626496 | -| train/ | | -| approx_kl | 0.009511361 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 127060 | -| policy_gradient_loss | 0.000681 | -| std | 0.0153 | -| value_loss | 6.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12708 | -| time_elapsed | 68179 | -| total_timesteps | 1626624 | -| train/ | | -| approx_kl | 0.008843947 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0044 | -| learning_rate | 0.0003 | -| loss | 0.000683 | -| n_updates | 127070 | -| policy_gradient_loss | 0.00417 | -| std | 0.0153 | -| value_loss | 2.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12709 | -| time_elapsed | 68183 | -| total_timesteps | 1626752 | -| train/ | | -| approx_kl | 0.02154342 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 127080 | -| policy_gradient_loss | 0.03 | -| std | 0.0153 | -| value_loss | 1.52e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12710 | -| time_elapsed | 68186 | -| total_timesteps | 1626880 | -| train/ | | -| approx_kl | 0.0045353984 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.00823 | -| learning_rate | 0.0003 | -| loss | -0.000995 | -| n_updates | 127090 | -| policy_gradient_loss | 0.00309 | -| std | 0.0153 | -| value_loss | 8.85e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12711 | -| time_elapsed | 68191 | -| total_timesteps | 1627008 | -| train/ | | -| approx_kl | 0.0074946405 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 127100 | -| policy_gradient_loss | -0.00281 | -| std | 0.0153 | -| value_loss | 7.01e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12712 | -| time_elapsed | 68201 | -| total_timesteps | 1627136 | -| train/ | | -| approx_kl | 0.13697977 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 127110 | -| policy_gradient_loss | -0.0144 | -| std | 0.0153 | -| value_loss | 0.000581 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12713 | -| time_elapsed | 68206 | -| total_timesteps | 1627264 | -| train/ | | -| approx_kl | 0.0039876886 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | 0.0283 | -| learning_rate | 0.0003 | -| loss | 0.000241 | -| n_updates | 127120 | -| policy_gradient_loss | 0.00235 | -| std | 0.0153 | -| value_loss | 6.73e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12714 | -| time_elapsed | 68210 | -| total_timesteps | 1627392 | -| train/ | | -| approx_kl | 2.0661857e-05 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.000996 | -| n_updates | 127130 | -| policy_gradient_loss | -0.00145 | -| std | 0.0152 | -| value_loss | 8.63e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12715 | -| time_elapsed | 68214 | -| total_timesteps | 1627520 | -| train/ | | -| approx_kl | 0.009363272 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 127140 | -| policy_gradient_loss | 0.00287 | -| std | 0.0152 | -| value_loss | 4.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12716 | -| time_elapsed | 68217 | -| total_timesteps | 1627648 | -| train/ | | -| approx_kl | 0.009647524 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 127150 | -| policy_gradient_loss | 0.00149 | -| std | 0.0152 | -| value_loss | 5.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12717 | -| time_elapsed | 68221 | -| total_timesteps | 1627776 | -| train/ | | -| approx_kl | 0.0024847067 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 127160 | -| policy_gradient_loss | 0.0022 | -| std | 0.0152 | -| value_loss | 1.26e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12718 | -| time_elapsed | 68224 | -| total_timesteps | 1627904 | -| train/ | | -| approx_kl | 0.04318808 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.0374 | -| n_updates | 127170 | -| policy_gradient_loss | 0.0114 | -| std | 0.0152 | -| value_loss | 8.88e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12719 | -| time_elapsed | 68227 | -| total_timesteps | 1628032 | -| train/ | | -| approx_kl | 0.003773863 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 127180 | -| policy_gradient_loss | 0.0146 | -| std | 0.0152 | -| value_loss | 7.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12720 | -| time_elapsed | 68236 | -| total_timesteps | 1628160 | -| train/ | | -| approx_kl | 0.034639295 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.76 | -| explained_variance | -15.5 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 127190 | -| policy_gradient_loss | -0.0144 | -| std | 0.0152 | -| value_loss | 0.00414 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12721 | -| time_elapsed | 68240 | -| total_timesteps | 1628288 | -| train/ | | -| approx_kl | 0.0022830614 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | 0.00216 | -| n_updates | 127200 | -| policy_gradient_loss | 0.00375 | -| std | 0.0152 | -| value_loss | 3.47e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12722 | -| time_elapsed | 68244 | -| total_timesteps | 1628416 | -| train/ | | -| approx_kl | 0.007837932 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -3.73 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 127210 | -| policy_gradient_loss | -0.0118 | -| std | 0.0152 | -| value_loss | 3.67e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12723 | -| time_elapsed | 68247 | -| total_timesteps | 1628544 | -| train/ | | -| approx_kl | 0.0048514795 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -1.88 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 127220 | -| policy_gradient_loss | -0.000876 | -| std | 0.0152 | -| value_loss | 2.27e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12724 | -| time_elapsed | 68250 | -| total_timesteps | 1628672 | -| train/ | | -| approx_kl | 0.02208707 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 127230 | -| policy_gradient_loss | -0.00547 | -| std | 0.0152 | -| value_loss | 1.99e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12725 | -| time_elapsed | 68253 | -| total_timesteps | 1628800 | -| train/ | | -| approx_kl | 4.7274865e-05 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | -0.000295 | -| n_updates | 127240 | -| policy_gradient_loss | 0.00547 | -| std | 0.0152 | -| value_loss | 1.01e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12726 | -| time_elapsed | 68257 | -| total_timesteps | 1628928 | -| train/ | | -| approx_kl | 0.0019725617 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 127250 | -| policy_gradient_loss | 0.0157 | -| std | 0.0152 | -| value_loss | 8.17e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12727 | -| time_elapsed | 68261 | -| total_timesteps | 1629056 | -| train/ | | -| approx_kl | 0.036691748 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.00556 | -| n_updates | 127260 | -| policy_gradient_loss | -0.00295 | -| std | 0.0152 | -| value_loss | 6.38e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12728 | -| time_elapsed | 68267 | -| total_timesteps | 1629184 | -| train/ | | -| approx_kl | 0.013650366 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.00916 | -| n_updates | 127270 | -| policy_gradient_loss | -0.00827 | -| std | 0.0152 | -| value_loss | 0.00134 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12729 | -| time_elapsed | 68270 | -| total_timesteps | 1629312 | -| train/ | | -| approx_kl | 0.011190837 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | 0.00707 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 127280 | -| policy_gradient_loss | 0.00302 | -| std | 0.0152 | -| value_loss | 5.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12730 | -| time_elapsed | 68273 | -| total_timesteps | 1629440 | -| train/ | | -| approx_kl | 0.05868658 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0869 | -| learning_rate | 0.0003 | -| loss | 0.0608 | -| n_updates | 127290 | -| policy_gradient_loss | 0.04 | -| std | 0.0152 | -| value_loss | 1.29e-06 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12731 | -| time_elapsed | 68276 | -| total_timesteps | 1629568 | -| train/ | | -| approx_kl | 0.041157 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0677 | -| n_updates | 127300 | -| policy_gradient_loss | 0.0294 | -| std | 0.0152 | -| value_loss | 7.2e-07 | --------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12732 | -| time_elapsed | 68279 | -| total_timesteps | 1629696 | -| train/ | | -| approx_kl | 0.0081703 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | 0.000964 | -| n_updates | 127310 | -| policy_gradient_loss | 0.0038 | -| std | 0.0152 | -| value_loss | 5.64e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12733 | -| time_elapsed | 68283 | -| total_timesteps | 1629824 | -| train/ | | -| approx_kl | 0.008444957 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 127320 | -| policy_gradient_loss | 0.00194 | -| std | 0.0152 | -| value_loss | 9.36e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 12734 | -| time_elapsed | 68286 | -| total_timesteps | 1629952 | -| train/ | | -| approx_kl | 0.0034608329 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.000224 | -| n_updates | 127330 | -| policy_gradient_loss | 0.00467 | -| std | 0.0152 | -| value_loss | 5.02e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12735 | -| time_elapsed | 68289 | -| total_timesteps | 1630080 | -| train/ | | -| approx_kl | 0.011058593 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 127340 | -| policy_gradient_loss | -0.00225 | -| std | 0.0151 | -| value_loss | 4e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12736 | -| time_elapsed | 68294 | -| total_timesteps | 1630208 | -| train/ | | -| approx_kl | 0.024030397 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 127350 | -| policy_gradient_loss | -0.0112 | -| std | 0.0151 | -| value_loss | 2.57e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12737 | -| time_elapsed | 68297 | -| total_timesteps | 1630336 | -| train/ | | -| approx_kl | 0.06702658 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | 0.000639 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 127360 | -| policy_gradient_loss | 0.00176 | -| std | 0.0151 | -| value_loss | 2.71e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12738 | -| time_elapsed | 68300 | -| total_timesteps | 1630464 | -| train/ | | -| approx_kl | 0.010493123 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | 0.00663 | -| learning_rate | 0.0003 | -| loss | 0.00293 | -| n_updates | 127370 | -| policy_gradient_loss | 0.00658 | -| std | 0.0151 | -| value_loss | 4.43e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12739 | -| time_elapsed | 68303 | -| total_timesteps | 1630592 | -| train/ | | -| approx_kl | 0.04468661 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 127380 | -| policy_gradient_loss | 0.00175 | -| std | 0.0151 | -| value_loss | 1.16e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12740 | -| time_elapsed | 68306 | -| total_timesteps | 1630720 | -| train/ | | -| approx_kl | 0.0034584412 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | -0.000981 | -| n_updates | 127390 | -| policy_gradient_loss | 0.00445 | -| std | 0.0151 | -| value_loss | 3.36e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12741 | -| time_elapsed | 68309 | -| total_timesteps | 1630848 | -| train/ | | -| approx_kl | 0.007906221 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00643 | -| n_updates | 127400 | -| policy_gradient_loss | 0.00304 | -| std | 0.0151 | -| value_loss | 1.42e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 12742 | -| time_elapsed | 68313 | -| total_timesteps | 1630976 | -| train/ | | -| approx_kl | 4.421547e-05 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 127410 | -| policy_gradient_loss | -0.0133 | -| std | 0.015 | -| value_loss | 1.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12743 | -| time_elapsed | 68316 | -| total_timesteps | 1631104 | -| train/ | | -| approx_kl | 0.012406781 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.00861 | -| learning_rate | 0.0003 | -| loss | 0.00737 | -| n_updates | 127420 | -| policy_gradient_loss | 0.00838 | -| std | 0.015 | -| value_loss | 7.74e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12744 | -| time_elapsed | 68324 | -| total_timesteps | 1631232 | -| train/ | | -| approx_kl | 0.123751745 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -1.45 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 127430 | -| policy_gradient_loss | -0.0105 | -| std | 0.015 | -| value_loss | 0.00227 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12745 | -| time_elapsed | 68328 | -| total_timesteps | 1631360 | -| train/ | | -| approx_kl | 0.01797944 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -18 | -| learning_rate | 0.0003 | -| loss | 0.000943 | -| n_updates | 127440 | -| policy_gradient_loss | 0.0025 | -| std | 0.015 | -| value_loss | 5.36e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12746 | -| time_elapsed | 68332 | -| total_timesteps | 1631488 | -| train/ | | -| approx_kl | 0.0048496905 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -82.8 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 127450 | -| policy_gradient_loss | -0.0116 | -| std | 0.015 | -| value_loss | 2.11e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12747 | -| time_elapsed | 68335 | -| total_timesteps | 1631616 | -| train/ | | -| approx_kl | 0.07052923 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -7.1 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 127460 | -| policy_gradient_loss | -0.0148 | -| std | 0.015 | -| value_loss | 2.12e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12748 | -| time_elapsed | 68339 | -| total_timesteps | 1631744 | -| train/ | | -| approx_kl | 0.06508033 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 127470 | -| policy_gradient_loss | 0.0125 | -| std | 0.015 | -| value_loss | 6.34e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 12749 | -| time_elapsed | 68341 | -| total_timesteps | 1631872 | -| train/ | | -| approx_kl | 0.023420025 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.445 | -| learning_rate | 0.0003 | -| loss | 0.0085 | -| n_updates | 127480 | -| policy_gradient_loss | 0.00639 | -| std | 0.015 | -| value_loss | 3.33e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12750 | -| time_elapsed | 68345 | -| total_timesteps | 1632000 | -| train/ | | -| approx_kl | 0.031235516 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 127490 | -| policy_gradient_loss | 0.00481 | -| std | 0.015 | -| value_loss | 1.96e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12751 | -| time_elapsed | 68348 | -| total_timesteps | 1632128 | -| train/ | | -| approx_kl | 0.05127155 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.0033 | -| learning_rate | 0.0003 | -| loss | 0.000146 | -| n_updates | 127500 | -| policy_gradient_loss | -0.00587 | -| std | 0.015 | -| value_loss | 1.33e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12752 | -| time_elapsed | 68356 | -| total_timesteps | 1632256 | -| train/ | | -| approx_kl | 1.0998425 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 127510 | -| policy_gradient_loss | -0.0146 | -| std | 0.015 | -| value_loss | 0.000202 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12753 | -| time_elapsed | 68359 | -| total_timesteps | 1632384 | -| train/ | | -| approx_kl | 0.0917258 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0608 | -| n_updates | 127520 | -| policy_gradient_loss | 0.0108 | -| std | 0.0151 | -| value_loss | 3.33e-06 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12754 | -| time_elapsed | 68361 | -| total_timesteps | 1632512 | -| train/ | | -| approx_kl | 1.5473459e-05 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -28 | -| learning_rate | 0.0003 | -| loss | 0.000141 | -| n_updates | 127530 | -| policy_gradient_loss | -0.00129 | -| std | 0.0151 | -| value_loss | 6.17e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12755 | -| time_elapsed | 68364 | -| total_timesteps | 1632640 | -| train/ | | -| approx_kl | 0.0037741666 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -2.07 | -| learning_rate | 0.0003 | -| loss | 0.00365 | -| n_updates | 127540 | -| policy_gradient_loss | 0.0129 | -| std | 0.0151 | -| value_loss | 1.89e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12756 | -| time_elapsed | 68367 | -| total_timesteps | 1632768 | -| train/ | | -| approx_kl | 0.021454312 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.318 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 127550 | -| policy_gradient_loss | 0.0173 | -| std | 0.0151 | -| value_loss | 7.28e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12757 | -| time_elapsed | 68369 | -| total_timesteps | 1632896 | -| train/ | | -| approx_kl | 0.006084535 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | 0.00172 | -| n_updates | 127560 | -| policy_gradient_loss | 0.00574 | -| std | 0.0151 | -| value_loss | 6.72e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12758 | -| time_elapsed | 68373 | -| total_timesteps | 1633024 | -| train/ | | -| approx_kl | 6.583659e-05 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 127570 | -| policy_gradient_loss | -0.0137 | -| std | 0.0151 | -| value_loss | 1.9e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12759 | -| time_elapsed | 68381 | -| total_timesteps | 1633152 | -| train/ | | -| approx_kl | 0.12325282 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | 0.00245 | -| n_updates | 127580 | -| policy_gradient_loss | -0.000894 | -| std | 0.0151 | -| value_loss | 0.00193 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12760 | -| time_elapsed | 68385 | -| total_timesteps | 1633280 | -| train/ | | -| approx_kl | 0.026301501 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.0363 | -| learning_rate | 0.0003 | -| loss | 0.0048 | -| n_updates | 127590 | -| policy_gradient_loss | 0.000878 | -| std | 0.015 | -| value_loss | 4.88e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12761 | -| time_elapsed | 68389 | -| total_timesteps | 1633408 | -| train/ | | -| approx_kl | 0.0051969974 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.00761 | -| n_updates | 127600 | -| policy_gradient_loss | -0.00218 | -| std | 0.015 | -| value_loss | 3.89e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12762 | -| time_elapsed | 68393 | -| total_timesteps | 1633536 | -| train/ | | -| approx_kl | 0.00671417 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0901 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 127610 | -| policy_gradient_loss | -0.00173 | -| std | 0.015 | -| value_loss | 2.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12763 | -| time_elapsed | 68395 | -| total_timesteps | 1633664 | -| train/ | | -| approx_kl | 0.01173876 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.0337 | -| n_updates | 127620 | -| policy_gradient_loss | 0.00574 | -| std | 0.015 | -| value_loss | 1.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12764 | -| time_elapsed | 68398 | -| total_timesteps | 1633792 | -| train/ | | -| approx_kl | 0.026880968 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 127630 | -| policy_gradient_loss | 0.0182 | -| std | 0.015 | -| value_loss | 1.48e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 12765 | -| time_elapsed | 68402 | -| total_timesteps | 1633920 | -| train/ | | -| approx_kl | 0.0070264223 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 127640 | -| policy_gradient_loss | 0.00549 | -| std | 0.015 | -| value_loss | 1.17e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12766 | -| time_elapsed | 68405 | -| total_timesteps | 1634048 | -| train/ | | -| approx_kl | 0.0062525133 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 127650 | -| policy_gradient_loss | 0.0143 | -| std | 0.015 | -| value_loss | 8.68e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12767 | -| time_elapsed | 68409 | -| total_timesteps | 1634176 | -| train/ | | -| approx_kl | 0.21582021 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.834 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 127660 | -| policy_gradient_loss | -0.00781 | -| std | 0.015 | -| value_loss | 0.0029 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12768 | -| time_elapsed | 68412 | -| total_timesteps | 1634304 | -| train/ | | -| approx_kl | 0.027351543 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0719 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 127670 | -| policy_gradient_loss | 0.00405 | -| std | 0.015 | -| value_loss | 3.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12769 | -| time_elapsed | 68416 | -| total_timesteps | 1634432 | -| train/ | | -| approx_kl | 0.007788813 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 127680 | -| policy_gradient_loss | -0.00383 | -| std | 0.015 | -| value_loss | 4.25e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12770 | -| time_elapsed | 68421 | -| total_timesteps | 1634560 | -| train/ | | -| approx_kl | 0.1346223 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | 0.0626 | -| n_updates | 127690 | -| policy_gradient_loss | 0.0121 | -| std | 0.015 | -| value_loss | 3.72e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12771 | -| time_elapsed | 68425 | -| total_timesteps | 1634688 | -| train/ | | -| approx_kl | 4.001567e-05 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 127700 | -| policy_gradient_loss | 0.00518 | -| std | 0.015 | -| value_loss | 1.55e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12772 | -| time_elapsed | 68428 | -| total_timesteps | 1634816 | -| train/ | | -| approx_kl | 0.0018462599 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 127710 | -| policy_gradient_loss | 0.00253 | -| std | 0.015 | -| value_loss | 8.74e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 12773 | -| time_elapsed | 68432 | -| total_timesteps | 1634944 | -| train/ | | -| approx_kl | 0.012125811 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 127720 | -| policy_gradient_loss | 0.0356 | -| std | 0.015 | -| value_loss | 6.56e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12774 | -| time_elapsed | 68436 | -| total_timesteps | 1635072 | -| train/ | | -| approx_kl | 0.05523622 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 127730 | -| policy_gradient_loss | 0.032 | -| std | 0.0151 | -| value_loss | 4.76e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12775 | -| time_elapsed | 68442 | -| total_timesteps | 1635200 | -| train/ | | -| approx_kl | 0.33684212 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 127740 | -| policy_gradient_loss | -0.019 | -| std | 0.0151 | -| value_loss | 0.00309 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12776 | -| time_elapsed | 68444 | -| total_timesteps | 1635328 | -| train/ | | -| approx_kl | 0.03757143 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.009 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 127750 | -| policy_gradient_loss | 0.0104 | -| std | 0.0151 | -| value_loss | 3.89e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12777 | -| time_elapsed | 68447 | -| total_timesteps | 1635456 | -| train/ | | -| approx_kl | 0.16796339 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0769 | -| n_updates | 127760 | -| policy_gradient_loss | 0.0145 | -| std | 0.0151 | -| value_loss | 8.43e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12778 | -| time_elapsed | 68451 | -| total_timesteps | 1635584 | -| train/ | | -| approx_kl | 0.00024561072 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 2.77 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | -0.00019 | -| n_updates | 127770 | -| policy_gradient_loss | 0.000533 | -| std | 0.0151 | -| value_loss | 4.23e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12779 | -| time_elapsed | 68454 | -| total_timesteps | 1635712 | -| train/ | | -| approx_kl | 0.014137681 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.00546 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 127780 | -| policy_gradient_loss | -0.00249 | -| std | 0.015 | -| value_loss | 4.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12780 | -| time_elapsed | 68457 | -| total_timesteps | 1635840 | -| train/ | | -| approx_kl | 0.008016437 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | -0.00532 | -| n_updates | 127790 | -| policy_gradient_loss | -0.00235 | -| std | 0.015 | -| value_loss | 3.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 12781 | -| time_elapsed | 68460 | -| total_timesteps | 1635968 | -| train/ | | -| approx_kl | 0.010739768 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.00522 | -| n_updates | 127800 | -| policy_gradient_loss | 0.00231 | -| std | 0.015 | -| value_loss | 1.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12782 | -| time_elapsed | 68463 | -| total_timesteps | 1636096 | -| train/ | | -| approx_kl | 0.009719048 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 127810 | -| policy_gradient_loss | -0.00121 | -| std | 0.015 | -| value_loss | 1.76e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12783 | -| time_elapsed | 68471 | -| total_timesteps | 1636224 | -| train/ | | -| approx_kl | 0.2992135 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 127820 | -| policy_gradient_loss | -0.00223 | -| std | 0.015 | -| value_loss | 0.000144 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12784 | -| time_elapsed | 68475 | -| total_timesteps | 1636352 | -| train/ | | -| approx_kl | 0.008208869 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.00353 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 127830 | -| policy_gradient_loss | -0.00484 | -| std | 0.015 | -| value_loss | 1.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12785 | -| time_elapsed | 68479 | -| total_timesteps | 1636480 | -| train/ | | -| approx_kl | 0.05481657 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0019 | -| learning_rate | 0.0003 | -| loss | 0.0362 | -| n_updates | 127840 | -| policy_gradient_loss | 0.0139 | -| std | 0.015 | -| value_loss | 7.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12786 | -| time_elapsed | 68483 | -| total_timesteps | 1636608 | -| train/ | | -| approx_kl | 0.015251645 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.00584 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 127850 | -| policy_gradient_loss | 0.00272 | -| std | 0.015 | -| value_loss | 7.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12787 | -| time_elapsed | 68487 | -| total_timesteps | 1636736 | -| train/ | | -| approx_kl | 0.058397226 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.00164 | -| learning_rate | 0.0003 | -| loss | 0.0637 | -| n_updates | 127860 | -| policy_gradient_loss | 0.0351 | -| std | 0.015 | -| value_loss | 1.33e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12788 | -| time_elapsed | 68490 | -| total_timesteps | 1636864 | -| train/ | | -| approx_kl | 0.03714432 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.00543 | -| learning_rate | 0.0003 | -| loss | 0.0261 | -| n_updates | 127870 | -| policy_gradient_loss | 0.036 | -| std | 0.015 | -| value_loss | 6.78e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 12789 | -| time_elapsed | 68493 | -| total_timesteps | 1636992 | -| train/ | | -| approx_kl | 0.0322318 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 127880 | -| policy_gradient_loss | 0.031 | -| std | 0.015 | -| value_loss | 6.57e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12790 | -| time_elapsed | 68496 | -| total_timesteps | 1637120 | -| train/ | | -| approx_kl | 0.026442181 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.00867 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 127890 | -| policy_gradient_loss | 0.0278 | -| std | 0.015 | -| value_loss | 5.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12791 | -| time_elapsed | 68506 | -| total_timesteps | 1637248 | -| train/ | | -| approx_kl | 0.035349835 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -7.06 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 127900 | -| policy_gradient_loss | -0.0136 | -| std | 0.015 | -| value_loss | 0.00349 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12792 | -| time_elapsed | 68510 | -| total_timesteps | 1637376 | -| train/ | | -| approx_kl | 0.002686047 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -6.03 | -| learning_rate | 0.0003 | -| loss | -0.000418 | -| n_updates | 127910 | -| policy_gradient_loss | 0.00236 | -| std | 0.015 | -| value_loss | 8.42e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12793 | -| time_elapsed | 68514 | -| total_timesteps | 1637504 | -| train/ | | -| approx_kl | 0.0028233193 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -91.3 | -| learning_rate | 0.0003 | -| loss | 0.00328 | -| n_updates | 127920 | -| policy_gradient_loss | 0.00611 | -| std | 0.0149 | -| value_loss | 0.000107 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12794 | -| time_elapsed | 68516 | -| total_timesteps | 1637632 | -| train/ | | -| approx_kl | 0.034383252 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.00692 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 127930 | -| policy_gradient_loss | 0.00142 | -| std | 0.0149 | -| value_loss | 1.88e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12795 | -| time_elapsed | 68520 | -| total_timesteps | 1637760 | -| train/ | | -| approx_kl | 0.006942673 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0856 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 127940 | -| policy_gradient_loss | 0.0124 | -| std | 0.0149 | -| value_loss | 1.03e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 12796 | -| time_elapsed | 68523 | -| total_timesteps | 1637888 | -| train/ | | -| approx_kl | 0.0096591 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 127950 | -| policy_gradient_loss | 0.0146 | -| std | 0.0149 | -| value_loss | 8.42e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12797 | -| time_elapsed | 68525 | -| total_timesteps | 1638016 | -| train/ | | -| approx_kl | 0.0082198195 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.00473 | -| n_updates | 127960 | -| policy_gradient_loss | 0.00161 | -| std | 0.0149 | -| value_loss | 4.21e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12798 | -| time_elapsed | 68532 | -| total_timesteps | 1638144 | -| train/ | | -| approx_kl | 0.08788337 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | 0.971 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 127970 | -| policy_gradient_loss | -0.0156 | -| std | 0.0149 | -| value_loss | 0.000119 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12799 | -| time_elapsed | 68535 | -| total_timesteps | 1638272 | -| train/ | | -| approx_kl | 0.0058488525 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.78 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 127980 | -| policy_gradient_loss | 0.000886 | -| std | 0.0149 | -| value_loss | 3.23e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12800 | -| time_elapsed | 68538 | -| total_timesteps | 1638400 | -| train/ | | -| approx_kl | 0.015732087 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 127990 | -| policy_gradient_loss | 0.0475 | -| std | 0.0149 | -| value_loss | 8.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12801 | -| time_elapsed | 68540 | -| total_timesteps | 1638528 | -| train/ | | -| approx_kl | 0.019566836 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | 0.0048 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 128000 | -| policy_gradient_loss | 0.0285 | -| std | 0.0149 | -| value_loss | 3.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12802 | -| time_elapsed | 68543 | -| total_timesteps | 1638656 | -| train/ | | -| approx_kl | 0.023533838 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00386 | -| learning_rate | 0.0003 | -| loss | 0.0405 | -| n_updates | 128010 | -| policy_gradient_loss | 0.0357 | -| std | 0.0149 | -| value_loss | 2.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12803 | -| time_elapsed | 68546 | -| total_timesteps | 1638784 | -| train/ | | -| approx_kl | 0.024208283 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00566 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 128020 | -| policy_gradient_loss | 0.0321 | -| std | 0.0149 | -| value_loss | 1.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 12804 | -| time_elapsed | 68549 | -| total_timesteps | 1638912 | -| train/ | | -| approx_kl | 0.008214812 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00619 | -| learning_rate | 0.0003 | -| loss | 0.0235 | -| n_updates | 128030 | -| policy_gradient_loss | 0.00236 | -| std | 0.0149 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12805 | -| time_elapsed | 68553 | -| total_timesteps | 1639040 | -| train/ | | -| approx_kl | 0.047537502 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00789 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 128040 | -| policy_gradient_loss | 0.00309 | -| std | 0.0149 | -| value_loss | 9.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12806 | -| time_elapsed | 68560 | -| total_timesteps | 1639168 | -| train/ | | -| approx_kl | 0.027097806 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 128050 | -| policy_gradient_loss | -0.00883 | -| std | 0.0149 | -| value_loss | 0.000375 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12807 | -| time_elapsed | 68564 | -| total_timesteps | 1639296 | -| train/ | | -| approx_kl | 0.004257089 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 128060 | -| policy_gradient_loss | -0.000199 | -| std | 0.0149 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12808 | -| time_elapsed | 68567 | -| total_timesteps | 1639424 | -| train/ | | -| approx_kl | 0.009331033 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 128070 | -| policy_gradient_loss | 0.00142 | -| std | 0.0149 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12809 | -| time_elapsed | 68571 | -| total_timesteps | 1639552 | -| train/ | | -| approx_kl | 0.007876543 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 128080 | -| policy_gradient_loss | -0.00463 | -| std | 0.0149 | -| value_loss | 4.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12810 | -| time_elapsed | 68575 | -| total_timesteps | 1639680 | -| train/ | | -| approx_kl | 0.016947825 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 128090 | -| policy_gradient_loss | 0.00107 | -| std | 0.0149 | -| value_loss | 2.71e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12811 | -| time_elapsed | 68579 | -| total_timesteps | 1639808 | -| train/ | | -| approx_kl | 0.02398367 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 128100 | -| policy_gradient_loss | 0.0332 | -| std | 0.0149 | -| value_loss | 1.44e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 12812 | -| time_elapsed | 68581 | -| total_timesteps | 1639936 | -| train/ | | -| approx_kl | 0.0048762723 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 128110 | -| policy_gradient_loss | 0.00382 | -| std | 0.0149 | -| value_loss | 1.02e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12813 | -| time_elapsed | 68584 | -| total_timesteps | 1640064 | -| train/ | | -| approx_kl | 0.1263563 | -| clip_fraction | 0.565 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 128120 | -| policy_gradient_loss | 0.056 | -| std | 0.0149 | -| value_loss | 1.02e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12814 | -| time_elapsed | 68590 | -| total_timesteps | 1640192 | -| train/ | | -| approx_kl | 0.015462501 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | 0.787 | -| learning_rate | 0.0003 | -| loss | -0.000589 | -| n_updates | 128130 | -| policy_gradient_loss | -0.000215 | -| std | 0.0149 | -| value_loss | 0.00406 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12815 | -| time_elapsed | 68593 | -| total_timesteps | 1640320 | -| train/ | | -| approx_kl | 0.054758806 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00484 | -| learning_rate | 0.0003 | -| loss | 0.00569 | -| n_updates | 128140 | -| policy_gradient_loss | 0.00566 | -| std | 0.0149 | -| value_loss | 4.23e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12816 | -| time_elapsed | 68595 | -| total_timesteps | 1640448 | -| train/ | | -| approx_kl | 0.00687818 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00401 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 128150 | -| policy_gradient_loss | -0.00386 | -| std | 0.0149 | -| value_loss | 1.08e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12817 | -| time_elapsed | 68599 | -| total_timesteps | 1640576 | -| train/ | | -| approx_kl | 0.007548976 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 128160 | -| policy_gradient_loss | -0.0021 | -| std | 0.0149 | -| value_loss | 6.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12818 | -| time_elapsed | 68603 | -| total_timesteps | 1640704 | -| train/ | | -| approx_kl | 0.002060786 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.00214 | -| n_updates | 128170 | -| policy_gradient_loss | 0.00351 | -| std | 0.0149 | -| value_loss | 4.28e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12819 | -| time_elapsed | 68606 | -| total_timesteps | 1640832 | -| train/ | | -| approx_kl | 0.0098405555 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -7.32 | -| learning_rate | 0.0003 | -| loss | -0.000206 | -| n_updates | 128180 | -| policy_gradient_loss | 0.00158 | -| std | 0.0149 | -| value_loss | 1.4e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 12820 | -| time_elapsed | 68608 | -| total_timesteps | 1640960 | -| train/ | | -| approx_kl | 0.06352667 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00176 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 128190 | -| policy_gradient_loss | 0.0152 | -| std | 0.0149 | -| value_loss | 2.32e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12821 | -| time_elapsed | 68612 | -| total_timesteps | 1641088 | -| train/ | | -| approx_kl | 0.005213289 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 128200 | -| policy_gradient_loss | -0.0135 | -| std | 0.0149 | -| value_loss | 1.6e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12822 | -| time_elapsed | 68618 | -| total_timesteps | 1641216 | -| train/ | | -| approx_kl | 0.031461105 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | 0.535 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 128210 | -| policy_gradient_loss | -0.00534 | -| std | 0.0149 | -| value_loss | 0.00114 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12823 | -| time_elapsed | 68622 | -| total_timesteps | 1641344 | -| train/ | | -| approx_kl | 0.06154186 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.00956 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 128220 | -| policy_gradient_loss | 0.00415 | -| std | 0.0149 | -| value_loss | 6.71e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12824 | -| time_elapsed | 68624 | -| total_timesteps | 1641472 | -| train/ | | -| approx_kl | 0.03759776 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | 0.00322 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 128230 | -| policy_gradient_loss | 0.00714 | -| std | 0.0149 | -| value_loss | 1.41e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12825 | -| time_elapsed | 68627 | -| total_timesteps | 1641600 | -| train/ | | -| approx_kl | 0.022812864 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 128240 | -| policy_gradient_loss | 0.00222 | -| std | 0.0149 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12826 | -| time_elapsed | 68630 | -| total_timesteps | 1641728 | -| train/ | | -| approx_kl | 0.034327313 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 128250 | -| policy_gradient_loss | 0.00785 | -| std | 0.0149 | -| value_loss | 7.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12827 | -| time_elapsed | 68634 | -| total_timesteps | 1641856 | -| train/ | | -| approx_kl | 0.018119542 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 128260 | -| policy_gradient_loss | -0.00613 | -| std | 0.0149 | -| value_loss | 6.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 12828 | -| time_elapsed | 68637 | -| total_timesteps | 1641984 | -| train/ | | -| approx_kl | 0.028954454 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 128270 | -| policy_gradient_loss | 0.0397 | -| std | 0.0149 | -| value_loss | 1.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12829 | -| time_elapsed | 68640 | -| total_timesteps | 1642112 | -| train/ | | -| approx_kl | 0.006197194 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 128280 | -| policy_gradient_loss | 0.00356 | -| std | 0.0149 | -| value_loss | 1.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12830 | -| time_elapsed | 68647 | -| total_timesteps | 1642240 | -| train/ | | -| approx_kl | 0.09873398 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -12.2 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 128290 | -| policy_gradient_loss | -0.0165 | -| std | 0.0149 | -| value_loss | 0.0035 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12831 | -| time_elapsed | 68650 | -| total_timesteps | 1642368 | -| train/ | | -| approx_kl | 0.0050403904 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -15.2 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 128300 | -| policy_gradient_loss | -0.00192 | -| std | 0.0148 | -| value_loss | 2.21e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12832 | -| time_elapsed | 68653 | -| total_timesteps | 1642496 | -| train/ | | -| approx_kl | 0.0068294085 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 2.79 | -| explained_variance | -179 | -| learning_rate | 0.0003 | -| loss | -0.00947 | -| n_updates | 128310 | -| policy_gradient_loss | -0.0033 | -| std | 0.0148 | -| value_loss | 1.97e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12833 | -| time_elapsed | 68656 | -| total_timesteps | 1642624 | -| train/ | | -| approx_kl | 0.00057117315 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 2.8 | -| explained_variance | -28.3 | -| learning_rate | 0.0003 | -| loss | -0.000405 | -| n_updates | 128320 | -| policy_gradient_loss | 0.000198 | -| std | 0.0148 | -| value_loss | 2.64e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12834 | -| time_elapsed | 68660 | -| total_timesteps | 1642752 | -| train/ | | -| approx_kl | 0.004850723 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.8 | -| explained_variance | -5.94 | -| learning_rate | 0.0003 | -| loss | 0.00517 | -| n_updates | 128330 | -| policy_gradient_loss | 0.00627 | -| std | 0.0147 | -| value_loss | 1.66e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 12835 | -| time_elapsed | 68663 | -| total_timesteps | 1642880 | -| train/ | | -| approx_kl | 0.0032025836 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 2.8 | -| explained_variance | -0.422 | -| learning_rate | 0.0003 | -| loss | 0.00416 | -| n_updates | 128340 | -| policy_gradient_loss | 0.0265 | -| std | 0.0147 | -| value_loss | 3.08e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12836 | -| time_elapsed | 68666 | -| total_timesteps | 1643008 | -| train/ | | -| approx_kl | 0.039755505 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.8 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 128350 | -| policy_gradient_loss | 0.00302 | -| std | 0.0147 | -| value_loss | 1.71e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12837 | -| time_elapsed | 68673 | -| total_timesteps | 1643136 | -| train/ | | -| approx_kl | 0.24066304 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.8 | -| explained_variance | 0.458 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 128360 | -| policy_gradient_loss | -0.0164 | -| std | 0.0147 | -| value_loss | 0.0009 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12838 | -| time_elapsed | 68676 | -| total_timesteps | 1643264 | -| train/ | | -| approx_kl | 0.007939795 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.8 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 128370 | -| policy_gradient_loss | 0.000543 | -| std | 0.0147 | -| value_loss | 8.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12839 | -| time_elapsed | 68679 | -| total_timesteps | 1643392 | -| train/ | | -| approx_kl | 0.024679456 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.8 | -| explained_variance | -1.67e+03 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 128380 | -| policy_gradient_loss | -0.000725 | -| std | 0.0146 | -| value_loss | 1.62e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12840 | -| time_elapsed | 68682 | -| total_timesteps | 1643520 | -| train/ | | -| approx_kl | 3.140699e-05 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -172 | -| learning_rate | 0.0003 | -| loss | -0.000163 | -| n_updates | 128390 | -| policy_gradient_loss | 0.00133 | -| std | 0.0146 | -| value_loss | 1.54e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12841 | -| time_elapsed | 68686 | -| total_timesteps | 1643648 | -| train/ | | -| approx_kl | 0.0071205767 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -18.1 | -| learning_rate | 0.0003 | -| loss | 0.0091 | -| n_updates | 128400 | -| policy_gradient_loss | 0.00881 | -| std | 0.0146 | -| value_loss | 2.33e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12842 | -| time_elapsed | 68689 | -| total_timesteps | 1643776 | -| train/ | | -| approx_kl | 0.0029980643 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.601 | -| learning_rate | 0.0003 | -| loss | 0.00658 | -| n_updates | 128410 | -| policy_gradient_loss | 0.0164 | -| std | 0.0146 | -| value_loss | 3.8e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 12843 | -| time_elapsed | 68693 | -| total_timesteps | 1643904 | -| train/ | | -| approx_kl | 0.018277738 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 128420 | -| policy_gradient_loss | 0.035 | -| std | 0.0146 | -| value_loss | 2.12e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12844 | -| time_elapsed | 68696 | -| total_timesteps | 1644032 | -| train/ | | -| approx_kl | 0.02446646 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.00286 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 128430 | -| policy_gradient_loss | 0.0446 | -| std | 0.0146 | -| value_loss | 8.42e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12845 | -| time_elapsed | 68704 | -| total_timesteps | 1644160 | -| train/ | | -| approx_kl | 0.032674458 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 128440 | -| policy_gradient_loss | 0.0393 | -| std | 0.0146 | -| value_loss | 0.000122 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12846 | -| time_elapsed | 68708 | -| total_timesteps | 1644288 | -| train/ | | -| approx_kl | 0.0054156105 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.0084 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 128450 | -| policy_gradient_loss | 0.00251 | -| std | 0.0146 | -| value_loss | 1.28e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12847 | -| time_elapsed | 68711 | -| total_timesteps | 1644416 | -| train/ | | -| approx_kl | 0.15637869 | -| clip_fraction | 0.575 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0026 | -| learning_rate | 0.0003 | -| loss | 0.0902 | -| n_updates | 128460 | -| policy_gradient_loss | 0.0776 | -| std | 0.0146 | -| value_loss | 7.8e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12848 | -| time_elapsed | 68713 | -| total_timesteps | 1644544 | -| train/ | | -| approx_kl | 0.035926726 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.003 | -| learning_rate | 0.0003 | -| loss | 0.00931 | -| n_updates | 128470 | -| policy_gradient_loss | 0.00276 | -| std | 0.0146 | -| value_loss | 5.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12849 | -| time_elapsed | 68717 | -| total_timesteps | 1644672 | -| train/ | | -| approx_kl | 0.017876327 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.00617 | -| learning_rate | 0.0003 | -| loss | 0.00223 | -| n_updates | 128480 | -| policy_gradient_loss | 0.00418 | -| std | 0.0146 | -| value_loss | 3.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12850 | -| time_elapsed | 68720 | -| total_timesteps | 1644800 | -| train/ | | -| approx_kl | 0.08460158 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | 0.0702 | -| n_updates | 128490 | -| policy_gradient_loss | 0.0505 | -| std | 0.0146 | -| value_loss | 2.04e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 12851 | -| time_elapsed | 68724 | -| total_timesteps | 1644928 | -| train/ | | -| approx_kl | 0.032761764 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 128500 | -| policy_gradient_loss | 0.0327 | -| std | 0.0146 | -| value_loss | 1.73e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12852 | -| time_elapsed | 68727 | -| total_timesteps | 1645056 | -| train/ | | -| approx_kl | 0.038463473 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.00993 | -| learning_rate | 0.0003 | -| loss | 0.0572 | -| n_updates | 128510 | -| policy_gradient_loss | 0.0491 | -| std | 0.0146 | -| value_loss | 1.71e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12853 | -| time_elapsed | 68731 | -| total_timesteps | 1645184 | -| train/ | | -| approx_kl | 0.0703135 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | 0.00595 | -| n_updates | 128520 | -| policy_gradient_loss | 0.00551 | -| std | 0.0146 | -| value_loss | 8.07e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12854 | -| time_elapsed | 68734 | -| total_timesteps | 1645312 | -| train/ | | -| approx_kl | 0.060126312 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.00242 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 128530 | -| policy_gradient_loss | 0.00288 | -| std | 0.0146 | -| value_loss | 2e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12855 | -| time_elapsed | 68737 | -| total_timesteps | 1645440 | -| train/ | | -| approx_kl | 0.04242765 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.000953 | -| learning_rate | 0.0003 | -| loss | 0.00265 | -| n_updates | 128540 | -| policy_gradient_loss | -0.000837 | -| std | 0.0146 | -| value_loss | 2.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12856 | -| time_elapsed | 68740 | -| total_timesteps | 1645568 | -| train/ | | -| approx_kl | 0.013431134 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.000976 | -| n_updates | 128550 | -| policy_gradient_loss | 0.0029 | -| std | 0.0146 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12857 | -| time_elapsed | 68742 | -| total_timesteps | 1645696 | -| train/ | | -| approx_kl | 0.029470453 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 128560 | -| policy_gradient_loss | 0.0102 | -| std | 0.0146 | -| value_loss | 7.73e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12858 | -| time_elapsed | 68745 | -| total_timesteps | 1645824 | -| train/ | | -| approx_kl | 0.04063802 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 128570 | -| policy_gradient_loss | 0.00934 | -| std | 0.0146 | -| value_loss | 1e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12859 | -| time_elapsed | 68748 | -| total_timesteps | 1645952 | -| train/ | | -| approx_kl | 0.0136521235 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.00377 | -| n_updates | 128580 | -| policy_gradient_loss | -4.93e-05 | -| std | 0.0146 | -| value_loss | 2.97e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12860 | -| time_elapsed | 68751 | -| total_timesteps | 1646080 | -| train/ | | -| approx_kl | 0.0032242131 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.00327 | -| learning_rate | 0.0003 | -| loss | -0.00631 | -| n_updates | 128590 | -| policy_gradient_loss | 0.00269 | -| std | 0.0146 | -| value_loss | 4.09e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12861 | -| time_elapsed | 68756 | -| total_timesteps | 1646208 | -| train/ | | -| approx_kl | 0.024335464 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 128600 | -| policy_gradient_loss | -0.0167 | -| std | 0.0146 | -| value_loss | 8.89e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12862 | -| time_elapsed | 68759 | -| total_timesteps | 1646336 | -| train/ | | -| approx_kl | 0.1563705 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.0732 | -| n_updates | 128610 | -| policy_gradient_loss | 0.0134 | -| std | 0.0146 | -| value_loss | 8.62e-08 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12863 | -| time_elapsed | 68762 | -| total_timesteps | 1646464 | -| train/ | | -| approx_kl | 4.4624787e-05 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 128620 | -| policy_gradient_loss | 0.00851 | -| std | 0.0146 | -| value_loss | 3.21e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12864 | -| time_elapsed | 68766 | -| total_timesteps | 1646592 | -| train/ | | -| approx_kl | 0.0015420909 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.000773 | -| learning_rate | 0.0003 | -| loss | 0.00091 | -| n_updates | 128630 | -| policy_gradient_loss | 0.044 | -| std | 0.0146 | -| value_loss | 1.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12865 | -| time_elapsed | 68769 | -| total_timesteps | 1646720 | -| train/ | | -| approx_kl | 0.020978132 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0028 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 128640 | -| policy_gradient_loss | -0.00749 | -| std | 0.0146 | -| value_loss | 1.82e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12866 | -| time_elapsed | 68772 | -| total_timesteps | 1646848 | -| train/ | | -| approx_kl | 0.00023074774 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.00648 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 128650 | -| policy_gradient_loss | 0.00342 | -| std | 0.0145 | -| value_loss | 1.1e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 12867 | -| time_elapsed | 68775 | -| total_timesteps | 1646976 | -| train/ | | -| approx_kl | 0.014143808 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.00534 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 128660 | -| policy_gradient_loss | -0.00194 | -| std | 0.0145 | -| value_loss | 5.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12868 | -| time_elapsed | 68779 | -| total_timesteps | 1647104 | -| train/ | | -| approx_kl | 0.04974508 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.00852 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 128670 | -| policy_gradient_loss | 0.00354 | -| std | 0.0145 | -| value_loss | 5.3e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12869 | -| time_elapsed | 68787 | -| total_timesteps | 1647232 | -| train/ | | -| approx_kl | 0.0064528883 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | 0.782 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 128680 | -| policy_gradient_loss | -0.0165 | -| std | 0.0145 | -| value_loss | 0.00354 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12870 | -| time_elapsed | 68791 | -| total_timesteps | 1647360 | -| train/ | | -| approx_kl | 0.046944983 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | 0.00475 | -| n_updates | 128690 | -| policy_gradient_loss | -0.00377 | -| std | 0.0145 | -| value_loss | 1.16e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12871 | -| time_elapsed | 68794 | -| total_timesteps | 1647488 | -| train/ | | -| approx_kl | 0.0340124 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -29.1 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 128700 | -| policy_gradient_loss | -0.0118 | -| std | 0.0145 | -| value_loss | 6.5e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12872 | -| time_elapsed | 68799 | -| total_timesteps | 1647616 | -| train/ | | -| approx_kl | 0.14553852 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | 0.0397 | -| n_updates | 128710 | -| policy_gradient_loss | 0.00794 | -| std | 0.0145 | -| value_loss | 5.32e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12873 | -| time_elapsed | 68803 | -| total_timesteps | 1647744 | -| train/ | | -| approx_kl | 0.008639445 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.814 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 128720 | -| policy_gradient_loss | -0.00125 | -| std | 0.0145 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12874 | -| time_elapsed | 68807 | -| total_timesteps | 1647872 | -| train/ | | -| approx_kl | 0.011613256 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.237 | -| learning_rate | 0.0003 | -| loss | 1.21e-06 | -| n_updates | 128730 | -| policy_gradient_loss | -0.000248 | -| std | 0.0145 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12875 | -| time_elapsed | 68810 | -| total_timesteps | 1648000 | -| train/ | | -| approx_kl | 0.0018596095 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 128740 | -| policy_gradient_loss | 0.0005 | -| std | 0.0145 | -| value_loss | 5.54e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12876 | -| time_elapsed | 68814 | -| total_timesteps | 1648128 | -| train/ | | -| approx_kl | 0.012187385 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.00335 | -| learning_rate | 0.0003 | -| loss | 0.0032 | -| n_updates | 128750 | -| policy_gradient_loss | 0.00911 | -| std | 0.0145 | -| value_loss | 2.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12877 | -| time_elapsed | 68820 | -| total_timesteps | 1648256 | -| train/ | | -| approx_kl | 0.043799996 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 128760 | -| policy_gradient_loss | 0.0108 | -| std | 0.0145 | -| value_loss | 0.00126 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12878 | -| time_elapsed | 68823 | -| total_timesteps | 1648384 | -| train/ | | -| approx_kl | 0.018009419 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | 0.00522 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 128770 | -| policy_gradient_loss | 0.0128 | -| std | 0.0145 | -| value_loss | 2.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12879 | -| time_elapsed | 68827 | -| total_timesteps | 1648512 | -| train/ | | -| approx_kl | 0.005084626 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.00621 | -| learning_rate | 0.0003 | -| loss | 5.21e-05 | -| n_updates | 128780 | -| policy_gradient_loss | 0.0075 | -| std | 0.0145 | -| value_loss | 2.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12880 | -| time_elapsed | 68828 | -| total_timesteps | 1648640 | -| train/ | | -| approx_kl | 0.03392373 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 128790 | -| policy_gradient_loss | 0.0018 | -| std | 0.0145 | -| value_loss | 1.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12881 | -| time_elapsed | 68831 | -| total_timesteps | 1648768 | -| train/ | | -| approx_kl | 0.023261523 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 128800 | -| policy_gradient_loss | -0.00446 | -| std | 0.0145 | -| value_loss | 8.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12882 | -| time_elapsed | 68832 | -| total_timesteps | 1648896 | -| train/ | | -| approx_kl | 0.025403494 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 2.81 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 128810 | -| policy_gradient_loss | 0.00986 | -| std | 0.0145 | -| value_loss | 3.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12883 | -| time_elapsed | 68835 | -| total_timesteps | 1649024 | -| train/ | | -| approx_kl | 0.028789524 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | 0.00724 | -| n_updates | 128820 | -| policy_gradient_loss | 0.0121 | -| std | 0.0145 | -| value_loss | 1.9e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12884 | -| time_elapsed | 68843 | -| total_timesteps | 1649152 | -| train/ | | -| approx_kl | 0.13790353 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.00736 | -| n_updates | 128830 | -| policy_gradient_loss | -0.00996 | -| std | 0.0145 | -| value_loss | 0.000479 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12885 | -| time_elapsed | 68847 | -| total_timesteps | 1649280 | -| train/ | | -| approx_kl | 0.023522098 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | 0.00971 | -| n_updates | 128840 | -| policy_gradient_loss | 0.0128 | -| std | 0.0145 | -| value_loss | 1.63e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12886 | -| time_elapsed | 68850 | -| total_timesteps | 1649408 | -| train/ | | -| approx_kl | 0.0055172886 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.00144 | -| learning_rate | 0.0003 | -| loss | -0.000226 | -| n_updates | 128850 | -| policy_gradient_loss | 0.00729 | -| std | 0.0145 | -| value_loss | 2.21e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12887 | -| time_elapsed | 68854 | -| total_timesteps | 1649536 | -| train/ | | -| approx_kl | 0.011974434 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 128860 | -| policy_gradient_loss | 0.000496 | -| std | 0.0145 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12888 | -| time_elapsed | 68857 | -| total_timesteps | 1649664 | -| train/ | | -| approx_kl | 0.063604474 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 128870 | -| policy_gradient_loss | 0.0095 | -| std | 0.0145 | -| value_loss | 1.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12889 | -| time_elapsed | 68860 | -| total_timesteps | 1649792 | -| train/ | | -| approx_kl | 0.01187196 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | 0.00504 | -| n_updates | 128880 | -| policy_gradient_loss | 0.00575 | -| std | 0.0145 | -| value_loss | 8.36e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12890 | -| time_elapsed | 68865 | -| total_timesteps | 1649920 | -| train/ | | -| approx_kl | 0.02155543 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.00753 | -| n_updates | 128890 | -| policy_gradient_loss | 0.00602 | -| std | 0.0145 | -| value_loss | 5.73e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12891 | -| time_elapsed | 68869 | -| total_timesteps | 1650048 | -| train/ | | -| approx_kl | 0.03644105 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 128900 | -| policy_gradient_loss | 0.0194 | -| std | 0.0145 | -| value_loss | 4.32e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12892 | -| time_elapsed | 68874 | -| total_timesteps | 1650176 | -| train/ | | -| approx_kl | 0.5065208 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | 0.526 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 128910 | -| policy_gradient_loss | -0.016 | -| std | 0.0145 | -| value_loss | 0.000937 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12893 | -| time_elapsed | 68878 | -| total_timesteps | 1650304 | -| train/ | | -| approx_kl | 0.011936637 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -9.07 | -| learning_rate | 0.0003 | -| loss | 0.000505 | -| n_updates | 128920 | -| policy_gradient_loss | 0.00562 | -| std | 0.0144 | -| value_loss | 3.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12894 | -| time_elapsed | 68882 | -| total_timesteps | 1650432 | -| train/ | | -| approx_kl | 0.009623153 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -40.8 | -| learning_rate | 0.0003 | -| loss | -0.00523 | -| n_updates | 128930 | -| policy_gradient_loss | -0.00364 | -| std | 0.0144 | -| value_loss | 2.94e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12895 | -| time_elapsed | 68885 | -| total_timesteps | 1650560 | -| train/ | | -| approx_kl | 0.010319401 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -481 | -| learning_rate | 0.0003 | -| loss | 0.00737 | -| n_updates | 128940 | -| policy_gradient_loss | 0.00238 | -| std | 0.0144 | -| value_loss | 1.82e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12896 | -| time_elapsed | 68887 | -| total_timesteps | 1650688 | -| train/ | | -| approx_kl | 0.00084049813 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -1.02 | -| learning_rate | 0.0003 | -| loss | 0.00052 | -| n_updates | 128950 | -| policy_gradient_loss | 0.00027 | -| std | 0.0144 | -| value_loss | 9.04e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12897 | -| time_elapsed | 68892 | -| total_timesteps | 1650816 | -| train/ | | -| approx_kl | 0.00027106144 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | -0.000599 | -| n_updates | 128960 | -| policy_gradient_loss | -0.000478 | -| std | 0.0144 | -| value_loss | 4.93e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 12898 | -| time_elapsed | 68896 | -| total_timesteps | 1650944 | -| train/ | | -| approx_kl | 0.01986594 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.000546 | -| learning_rate | 0.0003 | -| loss | -0.00712 | -| n_updates | 128970 | -| policy_gradient_loss | -0.00568 | -| std | 0.0144 | -| value_loss | 1.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12899 | -| time_elapsed | 68899 | -| total_timesteps | 1651072 | -| train/ | | -| approx_kl | 0.022626515 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 128980 | -| policy_gradient_loss | 0.00896 | -| std | 0.0144 | -| value_loss | 3.27e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12900 | -| time_elapsed | 68905 | -| total_timesteps | 1651200 | -| train/ | | -| approx_kl | 0.7453322 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.52 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 128990 | -| policy_gradient_loss | -0.0158 | -| std | 0.0144 | -| value_loss | 0.00153 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12901 | -| time_elapsed | 68908 | -| total_timesteps | 1651328 | -| train/ | | -| approx_kl | 0.00050217565 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -3.48e+03 | -| learning_rate | 0.0003 | -| loss | 0.00286 | -| n_updates | 129000 | -| policy_gradient_loss | -0.000515 | -| std | 0.0144 | -| value_loss | 7.72e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12902 | -| time_elapsed | 68912 | -| total_timesteps | 1651456 | -| train/ | | -| approx_kl | 0.0021661106 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -11.3 | -| learning_rate | 0.0003 | -| loss | 0.00567 | -| n_updates | 129010 | -| policy_gradient_loss | 0.00824 | -| std | 0.0144 | -| value_loss | 2.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12903 | -| time_elapsed | 68916 | -| total_timesteps | 1651584 | -| train/ | | -| approx_kl | 0.043703225 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 129020 | -| policy_gradient_loss | 0.00249 | -| std | 0.0144 | -| value_loss | 1.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12904 | -| time_elapsed | 68919 | -| total_timesteps | 1651712 | -| train/ | | -| approx_kl | 0.04206332 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 129030 | -| policy_gradient_loss | 0.0172 | -| std | 0.0144 | -| value_loss | 3.52e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12905 | -| time_elapsed | 68922 | -| total_timesteps | 1651840 | -| train/ | | -| approx_kl | 0.031352393 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.82 | -| explained_variance | -0.00512 | -| learning_rate | 0.0003 | -| loss | 0.000796 | -| n_updates | 129040 | -| policy_gradient_loss | -0.000245 | -| std | 0.0143 | -| value_loss | 1.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 12906 | -| time_elapsed | 68925 | -| total_timesteps | 1651968 | -| train/ | | -| approx_kl | 0.011361321 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.00193 | -| learning_rate | 0.0003 | -| loss | -0.000972 | -| n_updates | 129050 | -| policy_gradient_loss | -0.0017 | -| std | 0.0143 | -| value_loss | 1.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12907 | -| time_elapsed | 68929 | -| total_timesteps | 1652096 | -| train/ | | -| approx_kl | 0.039225392 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.00334 | -| n_updates | 129060 | -| policy_gradient_loss | -0.000402 | -| std | 0.0143 | -| value_loss | 7.47e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12908 | -| time_elapsed | 68937 | -| total_timesteps | 1652224 | -| train/ | | -| approx_kl | 0.29072213 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.806 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 129070 | -| policy_gradient_loss | -0.0133 | -| std | 0.0143 | -| value_loss | 0.000418 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12909 | -| time_elapsed | 68940 | -| total_timesteps | 1652352 | -| train/ | | -| approx_kl | 0.0113583235 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -22.6 | -| learning_rate | 0.0003 | -| loss | -0.00887 | -| n_updates | 129080 | -| policy_gradient_loss | -0.00357 | -| std | 0.0143 | -| value_loss | 1.25e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12910 | -| time_elapsed | 68943 | -| total_timesteps | 1652480 | -| train/ | | -| approx_kl | 0.0065784696 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -38.9 | -| learning_rate | 0.0003 | -| loss | 0.00824 | -| n_updates | 129090 | -| policy_gradient_loss | 0.000641 | -| std | 0.0143 | -| value_loss | 6.8e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12911 | -| time_elapsed | 68946 | -| total_timesteps | 1652608 | -| train/ | | -| approx_kl | 2.9788818e-05 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -8.24 | -| learning_rate | 0.0003 | -| loss | -0.000221 | -| n_updates | 129100 | -| policy_gradient_loss | -0.000467 | -| std | 0.0143 | -| value_loss | 1.16e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12912 | -| time_elapsed | 68948 | -| total_timesteps | 1652736 | -| train/ | | -| approx_kl | 0.019736432 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 129110 | -| policy_gradient_loss | 0.00484 | -| std | 0.0143 | -| value_loss | 5.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12913 | -| time_elapsed | 68952 | -| total_timesteps | 1652864 | -| train/ | | -| approx_kl | 0.018097121 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 129120 | -| policy_gradient_loss | -0.000967 | -| std | 0.0143 | -| value_loss | 7.13e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 12914 | -| time_elapsed | 68956 | -| total_timesteps | 1652992 | -| train/ | | -| approx_kl | 0.024903875 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 129130 | -| policy_gradient_loss | 0.0414 | -| std | 0.0143 | -| value_loss | 4.29e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12915 | -| time_elapsed | 68959 | -| total_timesteps | 1653120 | -| train/ | | -| approx_kl | 0.0050270124 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 129140 | -| policy_gradient_loss | 0.00277 | -| std | 0.0143 | -| value_loss | 2.75e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12916 | -| time_elapsed | 68968 | -| total_timesteps | 1653248 | -| train/ | | -| approx_kl | 0.12507236 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.902 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 129150 | -| policy_gradient_loss | -0.0169 | -| std | 0.0143 | -| value_loss | 0.000249 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12917 | -| time_elapsed | 68972 | -| total_timesteps | 1653376 | -| train/ | | -| approx_kl | 0.12336152 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -1.18e+03 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 129160 | -| policy_gradient_loss | -0.00381 | -| std | 0.0142 | -| value_loss | 1.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12918 | -| time_elapsed | 68975 | -| total_timesteps | 1653504 | -| train/ | | -| approx_kl | 0.006798461 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -750 | -| learning_rate | 0.0003 | -| loss | -0.00628 | -| n_updates | 129170 | -| policy_gradient_loss | 0.000359 | -| std | 0.0142 | -| value_loss | 5.97e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12919 | -| time_elapsed | 68979 | -| total_timesteps | 1653632 | -| train/ | | -| approx_kl | 0.06919653 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -428 | -| learning_rate | 0.0003 | -| loss | 0.0497 | -| n_updates | 129180 | -| policy_gradient_loss | 0.0076 | -| std | 0.0142 | -| value_loss | 8.74e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12920 | -| time_elapsed | 68984 | -| total_timesteps | 1653760 | -| train/ | | -| approx_kl | 0.0049735657 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -1.57e+04 | -| learning_rate | 0.0003 | -| loss | 0.00557 | -| n_updates | 129190 | -| policy_gradient_loss | -0.000147 | -| std | 0.0142 | -| value_loss | 7.57e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12921 | -| time_elapsed | 68988 | -| total_timesteps | 1653888 | -| train/ | | -| approx_kl | 0.015113499 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -7.05e+03 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 129200 | -| policy_gradient_loss | 7.81e-05 | -| std | 0.0142 | -| value_loss | 8e-12 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12922 | -| time_elapsed | 68992 | -| total_timesteps | 1654016 | -| train/ | | -| approx_kl | 0.00047848234 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -449 | -| learning_rate | 0.0003 | -| loss | 0.00627 | -| n_updates | 129210 | -| policy_gradient_loss | -0.00579 | -| std | 0.0142 | -| value_loss | 9.19e-13 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12923 | -| time_elapsed | 69000 | -| total_timesteps | 1654144 | -| train/ | | -| approx_kl | 0.011446899 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.00911 | -| n_updates | 129220 | -| policy_gradient_loss | 0.00684 | -| std | 0.0142 | -| value_loss | 5.06e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12924 | -| time_elapsed | 69003 | -| total_timesteps | 1654272 | -| train/ | | -| approx_kl | 0.00712809 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.000326 | -| learning_rate | 0.0003 | -| loss | 0.00963 | -| n_updates | 129230 | -| policy_gradient_loss | 0.000741 | -| std | 0.0142 | -| value_loss | 1.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12925 | -| time_elapsed | 69008 | -| total_timesteps | 1654400 | -| train/ | | -| approx_kl | 0.09391774 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.000291 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 129240 | -| policy_gradient_loss | 0.00337 | -| std | 0.0142 | -| value_loss | 2.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12926 | -| time_elapsed | 69011 | -| total_timesteps | 1654528 | -| train/ | | -| approx_kl | 0.014132181 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 129250 | -| policy_gradient_loss | 0.00951 | -| std | 0.0142 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12927 | -| time_elapsed | 69014 | -| total_timesteps | 1654656 | -| train/ | | -| approx_kl | 0.047256805 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 129260 | -| policy_gradient_loss | 0.00356 | -| std | 0.0142 | -| value_loss | 1.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12928 | -| time_elapsed | 69018 | -| total_timesteps | 1654784 | -| train/ | | -| approx_kl | 0.033937745 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | 0.00638 | -| n_updates | 129270 | -| policy_gradient_loss | 0.0165 | -| std | 0.0142 | -| value_loss | 1.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12929 | -| time_elapsed | 69022 | -| total_timesteps | 1654912 | -| train/ | | -| approx_kl | 0.021676078 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.00629 | -| n_updates | 129280 | -| policy_gradient_loss | 0.00176 | -| std | 0.0142 | -| value_loss | 1.63e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12930 | -| time_elapsed | 69025 | -| total_timesteps | 1655040 | -| train/ | | -| approx_kl | 0.015558243 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 129290 | -| policy_gradient_loss | -0.01 | -| std | 0.0142 | -| value_loss | 2.85e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12931 | -| time_elapsed | 69033 | -| total_timesteps | 1655168 | -| train/ | | -| approx_kl | 0.0901859 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.663 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 129300 | -| policy_gradient_loss | -0.00109 | -| std | 0.0142 | -| value_loss | 0.00112 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12932 | -| time_elapsed | 69036 | -| total_timesteps | 1655296 | -| train/ | | -| approx_kl | 0.004647178 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | 0.00868 | -| n_updates | 129310 | -| policy_gradient_loss | 0.00492 | -| std | 0.0142 | -| value_loss | 7.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12933 | -| time_elapsed | 69039 | -| total_timesteps | 1655424 | -| train/ | | -| approx_kl | 0.008073483 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.00354 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 129320 | -| policy_gradient_loss | -0.000475 | -| std | 0.0142 | -| value_loss | 6.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12934 | -| time_elapsed | 69043 | -| total_timesteps | 1655552 | -| train/ | | -| approx_kl | 0.025483625 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.00926 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 129330 | -| policy_gradient_loss | 0.0149 | -| std | 0.0141 | -| value_loss | 3.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12935 | -| time_elapsed | 69046 | -| total_timesteps | 1655680 | -| train/ | | -| approx_kl | 0.03393505 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 129340 | -| policy_gradient_loss | 0.0167 | -| std | 0.0141 | -| value_loss | 2.28e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12936 | -| time_elapsed | 69049 | -| total_timesteps | 1655808 | -| train/ | | -| approx_kl | 0.05394336 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 129350 | -| policy_gradient_loss | 0.00537 | -| std | 0.0141 | -| value_loss | 1.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 12937 | -| time_elapsed | 69052 | -| total_timesteps | 1655936 | -| train/ | | -| approx_kl | 0.028182773 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | -0.00993 | -| n_updates | 129360 | -| policy_gradient_loss | 0.0015 | -| std | 0.0141 | -| value_loss | 1.33e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12938 | -| time_elapsed | 69054 | -| total_timesteps | 1656064 | -| train/ | | -| approx_kl | 1.8873252e-06 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.00997 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 129370 | -| policy_gradient_loss | 0.0275 | -| std | 0.0141 | -| value_loss | 1.85e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12939 | -| time_elapsed | 69060 | -| total_timesteps | 1656192 | -| train/ | | -| approx_kl | 0.4509374 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | 0.00429 | -| n_updates | 129380 | -| policy_gradient_loss | -0.00606 | -| std | 0.0141 | -| value_loss | 0.00147 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12940 | -| time_elapsed | 69064 | -| total_timesteps | 1656320 | -| train/ | | -| approx_kl | 0.007982032 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.714 | -| learning_rate | 0.0003 | -| loss | 0.00199 | -| n_updates | 129390 | -| policy_gradient_loss | 0.00629 | -| std | 0.0141 | -| value_loss | 6.68e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12941 | -| time_elapsed | 69067 | -| total_timesteps | 1656448 | -| train/ | | -| approx_kl | 0.030422458 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.4 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 129400 | -| policy_gradient_loss | 0.00792 | -| std | 0.0141 | -| value_loss | 1.86e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12942 | -| time_elapsed | 69072 | -| total_timesteps | 1656576 | -| train/ | | -| approx_kl | 0.0050916923 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.233 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 129410 | -| policy_gradient_loss | -0.0058 | -| std | 0.0141 | -| value_loss | 1.33e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12943 | -| time_elapsed | 69076 | -| total_timesteps | 1656704 | -| train/ | | -| approx_kl | 0.05485929 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0717 | -| learning_rate | 0.0003 | -| loss | 0.00306 | -| n_updates | 129420 | -| policy_gradient_loss | -0.00185 | -| std | 0.0141 | -| value_loss | 9.26e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12944 | -| time_elapsed | 69080 | -| total_timesteps | 1656832 | -| train/ | | -| approx_kl | 0.01893477 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 129430 | -| policy_gradient_loss | 0.00393 | -| std | 0.0141 | -| value_loss | 6.03e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 12945 | -| time_elapsed | 69082 | -| total_timesteps | 1656960 | -| train/ | | -| approx_kl | 0.028314805 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 129440 | -| policy_gradient_loss | 0.00973 | -| std | 0.0141 | -| value_loss | 9e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12946 | -| time_elapsed | 69086 | -| total_timesteps | 1657088 | -| train/ | | -| approx_kl | 0.01783994 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0085 | -| learning_rate | 0.0003 | -| loss | -0.00407 | -| n_updates | 129450 | -| policy_gradient_loss | -0.000403 | -| std | 0.0141 | -| value_loss | 3.39e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12947 | -| time_elapsed | 69095 | -| total_timesteps | 1657216 | -| train/ | | -| approx_kl | 0.0055698375 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.953 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 129460 | -| policy_gradient_loss | -0.0031 | -| std | 0.0141 | -| value_loss | 0.000317 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12948 | -| time_elapsed | 69098 | -| total_timesteps | 1657344 | -| train/ | | -| approx_kl | 0.08519727 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.00649 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 129470 | -| policy_gradient_loss | 0.00803 | -| std | 0.0141 | -| value_loss | 3.08e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12949 | -| time_elapsed | 69101 | -| total_timesteps | 1657472 | -| train/ | | -| approx_kl | 8.391822e-05 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 129480 | -| policy_gradient_loss | -0.00355 | -| std | 0.0141 | -| value_loss | 5.18e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12950 | -| time_elapsed | 69105 | -| total_timesteps | 1657600 | -| train/ | | -| approx_kl | 0.013616159 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 129490 | -| policy_gradient_loss | 0.013 | -| std | 0.0141 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12951 | -| time_elapsed | 69109 | -| total_timesteps | 1657728 | -| train/ | | -| approx_kl | 0.003986268 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.00801 | -| n_updates | 129500 | -| policy_gradient_loss | -0.00101 | -| std | 0.0141 | -| value_loss | 1.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12952 | -| time_elapsed | 69111 | -| total_timesteps | 1657856 | -| train/ | | -| approx_kl | 0.012097647 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 129510 | -| policy_gradient_loss | 0.00389 | -| std | 0.0141 | -| value_loss | 8.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 12953 | -| time_elapsed | 69115 | -| total_timesteps | 1657984 | -| train/ | | -| approx_kl | 0.033061203 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 129520 | -| policy_gradient_loss | -0.0033 | -| std | 0.0141 | -| value_loss | 7.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 12954 | -| time_elapsed | 69118 | -| total_timesteps | 1658112 | -| train/ | | -| approx_kl | 0.040497925 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | 0.00783 | -| n_updates | 129530 | -| policy_gradient_loss | 0.0152 | -| std | 0.0141 | -| value_loss | 6.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 12955 | -| time_elapsed | 69126 | -| total_timesteps | 1658240 | -| train/ | | -| approx_kl | 0.026906522 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.797 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 129540 | -| policy_gradient_loss | -0.0151 | -| std | 0.0141 | -| value_loss | 0.00279 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 12956 | -| time_elapsed | 69130 | -| total_timesteps | 1658368 | -| train/ | | -| approx_kl | 0.0057597496 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.541 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 129550 | -| policy_gradient_loss | 0.00187 | -| std | 0.0141 | -| value_loss | 1.08e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 12957 | -| time_elapsed | 69133 | -| total_timesteps | 1658496 | -| train/ | | -| approx_kl | 0.049309812 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -1.54 | -| learning_rate | 0.0003 | -| loss | -0.000974 | -| n_updates | 129560 | -| policy_gradient_loss | 0.00225 | -| std | 0.0141 | -| value_loss | 8e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 12958 | -| time_elapsed | 69137 | -| total_timesteps | 1658624 | -| train/ | | -| approx_kl | 0.0034934264 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.35 | -| learning_rate | 0.0003 | -| loss | -0.000232 | -| n_updates | 129570 | -| policy_gradient_loss | 0.00888 | -| std | 0.0141 | -| value_loss | 3.43e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 12959 | -| time_elapsed | 69141 | -| total_timesteps | 1658752 | -| train/ | | -| approx_kl | 0.036080565 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 129580 | -| policy_gradient_loss | 0.00347 | -| std | 0.014 | -| value_loss | 3.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 12960 | -| time_elapsed | 69143 | -| total_timesteps | 1658880 | -| train/ | | -| approx_kl | 0.017922897 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.00696 | -| n_updates | 129590 | -| policy_gradient_loss | 0.00416 | -| std | 0.014 | -| value_loss | 3.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12961 | -| time_elapsed | 69147 | -| total_timesteps | 1659008 | -| train/ | | -| approx_kl | 0.028246328 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.00389 | -| learning_rate | 0.0003 | -| loss | 0.0057 | -| n_updates | 129600 | -| policy_gradient_loss | 0.00573 | -| std | 0.014 | -| value_loss | 2.35e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12962 | -| time_elapsed | 69156 | -| total_timesteps | 1659136 | -| train/ | | -| approx_kl | 0.12537095 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.773 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 129610 | -| policy_gradient_loss | -0.0143 | -| std | 0.014 | -| value_loss | 0.00391 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12963 | -| time_elapsed | 69160 | -| total_timesteps | 1659264 | -| train/ | | -| approx_kl | 0.0012863604 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.0341 | -| learning_rate | 0.0003 | -| loss | -0.00393 | -| n_updates | 129620 | -| policy_gradient_loss | -0.00437 | -| std | 0.014 | -| value_loss | 0.00128 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12964 | -| time_elapsed | 69164 | -| total_timesteps | 1659392 | -| train/ | | -| approx_kl | 2.1568034e-05 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.000522 | -| n_updates | 129630 | -| policy_gradient_loss | -0.00269 | -| std | 0.014 | -| value_loss | 2.53e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12965 | -| time_elapsed | 69167 | -| total_timesteps | 1659520 | -| train/ | | -| approx_kl | 0.016955707 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.00864 | -| n_updates | 129640 | -| policy_gradient_loss | 0.0186 | -| std | 0.014 | -| value_loss | 3.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12966 | -| time_elapsed | 69170 | -| total_timesteps | 1659648 | -| train/ | | -| approx_kl | 0.003681798 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.00842 | -| n_updates | 129650 | -| policy_gradient_loss | -0.003 | -| std | 0.0141 | -| value_loss | 2.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12967 | -| time_elapsed | 69173 | -| total_timesteps | 1659776 | -| train/ | | -| approx_kl | 0.027112292 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 129660 | -| policy_gradient_loss | 0.0116 | -| std | 0.0141 | -| value_loss | 1.57e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 12968 | -| time_elapsed | 69177 | -| total_timesteps | 1659904 | -| train/ | | -| approx_kl | 0.03974827 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.00256 | -| n_updates | 129670 | -| policy_gradient_loss | 0.0017 | -| std | 0.0141 | -| value_loss | 1.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12969 | -| time_elapsed | 69180 | -| total_timesteps | 1660032 | -| train/ | | -| approx_kl | 0.068229444 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | 0.0374 | -| n_updates | 129680 | -| policy_gradient_loss | 0.0126 | -| std | 0.0141 | -| value_loss | 9.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12970 | -| time_elapsed | 69190 | -| total_timesteps | 1660160 | -| train/ | | -| approx_kl | 0.04315271 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 129690 | -| policy_gradient_loss | -0.0128 | -| std | 0.0141 | -| value_loss | 0.000373 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12971 | -| time_elapsed | 69193 | -| total_timesteps | 1660288 | -| train/ | | -| approx_kl | 0.005626184 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.0439 | -| learning_rate | 0.0003 | -| loss | -0.00629 | -| n_updates | 129700 | -| policy_gradient_loss | 0.00017 | -| std | 0.0141 | -| value_loss | 8.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12972 | -| time_elapsed | 69196 | -| total_timesteps | 1660416 | -| train/ | | -| approx_kl | 0.026375575 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 129710 | -| policy_gradient_loss | 0.00635 | -| std | 0.0141 | -| value_loss | 3.71e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12973 | -| time_elapsed | 69200 | -| total_timesteps | 1660544 | -| train/ | | -| approx_kl | 0.0074615264 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 129720 | -| policy_gradient_loss | -0.00433 | -| std | 0.0141 | -| value_loss | 2.85e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12974 | -| time_elapsed | 69203 | -| total_timesteps | 1660672 | -| train/ | | -| approx_kl | 0.1727925 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.0762 | -| n_updates | 129730 | -| policy_gradient_loss | 0.0157 | -| std | 0.0141 | -| value_loss | 1.98e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12975 | -| time_elapsed | 69206 | -| total_timesteps | 1660800 | -| train/ | | -| approx_kl | 0.026673615 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 129740 | -| policy_gradient_loss | 0.0173 | -| std | 0.0141 | -| value_loss | 4.43e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 12976 | -| time_elapsed | 69208 | -| total_timesteps | 1660928 | -| train/ | | -| approx_kl | 0.0041530803 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 129750 | -| policy_gradient_loss | 0.0314 | -| std | 0.0141 | -| value_loss | 2.96e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12977 | -| time_elapsed | 69212 | -| total_timesteps | 1661056 | -| train/ | | -| approx_kl | 0.007868533 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 129760 | -| policy_gradient_loss | 0.0273 | -| std | 0.0141 | -| value_loss | 1.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12978 | -| time_elapsed | 69217 | -| total_timesteps | 1661184 | -| train/ | | -| approx_kl | 0.015242864 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.781 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 129770 | -| policy_gradient_loss | -0.0139 | -| std | 0.0141 | -| value_loss | 0.00419 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 12979 | -| time_elapsed | 69222 | -| total_timesteps | 1661312 | -| train/ | | -| approx_kl | 0.022348315 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -4.12 | -| learning_rate | 0.0003 | -| loss | 0.000258 | -| n_updates | 129780 | -| policy_gradient_loss | -0.000323 | -| std | 0.0141 | -| value_loss | 3.56e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 12980 | -| time_elapsed | 69225 | -| total_timesteps | 1661440 | -| train/ | | -| approx_kl | 2.058642e-05 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -8.99 | -| learning_rate | 0.0003 | -| loss | 0.000955 | -| n_updates | 129790 | -| policy_gradient_loss | -0.00598 | -| std | 0.0141 | -| value_loss | 1.07e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 12981 | -| time_elapsed | 69229 | -| total_timesteps | 1661568 | -| train/ | | -| approx_kl | 0.020882871 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.524 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 129800 | -| policy_gradient_loss | 0.00905 | -| std | 0.0141 | -| value_loss | 7.65e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 12982 | -| time_elapsed | 69232 | -| total_timesteps | 1661696 | -| train/ | | -| approx_kl | 0.00020245183 | -| clip_fraction | 0.0531 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | 0.000513 | -| n_updates | 129810 | -| policy_gradient_loss | 0.000462 | -| std | 0.0141 | -| value_loss | 4.35e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 12983 | -| time_elapsed | 69235 | -| total_timesteps | 1661824 | -| train/ | | -| approx_kl | 0.0063319206 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.00258 | -| n_updates | 129820 | -| policy_gradient_loss | 0.0121 | -| std | 0.0141 | -| value_loss | 1.52e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 12984 | -| time_elapsed | 69237 | -| total_timesteps | 1661952 | -| train/ | | -| approx_kl | 0.021397233 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.00831 | -| learning_rate | 0.0003 | -| loss | -0.00636 | -| n_updates | 129830 | -| policy_gradient_loss | 0.0117 | -| std | 0.0142 | -| value_loss | 1.21e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12985 | -| time_elapsed | 69241 | -| total_timesteps | 1662080 | -| train/ | | -| approx_kl | 0.04871442 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.00394 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 129840 | -| policy_gradient_loss | 0.0109 | -| std | 0.0142 | -| value_loss | 7.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12986 | -| time_elapsed | 69247 | -| total_timesteps | 1662208 | -| train/ | | -| approx_kl | 0.016007952 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 129850 | -| policy_gradient_loss | -0.0203 | -| std | 0.0142 | -| value_loss | 0.000459 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12987 | -| time_elapsed | 69250 | -| total_timesteps | 1662336 | -| train/ | | -| approx_kl | 0.012669383 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.00229 | -| learning_rate | 0.0003 | -| loss | 0.00424 | -| n_updates | 129860 | -| policy_gradient_loss | 0.0124 | -| std | 0.0142 | -| value_loss | 1.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12988 | -| time_elapsed | 69253 | -| total_timesteps | 1662464 | -| train/ | | -| approx_kl | 0.006747147 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 129870 | -| policy_gradient_loss | 0.0204 | -| std | 0.0142 | -| value_loss | 3.95e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12989 | -| time_elapsed | 69257 | -| total_timesteps | 1662592 | -| train/ | | -| approx_kl | 0.007938188 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 129880 | -| policy_gradient_loss | 0.000224 | -| std | 0.0142 | -| value_loss | 3.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12990 | -| time_elapsed | 69261 | -| total_timesteps | 1662720 | -| train/ | | -| approx_kl | 0.01827959 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 129890 | -| policy_gradient_loss | 0.0364 | -| std | 0.0142 | -| value_loss | 1.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12991 | -| time_elapsed | 69264 | -| total_timesteps | 1662848 | -| train/ | | -| approx_kl | 0.03553202 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 129900 | -| policy_gradient_loss | -0.00533 | -| std | 0.0142 | -| value_loss | 1.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 12992 | -| time_elapsed | 69266 | -| total_timesteps | 1662976 | -| train/ | | -| approx_kl | 0.03277332 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 129910 | -| policy_gradient_loss | 0.00138 | -| std | 0.0142 | -| value_loss | 8.5e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 24 | -| iterations | 12993 | -| time_elapsed | 69270 | -| total_timesteps | 1663104 | -| train/ | | -| approx_kl | 0.0044180877 | -| clip_fraction | 0.0453 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.000687 | -| n_updates | 129920 | -| policy_gradient_loss | 0.000191 | -| std | 0.0142 | -| value_loss | 5.96e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 24 | -| iterations | 12994 | -| time_elapsed | 69277 | -| total_timesteps | 1663232 | -| train/ | | -| approx_kl | 0.13673943 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.395 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 129930 | -| policy_gradient_loss | -0.0162 | -| std | 0.0142 | -| value_loss | 0.00131 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 24 | -| iterations | 12995 | -| time_elapsed | 69281 | -| total_timesteps | 1663360 | -| train/ | | -| approx_kl | 0.0022887974 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.739 | -| learning_rate | 0.0003 | -| loss | -0.000463 | -| n_updates | 129940 | -| policy_gradient_loss | 0.0322 | -| std | 0.0142 | -| value_loss | 1.07e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 24 | -| iterations | 12996 | -| time_elapsed | 69284 | -| total_timesteps | 1663488 | -| train/ | | -| approx_kl | 0.019223021 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.44 | -| learning_rate | 0.0003 | -| loss | -0.00695 | -| n_updates | 129950 | -| policy_gradient_loss | 0.0186 | -| std | 0.0143 | -| value_loss | 7.99e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 24 | -| iterations | 12997 | -| time_elapsed | 69287 | -| total_timesteps | 1663616 | -| train/ | | -| approx_kl | 0.00016985787 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.0014 | -| n_updates | 129960 | -| policy_gradient_loss | 0.00608 | -| std | 0.0143 | -| value_loss | 1.5e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 24 | -| iterations | 12998 | -| time_elapsed | 69290 | -| total_timesteps | 1663744 | -| train/ | | -| approx_kl | 0.047241315 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.00622 | -| learning_rate | 0.0003 | -| loss | 0.05 | -| n_updates | 129970 | -| policy_gradient_loss | 0.0379 | -| std | 0.0143 | -| value_loss | 5.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 24 | -| iterations | 12999 | -| time_elapsed | 69293 | -| total_timesteps | 1663872 | -| train/ | | -| approx_kl | 0.034586936 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.055 | -| n_updates | 129980 | -| policy_gradient_loss | 0.0357 | -| std | 0.0143 | -| value_loss | 5.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13000 | -| time_elapsed | 69297 | -| total_timesteps | 1664000 | -| train/ | | -| approx_kl | 0.006700036 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 129990 | -| policy_gradient_loss | 0.00269 | -| std | 0.0143 | -| value_loss | 3.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13001 | -| time_elapsed | 69301 | -| total_timesteps | 1664128 | -| train/ | | -| approx_kl | 0.01221445 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.00279 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 130000 | -| policy_gradient_loss | 0.00593 | -| std | 0.0143 | -| value_loss | 1.61e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13002 | -| time_elapsed | 69307 | -| total_timesteps | 1664256 | -| train/ | | -| approx_kl | 0.2681118 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 130010 | -| policy_gradient_loss | -0.0153 | -| std | 0.0143 | -| value_loss | 0.001 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13003 | -| time_elapsed | 69311 | -| total_timesteps | 1664384 | -| train/ | | -| approx_kl | 0.049059346 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.00867 | -| learning_rate | 0.0003 | -| loss | 0.00341 | -| n_updates | 130020 | -| policy_gradient_loss | 0.00666 | -| std | 0.0143 | -| value_loss | 3.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13004 | -| time_elapsed | 69315 | -| total_timesteps | 1664512 | -| train/ | | -| approx_kl | 0.035992697 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 130030 | -| policy_gradient_loss | 0.00682 | -| std | 0.0143 | -| value_loss | 3.19e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13005 | -| time_elapsed | 69318 | -| total_timesteps | 1664640 | -| train/ | | -| approx_kl | 0.085490845 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.0801 | -| n_updates | 130040 | -| policy_gradient_loss | 0.0524 | -| std | 0.0143 | -| value_loss | 3.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13006 | -| time_elapsed | 69322 | -| total_timesteps | 1664768 | -| train/ | | -| approx_kl | 0.042962704 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.0456 | -| n_updates | 130050 | -| policy_gradient_loss | 0.0374 | -| std | 0.0143 | -| value_loss | 1.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13007 | -| time_elapsed | 69325 | -| total_timesteps | 1664896 | -| train/ | | -| approx_kl | 0.00688771 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 130060 | -| policy_gradient_loss | 0.00505 | -| std | 0.0143 | -| value_loss | 3.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13008 | -| time_elapsed | 69328 | -| total_timesteps | 1665024 | -| train/ | | -| approx_kl | 0.009798771 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00774 | -| n_updates | 130070 | -| policy_gradient_loss | -0.00296 | -| std | 0.0143 | -| value_loss | 9.37e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13009 | -| time_elapsed | 69336 | -| total_timesteps | 1665152 | -| train/ | | -| approx_kl | 0.2338619 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 130080 | -| policy_gradient_loss | -0.0169 | -| std | 0.0143 | -| value_loss | 0.000368 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13010 | -| time_elapsed | 69340 | -| total_timesteps | 1665280 | -| train/ | | -| approx_kl | 0.0525778 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.947 | -| learning_rate | 0.0003 | -| loss | 0.0344 | -| n_updates | 130090 | -| policy_gradient_loss | 0.0249 | -| std | 0.0143 | -| value_loss | 1.32e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13011 | -| time_elapsed | 69344 | -| total_timesteps | 1665408 | -| train/ | | -| approx_kl | 0.0057422174 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -6.56 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 130100 | -| policy_gradient_loss | -0.000892 | -| std | 0.0143 | -| value_loss | 8.29e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13012 | -| time_elapsed | 69348 | -| total_timesteps | 1665536 | -| train/ | | -| approx_kl | 0.018599728 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.784 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 130110 | -| policy_gradient_loss | 0.0139 | -| std | 0.0143 | -| value_loss | 2.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13013 | -| time_elapsed | 69351 | -| total_timesteps | 1665664 | -| train/ | | -| approx_kl | 0.006307712 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | 0.00169 | -| n_updates | 130120 | -| policy_gradient_loss | 0.00781 | -| std | 0.0143 | -| value_loss | 2.04e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13014 | -| time_elapsed | 69355 | -| total_timesteps | 1665792 | -| train/ | | -| approx_kl | 0.0059199724 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.00126 | -| learning_rate | 0.0003 | -| loss | -0.000727 | -| n_updates | 130130 | -| policy_gradient_loss | 0.0146 | -| std | 0.0143 | -| value_loss | 9.42e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13015 | -| time_elapsed | 69359 | -| total_timesteps | 1665920 | -| train/ | | -| approx_kl | 0.009440168 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.00343 | -| learning_rate | 0.0003 | -| loss | -0.00994 | -| n_updates | 130140 | -| policy_gradient_loss | -0.00392 | -| std | 0.0143 | -| value_loss | 6.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13016 | -| time_elapsed | 69361 | -| total_timesteps | 1666048 | -| train/ | | -| approx_kl | 0.016709024 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.0096 | -| n_updates | 130150 | -| policy_gradient_loss | -0.00256 | -| std | 0.0143 | -| value_loss | 3.57e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13017 | -| time_elapsed | 69368 | -| total_timesteps | 1666176 | -| train/ | | -| approx_kl | 0.0037886435 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | -0.000291 | -| n_updates | 130160 | -| policy_gradient_loss | 0.0198 | -| std | 0.0143 | -| value_loss | 0.00114 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13018 | -| time_elapsed | 69371 | -| total_timesteps | 1666304 | -| train/ | | -| approx_kl | 0.07589303 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 130170 | -| policy_gradient_loss | -0.000127 | -| std | 0.0143 | -| value_loss | 4.72e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13019 | -| time_elapsed | 69374 | -| total_timesteps | 1666432 | -| train/ | | -| approx_kl | 0.060571883 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.0291 | -| n_updates | 130180 | -| policy_gradient_loss | 0.00884 | -| std | 0.0143 | -| value_loss | 5.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13020 | -| time_elapsed | 69377 | -| total_timesteps | 1666560 | -| train/ | | -| approx_kl | 0.056722857 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -9.03 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 130190 | -| policy_gradient_loss | -0.00299 | -| std | 0.0143 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13021 | -| time_elapsed | 69380 | -| total_timesteps | 1666688 | -| train/ | | -| approx_kl | 0.020591598 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0696 | -| learning_rate | 0.0003 | -| loss | 0.00778 | -| n_updates | 130200 | -| policy_gradient_loss | 0.00889 | -| std | 0.0143 | -| value_loss | 1.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13022 | -| time_elapsed | 69383 | -| total_timesteps | 1666816 | -| train/ | | -| approx_kl | 0.032570202 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.00912 | -| n_updates | 130210 | -| policy_gradient_loss | 0.00451 | -| std | 0.0143 | -| value_loss | 7.41e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13023 | -| time_elapsed | 69388 | -| total_timesteps | 1666944 | -| train/ | | -| approx_kl | 0.0005870443 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.000454 | -| n_updates | 130220 | -| policy_gradient_loss | 0.00626 | -| std | 0.0143 | -| value_loss | 2.08e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13024 | -| time_elapsed | 69391 | -| total_timesteps | 1667072 | -| train/ | | -| approx_kl | 0.005324871 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 130230 | -| policy_gradient_loss | 0.00225 | -| std | 0.0142 | -| value_loss | 1.5e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13025 | -| time_elapsed | 69396 | -| total_timesteps | 1667200 | -| train/ | | -| approx_kl | 0.0024966188 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.831 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 130240 | -| policy_gradient_loss | -0.00522 | -| std | 0.0142 | -| value_loss | 0.00309 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13026 | -| time_elapsed | 69400 | -| total_timesteps | 1667328 | -| train/ | | -| approx_kl | 0.07510095 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.00913 | -| learning_rate | 0.0003 | -| loss | 0.0282 | -| n_updates | 130250 | -| policy_gradient_loss | 0.00692 | -| std | 0.0142 | -| value_loss | 3.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13027 | -| time_elapsed | 69404 | -| total_timesteps | 1667456 | -| train/ | | -| approx_kl | 0.021029936 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 130260 | -| policy_gradient_loss | 0.00616 | -| std | 0.0142 | -| value_loss | 4.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13028 | -| time_elapsed | 69407 | -| total_timesteps | 1667584 | -| train/ | | -| approx_kl | 0.009627519 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0858 | -| learning_rate | 0.0003 | -| loss | -0.00358 | -| n_updates | 130270 | -| policy_gradient_loss | 0.00358 | -| std | 0.0142 | -| value_loss | 2.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13029 | -| time_elapsed | 69410 | -| total_timesteps | 1667712 | -| train/ | | -| approx_kl | 0.03923227 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 130280 | -| policy_gradient_loss | 0.0123 | -| std | 0.0142 | -| value_loss | 1.91e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13030 | -| time_elapsed | 69414 | -| total_timesteps | 1667840 | -| train/ | | -| approx_kl | 0.038317595 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 130290 | -| policy_gradient_loss | -0.00207 | -| std | 0.0142 | -| value_loss | 1.36e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13031 | -| time_elapsed | 69417 | -| total_timesteps | 1667968 | -| train/ | | -| approx_kl | 0.1675587 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 130300 | -| policy_gradient_loss | 0.0207 | -| std | 0.0142 | -| value_loss | 4.54e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13032 | -| time_elapsed | 69420 | -| total_timesteps | 1668096 | -| train/ | | -| approx_kl | 0.0071187927 | -| clip_fraction | 0.0484 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 130310 | -| policy_gradient_loss | -0.00091 | -| std | 0.0142 | -| value_loss | 2.18e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13033 | -| time_elapsed | 69427 | -| total_timesteps | 1668224 | -| train/ | | -| approx_kl | 0.11213498 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 130320 | -| policy_gradient_loss | -0.0196 | -| std | 0.0142 | -| value_loss | 0.000425 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13034 | -| time_elapsed | 69430 | -| total_timesteps | 1668352 | -| train/ | | -| approx_kl | 1.9208994e-05 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -2.39 | -| learning_rate | 0.0003 | -| loss | 0.000162 | -| n_updates | 130330 | -| policy_gradient_loss | -8.08e-05 | -| std | 0.0142 | -| value_loss | 2.19e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13035 | -| time_elapsed | 69434 | -| total_timesteps | 1668480 | -| train/ | | -| approx_kl | 0.015667886 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -7.88 | -| learning_rate | 0.0003 | -| loss | 0.00266 | -| n_updates | 130340 | -| policy_gradient_loss | 0.00938 | -| std | 0.0142 | -| value_loss | 1.26e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13036 | -| time_elapsed | 69436 | -| total_timesteps | 1668608 | -| train/ | | -| approx_kl | 0.0032241442 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -1.63 | -| learning_rate | 0.0003 | -| loss | 0.00394 | -| n_updates | 130350 | -| policy_gradient_loss | -0.000476 | -| std | 0.0142 | -| value_loss | 1.71e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13037 | -| time_elapsed | 69439 | -| total_timesteps | 1668736 | -| train/ | | -| approx_kl | 0.022498937 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.00036 | -| n_updates | 130360 | -| policy_gradient_loss | 0.00317 | -| std | 0.0142 | -| value_loss | 4.36e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13038 | -| time_elapsed | 69442 | -| total_timesteps | 1668864 | -| train/ | | -| approx_kl | 0.080042474 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | 0.0608 | -| n_updates | 130370 | -| policy_gradient_loss | 0.0505 | -| std | 0.0142 | -| value_loss | 2.35e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 13039 | -| time_elapsed | 69444 | -| total_timesteps | 1668992 | -| train/ | | -| approx_kl | 0.012648113 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | 0.00049 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 130380 | -| policy_gradient_loss | 0.00227 | -| std | 0.0142 | -| value_loss | 1.42e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13040 | -| time_elapsed | 69446 | -| total_timesteps | 1669120 | -| train/ | | -| approx_kl | 0.010156484 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.00699 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 130390 | -| policy_gradient_loss | 0.000217 | -| std | 0.0142 | -| value_loss | 9.66e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13041 | -| time_elapsed | 69455 | -| total_timesteps | 1669248 | -| train/ | | -| approx_kl | 0.040790696 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -0.708 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 130400 | -| policy_gradient_loss | -0.0149 | -| std | 0.0142 | -| value_loss | 0.00201 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13042 | -| time_elapsed | 69458 | -| total_timesteps | 1669376 | -| train/ | | -| approx_kl | 0.02534043 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.83 | -| explained_variance | -3.38 | -| learning_rate | 0.0003 | -| loss | 0.00665 | -| n_updates | 130410 | -| policy_gradient_loss | 0.00382 | -| std | 0.0142 | -| value_loss | 2.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13043 | -| time_elapsed | 69462 | -| total_timesteps | 1669504 | -| train/ | | -| approx_kl | 0.014101174 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | 0.00454 | -| n_updates | 130420 | -| policy_gradient_loss | 0.000597 | -| std | 0.0142 | -| value_loss | 1.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13044 | -| time_elapsed | 69465 | -| total_timesteps | 1669632 | -| train/ | | -| approx_kl | 0.042773463 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -1.97 | -| learning_rate | 0.0003 | -| loss | 0.00784 | -| n_updates | 130430 | -| policy_gradient_loss | 0.00467 | -| std | 0.0141 | -| value_loss | 2.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13045 | -| time_elapsed | 69469 | -| total_timesteps | 1669760 | -| train/ | | -| approx_kl | 0.04380031 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 130440 | -| policy_gradient_loss | -0.00135 | -| std | 0.0141 | -| value_loss | 1.43e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13046 | -| time_elapsed | 69472 | -| total_timesteps | 1669888 | -| train/ | | -| approx_kl | 0.055428322 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 130450 | -| policy_gradient_loss | 0.00614 | -| std | 0.0141 | -| value_loss | 6.69e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13047 | -| time_elapsed | 69476 | -| total_timesteps | 1670016 | -| train/ | | -| approx_kl | 0.00034826575 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | -0.000933 | -| n_updates | 130460 | -| policy_gradient_loss | 0.000565 | -| std | 0.0141 | -| value_loss | 3.84e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13048 | -| time_elapsed | 69485 | -| total_timesteps | 1670144 | -| train/ | | -| approx_kl | 0.04876342 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | 0.472 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 130470 | -| policy_gradient_loss | -0.0115 | -| std | 0.0141 | -| value_loss | 0.00103 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13049 | -| time_elapsed | 69489 | -| total_timesteps | 1670272 | -| train/ | | -| approx_kl | 0.05423823 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.741 | -| learning_rate | 0.0003 | -| loss | 0.00205 | -| n_updates | 130480 | -| policy_gradient_loss | -0.000275 | -| std | 0.0141 | -| value_loss | 1.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13050 | -| time_elapsed | 69493 | -| total_timesteps | 1670400 | -| train/ | | -| approx_kl | 0.030876478 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 130490 | -| policy_gradient_loss | 0.00509 | -| std | 0.0141 | -| value_loss | 2.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13051 | -| time_elapsed | 69497 | -| total_timesteps | 1670528 | -| train/ | | -| approx_kl | 0.054021623 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | 0.000301 | -| n_updates | 130500 | -| policy_gradient_loss | -0.00217 | -| std | 0.0141 | -| value_loss | 4.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13052 | -| time_elapsed | 69500 | -| total_timesteps | 1670656 | -| train/ | | -| approx_kl | 0.038580056 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 130510 | -| policy_gradient_loss | 0.00526 | -| std | 0.0141 | -| value_loss | 3.76e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13053 | -| time_elapsed | 69504 | -| total_timesteps | 1670784 | -| train/ | | -| approx_kl | 0.13812372 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | 0.0549 | -| n_updates | 130520 | -| policy_gradient_loss | 0.012 | -| std | 0.0141 | -| value_loss | 3.71e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13054 | -| time_elapsed | 69507 | -| total_timesteps | 1670912 | -| train/ | | -| approx_kl | 0.0062733768 | -| clip_fraction | 0.0406 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 130530 | -| policy_gradient_loss | -0.000192 | -| std | 0.0141 | -| value_loss | 1.33e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13055 | -| time_elapsed | 69511 | -| total_timesteps | 1671040 | -| train/ | | -| approx_kl | 0.02806006 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.00314 | -| n_updates | 130540 | -| policy_gradient_loss | -0.000302 | -| std | 0.0141 | -| value_loss | 9.37e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13056 | -| time_elapsed | 69518 | -| total_timesteps | 1671168 | -| train/ | | -| approx_kl | 0.050256304 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 130550 | -| policy_gradient_loss | -0.0152 | -| std | 0.0141 | -| value_loss | 0.00326 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13057 | -| time_elapsed | 69521 | -| total_timesteps | 1671296 | -| train/ | | -| approx_kl | 5.6921504e-05 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 2.84 | -| explained_variance | -220 | -| learning_rate | 0.0003 | -| loss | -7.87e-05 | -| n_updates | 130560 | -| policy_gradient_loss | 0.00122 | -| std | 0.0141 | -| value_loss | 1.18e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13058 | -| time_elapsed | 69524 | -| total_timesteps | 1671424 | -| train/ | | -| approx_kl | 0.0037968517 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.00097 | -| n_updates | 130570 | -| policy_gradient_loss | 0.00184 | -| std | 0.014 | -| value_loss | 0.00035 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13059 | -| time_elapsed | 69527 | -| total_timesteps | 1671552 | -| train/ | | -| approx_kl | 0.06793078 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.00701 | -| learning_rate | 0.0003 | -| loss | 0.0487 | -| n_updates | 130580 | -| policy_gradient_loss | 0.0467 | -| std | 0.014 | -| value_loss | 0.000332 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13060 | -| time_elapsed | 69529 | -| total_timesteps | 1671680 | -| train/ | | -| approx_kl | 0.05905416 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.688 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 130590 | -| policy_gradient_loss | 0.00487 | -| std | 0.014 | -| value_loss | 0.000185 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13061 | -| time_elapsed | 69531 | -| total_timesteps | 1671808 | -| train/ | | -| approx_kl | 0.0111895725 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.24 | -| learning_rate | 0.0003 | -| loss | -0.000509 | -| n_updates | 130600 | -| policy_gradient_loss | 0.00381 | -| std | 0.014 | -| value_loss | 0.000145 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 13062 | -| time_elapsed | 69532 | -| total_timesteps | 1671936 | -| train/ | | -| approx_kl | 0.07393457 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.548 | -| learning_rate | 0.0003 | -| loss | 0.0396 | -| n_updates | 130610 | -| policy_gradient_loss | 0.0367 | -| std | 0.014 | -| value_loss | 0.000246 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13063 | -| time_elapsed | 69534 | -| total_timesteps | 1672064 | -| train/ | | -| approx_kl | 0.011338105 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 130620 | -| policy_gradient_loss | 0.00234 | -| std | 0.014 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13064 | -| time_elapsed | 69539 | -| total_timesteps | 1672192 | -| train/ | | -| approx_kl | 0.012858421 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 130630 | -| policy_gradient_loss | -0.0129 | -| std | 0.014 | -| value_loss | 0.000346 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13065 | -| time_elapsed | 69542 | -| total_timesteps | 1672320 | -| train/ | | -| approx_kl | 0.18261006 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 130640 | -| policy_gradient_loss | 0.0594 | -| std | 0.014 | -| value_loss | 1.03e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13066 | -| time_elapsed | 69546 | -| total_timesteps | 1672448 | -| train/ | | -| approx_kl | 0.0060241637 | -| clip_fraction | 0.0203 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | 0.00129 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 130650 | -| policy_gradient_loss | -0.00245 | -| std | 0.014 | -| value_loss | 8.77e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13067 | -| time_elapsed | 69549 | -| total_timesteps | 1672576 | -| train/ | | -| approx_kl | 0.0037940047 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 130660 | -| policy_gradient_loss | 0.00106 | -| std | 0.014 | -| value_loss | 1.24e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13068 | -| time_elapsed | 69552 | -| total_timesteps | 1672704 | -| train/ | | -| approx_kl | 0.0075234063 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.000633 | -| learning_rate | 0.0003 | -| loss | -0.000771 | -| n_updates | 130670 | -| policy_gradient_loss | 0.00733 | -| std | 0.014 | -| value_loss | 4.76e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13069 | -| time_elapsed | 69555 | -| total_timesteps | 1672832 | -| train/ | | -| approx_kl | 0.0308642 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.85 | -| explained_variance | -0.0073 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 130680 | -| policy_gradient_loss | 0.00746 | -| std | 0.0139 | -| value_loss | 1.56e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13070 | -| time_elapsed | 69559 | -| total_timesteps | 1672960 | -| train/ | | -| approx_kl | 0.003906082 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | 0.0042 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 130690 | -| policy_gradient_loss | 0.00546 | -| std | 0.0139 | -| value_loss | 4.18e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13071 | -| time_elapsed | 69562 | -| total_timesteps | 1673088 | -| train/ | | -| approx_kl | 0.01942985 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 130700 | -| policy_gradient_loss | -0.00796 | -| std | 0.0139 | -| value_loss | 4.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13072 | -| time_elapsed | 69570 | -| total_timesteps | 1673216 | -| train/ | | -| approx_kl | 0.026314761 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.745 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 130710 | -| policy_gradient_loss | -0.0108 | -| std | 0.0139 | -| value_loss | 0.0015 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13073 | -| time_elapsed | 69574 | -| total_timesteps | 1673344 | -| train/ | | -| approx_kl | 0.031618632 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | 0.000324 | -| n_updates | 130720 | -| policy_gradient_loss | 0.000293 | -| std | 0.0139 | -| value_loss | 1.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13074 | -| time_elapsed | 69579 | -| total_timesteps | 1673472 | -| train/ | | -| approx_kl | 0.16590664 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -266 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 130730 | -| policy_gradient_loss | -0.00514 | -| std | 0.0139 | -| value_loss | 4.02e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13075 | -| time_elapsed | 69582 | -| total_timesteps | 1673600 | -| train/ | | -| approx_kl | 0.0019872515 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -68.7 | -| learning_rate | 0.0003 | -| loss | 0.00588 | -| n_updates | 130740 | -| policy_gradient_loss | -0.00781 | -| std | 0.0139 | -| value_loss | 4.59e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13076 | -| time_elapsed | 69585 | -| total_timesteps | 1673728 | -| train/ | | -| approx_kl | 0.03311369 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -15.4 | -| learning_rate | 0.0003 | -| loss | 0.007 | -| n_updates | 130750 | -| policy_gradient_loss | 0.00697 | -| std | 0.0139 | -| value_loss | 9.31e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13077 | -| time_elapsed | 69589 | -| total_timesteps | 1673856 | -| train/ | | -| approx_kl | 0.008539033 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | -0.00742 | -| n_updates | 130760 | -| policy_gradient_loss | -0.00108 | -| std | 0.0139 | -| value_loss | 1.49e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13078 | -| time_elapsed | 69591 | -| total_timesteps | 1673984 | -| train/ | | -| approx_kl | 0.0104213245 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.626 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 130770 | -| policy_gradient_loss | -0.00143 | -| std | 0.0139 | -| value_loss | 7.44e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13079 | -| time_elapsed | 69594 | -| total_timesteps | 1674112 | -| train/ | | -| approx_kl | 0.022210222 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 130780 | -| policy_gradient_loss | -0.000883 | -| std | 0.0139 | -| value_loss | 4.92e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13080 | -| time_elapsed | 69604 | -| total_timesteps | 1674240 | -| train/ | | -| approx_kl | 0.035777964 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | 0.00447 | -| n_updates | 130790 | -| policy_gradient_loss | 0.00965 | -| std | 0.0139 | -| value_loss | 0.000115 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13081 | -| time_elapsed | 69608 | -| total_timesteps | 1674368 | -| train/ | | -| approx_kl | 0.0032338295 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0946 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 130800 | -| policy_gradient_loss | -0.00548 | -| std | 0.0139 | -| value_loss | 6.69e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13082 | -| time_elapsed | 69611 | -| total_timesteps | 1674496 | -| train/ | | -| approx_kl | 0.009486346 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.00153 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 130810 | -| policy_gradient_loss | 0.00676 | -| std | 0.0138 | -| value_loss | 5.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13083 | -| time_elapsed | 69616 | -| total_timesteps | 1674624 | -| train/ | | -| approx_kl | 0.030788718 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.00777 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 130820 | -| policy_gradient_loss | 0.0197 | -| std | 0.0138 | -| value_loss | 3.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13084 | -| time_elapsed | 69619 | -| total_timesteps | 1674752 | -| train/ | | -| approx_kl | 0.006326486 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 130830 | -| policy_gradient_loss | -0.0022 | -| std | 0.0138 | -| value_loss | 2.68e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13085 | -| time_elapsed | 69623 | -| total_timesteps | 1674880 | -| train/ | | -| approx_kl | 0.0868219 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 130840 | -| policy_gradient_loss | 0.000158 | -| std | 0.0138 | -| value_loss | 3.23e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13086 | -| time_elapsed | 69626 | -| total_timesteps | 1675008 | -| train/ | | -| approx_kl | 8.443091e-05 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | 0.00163 | -| n_updates | 130850 | -| policy_gradient_loss | -0.00543 | -| std | 0.0138 | -| value_loss | 9.5e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13087 | -| time_elapsed | 69634 | -| total_timesteps | 1675136 | -| train/ | | -| approx_kl | 0.06037076 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | 0.504 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 130860 | -| policy_gradient_loss | -0.0154 | -| std | 0.0138 | -| value_loss | 0.000746 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13088 | -| time_elapsed | 69638 | -| total_timesteps | 1675264 | -| train/ | | -| approx_kl | 0.10490415 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 130870 | -| policy_gradient_loss | 0.0291 | -| std | 0.0138 | -| value_loss | 2.23e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13089 | -| time_elapsed | 69642 | -| total_timesteps | 1675392 | -| train/ | | -| approx_kl | 0.058949284 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | 0.0265 | -| n_updates | 130880 | -| policy_gradient_loss | 0.0276 | -| std | 0.0138 | -| value_loss | 6.37e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13090 | -| time_elapsed | 69646 | -| total_timesteps | 1675520 | -| train/ | | -| approx_kl | 0.008599471 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.509 | -| learning_rate | 0.0003 | -| loss | -0.00534 | -| n_updates | 130890 | -| policy_gradient_loss | 0.00482 | -| std | 0.0138 | -| value_loss | 3.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13091 | -| time_elapsed | 69650 | -| total_timesteps | 1675648 | -| train/ | | -| approx_kl | 0.014006542 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 130900 | -| policy_gradient_loss | 0.00568 | -| std | 0.0138 | -| value_loss | 1.78e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13092 | -| time_elapsed | 69653 | -| total_timesteps | 1675776 | -| train/ | | -| approx_kl | 0.00070236344 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0576 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 130910 | -| policy_gradient_loss | 0.00541 | -| std | 0.0138 | -| value_loss | 1.18e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13093 | -| time_elapsed | 69656 | -| total_timesteps | 1675904 | -| train/ | | -| approx_kl | 0.09907295 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 130920 | -| policy_gradient_loss | 0.00611 | -| std | 0.0138 | -| value_loss | 8.43e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13094 | -| time_elapsed | 69659 | -| total_timesteps | 1676032 | -| train/ | | -| approx_kl | 0.08668352 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 130930 | -| policy_gradient_loss | 0.00189 | -| std | 0.0138 | -| value_loss | 5.29e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13095 | -| time_elapsed | 69666 | -| total_timesteps | 1676160 | -| train/ | | -| approx_kl | 0.022739206 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 130940 | -| policy_gradient_loss | -0.0109 | -| std | 0.0138 | -| value_loss | 0.00031 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13096 | -| time_elapsed | 69670 | -| total_timesteps | 1676288 | -| train/ | | -| approx_kl | 0.006804385 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 130950 | -| policy_gradient_loss | 0.00175 | -| std | 0.0138 | -| value_loss | 1.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13097 | -| time_elapsed | 69673 | -| total_timesteps | 1676416 | -| train/ | | -| approx_kl | 0.010971434 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -3 | -| learning_rate | 0.0003 | -| loss | 0.000555 | -| n_updates | 130960 | -| policy_gradient_loss | 0.00244 | -| std | 0.0138 | -| value_loss | 1.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13098 | -| time_elapsed | 69676 | -| total_timesteps | 1676544 | -| train/ | | -| approx_kl | 0.090595916 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.598 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 130970 | -| policy_gradient_loss | 0.0043 | -| std | 0.0138 | -| value_loss | 5.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13099 | -| time_elapsed | 69678 | -| total_timesteps | 1676672 | -| train/ | | -| approx_kl | 0.017645296 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.000656 | -| n_updates | 130980 | -| policy_gradient_loss | 0.0111 | -| std | 0.0138 | -| value_loss | 3.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13100 | -| time_elapsed | 69683 | -| total_timesteps | 1676800 | -| train/ | | -| approx_kl | 0.022667155 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 130990 | -| policy_gradient_loss | 0.00945 | -| std | 0.0138 | -| value_loss | 1.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13101 | -| time_elapsed | 69686 | -| total_timesteps | 1676928 | -| train/ | | -| approx_kl | 0.11712988 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | 0.0885 | -| n_updates | 131000 | -| policy_gradient_loss | 0.0558 | -| std | 0.0138 | -| value_loss | 6.67e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13102 | -| time_elapsed | 69690 | -| total_timesteps | 1677056 | -| train/ | | -| approx_kl | 0.00034806132 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | -0.00314 | -| n_updates | 131010 | -| policy_gradient_loss | 0.0118 | -| std | 0.0138 | -| value_loss | 2.22e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13103 | -| time_elapsed | 69696 | -| total_timesteps | 1677184 | -| train/ | | -| approx_kl | 0.05889743 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -6.83 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 131020 | -| policy_gradient_loss | -0.0118 | -| std | 0.0138 | -| value_loss | 0.00219 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13104 | -| time_elapsed | 69701 | -| total_timesteps | 1677312 | -| train/ | | -| approx_kl | 0.029448533 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -18.4 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 131030 | -| policy_gradient_loss | -0.000197 | -| std | 0.0138 | -| value_loss | 2.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13105 | -| time_elapsed | 69704 | -| total_timesteps | 1677440 | -| train/ | | -| approx_kl | 0.0015527904 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.000313 | -| n_updates | 131040 | -| policy_gradient_loss | 0.0212 | -| std | 0.0138 | -| value_loss | 2.13e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13106 | -| time_elapsed | 69707 | -| total_timesteps | 1677568 | -| train/ | | -| approx_kl | 0.03129957 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 131050 | -| policy_gradient_loss | 0.00959 | -| std | 0.0138 | -| value_loss | 4.2e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13107 | -| time_elapsed | 69712 | -| total_timesteps | 1677696 | -| train/ | | -| approx_kl | 0.09430863 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.0609 | -| n_updates | 131060 | -| policy_gradient_loss | 0.0272 | -| std | 0.0138 | -| value_loss | 8.96e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13108 | -| time_elapsed | 69715 | -| total_timesteps | 1677824 | -| train/ | | -| approx_kl | 0.009128502 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | 0.00451 | -| learning_rate | 0.0003 | -| loss | -0.00711 | -| n_updates | 131070 | -| policy_gradient_loss | 0.0174 | -| std | 0.0138 | -| value_loss | 7.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13109 | -| time_elapsed | 69719 | -| total_timesteps | 1677952 | -| train/ | | -| approx_kl | 0.00402213 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 131080 | -| policy_gradient_loss | 0.00842 | -| std | 0.0138 | -| value_loss | 4.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13110 | -| time_elapsed | 69722 | -| total_timesteps | 1678080 | -| train/ | | -| approx_kl | 0.007425876 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 131090 | -| policy_gradient_loss | 0.0181 | -| std | 0.0138 | -| value_loss | 4.19e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13111 | -| time_elapsed | 69727 | -| total_timesteps | 1678208 | -| train/ | | -| approx_kl | 0.051025543 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | 0.807 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 131100 | -| policy_gradient_loss | -0.0151 | -| std | 0.0138 | -| value_loss | 0.00046 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13112 | -| time_elapsed | 69731 | -| total_timesteps | 1678336 | -| train/ | | -| approx_kl | 0.031651057 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 131110 | -| policy_gradient_loss | -0.00834 | -| std | 0.0138 | -| value_loss | 3.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13113 | -| time_elapsed | 69735 | -| total_timesteps | 1678464 | -| train/ | | -| approx_kl | 0.007700668 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 131120 | -| policy_gradient_loss | -0.00395 | -| std | 0.0138 | -| value_loss | 8.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13114 | -| time_elapsed | 69737 | -| total_timesteps | 1678592 | -| train/ | | -| approx_kl | 0.025976121 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.00716 | -| learning_rate | 0.0003 | -| loss | 0.00461 | -| n_updates | 131130 | -| policy_gradient_loss | -0.00184 | -| std | 0.0138 | -| value_loss | 6.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13115 | -| time_elapsed | 69742 | -| total_timesteps | 1678720 | -| train/ | | -| approx_kl | 0.05349773 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.86 | -| explained_variance | -0.00932 | -| learning_rate | 0.0003 | -| loss | 0.0299 | -| n_updates | 131140 | -| policy_gradient_loss | 0.00429 | -| std | 0.0138 | -| value_loss | 1.16e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13116 | -| time_elapsed | 69745 | -| total_timesteps | 1678848 | -| train/ | | -| approx_kl | 0.0017375955 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00599 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 131150 | -| policy_gradient_loss | 0.00169 | -| std | 0.0138 | -| value_loss | 2.55e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13117 | -| time_elapsed | 69749 | -| total_timesteps | 1678976 | -| train/ | | -| approx_kl | 0.015151234 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 131160 | -| policy_gradient_loss | -0.00564 | -| std | 0.0138 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13118 | -| time_elapsed | 69753 | -| total_timesteps | 1679104 | -| train/ | | -| approx_kl | 0.024425428 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 131170 | -| policy_gradient_loss | 0.0363 | -| std | 0.0138 | -| value_loss | 9.4e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13119 | -| time_elapsed | 69762 | -| total_timesteps | 1679232 | -| train/ | | -| approx_kl | 0.033894036 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.885 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 131180 | -| policy_gradient_loss | -0.0144 | -| std | 0.0138 | -| value_loss | 0.00126 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13120 | -| time_elapsed | 69764 | -| total_timesteps | 1679360 | -| train/ | | -| approx_kl | 0.010674251 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -69.7 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 131190 | -| policy_gradient_loss | -0.00744 | -| std | 0.0138 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13121 | -| time_elapsed | 69767 | -| total_timesteps | 1679488 | -| train/ | | -| approx_kl | 0.027368043 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -54.9 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 131200 | -| policy_gradient_loss | 0.00407 | -| std | 0.0138 | -| value_loss | 4.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13122 | -| time_elapsed | 69771 | -| total_timesteps | 1679616 | -| train/ | | -| approx_kl | 0.006075809 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -9.36 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 131210 | -| policy_gradient_loss | -0.00165 | -| std | 0.0138 | -| value_loss | 6.03e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13123 | -| time_elapsed | 69774 | -| total_timesteps | 1679744 | -| train/ | | -| approx_kl | 0.106441416 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -1.32 | -| learning_rate | 0.0003 | -| loss | 0.0398 | -| n_updates | 131220 | -| policy_gradient_loss | 0.00728 | -| std | 0.0138 | -| value_loss | 3.46e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13124 | -| time_elapsed | 69778 | -| total_timesteps | 1679872 | -| train/ | | -| approx_kl | 0.01711538 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 131230 | -| policy_gradient_loss | 0.013 | -| std | 0.0138 | -| value_loss | 1.26e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13125 | -| time_elapsed | 69783 | -| total_timesteps | 1680000 | -| train/ | | -| approx_kl | 0.022575427 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0018 | -| learning_rate | 0.0003 | -| loss | -0.000129 | -| n_updates | 131240 | -| policy_gradient_loss | -0.00195 | -| std | 0.0138 | -| value_loss | 8.96e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13126 | -| time_elapsed | 69786 | -| total_timesteps | 1680128 | -| train/ | | -| approx_kl | 0.003056765 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.000542 | -| learning_rate | 0.0003 | -| loss | 0.00895 | -| n_updates | 131250 | -| policy_gradient_loss | -0.000151 | -| std | 0.0138 | -| value_loss | 4.59e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13127 | -| time_elapsed | 69793 | -| total_timesteps | 1680256 | -| train/ | | -| approx_kl | 0.013714884 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.701 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 131260 | -| policy_gradient_loss | -0.0122 | -| std | 0.0138 | -| value_loss | 0.00524 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13128 | -| time_elapsed | 69797 | -| total_timesteps | 1680384 | -| train/ | | -| approx_kl | 0.14587359 | -| clip_fraction | 0.599 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 131270 | -| policy_gradient_loss | 0.0686 | -| std | 0.0138 | -| value_loss | 7.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13129 | -| time_elapsed | 69800 | -| total_timesteps | 1680512 | -| train/ | | -| approx_kl | 0.050900318 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 131280 | -| policy_gradient_loss | -0.00474 | -| std | 0.0138 | -| value_loss | 2.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13130 | -| time_elapsed | 69803 | -| total_timesteps | 1680640 | -| train/ | | -| approx_kl | 0.024352578 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 131290 | -| policy_gradient_loss | -0.00121 | -| std | 0.0138 | -| value_loss | 1.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13131 | -| time_elapsed | 69806 | -| total_timesteps | 1680768 | -| train/ | | -| approx_kl | 0.034485504 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.00378 | -| n_updates | 131300 | -| policy_gradient_loss | 0.00218 | -| std | 0.0138 | -| value_loss | 1.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13132 | -| time_elapsed | 69810 | -| total_timesteps | 1680896 | -| train/ | | -| approx_kl | 0.15992868 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | 0.0998 | -| n_updates | 131310 | -| policy_gradient_loss | 0.0203 | -| std | 0.0138 | -| value_loss | 6.93e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13133 | -| time_elapsed | 69814 | -| total_timesteps | 1681024 | -| train/ | | -| approx_kl | 0.009308623 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | -0.00789 | -| n_updates | 131320 | -| policy_gradient_loss | -0.0029 | -| std | 0.0138 | -| value_loss | 4.62e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13134 | -| time_elapsed | 69822 | -| total_timesteps | 1681152 | -| train/ | | -| approx_kl | 0.03218648 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 131330 | -| policy_gradient_loss | -0.00637 | -| std | 0.0138 | -| value_loss | 3.65e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13135 | -| time_elapsed | 69826 | -| total_timesteps | 1681280 | -| train/ | | -| approx_kl | 0.0034542265 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.0191 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 131340 | -| policy_gradient_loss | -0.00676 | -| std | 0.0138 | -| value_loss | 0.000311 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13136 | -| time_elapsed | 69829 | -| total_timesteps | 1681408 | -| train/ | | -| approx_kl | 0.008477915 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00664 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 131350 | -| policy_gradient_loss | -0.00216 | -| std | 0.0138 | -| value_loss | 1.93e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13137 | -| time_elapsed | 69831 | -| total_timesteps | 1681536 | -| train/ | | -| approx_kl | 0.013312753 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.00203 | -| learning_rate | 0.0003 | -| loss | -0.00564 | -| n_updates | 131360 | -| policy_gradient_loss | -0.00315 | -| std | 0.0137 | -| value_loss | 2.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13138 | -| time_elapsed | 69835 | -| total_timesteps | 1681664 | -| train/ | | -| approx_kl | 0.010713647 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.00159 | -| n_updates | 131370 | -| policy_gradient_loss | 0.000812 | -| std | 0.0137 | -| value_loss | 1.16e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13139 | -| time_elapsed | 69837 | -| total_timesteps | 1681792 | -| train/ | | -| approx_kl | 0.00036129216 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.00296 | -| n_updates | 131380 | -| policy_gradient_loss | -0.00625 | -| std | 0.0137 | -| value_loss | 9.05e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13140 | -| time_elapsed | 69840 | -| total_timesteps | 1681920 | -| train/ | | -| approx_kl | 0.007980734 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 131390 | -| policy_gradient_loss | -0.00179 | -| std | 0.0137 | -| value_loss | 5.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13141 | -| time_elapsed | 69844 | -| total_timesteps | 1682048 | -| train/ | | -| approx_kl | 0.015190198 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | -0.00913 | -| n_updates | 131400 | -| policy_gradient_loss | -0.00477 | -| std | 0.0137 | -| value_loss | 2.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13142 | -| time_elapsed | 69850 | -| total_timesteps | 1682176 | -| train/ | | -| approx_kl | 0.031708557 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -5.35 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 131410 | -| policy_gradient_loss | -0.0142 | -| std | 0.0137 | -| value_loss | 0.00202 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13143 | -| time_elapsed | 69854 | -| total_timesteps | 1682304 | -| train/ | | -| approx_kl | 0.002109934 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | -0.00854 | -| n_updates | 131420 | -| policy_gradient_loss | -0.0107 | -| std | 0.0137 | -| value_loss | 6.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13144 | -| time_elapsed | 69858 | -| total_timesteps | 1682432 | -| train/ | | -| approx_kl | 0.025523623 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.358 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 131430 | -| policy_gradient_loss | -0.0109 | -| std | 0.0137 | -| value_loss | 2.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13145 | -| time_elapsed | 69861 | -| total_timesteps | 1682560 | -| train/ | | -| approx_kl | 0.08721095 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 131440 | -| policy_gradient_loss | 0.0185 | -| std | 0.0137 | -| value_loss | 1.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13146 | -| time_elapsed | 69865 | -| total_timesteps | 1682688 | -| train/ | | -| approx_kl | 0.013818651 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.0022 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 131450 | -| policy_gradient_loss | 0.00379 | -| std | 0.0137 | -| value_loss | 1.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13147 | -| time_elapsed | 69869 | -| total_timesteps | 1682816 | -| train/ | | -| approx_kl | 0.09166925 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00565 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 131460 | -| policy_gradient_loss | 0.00282 | -| std | 0.0137 | -| value_loss | 7.76e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13148 | -| time_elapsed | 69873 | -| total_timesteps | 1682944 | -| train/ | | -| approx_kl | 2.367096e-05 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | 0.000453 | -| n_updates | 131470 | -| policy_gradient_loss | -0.00227 | -| std | 0.0137 | -| value_loss | 4.45e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13149 | -| time_elapsed | 69874 | -| total_timesteps | 1683072 | -| train/ | | -| approx_kl | 0.017727839 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.00719 | -| n_updates | 131480 | -| policy_gradient_loss | 0.0204 | -| std | 0.0137 | -| value_loss | 2.64e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13150 | -| time_elapsed | 69880 | -| total_timesteps | 1683200 | -| train/ | | -| approx_kl | 0.022476198 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.791 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 131490 | -| policy_gradient_loss | -0.0138 | -| std | 0.0137 | -| value_loss | 0.00254 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13151 | -| time_elapsed | 69885 | -| total_timesteps | 1683328 | -| train/ | | -| approx_kl | 0.0062249815 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.508 | -| learning_rate | 0.0003 | -| loss | 0.00481 | -| n_updates | 131500 | -| policy_gradient_loss | 0.0147 | -| std | 0.0137 | -| value_loss | 1.81e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13152 | -| time_elapsed | 69887 | -| total_timesteps | 1683456 | -| train/ | | -| approx_kl | 0.000247919 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -338 | -| learning_rate | 0.0003 | -| loss | 0.0014 | -| n_updates | 131510 | -| policy_gradient_loss | -0.00266 | -| std | 0.0137 | -| value_loss | 1.19e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13153 | -| time_elapsed | 69890 | -| total_timesteps | 1683584 | -| train/ | | -| approx_kl | 0.06402307 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -19.7 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 131520 | -| policy_gradient_loss | 0.00114 | -| std | 0.0137 | -| value_loss | 9.2e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13154 | -| time_elapsed | 69893 | -| total_timesteps | 1683712 | -| train/ | | -| approx_kl | 0.05421446 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -3.37 | -| learning_rate | 0.0003 | -| loss | 0.00511 | -| n_updates | 131530 | -| policy_gradient_loss | 0.00144 | -| std | 0.0137 | -| value_loss | 1.77e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13155 | -| time_elapsed | 69897 | -| total_timesteps | 1683840 | -| train/ | | -| approx_kl | 0.022535566 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.476 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 131540 | -| policy_gradient_loss | -0.00477 | -| std | 0.0137 | -| value_loss | 7.22e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13156 | -| time_elapsed | 69899 | -| total_timesteps | 1683968 | -| train/ | | -| approx_kl | 0.081765585 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.0838 | -| n_updates | 131550 | -| policy_gradient_loss | 0.0606 | -| std | 0.0137 | -| value_loss | 4.88e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13157 | -| time_elapsed | 69903 | -| total_timesteps | 1684096 | -| train/ | | -| approx_kl | 0.013572293 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.0013 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 131560 | -| policy_gradient_loss | 0.00433 | -| std | 0.0137 | -| value_loss | 3.71e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13158 | -| time_elapsed | 69911 | -| total_timesteps | 1684224 | -| train/ | | -| approx_kl | 0.027596537 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 131570 | -| policy_gradient_loss | -0.0134 | -| std | 0.0137 | -| value_loss | 0.000339 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13159 | -| time_elapsed | 69914 | -| total_timesteps | 1684352 | -| train/ | | -| approx_kl | 0.15093619 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0052 | -| learning_rate | 0.0003 | -| loss | 0.0807 | -| n_updates | 131580 | -| policy_gradient_loss | 0.0203 | -| std | 0.0137 | -| value_loss | 6.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13160 | -| time_elapsed | 69918 | -| total_timesteps | 1684480 | -| train/ | | -| approx_kl | 0.0039102803 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 131590 | -| policy_gradient_loss | -0.00695 | -| std | 0.0137 | -| value_loss | 2.48e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13161 | -| time_elapsed | 69922 | -| total_timesteps | 1684608 | -| train/ | | -| approx_kl | 0.0039774515 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | -0.000734 | -| n_updates | 131600 | -| policy_gradient_loss | 0.000466 | -| std | 0.0137 | -| value_loss | 1.42e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13162 | -| time_elapsed | 69925 | -| total_timesteps | 1684736 | -| train/ | | -| approx_kl | 0.0021863412 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 131610 | -| policy_gradient_loss | 0.00481 | -| std | 0.0137 | -| value_loss | 1.9e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13163 | -| time_elapsed | 69928 | -| total_timesteps | 1684864 | -| train/ | | -| approx_kl | 0.00038893986 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00672 | -| learning_rate | 0.0003 | -| loss | 0.00366 | -| n_updates | 131620 | -| policy_gradient_loss | 0.0267 | -| std | 0.0137 | -| value_loss | 1.08e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 24 | -| iterations | 13164 | -| time_elapsed | 69931 | -| total_timesteps | 1684992 | -| train/ | | -| approx_kl | 0.015046982 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00906 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 131630 | -| policy_gradient_loss | 0.0452 | -| std | 0.0137 | -| value_loss | 7.63e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 24 | -| iterations | 13165 | -| time_elapsed | 69934 | -| total_timesteps | 1685120 | -| train/ | | -| approx_kl | 0.026825987 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00905 | -| learning_rate | 0.0003 | -| loss | 0.0318 | -| n_updates | 131640 | -| policy_gradient_loss | 0.0397 | -| std | 0.0137 | -| value_loss | 5.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 24 | -| iterations | 13166 | -| time_elapsed | 69943 | -| total_timesteps | 1685248 | -| train/ | | -| approx_kl | 0.031579915 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | 0.00559 | -| n_updates | 131650 | -| policy_gradient_loss | 0.00557 | -| std | 0.0137 | -| value_loss | 0.00127 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 24 | -| iterations | 13167 | -| time_elapsed | 69948 | -| total_timesteps | 1685376 | -| train/ | | -| approx_kl | 0.02468775 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0718 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 131660 | -| policy_gradient_loss | 0.000524 | -| std | 0.0137 | -| value_loss | 6.94e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 24 | -| iterations | 13168 | -| time_elapsed | 69951 | -| total_timesteps | 1685504 | -| train/ | | -| approx_kl | 0.000987317 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | 0.00244 | -| n_updates | 131670 | -| policy_gradient_loss | 0.00346 | -| std | 0.0137 | -| value_loss | 2.28e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 24 | -| iterations | 13169 | -| time_elapsed | 69954 | -| total_timesteps | 1685632 | -| train/ | | -| approx_kl | 0.08245261 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.0388 | -| n_updates | 131680 | -| policy_gradient_loss | 0.00477 | -| std | 0.0137 | -| value_loss | 1.75e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 24 | -| iterations | 13170 | -| time_elapsed | 69957 | -| total_timesteps | 1685760 | -| train/ | | -| approx_kl | 0.052318346 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 131690 | -| policy_gradient_loss | 0.00867 | -| std | 0.0137 | -| value_loss | 8.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 24 | -| iterations | 13171 | -| time_elapsed | 69961 | -| total_timesteps | 1685888 | -| train/ | | -| approx_kl | 0.019742873 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.000663 | -| n_updates | 131700 | -| policy_gradient_loss | 0.00386 | -| std | 0.0137 | -| value_loss | 5.62e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13172 | -| time_elapsed | 69964 | -| total_timesteps | 1686016 | -| train/ | | -| approx_kl | 0.07906301 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | 0.0774 | -| n_updates | 131710 | -| policy_gradient_loss | 0.0498 | -| std | 0.0137 | -| value_loss | 4.17e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13173 | -| time_elapsed | 69973 | -| total_timesteps | 1686144 | -| train/ | | -| approx_kl | 0.017399244 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.869 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 131720 | -| policy_gradient_loss | 0.0129 | -| std | 0.0137 | -| value_loss | 0.00137 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13174 | -| time_elapsed | 69976 | -| total_timesteps | 1686272 | -| train/ | | -| approx_kl | 0.03178035 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.0147 | -| learning_rate | 0.0003 | -| loss | 0.00857 | -| n_updates | 131730 | -| policy_gradient_loss | 0.0033 | -| std | 0.0137 | -| value_loss | 5.48e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13175 | -| time_elapsed | 69980 | -| total_timesteps | 1686400 | -| train/ | | -| approx_kl | 0.073715165 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 131740 | -| policy_gradient_loss | 0.00661 | -| std | 0.0137 | -| value_loss | 3.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13176 | -| time_elapsed | 69983 | -| total_timesteps | 1686528 | -| train/ | | -| approx_kl | 0.02219227 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.00942 | -| n_updates | 131750 | -| policy_gradient_loss | 0.011 | -| std | 0.0137 | -| value_loss | 1.16e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13177 | -| time_elapsed | 69985 | -| total_timesteps | 1686656 | -| train/ | | -| approx_kl | 0.02850691 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00632 | -| n_updates | 131760 | -| policy_gradient_loss | 0.00333 | -| std | 0.0137 | -| value_loss | 6.77e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13178 | -| time_elapsed | 69987 | -| total_timesteps | 1686784 | -| train/ | | -| approx_kl | 0.007851029 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.00143 | -| n_updates | 131770 | -| policy_gradient_loss | 0.00106 | -| std | 0.0137 | -| value_loss | 1.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 24 | -| iterations | 13179 | -| time_elapsed | 69989 | -| total_timesteps | 1686912 | -| train/ | | -| approx_kl | 0.024296582 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 131780 | -| policy_gradient_loss | 0.00566 | -| std | 0.0137 | -| value_loss | 1.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13180 | -| time_elapsed | 69993 | -| total_timesteps | 1687040 | -| train/ | | -| approx_kl | 0.14151074 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 131790 | -| policy_gradient_loss | 0.0131 | -| std | 0.0137 | -| value_loss | 1.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13181 | -| time_elapsed | 69999 | -| total_timesteps | 1687168 | -| train/ | | -| approx_kl | 0.035548795 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.732 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 131800 | -| policy_gradient_loss | -0.0153 | -| std | 0.0137 | -| value_loss | 0.000491 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13182 | -| time_elapsed | 70003 | -| total_timesteps | 1687296 | -| train/ | | -| approx_kl | 0.00025446154 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -17.9 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 131810 | -| policy_gradient_loss | 0.00349 | -| std | 0.0137 | -| value_loss | 3.03e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13183 | -| time_elapsed | 70007 | -| total_timesteps | 1687424 | -| train/ | | -| approx_kl | 0.04175337 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -14 | -| learning_rate | 0.0003 | -| loss | 0.00551 | -| n_updates | 131820 | -| policy_gradient_loss | 0.00573 | -| std | 0.0137 | -| value_loss | 1.7e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13184 | -| time_elapsed | 70011 | -| total_timesteps | 1687552 | -| train/ | | -| approx_kl | 0.02209925 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -1.84 | -| learning_rate | 0.0003 | -| loss | 0.00708 | -| n_updates | 131830 | -| policy_gradient_loss | 0.00144 | -| std | 0.0137 | -| value_loss | 3.21e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13185 | -| time_elapsed | 70015 | -| total_timesteps | 1687680 | -| train/ | | -| approx_kl | 0.0023973687 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.00775 | -| n_updates | 131840 | -| policy_gradient_loss | -0.00158 | -| std | 0.0137 | -| value_loss | 1.92e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13186 | -| time_elapsed | 70019 | -| total_timesteps | 1687808 | -| train/ | | -| approx_kl | 0.0010212553 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | -0.000602 | -| n_updates | 131850 | -| policy_gradient_loss | 0.0223 | -| std | 0.0137 | -| value_loss | 1.15e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13187 | -| time_elapsed | 70023 | -| total_timesteps | 1687936 | -| train/ | | -| approx_kl | 0.03171612 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.000884 | -| learning_rate | 0.0003 | -| loss | 0.0438 | -| n_updates | 131860 | -| policy_gradient_loss | 0.0894 | -| std | 0.0137 | -| value_loss | 1.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13188 | -| time_elapsed | 70026 | -| total_timesteps | 1688064 | -| train/ | | -| approx_kl | 0.018721692 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.00256 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 131870 | -| policy_gradient_loss | 0.00299 | -| std | 0.0137 | -| value_loss | 8.46e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13189 | -| time_elapsed | 70031 | -| total_timesteps | 1688192 | -| train/ | | -| approx_kl | 0.07900794 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.843 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 131880 | -| policy_gradient_loss | -0.0124 | -| std | 0.0137 | -| value_loss | 0.00161 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13190 | -| time_elapsed | 70034 | -| total_timesteps | 1688320 | -| train/ | | -| approx_kl | 0.0037324033 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -24.4 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 131890 | -| policy_gradient_loss | 0.00311 | -| std | 0.0137 | -| value_loss | 2.02e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13191 | -| time_elapsed | 70037 | -| total_timesteps | 1688448 | -| train/ | | -| approx_kl | 0.039696112 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -21.1 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 131900 | -| policy_gradient_loss | 0.00252 | -| std | 0.0137 | -| value_loss | 7.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13192 | -| time_elapsed | 70040 | -| total_timesteps | 1688576 | -| train/ | | -| approx_kl | 0.011569625 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 131910 | -| policy_gradient_loss | 0.00488 | -| std | 0.0137 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13193 | -| time_elapsed | 70043 | -| total_timesteps | 1688704 | -| train/ | | -| approx_kl | 0.013916339 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.0269 | -| n_updates | 131920 | -| policy_gradient_loss | -0.0135 | -| std | 0.0137 | -| value_loss | 1.45e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13194 | -| time_elapsed | 70047 | -| total_timesteps | 1688832 | -| train/ | | -| approx_kl | 0.0043040775 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | -0.000151 | -| n_updates | 131930 | -| policy_gradient_loss | 0.0213 | -| std | 0.0137 | -| value_loss | 1.44e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13195 | -| time_elapsed | 70050 | -| total_timesteps | 1688960 | -| train/ | | -| approx_kl | 0.008209846 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 131940 | -| policy_gradient_loss | -0.00752 | -| std | 0.0137 | -| value_loss | 4.52e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13196 | -| time_elapsed | 70054 | -| total_timesteps | 1689088 | -| train/ | | -| approx_kl | 0.0037160409 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.00249 | -| learning_rate | 0.0003 | -| loss | 0.00263 | -| n_updates | 131950 | -| policy_gradient_loss | 0.00479 | -| std | 0.0137 | -| value_loss | 6.12e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13197 | -| time_elapsed | 70062 | -| total_timesteps | 1689216 | -| train/ | | -| approx_kl | 0.09308307 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | 0.0411 | -| n_updates | 131960 | -| policy_gradient_loss | 0.00917 | -| std | 0.0137 | -| value_loss | 0.000134 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13198 | -| time_elapsed | 70065 | -| total_timesteps | 1689344 | -| train/ | | -| approx_kl | 0.009272646 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 131970 | -| policy_gradient_loss | 0.0207 | -| std | 0.0137 | -| value_loss | 3.67e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13199 | -| time_elapsed | 70069 | -| total_timesteps | 1689472 | -| train/ | | -| approx_kl | 0.015478028 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00377 | -| learning_rate | 0.0003 | -| loss | 0.00575 | -| n_updates | 131980 | -| policy_gradient_loss | 0.00694 | -| std | 0.0137 | -| value_loss | 4.29e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13200 | -| time_elapsed | 70073 | -| total_timesteps | 1689600 | -| train/ | | -| approx_kl | 0.0009084926 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00713 | -| learning_rate | 0.0003 | -| loss | -0.00686 | -| n_updates | 131990 | -| policy_gradient_loss | -0.0126 | -| std | 0.0137 | -| value_loss | 7.25e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13201 | -| time_elapsed | 70079 | -| total_timesteps | 1689728 | -| train/ | | -| approx_kl | 0.05854647 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.0049 | -| learning_rate | 0.0003 | -| loss | 0.0383 | -| n_updates | 132000 | -| policy_gradient_loss | 0.00632 | -| std | 0.0137 | -| value_loss | 2.69e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13202 | -| time_elapsed | 70083 | -| total_timesteps | 1689856 | -| train/ | | -| approx_kl | 0.0019324631 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 132010 | -| policy_gradient_loss | 0.00248 | -| std | 0.0137 | -| value_loss | 4.1e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13203 | -| time_elapsed | 70087 | -| total_timesteps | 1689984 | -| train/ | | -| approx_kl | 0.08734542 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | 0.0455 | -| n_updates | 132020 | -| policy_gradient_loss | 0.0148 | -| std | 0.0137 | -| value_loss | 4.73e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13204 | -| time_elapsed | 70090 | -| total_timesteps | 1690112 | -| train/ | | -| approx_kl | 0.015933003 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 132030 | -| policy_gradient_loss | -0.00619 | -| std | 0.0137 | -| value_loss | 3.7e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13205 | -| time_elapsed | 70099 | -| total_timesteps | 1690240 | -| train/ | | -| approx_kl | 0.00091470825 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 132040 | -| policy_gradient_loss | -0.0031 | -| std | 0.0137 | -| value_loss | 0.00237 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13206 | -| time_elapsed | 70102 | -| total_timesteps | 1690368 | -| train/ | | -| approx_kl | 0.004749151 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 132050 | -| policy_gradient_loss | -0.0044 | -| std | 0.0137 | -| value_loss | 3.26e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13207 | -| time_elapsed | 70105 | -| total_timesteps | 1690496 | -| train/ | | -| approx_kl | 0.00028235838 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.000305 | -| n_updates | 132060 | -| policy_gradient_loss | 0.000813 | -| std | 0.0137 | -| value_loss | 6.87e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13208 | -| time_elapsed | 70109 | -| total_timesteps | 1690624 | -| train/ | | -| approx_kl | 0.00016107224 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | -0.000815 | -| n_updates | 132070 | -| policy_gradient_loss | 0.000878 | -| std | 0.0137 | -| value_loss | 7.57e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13209 | -| time_elapsed | 70113 | -| total_timesteps | 1690752 | -| train/ | | -| approx_kl | 0.01702786 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | 0.00223 | -| n_updates | 132080 | -| policy_gradient_loss | 0.0202 | -| std | 0.0137 | -| value_loss | 2.22e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13210 | -| time_elapsed | 70116 | -| total_timesteps | 1690880 | -| train/ | | -| approx_kl | 0.0058684945 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | -0.000388 | -| n_updates | 132090 | -| policy_gradient_loss | 0.00745 | -| std | 0.0137 | -| value_loss | 1.49e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13211 | -| time_elapsed | 70119 | -| total_timesteps | 1691008 | -| train/ | | -| approx_kl | 0.08346173 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.00843 | -| n_updates | 132100 | -| policy_gradient_loss | 0.00418 | -| std | 0.0137 | -| value_loss | 1.91e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13212 | -| time_elapsed | 70128 | -| total_timesteps | 1691136 | -| train/ | | -| approx_kl | 0.102190465 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 132110 | -| policy_gradient_loss | -0.0154 | -| std | 0.0137 | -| value_loss | 0.000399 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13213 | -| time_elapsed | 70132 | -| total_timesteps | 1691264 | -| train/ | | -| approx_kl | 0.00040458608 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 132120 | -| policy_gradient_loss | 0.00636 | -| std | 0.0137 | -| value_loss | 7.97e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13214 | -| time_elapsed | 70137 | -| total_timesteps | 1691392 | -| train/ | | -| approx_kl | 0.0022741347 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 132130 | -| policy_gradient_loss | 0.0164 | -| std | 0.0137 | -| value_loss | 9.09e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13215 | -| time_elapsed | 70140 | -| total_timesteps | 1691520 | -| train/ | | -| approx_kl | 0.014556483 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.606 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 132140 | -| policy_gradient_loss | 0.024 | -| std | 0.0137 | -| value_loss | 3.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13216 | -| time_elapsed | 70144 | -| total_timesteps | 1691648 | -| train/ | | -| approx_kl | 0.04596333 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.00753 | -| n_updates | 132150 | -| policy_gradient_loss | -0.00258 | -| std | 0.0137 | -| value_loss | 2.66e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13217 | -| time_elapsed | 70147 | -| total_timesteps | 1691776 | -| train/ | | -| approx_kl | 0.07262643 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | 0.05 | -| n_updates | 132160 | -| policy_gradient_loss | 0.0082 | -| std | 0.0137 | -| value_loss | 1.4e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13218 | -| time_elapsed | 70150 | -| total_timesteps | 1691904 | -| train/ | | -| approx_kl | 0.06292396 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 132170 | -| policy_gradient_loss | 0.00524 | -| std | 0.0137 | -| value_loss | 1.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13219 | -| time_elapsed | 70154 | -| total_timesteps | 1692032 | -| train/ | | -| approx_kl | 0.018308507 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00953 | -| learning_rate | 0.0003 | -| loss | -0.00932 | -| n_updates | 132180 | -| policy_gradient_loss | 9.66e-05 | -| std | 0.0137 | -| value_loss | 7.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13220 | -| time_elapsed | 70162 | -| total_timesteps | 1692160 | -| train/ | | -| approx_kl | 0.022909744 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | 0.00624 | -| n_updates | 132190 | -| policy_gradient_loss | 0.00615 | -| std | 0.0137 | -| value_loss | 0.000711 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13221 | -| time_elapsed | 70166 | -| total_timesteps | 1692288 | -| train/ | | -| approx_kl | 0.027807994 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.00567 | -| learning_rate | 0.0003 | -| loss | 0.00831 | -| n_updates | 132200 | -| policy_gradient_loss | 0.00719 | -| std | 0.0137 | -| value_loss | 9.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13222 | -| time_elapsed | 70169 | -| total_timesteps | 1692416 | -| train/ | | -| approx_kl | 0.051179044 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.571 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 132210 | -| policy_gradient_loss | 0.00981 | -| std | 0.0137 | -| value_loss | 0.000109 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13223 | -| time_elapsed | 70173 | -| total_timesteps | 1692544 | -| train/ | | -| approx_kl | 0.012834923 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 132220 | -| policy_gradient_loss | 0.0113 | -| std | 0.0137 | -| value_loss | 2.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13224 | -| time_elapsed | 70176 | -| total_timesteps | 1692672 | -| train/ | | -| approx_kl | 0.005097934 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 132230 | -| policy_gradient_loss | 0.00469 | -| std | 0.0137 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13225 | -| time_elapsed | 70179 | -| total_timesteps | 1692800 | -| train/ | | -| approx_kl | 0.008552067 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.87 | -| explained_variance | 0.00592 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 132240 | -| policy_gradient_loss | -0.0063 | -| std | 0.0136 | -| value_loss | 3.58e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13226 | -| time_elapsed | 70183 | -| total_timesteps | 1692928 | -| train/ | | -| approx_kl | 0.00047325203 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.00381 | -| learning_rate | 0.0003 | -| loss | 0.00153 | -| n_updates | 132250 | -| policy_gradient_loss | -0.000654 | -| std | 0.0136 | -| value_loss | 1.15e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13227 | -| time_elapsed | 70187 | -| total_timesteps | 1693056 | -| train/ | | -| approx_kl | 0.0013766112 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.00474 | -| learning_rate | 0.0003 | -| loss | 3.01e-05 | -| n_updates | 132260 | -| policy_gradient_loss | 0.000557 | -| std | 0.0136 | -| value_loss | 1.58e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13228 | -| time_elapsed | 70193 | -| total_timesteps | 1693184 | -| train/ | | -| approx_kl | 0.009711985 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.687 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 132270 | -| policy_gradient_loss | -0.00154 | -| std | 0.0136 | -| value_loss | 0.00625 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13229 | -| time_elapsed | 70196 | -| total_timesteps | 1693312 | -| train/ | | -| approx_kl | 0.041050926 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.0211 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 132280 | -| policy_gradient_loss | -0.00225 | -| std | 0.0136 | -| value_loss | 0.00012 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13230 | -| time_elapsed | 70200 | -| total_timesteps | 1693440 | -| train/ | | -| approx_kl | 0.02754366 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -1.44 | -| learning_rate | 0.0003 | -| loss | -0.00314 | -| n_updates | 132290 | -| policy_gradient_loss | 0.00228 | -| std | 0.0136 | -| value_loss | 5.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13231 | -| time_elapsed | 70204 | -| total_timesteps | 1693568 | -| train/ | | -| approx_kl | 0.031089196 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.00917 | -| n_updates | 132300 | -| policy_gradient_loss | 0.00399 | -| std | 0.0136 | -| value_loss | 4.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13232 | -| time_elapsed | 70208 | -| total_timesteps | 1693696 | -| train/ | | -| approx_kl | 0.019295631 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0059 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 132310 | -| policy_gradient_loss | 0.0025 | -| std | 0.0136 | -| value_loss | 3.13e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13233 | -| time_elapsed | 70211 | -| total_timesteps | 1693824 | -| train/ | | -| approx_kl | 0.0265599 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.00229 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 132320 | -| policy_gradient_loss | 0.031 | -| std | 0.0136 | -| value_loss | 1.28e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13234 | -| time_elapsed | 70215 | -| total_timesteps | 1693952 | -| train/ | | -| approx_kl | 0.031869534 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0539 | -| n_updates | 132330 | -| policy_gradient_loss | 0.0584 | -| std | 0.0136 | -| value_loss | 1.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13235 | -| time_elapsed | 70217 | -| total_timesteps | 1694080 | -| train/ | | -| approx_kl | 0.007494581 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.00649 | -| learning_rate | 0.0003 | -| loss | -0.00702 | -| n_updates | 132340 | -| policy_gradient_loss | 0.0045 | -| std | 0.0136 | -| value_loss | 8.6e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13236 | -| time_elapsed | 70223 | -| total_timesteps | 1694208 | -| train/ | | -| approx_kl | 0.13726169 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.933 | -| learning_rate | 0.0003 | -| loss | 0.0447 | -| n_updates | 132350 | -| policy_gradient_loss | 0.000785 | -| std | 0.0136 | -| value_loss | 0.000535 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13237 | -| time_elapsed | 70226 | -| total_timesteps | 1694336 | -| train/ | | -| approx_kl | 0.008848283 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0957 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 132360 | -| policy_gradient_loss | 0.0192 | -| std | 0.0136 | -| value_loss | 9.94e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13238 | -| time_elapsed | 70231 | -| total_timesteps | 1694464 | -| train/ | | -| approx_kl | 0.0046967817 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.00485 | -| learning_rate | 0.0003 | -| loss | 0.0085 | -| n_updates | 132370 | -| policy_gradient_loss | 0.0287 | -| std | 0.0136 | -| value_loss | 1.71e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13239 | -| time_elapsed | 70234 | -| total_timesteps | 1694592 | -| train/ | | -| approx_kl | 0.03969939 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.00934 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 132380 | -| policy_gradient_loss | 0.00348 | -| std | 0.0136 | -| value_loss | 7.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13240 | -| time_elapsed | 70237 | -| total_timesteps | 1694720 | -| train/ | | -| approx_kl | 0.028774349 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 132390 | -| policy_gradient_loss | -0.00643 | -| std | 0.0136 | -| value_loss | 4.69e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13241 | -| time_elapsed | 70238 | -| total_timesteps | 1694848 | -| train/ | | -| approx_kl | 3.7387013e-05 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 132400 | -| policy_gradient_loss | 0.00845 | -| std | 0.0136 | -| value_loss | 3.36e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13242 | -| time_elapsed | 70242 | -| total_timesteps | 1694976 | -| train/ | | -| approx_kl | 0.0013293447 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.00389 | -| n_updates | 132410 | -| policy_gradient_loss | 0.0295 | -| std | 0.0136 | -| value_loss | 2.68e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13243 | -| time_elapsed | 70245 | -| total_timesteps | 1695104 | -| train/ | | -| approx_kl | 0.018660583 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 132420 | -| policy_gradient_loss | 0.0485 | -| std | 0.0136 | -| value_loss | 1.85e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13244 | -| time_elapsed | 70251 | -| total_timesteps | 1695232 | -| train/ | | -| approx_kl | 0.06064049 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.745 | -| learning_rate | 0.0003 | -| loss | 0.0383 | -| n_updates | 132430 | -| policy_gradient_loss | 0.0254 | -| std | 0.0136 | -| value_loss | 0.00417 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13245 | -| time_elapsed | 70255 | -| total_timesteps | 1695360 | -| train/ | | -| approx_kl | 0.035319068 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 132440 | -| policy_gradient_loss | 0.0439 | -| std | 0.0136 | -| value_loss | 5.22e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13246 | -| time_elapsed | 70258 | -| total_timesteps | 1695488 | -| train/ | | -| approx_kl | 0.0078089014 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.00482 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 132450 | -| policy_gradient_loss | 0.00458 | -| std | 0.0136 | -| value_loss | 1.06e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13247 | -| time_elapsed | 70261 | -| total_timesteps | 1695616 | -| train/ | | -| approx_kl | 0.010568719 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.00597 | -| learning_rate | 0.0003 | -| loss | -0.00814 | -| n_updates | 132460 | -| policy_gradient_loss | -0.00257 | -| std | 0.0136 | -| value_loss | 4.74e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13248 | -| time_elapsed | 70264 | -| total_timesteps | 1695744 | -| train/ | | -| approx_kl | 0.0037433286 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | -0.000318 | -| n_updates | 132470 | -| policy_gradient_loss | 0.00475 | -| std | 0.0136 | -| value_loss | 7.01e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13249 | -| time_elapsed | 70268 | -| total_timesteps | 1695872 | -| train/ | | -| approx_kl | 0.010157461 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.00253 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 132480 | -| policy_gradient_loss | 0.00943 | -| std | 0.0135 | -| value_loss | 0.000764 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13250 | -| time_elapsed | 70271 | -| total_timesteps | 1696000 | -| train/ | | -| approx_kl | 0.035975844 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.0282 | -| n_updates | 132490 | -| policy_gradient_loss | 0.00996 | -| std | 0.0135 | -| value_loss | 4.9e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13251 | -| time_elapsed | 70274 | -| total_timesteps | 1696128 | -| train/ | | -| approx_kl | 0.011638095 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.00381 | -| learning_rate | 0.0003 | -| loss | -0.00953 | -| n_updates | 132500 | -| policy_gradient_loss | 0.0244 | -| std | 0.0135 | -| value_loss | 9.65e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13252 | -| time_elapsed | 70280 | -| total_timesteps | 1696256 | -| train/ | | -| approx_kl | 0.03843723 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.88 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 132510 | -| policy_gradient_loss | -0.0114 | -| std | 0.0135 | -| value_loss | 0.00161 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13253 | -| time_elapsed | 70284 | -| total_timesteps | 1696384 | -| train/ | | -| approx_kl | 0.045663625 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 132520 | -| policy_gradient_loss | 0.00975 | -| std | 0.0135 | -| value_loss | 1.39e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13254 | -| time_elapsed | 70288 | -| total_timesteps | 1696512 | -| train/ | | -| approx_kl | 0.02550581 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.00753 | -| n_updates | 132530 | -| policy_gradient_loss | 0.00766 | -| std | 0.0135 | -| value_loss | 4.45e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13255 | -| time_elapsed | 70292 | -| total_timesteps | 1696640 | -| train/ | | -| approx_kl | 0.043380998 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 132540 | -| policy_gradient_loss | 0.00675 | -| std | 0.0135 | -| value_loss | 3.33e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13256 | -| time_elapsed | 70297 | -| total_timesteps | 1696768 | -| train/ | | -| approx_kl | 0.1965552 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 132550 | -| policy_gradient_loss | 0.0222 | -| std | 0.0135 | -| value_loss | 2.53e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13257 | -| time_elapsed | 70300 | -| total_timesteps | 1696896 | -| train/ | | -| approx_kl | 0.0006435658 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 132560 | -| policy_gradient_loss | -0.0106 | -| std | 0.0135 | -| value_loss | 6.16e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13258 | -| time_elapsed | 70304 | -| total_timesteps | 1697024 | -| train/ | | -| approx_kl | 0.0067765852 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 132570 | -| policy_gradient_loss | 0.000131 | -| std | 0.0135 | -| value_loss | 5.13e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13259 | -| time_elapsed | 70311 | -| total_timesteps | 1697152 | -| train/ | | -| approx_kl | 0.0049725333 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 132580 | -| policy_gradient_loss | -0.0147 | -| std | 0.0135 | -| value_loss | 0.00271 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13260 | -| time_elapsed | 70314 | -| total_timesteps | 1697280 | -| train/ | | -| approx_kl | 0.0043967385 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | -0.000925 | -| n_updates | 132590 | -| policy_gradient_loss | 0.00705 | -| std | 0.0135 | -| value_loss | 4.88e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13261 | -| time_elapsed | 70317 | -| total_timesteps | 1697408 | -| train/ | | -| approx_kl | 0.009348345 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 132600 | -| policy_gradient_loss | 0.0164 | -| std | 0.0135 | -| value_loss | 2.74e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13262 | -| time_elapsed | 70321 | -| total_timesteps | 1697536 | -| train/ | | -| approx_kl | 0.005414895 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.00481 | -| n_updates | 132610 | -| policy_gradient_loss | 0.00734 | -| std | 0.0135 | -| value_loss | 9.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13263 | -| time_elapsed | 70324 | -| total_timesteps | 1697664 | -| train/ | | -| approx_kl | 0.039765548 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 132620 | -| policy_gradient_loss | 0.00887 | -| std | 0.0135 | -| value_loss | 5.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13264 | -| time_elapsed | 70329 | -| total_timesteps | 1697792 | -| train/ | | -| approx_kl | 0.011703726 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.00264 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 132630 | -| policy_gradient_loss | 0.0172 | -| std | 0.0134 | -| value_loss | 7.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13265 | -| time_elapsed | 70333 | -| total_timesteps | 1697920 | -| train/ | | -| approx_kl | 0.05112184 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.000472 | -| learning_rate | 0.0003 | -| loss | 0.00429 | -| n_updates | 132640 | -| policy_gradient_loss | -0.000165 | -| std | 0.0134 | -| value_loss | 2.55e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13266 | -| time_elapsed | 70336 | -| total_timesteps | 1698048 | -| train/ | | -| approx_kl | 0.05510273 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 132650 | -| policy_gradient_loss | 0.00642 | -| std | 0.0134 | -| value_loss | 1.3e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13267 | -| time_elapsed | 70344 | -| total_timesteps | 1698176 | -| train/ | | -| approx_kl | 0.11731537 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.261 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 132660 | -| policy_gradient_loss | -0.0148 | -| std | 0.0134 | -| value_loss | 0.00116 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13268 | -| time_elapsed | 70346 | -| total_timesteps | 1698304 | -| train/ | | -| approx_kl | 0.02191666 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.0231 | -| learning_rate | 0.0003 | -| loss | 0.00686 | -| n_updates | 132670 | -| policy_gradient_loss | 0.023 | -| std | 0.0134 | -| value_loss | 3.84e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13269 | -| time_elapsed | 70350 | -| total_timesteps | 1698432 | -| train/ | | -| approx_kl | 0.06921981 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 132680 | -| policy_gradient_loss | 0.0124 | -| std | 0.0134 | -| value_loss | 9.58e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13270 | -| time_elapsed | 70353 | -| total_timesteps | 1698560 | -| train/ | | -| approx_kl | 0.00027834345 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.00277 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 132690 | -| policy_gradient_loss | -0.00473 | -| std | 0.0134 | -| value_loss | 3.98e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13271 | -| time_elapsed | 70357 | -| total_timesteps | 1698688 | -| train/ | | -| approx_kl | 0.017655266 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.000365 | -| n_updates | 132700 | -| policy_gradient_loss | 0.016 | -| std | 0.0134 | -| value_loss | 2.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13272 | -| time_elapsed | 70361 | -| total_timesteps | 1698816 | -| train/ | | -| approx_kl | 0.06002353 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.00968 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 132710 | -| policy_gradient_loss | 0.00268 | -| std | 0.0134 | -| value_loss | 1.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13273 | -| time_elapsed | 70365 | -| total_timesteps | 1698944 | -| train/ | | -| approx_kl | 0.024683177 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 132720 | -| policy_gradient_loss | 0.00415 | -| std | 0.0134 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13274 | -| time_elapsed | 70369 | -| total_timesteps | 1699072 | -| train/ | | -| approx_kl | 0.0075530857 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | -0.00717 | -| n_updates | 132730 | -| policy_gradient_loss | 0.00362 | -| std | 0.0134 | -| value_loss | 8.59e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13275 | -| time_elapsed | 70377 | -| total_timesteps | 1699200 | -| train/ | | -| approx_kl | 0.08652056 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 132740 | -| policy_gradient_loss | -0.0127 | -| std | 0.0134 | -| value_loss | 0.0002 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13276 | -| time_elapsed | 70381 | -| total_timesteps | 1699328 | -| train/ | | -| approx_kl | 0.010997873 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0033 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 132750 | -| policy_gradient_loss | 0.00116 | -| std | 0.0134 | -| value_loss | 5.52e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13277 | -| time_elapsed | 70386 | -| total_timesteps | 1699456 | -| train/ | | -| approx_kl | 0.05305757 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0923 | -| learning_rate | 0.0003 | -| loss | 0.0528 | -| n_updates | 132760 | -| policy_gradient_loss | 0.0208 | -| std | 0.0134 | -| value_loss | 2.47e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13278 | -| time_elapsed | 70389 | -| total_timesteps | 1699584 | -| train/ | | -| approx_kl | 0.00017161109 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 132770 | -| policy_gradient_loss | -0.00159 | -| std | 0.0134 | -| value_loss | 2.98e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13279 | -| time_elapsed | 70393 | -| total_timesteps | 1699712 | -| train/ | | -| approx_kl | 0.015673902 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 132780 | -| policy_gradient_loss | 0.015 | -| std | 0.0134 | -| value_loss | 2.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13280 | -| time_elapsed | 70397 | -| total_timesteps | 1699840 | -| train/ | | -| approx_kl | 0.026315153 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.00359 | -| n_updates | 132790 | -| policy_gradient_loss | -0.00128 | -| std | 0.0134 | -| value_loss | 1.56e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13281 | -| time_elapsed | 70400 | -| total_timesteps | 1699968 | -| train/ | | -| approx_kl | 0.0041189734 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.00676 | -| n_updates | 132800 | -| policy_gradient_loss | 0.00668 | -| std | 0.0134 | -| value_loss | 9.13e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13282 | -| time_elapsed | 70405 | -| total_timesteps | 1700096 | -| train/ | | -| approx_kl | 0.010728687 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.000746 | -| n_updates | 132810 | -| policy_gradient_loss | 0.00743 | -| std | 0.0134 | -| value_loss | 5.77e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13283 | -| time_elapsed | 70411 | -| total_timesteps | 1700224 | -| train/ | | -| approx_kl | 0.057356887 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | 0.00174 | -| n_updates | 132820 | -| policy_gradient_loss | 0.00286 | -| std | 0.0134 | -| value_loss | 0.00143 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13284 | -| time_elapsed | 70415 | -| total_timesteps | 1700352 | -| train/ | | -| approx_kl | 0.0059268647 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 132830 | -| policy_gradient_loss | 0.00378 | -| std | 0.0134 | -| value_loss | 6.31e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13285 | -| time_elapsed | 70419 | -| total_timesteps | 1700480 | -| train/ | | -| approx_kl | 0.10905059 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | 0.00267 | -| n_updates | 132840 | -| policy_gradient_loss | 0.00196 | -| std | 0.0134 | -| value_loss | 2.18e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13286 | -| time_elapsed | 70423 | -| total_timesteps | 1700608 | -| train/ | | -| approx_kl | 0.0036962032 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 132850 | -| policy_gradient_loss | 0.0216 | -| std | 0.0134 | -| value_loss | 1.12e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13287 | -| time_elapsed | 70427 | -| total_timesteps | 1700736 | -| train/ | | -| approx_kl | 0.019967854 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.0069 | -| n_updates | 132860 | -| policy_gradient_loss | 0.0261 | -| std | 0.0134 | -| value_loss | 5.15e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13288 | -| time_elapsed | 70430 | -| total_timesteps | 1700864 | -| train/ | | -| approx_kl | 0.00038745208 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.000547 | -| n_updates | 132870 | -| policy_gradient_loss | 0.00616 | -| std | 0.0134 | -| value_loss | 2.72e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13289 | -| time_elapsed | 70435 | -| total_timesteps | 1700992 | -| train/ | | -| approx_kl | 0.06078858 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 132880 | -| policy_gradient_loss | 0.0479 | -| std | 0.0134 | -| value_loss | 2.35e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 24 | -| iterations | 13290 | -| time_elapsed | 70439 | -| total_timesteps | 1701120 | -| train/ | | -| approx_kl | 0.04409247 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 132890 | -| policy_gradient_loss | 0.0393 | -| std | 0.0134 | -| value_loss | 1.86e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 24 | -| iterations | 13291 | -| time_elapsed | 70449 | -| total_timesteps | 1701248 | -| train/ | | -| approx_kl | 0.06671774 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.963 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 132900 | -| policy_gradient_loss | -0.0153 | -| std | 0.0134 | -| value_loss | 0.00181 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 24 | -| iterations | 13292 | -| time_elapsed | 70453 | -| total_timesteps | 1701376 | -| train/ | | -| approx_kl | 0.010055227 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -39.5 | -| learning_rate | 0.0003 | -| loss | 0.00854 | -| n_updates | 132910 | -| policy_gradient_loss | -0.00242 | -| std | 0.0134 | -| value_loss | 6.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 24 | -| iterations | 13293 | -| time_elapsed | 70457 | -| total_timesteps | 1701504 | -| train/ | | -| approx_kl | 0.026019413 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -132 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 132920 | -| policy_gradient_loss | -0.00179 | -| std | 0.0134 | -| value_loss | 4.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 24 | -| iterations | 13294 | -| time_elapsed | 70460 | -| total_timesteps | 1701632 | -| train/ | | -| approx_kl | 0.06486657 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -55.8 | -| learning_rate | 0.0003 | -| loss | -0.000678 | -| n_updates | 132930 | -| policy_gradient_loss | -0.00233 | -| std | 0.0133 | -| value_loss | 3.46e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 24 | -| iterations | 13295 | -| time_elapsed | 70464 | -| total_timesteps | 1701760 | -| train/ | | -| approx_kl | 0.03754684 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -7.13 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 132940 | -| policy_gradient_loss | -0.0096 | -| std | 0.0133 | -| value_loss | 1.11e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 24 | -| iterations | 13296 | -| time_elapsed | 70468 | -| total_timesteps | 1701888 | -| train/ | | -| approx_kl | 9.426428e-05 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | -0.000902 | -| n_updates | 132950 | -| policy_gradient_loss | -0.00138 | -| std | 0.0133 | -| value_loss | 1.23e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13297 | -| time_elapsed | 70472 | -| total_timesteps | 1702016 | -| train/ | | -| approx_kl | 0.0079341 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 132960 | -| policy_gradient_loss | 0.00017 | -| std | 0.0133 | -| value_loss | 4.58e-10 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13298 | -| time_elapsed | 70480 | -| total_timesteps | 1702144 | -| train/ | | -| approx_kl | 0.05425695 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | 0.00915 | -| n_updates | 132970 | -| policy_gradient_loss | 0.00139 | -| std | 0.0133 | -| value_loss | 0.00114 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13299 | -| time_elapsed | 70483 | -| total_timesteps | 1702272 | -| train/ | | -| approx_kl | 0.035087615 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.0163 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 132980 | -| policy_gradient_loss | 0.0147 | -| std | 0.0133 | -| value_loss | 0.0011 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13300 | -| time_elapsed | 70487 | -| total_timesteps | 1702400 | -| train/ | | -| approx_kl | 0.01352708 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 132990 | -| policy_gradient_loss | 0.00571 | -| std | 0.0133 | -| value_loss | 0.000126 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13301 | -| time_elapsed | 70490 | -| total_timesteps | 1702528 | -| train/ | | -| approx_kl | 0.04550553 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.00388 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 133000 | -| policy_gradient_loss | 0.015 | -| std | 0.0133 | -| value_loss | 1.6e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13302 | -| time_elapsed | 70494 | -| total_timesteps | 1702656 | -| train/ | | -| approx_kl | 0.041041777 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 133010 | -| policy_gradient_loss | 0.00863 | -| std | 0.0133 | -| value_loss | 1.02e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13303 | -| time_elapsed | 70496 | -| total_timesteps | 1702784 | -| train/ | | -| approx_kl | 0.009622566 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 133020 | -| policy_gradient_loss | -0.00141 | -| std | 0.0133 | -| value_loss | 6.93e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13304 | -| time_elapsed | 70500 | -| total_timesteps | 1702912 | -| train/ | | -| approx_kl | 0.04834736 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 133030 | -| policy_gradient_loss | 0.00456 | -| std | 0.0133 | -| value_loss | 4.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13305 | -| time_elapsed | 70503 | -| total_timesteps | 1703040 | -| train/ | | -| approx_kl | 0.049304172 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 133040 | -| policy_gradient_loss | 0.00469 | -| std | 0.0133 | -| value_loss | 2.73e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13306 | -| time_elapsed | 70510 | -| total_timesteps | 1703168 | -| train/ | | -| approx_kl | 0.4238091 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.00346 | -| n_updates | 133050 | -| policy_gradient_loss | -0.00876 | -| std | 0.0133 | -| value_loss | 0.000996 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13307 | -| time_elapsed | 70514 | -| total_timesteps | 1703296 | -| train/ | | -| approx_kl | 0.024394523 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.449 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 133060 | -| policy_gradient_loss | -0.00145 | -| std | 0.0133 | -| value_loss | 8.89e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13308 | -| time_elapsed | 70517 | -| total_timesteps | 1703424 | -| train/ | | -| approx_kl | 0.008645229 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -7.84 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 133070 | -| policy_gradient_loss | -0.0104 | -| std | 0.0133 | -| value_loss | 1.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13309 | -| time_elapsed | 70519 | -| total_timesteps | 1703552 | -| train/ | | -| approx_kl | 0.073377095 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.0013 | -| n_updates | 133080 | -| policy_gradient_loss | -0.00699 | -| std | 0.0133 | -| value_loss | 1.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13310 | -| time_elapsed | 70523 | -| total_timesteps | 1703680 | -| train/ | | -| approx_kl | 0.016058598 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 133090 | -| policy_gradient_loss | 0.00142 | -| std | 0.0133 | -| value_loss | 1.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13311 | -| time_elapsed | 70526 | -| total_timesteps | 1703808 | -| train/ | | -| approx_kl | 0.032947276 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.000338 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 133100 | -| policy_gradient_loss | 0.00918 | -| std | 0.0133 | -| value_loss | 9.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13312 | -| time_elapsed | 70530 | -| total_timesteps | 1703936 | -| train/ | | -| approx_kl | 0.038212813 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.00713 | -| learning_rate | 0.0003 | -| loss | 0.000316 | -| n_updates | 133110 | -| policy_gradient_loss | -9.44e-05 | -| std | 0.0133 | -| value_loss | 6.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13313 | -| time_elapsed | 70534 | -| total_timesteps | 1704064 | -| train/ | | -| approx_kl | 0.017987173 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 133120 | -| policy_gradient_loss | -0.00279 | -| std | 0.0133 | -| value_loss | 5.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13314 | -| time_elapsed | 70541 | -| total_timesteps | 1704192 | -| train/ | | -| approx_kl | 0.25310868 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.451 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 133130 | -| policy_gradient_loss | -0.016 | -| std | 0.0133 | -| value_loss | 0.000928 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13315 | -| time_elapsed | 70544 | -| total_timesteps | 1704320 | -| train/ | | -| approx_kl | 0.036204092 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -7.82e+03 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 133140 | -| policy_gradient_loss | -0.009 | -| std | 0.0133 | -| value_loss | 4.76e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13316 | -| time_elapsed | 70548 | -| total_timesteps | 1704448 | -| train/ | | -| approx_kl | 0.021599 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -9.35 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 133150 | -| policy_gradient_loss | -0.000463 | -| std | 0.0133 | -| value_loss | 6.96e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13317 | -| time_elapsed | 70551 | -| total_timesteps | 1704576 | -| train/ | | -| approx_kl | 0.021458441 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | -0.000752 | -| n_updates | 133160 | -| policy_gradient_loss | 0.00229 | -| std | 0.0133 | -| value_loss | 4.15e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13318 | -| time_elapsed | 70554 | -| total_timesteps | 1704704 | -| train/ | | -| approx_kl | 0.0048490125 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.000231 | -| n_updates | 133170 | -| policy_gradient_loss | 0.00427 | -| std | 0.0132 | -| value_loss | 3.53e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13319 | -| time_elapsed | 70557 | -| total_timesteps | 1704832 | -| train/ | | -| approx_kl | 0.008121684 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | -0.0066 | -| n_updates | 133180 | -| policy_gradient_loss | -0.00144 | -| std | 0.0132 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13320 | -| time_elapsed | 70560 | -| total_timesteps | 1704960 | -| train/ | | -| approx_kl | 0.030978285 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.00152 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 133190 | -| policy_gradient_loss | 0.056 | -| std | 0.0132 | -| value_loss | 5.01e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13321 | -| time_elapsed | 70563 | -| total_timesteps | 1705088 | -| train/ | | -| approx_kl | 0.03407777 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 133200 | -| policy_gradient_loss | 0.0466 | -| std | 0.0132 | -| value_loss | 1.36e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13322 | -| time_elapsed | 70569 | -| total_timesteps | 1705216 | -| train/ | | -| approx_kl | 0.3689011 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 133210 | -| policy_gradient_loss | 0.0278 | -| std | 0.0132 | -| value_loss | 7.37e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13323 | -| time_elapsed | 70573 | -| total_timesteps | 1705344 | -| train/ | | -| approx_kl | 0.009156559 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | -0.00573 | -| n_updates | 133220 | -| policy_gradient_loss | 0.00291 | -| std | 0.0132 | -| value_loss | 7.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13324 | -| time_elapsed | 70577 | -| total_timesteps | 1705472 | -| train/ | | -| approx_kl | 0.039089207 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.00444 | -| learning_rate | 0.0003 | -| loss | 0.029 | -| n_updates | 133230 | -| policy_gradient_loss | 0.0053 | -| std | 0.0132 | -| value_loss | 8.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13325 | -| time_elapsed | 70580 | -| total_timesteps | 1705600 | -| train/ | | -| approx_kl | 0.042755146 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.00258 | -| n_updates | 133240 | -| policy_gradient_loss | 9.81e-05 | -| std | 0.0132 | -| value_loss | 5.84e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13326 | -| time_elapsed | 70584 | -| total_timesteps | 1705728 | -| train/ | | -| approx_kl | 0.08128796 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0295 | -| n_updates | 133250 | -| policy_gradient_loss | 0.0037 | -| std | 0.0132 | -| value_loss | 3.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13327 | -| time_elapsed | 70587 | -| total_timesteps | 1705856 | -| train/ | | -| approx_kl | 0.022520473 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 133260 | -| policy_gradient_loss | 0.0185 | -| std | 0.0132 | -| value_loss | 2.58e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13328 | -| time_elapsed | 70591 | -| total_timesteps | 1705984 | -| train/ | | -| approx_kl | 0.03106847 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0094 | -| n_updates | 133270 | -| policy_gradient_loss | 0.00198 | -| std | 0.0132 | -| value_loss | 1.79e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13329 | -| time_elapsed | 70595 | -| total_timesteps | 1706112 | -| train/ | | -| approx_kl | 0.0020607347 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | -0.000454 | -| n_updates | 133280 | -| policy_gradient_loss | 0.0221 | -| std | 0.0133 | -| value_loss | 7.39e-07 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13330 | -| time_elapsed | 70604 | -| total_timesteps | 1706240 | -| train/ | | -| approx_kl | 0.022119 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 133290 | -| policy_gradient_loss | 0.0128 | -| std | 0.0133 | -| value_loss | 9.67e-05 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13331 | -| time_elapsed | 70607 | -| total_timesteps | 1706368 | -| train/ | | -| approx_kl | 0.00074598705 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0728 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 133300 | -| policy_gradient_loss | 0.0258 | -| std | 0.0133 | -| value_loss | 4.39e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13332 | -| time_elapsed | 70610 | -| total_timesteps | 1706496 | -| train/ | | -| approx_kl | 0.029271588 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 133310 | -| policy_gradient_loss | 0.067 | -| std | 0.0133 | -| value_loss | 1.94e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13333 | -| time_elapsed | 70613 | -| total_timesteps | 1706624 | -| train/ | | -| approx_kl | 0.01704035 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.00732 | -| n_updates | 133320 | -| policy_gradient_loss | 0.00621 | -| std | 0.0133 | -| value_loss | 2.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13334 | -| time_elapsed | 70617 | -| total_timesteps | 1706752 | -| train/ | | -| approx_kl | 0.045644365 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 133330 | -| policy_gradient_loss | 0.016 | -| std | 0.0133 | -| value_loss | 3.68e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13335 | -| time_elapsed | 70621 | -| total_timesteps | 1706880 | -| train/ | | -| approx_kl | 0.04186911 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.000233 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 133340 | -| policy_gradient_loss | 0.00651 | -| std | 0.0133 | -| value_loss | 9.19e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13336 | -| time_elapsed | 70624 | -| total_timesteps | 1707008 | -| train/ | | -| approx_kl | 0.0050955624 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 133350 | -| policy_gradient_loss | 0.00421 | -| std | 0.0133 | -| value_loss | 5.8e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13337 | -| time_elapsed | 70633 | -| total_timesteps | 1707136 | -| train/ | | -| approx_kl | 0.5803596 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0219 | -| n_updates | 133360 | -| policy_gradient_loss | -0.0179 | -| std | 0.0133 | -| value_loss | 0.000137 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13338 | -| time_elapsed | 70637 | -| total_timesteps | 1707264 | -| train/ | | -| approx_kl | 0.082111515 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.0305 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 133370 | -| policy_gradient_loss | 0.0174 | -| std | 0.0133 | -| value_loss | 4.85e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13339 | -| time_elapsed | 70641 | -| total_timesteps | 1707392 | -| train/ | | -| approx_kl | 0.09839962 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.568 | -| learning_rate | 0.0003 | -| loss | 0.00836 | -| n_updates | 133380 | -| policy_gradient_loss | -0.00278 | -| std | 0.0133 | -| value_loss | 7.2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13340 | -| time_elapsed | 70645 | -| total_timesteps | 1707520 | -| train/ | | -| approx_kl | 0.025697505 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -6.83 | -| learning_rate | 0.0003 | -| loss | -0.00555 | -| n_updates | 133390 | -| policy_gradient_loss | 0.0018 | -| std | 0.0133 | -| value_loss | 2.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13341 | -| time_elapsed | 70648 | -| total_timesteps | 1707648 | -| train/ | | -| approx_kl | 0.004599432 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.686 | -| learning_rate | 0.0003 | -| loss | 0.00598 | -| n_updates | 133400 | -| policy_gradient_loss | -0.00176 | -| std | 0.0133 | -| value_loss | 2.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13342 | -| time_elapsed | 70652 | -| total_timesteps | 1707776 | -| train/ | | -| approx_kl | 0.027499538 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0016 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 133410 | -| policy_gradient_loss | 0.0147 | -| std | 0.0133 | -| value_loss | 1.01e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13343 | -| time_elapsed | 70655 | -| total_timesteps | 1707904 | -| train/ | | -| approx_kl | 0.043385863 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 133420 | -| policy_gradient_loss | -0.000223 | -| std | 0.0133 | -| value_loss | 5.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13344 | -| time_elapsed | 70659 | -| total_timesteps | 1708032 | -| train/ | | -| approx_kl | 0.021295425 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 133430 | -| policy_gradient_loss | -0.0112 | -| std | 0.0133 | -| value_loss | 3.76e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13345 | -| time_elapsed | 70668 | -| total_timesteps | 1708160 | -| train/ | | -| approx_kl | 0.21758552 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.922 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 133440 | -| policy_gradient_loss | -0.0149 | -| std | 0.0133 | -| value_loss | 0.000785 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13346 | -| time_elapsed | 70671 | -| total_timesteps | 1708288 | -| train/ | | -| approx_kl | 0.019056216 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.167 | -| learning_rate | 0.0003 | -| loss | 0.00705 | -| n_updates | 133450 | -| policy_gradient_loss | 0.00587 | -| std | 0.0133 | -| value_loss | 1.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13347 | -| time_elapsed | 70675 | -| total_timesteps | 1708416 | -| train/ | | -| approx_kl | 0.014832309 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -11.3 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 133460 | -| policy_gradient_loss | -0.00124 | -| std | 0.0133 | -| value_loss | 3.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13348 | -| time_elapsed | 70681 | -| total_timesteps | 1708544 | -| train/ | | -| approx_kl | 0.029783864 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | 0.0197 | -| n_updates | 133470 | -| policy_gradient_loss | 0.0184 | -| std | 0.0134 | -| value_loss | 3.42e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13349 | -| time_elapsed | 70685 | -| total_timesteps | 1708672 | -| train/ | | -| approx_kl | 0.09182901 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.00727 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 133480 | -| policy_gradient_loss | 0.037 | -| std | 0.0134 | -| value_loss | 1.22e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13350 | -| time_elapsed | 70688 | -| total_timesteps | 1708800 | -| train/ | | -| approx_kl | 1.860736e-05 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.546 | -| learning_rate | 0.0003 | -| loss | -0.000745 | -| n_updates | 133490 | -| policy_gradient_loss | -0.00255 | -| std | 0.0135 | -| value_loss | 6.12e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13351 | -| time_elapsed | 70690 | -| total_timesteps | 1708928 | -| train/ | | -| approx_kl | 0.0003908989 | -| clip_fraction | 0.0461 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 133500 | -| policy_gradient_loss | -0.0019 | -| std | 0.0135 | -| value_loss | 7.25e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13352 | -| time_elapsed | 70694 | -| total_timesteps | 1709056 | -| train/ | | -| approx_kl | 0.00024792273 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 133510 | -| policy_gradient_loss | -0.00301 | -| std | 0.0135 | -| value_loss | 2.86e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13353 | -| time_elapsed | 70702 | -| total_timesteps | 1709184 | -| train/ | | -| approx_kl | 0.16592458 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 133520 | -| policy_gradient_loss | -0.0082 | -| std | 0.0135 | -| value_loss | 6.97e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13354 | -| time_elapsed | 70706 | -| total_timesteps | 1709312 | -| train/ | | -| approx_kl | 0.010582559 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.00501 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 133530 | -| policy_gradient_loss | 0.00601 | -| std | 0.0135 | -| value_loss | 4.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13355 | -| time_elapsed | 70711 | -| total_timesteps | 1709440 | -| train/ | | -| approx_kl | 0.024056653 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.00449 | -| learning_rate | 0.0003 | -| loss | 0.00752 | -| n_updates | 133540 | -| policy_gradient_loss | 0.00426 | -| std | 0.0135 | -| value_loss | 5.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13356 | -| time_elapsed | 70717 | -| total_timesteps | 1709568 | -| train/ | | -| approx_kl | 0.015017666 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 133550 | -| policy_gradient_loss | 0.000267 | -| std | 0.0135 | -| value_loss | 3.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13357 | -| time_elapsed | 70722 | -| total_timesteps | 1709696 | -| train/ | | -| approx_kl | 0.027275259 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 133560 | -| policy_gradient_loss | 0.0419 | -| std | 0.0135 | -| value_loss | 1.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13358 | -| time_elapsed | 70726 | -| total_timesteps | 1709824 | -| train/ | | -| approx_kl | 0.030537507 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0437 | -| n_updates | 133570 | -| policy_gradient_loss | 0.0373 | -| std | 0.0135 | -| value_loss | 1.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 24 | -| iterations | 13359 | -| time_elapsed | 70730 | -| total_timesteps | 1709952 | -| train/ | | -| approx_kl | 0.005360822 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 9.94e-06 | -| n_updates | 133580 | -| policy_gradient_loss | 0.00359 | -| std | 0.0135 | -| value_loss | 1.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13360 | -| time_elapsed | 70735 | -| total_timesteps | 1710080 | -| train/ | | -| approx_kl | 0.031526566 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 133590 | -| policy_gradient_loss | 0.00638 | -| std | 0.0135 | -| value_loss | 1.97e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13361 | -| time_elapsed | 70745 | -| total_timesteps | 1710208 | -| train/ | | -| approx_kl | 0.10205616 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 133600 | -| policy_gradient_loss | -0.0154 | -| std | 0.0135 | -| value_loss | 0.00036 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13362 | -| time_elapsed | 70750 | -| total_timesteps | 1710336 | -| train/ | | -| approx_kl | 0.11116425 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | 0.00895 | -| n_updates | 133610 | -| policy_gradient_loss | 0.00136 | -| std | 0.0135 | -| value_loss | 5.23e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13363 | -| time_elapsed | 70756 | -| total_timesteps | 1710464 | -| train/ | | -| approx_kl | 0.0008927025 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -26.3 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 133620 | -| policy_gradient_loss | -0.00426 | -| std | 0.0135 | -| value_loss | 2.44e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13364 | -| time_elapsed | 70761 | -| total_timesteps | 1710592 | -| train/ | | -| approx_kl | 0.005944226 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -1.02 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 133630 | -| policy_gradient_loss | -0.0101 | -| std | 0.0135 | -| value_loss | 3.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13365 | -| time_elapsed | 70766 | -| total_timesteps | 1710720 | -| train/ | | -| approx_kl | 0.023455638 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.000627 | -| n_updates | 133640 | -| policy_gradient_loss | -0.00232 | -| std | 0.0135 | -| value_loss | 2.04e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13366 | -| time_elapsed | 70772 | -| total_timesteps | 1710848 | -| train/ | | -| approx_kl | 0.03410268 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 133650 | -| policy_gradient_loss | 0.0143 | -| std | 0.0135 | -| value_loss | 2.49e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13367 | -| time_elapsed | 70777 | -| total_timesteps | 1710976 | -| train/ | | -| approx_kl | 0.0085978955 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.00387 | -| learning_rate | 0.0003 | -| loss | -0.00437 | -| n_updates | 133660 | -| policy_gradient_loss | 0.00256 | -| std | 0.0135 | -| value_loss | 9.47e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13368 | -| time_elapsed | 70782 | -| total_timesteps | 1711104 | -| train/ | | -| approx_kl | 0.11438317 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 133670 | -| policy_gradient_loss | 0.0218 | -| std | 0.0135 | -| value_loss | 8.19e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13369 | -| time_elapsed | 70792 | -| total_timesteps | 1711232 | -| train/ | | -| approx_kl | 1.0207608 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -8.26 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 133680 | -| policy_gradient_loss | -0.0135 | -| std | 0.0135 | -| value_loss | 0.00352 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13370 | -| time_elapsed | 70796 | -| total_timesteps | 1711360 | -| train/ | | -| approx_kl | 0.0060908045 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.923 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 133690 | -| policy_gradient_loss | 0.00928 | -| std | 0.0135 | -| value_loss | 7.8e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13371 | -| time_elapsed | 70802 | -| total_timesteps | 1711488 | -| train/ | | -| approx_kl | 0.004081115 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -2.78 | -| learning_rate | 0.0003 | -| loss | 0.00547 | -| n_updates | 133700 | -| policy_gradient_loss | 0.0171 | -| std | 0.0135 | -| value_loss | 2.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13372 | -| time_elapsed | 70808 | -| total_timesteps | 1711616 | -| train/ | | -| approx_kl | 0.037120387 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.548 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 133710 | -| policy_gradient_loss | 0.00133 | -| std | 0.0135 | -| value_loss | 1.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13373 | -| time_elapsed | 70815 | -| total_timesteps | 1711744 | -| train/ | | -| approx_kl | 0.09445492 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0991 | -| learning_rate | 0.0003 | -| loss | 0.0679 | -| n_updates | 133720 | -| policy_gradient_loss | 0.0124 | -| std | 0.0135 | -| value_loss | 3.89e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13374 | -| time_elapsed | 70820 | -| total_timesteps | 1711872 | -| train/ | | -| approx_kl | 0.05224189 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 133730 | -| policy_gradient_loss | -0.00446 | -| std | 0.0135 | -| value_loss | 6.98e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13375 | -| time_elapsed | 70825 | -| total_timesteps | 1712000 | -| train/ | | -| approx_kl | 0.017320516 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.00218 | -| n_updates | 133740 | -| policy_gradient_loss | 0.0055 | -| std | 0.0135 | -| value_loss | 3.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13376 | -| time_elapsed | 70830 | -| total_timesteps | 1712128 | -| train/ | | -| approx_kl | 0.028993547 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.00222 | -| learning_rate | 0.0003 | -| loss | 0.00917 | -| n_updates | 133750 | -| policy_gradient_loss | 0.00434 | -| std | 0.0135 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13377 | -| time_elapsed | 70840 | -| total_timesteps | 1712256 | -| train/ | | -| approx_kl | 0.49498323 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.933 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 133760 | -| policy_gradient_loss | -0.009 | -| std | 0.0135 | -| value_loss | 0.000299 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13378 | -| time_elapsed | 70846 | -| total_timesteps | 1712384 | -| train/ | | -| approx_kl | 0.0039833426 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 133770 | -| policy_gradient_loss | 0.00471 | -| std | 0.0135 | -| value_loss | 7.11e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13379 | -| time_elapsed | 70851 | -| total_timesteps | 1712512 | -| train/ | | -| approx_kl | 0.009474331 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.000389 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 133780 | -| policy_gradient_loss | 0.0043 | -| std | 0.0134 | -| value_loss | 1.78e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13380 | -| time_elapsed | 70857 | -| total_timesteps | 1712640 | -| train/ | | -| approx_kl | 0.077427685 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 133790 | -| policy_gradient_loss | 0.0115 | -| std | 0.0134 | -| value_loss | 1.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13381 | -| time_elapsed | 70861 | -| total_timesteps | 1712768 | -| train/ | | -| approx_kl | 0.018620828 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.00372 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 133800 | -| policy_gradient_loss | -0.00644 | -| std | 0.0134 | -| value_loss | 5.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13382 | -| time_elapsed | 70866 | -| total_timesteps | 1712896 | -| train/ | | -| approx_kl | 0.040039934 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 133810 | -| policy_gradient_loss | 0.0198 | -| std | 0.0134 | -| value_loss | 3.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13383 | -| time_elapsed | 70870 | -| total_timesteps | 1713024 | -| train/ | | -| approx_kl | 0.031846557 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.000329 | -| n_updates | 133820 | -| policy_gradient_loss | -0.00409 | -| std | 0.0134 | -| value_loss | 2.88e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13384 | -| time_elapsed | 70880 | -| total_timesteps | 1713152 | -| train/ | | -| approx_kl | 1.2411814 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | 0.0672 | -| n_updates | 133830 | -| policy_gradient_loss | 0.0545 | -| std | 0.0134 | -| value_loss | 5.81e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13385 | -| time_elapsed | 70883 | -| total_timesteps | 1713280 | -| train/ | | -| approx_kl | 0.010030957 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.00399 | -| n_updates | 133840 | -| policy_gradient_loss | 0.00759 | -| std | 0.0134 | -| value_loss | 2.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13386 | -| time_elapsed | 70889 | -| total_timesteps | 1713408 | -| train/ | | -| approx_kl | 0.07330296 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 133850 | -| policy_gradient_loss | 0.0048 | -| std | 0.0134 | -| value_loss | 9.47e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13387 | -| time_elapsed | 70894 | -| total_timesteps | 1713536 | -| train/ | | -| approx_kl | 0.015545072 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0918 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 133860 | -| policy_gradient_loss | 0.0122 | -| std | 0.0134 | -| value_loss | 5.75e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13388 | -| time_elapsed | 70899 | -| total_timesteps | 1713664 | -| train/ | | -| approx_kl | 0.06547028 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 133870 | -| policy_gradient_loss | 0.00978 | -| std | 0.0134 | -| value_loss | 9.24e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13389 | -| time_elapsed | 70904 | -| total_timesteps | 1713792 | -| train/ | | -| approx_kl | 0.01396227 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 133880 | -| policy_gradient_loss | 0.0194 | -| std | 0.0134 | -| value_loss | 3.91e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 24 | -| iterations | 13390 | -| time_elapsed | 70909 | -| total_timesteps | 1713920 | -| train/ | | -| approx_kl | 0.05032167 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 133890 | -| policy_gradient_loss | 0.00599 | -| std | 0.0134 | -| value_loss | 2.88e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13391 | -| time_elapsed | 70914 | -| total_timesteps | 1714048 | -| train/ | | -| approx_kl | 0.043076485 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | -0.000163 | -| n_updates | 133900 | -| policy_gradient_loss | -0.002 | -| std | 0.0134 | -| value_loss | 1.89e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13392 | -| time_elapsed | 70923 | -| total_timesteps | 1714176 | -| train/ | | -| approx_kl | 0.0051090764 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 133910 | -| policy_gradient_loss | -0.000729 | -| std | 0.0134 | -| value_loss | 0.00111 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13393 | -| time_elapsed | 70928 | -| total_timesteps | 1714304 | -| train/ | | -| approx_kl | 0.029606683 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.00188 | -| learning_rate | 0.0003 | -| loss | -3.45e-05 | -| n_updates | 133920 | -| policy_gradient_loss | 0.0194 | -| std | 0.0134 | -| value_loss | 9.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13394 | -| time_elapsed | 70933 | -| total_timesteps | 1714432 | -| train/ | | -| approx_kl | 0.055075787 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 133930 | -| policy_gradient_loss | 0.0104 | -| std | 0.0134 | -| value_loss | 5.27e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13395 | -| time_elapsed | 70937 | -| total_timesteps | 1714560 | -| train/ | | -| approx_kl | 6.946083e-05 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 133940 | -| policy_gradient_loss | -0.00814 | -| std | 0.0134 | -| value_loss | 3.83e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13396 | -| time_elapsed | 70941 | -| total_timesteps | 1714688 | -| train/ | | -| approx_kl | 0.0065080235 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 133950 | -| policy_gradient_loss | 0.00235 | -| std | 0.0134 | -| value_loss | 2.31e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13397 | -| time_elapsed | 70945 | -| total_timesteps | 1714816 | -| train/ | | -| approx_kl | 0.023024198 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 133960 | -| policy_gradient_loss | 0.0145 | -| std | 0.0134 | -| value_loss | 8.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13398 | -| time_elapsed | 70950 | -| total_timesteps | 1714944 | -| train/ | | -| approx_kl | 0.025226988 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | 1.79e-05 | -| learning_rate | 0.0003 | -| loss | 0.00349 | -| n_updates | 133970 | -| policy_gradient_loss | 8.68e-05 | -| std | 0.0134 | -| value_loss | 1.27e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13399 | -| time_elapsed | 70955 | -| total_timesteps | 1715072 | -| train/ | | -| approx_kl | 0.0029561394 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00218 | -| n_updates | 133980 | -| policy_gradient_loss | 0.00622 | -| std | 0.0134 | -| value_loss | 1.01e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13400 | -| time_elapsed | 70962 | -| total_timesteps | 1715200 | -| train/ | | -| approx_kl | 0.6412447 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.89 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 133990 | -| policy_gradient_loss | -0.0158 | -| std | 0.0134 | -| value_loss | 0.00133 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13401 | -| time_elapsed | 70967 | -| total_timesteps | 1715328 | -| train/ | | -| approx_kl | 0.067131676 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -40.7 | -| learning_rate | 0.0003 | -| loss | -0.00927 | -| n_updates | 134000 | -| policy_gradient_loss | -0.00374 | -| std | 0.0134 | -| value_loss | 3.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13402 | -| time_elapsed | 70971 | -| total_timesteps | 1715456 | -| train/ | | -| approx_kl | 0.021878436 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -46.6 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 134010 | -| policy_gradient_loss | -0.00504 | -| std | 0.0134 | -| value_loss | 1.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13403 | -| time_elapsed | 70975 | -| total_timesteps | 1715584 | -| train/ | | -| approx_kl | 0.063099965 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -6.56 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 134020 | -| policy_gradient_loss | 0.0149 | -| std | 0.0134 | -| value_loss | 2.25e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13404 | -| time_elapsed | 70980 | -| total_timesteps | 1715712 | -| train/ | | -| approx_kl | 7.1385875e-05 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | -0.000493 | -| n_updates | 134030 | -| policy_gradient_loss | -0.000603 | -| std | 0.0134 | -| value_loss | 5.34e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13405 | -| time_elapsed | 70985 | -| total_timesteps | 1715840 | -| train/ | | -| approx_kl | 2.1289568e-05 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -0.000849 | -| n_updates | 134040 | -| policy_gradient_loss | -0.00477 | -| std | 0.0134 | -| value_loss | 3.56e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13406 | -| time_elapsed | 70990 | -| total_timesteps | 1715968 | -| train/ | | -| approx_kl | 3.889948e-05 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.00983 | -| learning_rate | 0.0003 | -| loss | -0.0009 | -| n_updates | 134050 | -| policy_gradient_loss | -0.00275 | -| std | 0.0134 | -| value_loss | 2.19e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13407 | -| time_elapsed | 70995 | -| total_timesteps | 1716096 | -| train/ | | -| approx_kl | 0.018611096 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.000967 | -| learning_rate | 0.0003 | -| loss | 0.00632 | -| n_updates | 134060 | -| policy_gradient_loss | 0.0227 | -| std | 0.0134 | -| value_loss | 1.35e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13408 | -| time_elapsed | 71005 | -| total_timesteps | 1716224 | -| train/ | | -| approx_kl | 0.0108787455 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.792 | -| learning_rate | 0.0003 | -| loss | 0.00984 | -| n_updates | 134070 | -| policy_gradient_loss | 0.00394 | -| std | 0.0133 | -| value_loss | 0.00232 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13409 | -| time_elapsed | 71008 | -| total_timesteps | 1716352 | -| train/ | | -| approx_kl | 0.02365297 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.00252 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 134080 | -| policy_gradient_loss | -0.00737 | -| std | 0.0133 | -| value_loss | 1.98e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13410 | -| time_elapsed | 71013 | -| total_timesteps | 1716480 | -| train/ | | -| approx_kl | 0.006346969 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 134090 | -| policy_gradient_loss | 0.00337 | -| std | 0.0133 | -| value_loss | 1.8e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13411 | -| time_elapsed | 71016 | -| total_timesteps | 1716608 | -| train/ | | -| approx_kl | 0.00082485983 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -6.15e-05 | -| n_updates | 134100 | -| policy_gradient_loss | 0.0102 | -| std | 0.0133 | -| value_loss | 2.88e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13412 | -| time_elapsed | 71020 | -| total_timesteps | 1716736 | -| train/ | | -| approx_kl | 3.92152e-05 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.000998 | -| learning_rate | 0.0003 | -| loss | -0.000334 | -| n_updates | 134110 | -| policy_gradient_loss | -0.000505 | -| std | 0.0132 | -| value_loss | 5.71e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13413 | -| time_elapsed | 71025 | -| total_timesteps | 1716864 | -| train/ | | -| approx_kl | 0.010580294 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.00546 | -| n_updates | 134120 | -| policy_gradient_loss | 0.00574 | -| std | 0.0132 | -| value_loss | 2.81e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13414 | -| time_elapsed | 71030 | -| total_timesteps | 1716992 | -| train/ | | -| approx_kl | 0.01253697 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.00142 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 134130 | -| policy_gradient_loss | -0.0061 | -| std | 0.0132 | -| value_loss | 0.00036 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13415 | -| time_elapsed | 71036 | -| total_timesteps | 1717120 | -| train/ | | -| approx_kl | 0.067035474 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.00167 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 134140 | -| policy_gradient_loss | 0.00443 | -| std | 0.0132 | -| value_loss | 0.000258 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13416 | -| time_elapsed | 71048 | -| total_timesteps | 1717248 | -| train/ | | -| approx_kl | 0.3383679 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 134150 | -| policy_gradient_loss | -0.0111 | -| std | 0.0132 | -| value_loss | 0.00361 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13417 | -| time_elapsed | 71053 | -| total_timesteps | 1717376 | -| train/ | | -| approx_kl | 0.017112931 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | 0.00436 | -| n_updates | 134160 | -| policy_gradient_loss | 0.0198 | -| std | 0.0132 | -| value_loss | 2.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13418 | -| time_elapsed | 71058 | -| total_timesteps | 1717504 | -| train/ | | -| approx_kl | 0.029128445 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | 0.00501 | -| n_updates | 134170 | -| policy_gradient_loss | 0.000175 | -| std | 0.0132 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13419 | -| time_elapsed | 71064 | -| total_timesteps | 1717632 | -| train/ | | -| approx_kl | 0.0031996886 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00367 | -| n_updates | 134180 | -| policy_gradient_loss | 0.00761 | -| std | 0.0132 | -| value_loss | 5.58e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13420 | -| time_elapsed | 71069 | -| total_timesteps | 1717760 | -| train/ | | -| approx_kl | 0.012954921 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 134190 | -| policy_gradient_loss | -0.0141 | -| std | 0.0132 | -| value_loss | 4.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13421 | -| time_elapsed | 71074 | -| total_timesteps | 1717888 | -| train/ | | -| approx_kl | 0.008875923 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.00758 | -| n_updates | 134200 | -| policy_gradient_loss | -0.0031 | -| std | 0.0132 | -| value_loss | 2.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13422 | -| time_elapsed | 71078 | -| total_timesteps | 1718016 | -| train/ | | -| approx_kl | 0.0126943905 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.0093 | -| n_updates | 134210 | -| policy_gradient_loss | 0.00444 | -| std | 0.0132 | -| value_loss | 2.14e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13423 | -| time_elapsed | 71088 | -| total_timesteps | 1718144 | -| train/ | | -| approx_kl | 0.012012131 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 134220 | -| policy_gradient_loss | -0.0144 | -| std | 0.0132 | -| value_loss | 0.000716 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13424 | -| time_elapsed | 71094 | -| total_timesteps | 1718272 | -| train/ | | -| approx_kl | 0.015296774 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.0201 | -| learning_rate | 0.0003 | -| loss | -0.00719 | -| n_updates | 134230 | -| policy_gradient_loss | -0.00501 | -| std | 0.0132 | -| value_loss | 4.76e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13425 | -| time_elapsed | 71098 | -| total_timesteps | 1718400 | -| train/ | | -| approx_kl | 0.00025206385 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 134240 | -| policy_gradient_loss | -0.00143 | -| std | 0.0132 | -| value_loss | 2.23e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13426 | -| time_elapsed | 71103 | -| total_timesteps | 1718528 | -| train/ | | -| approx_kl | 0.0023248913 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 134250 | -| policy_gradient_loss | 0.000429 | -| std | 0.0132 | -| value_loss | 5.03e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13427 | -| time_elapsed | 71107 | -| total_timesteps | 1718656 | -| train/ | | -| approx_kl | 0.0012278054 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.00596 | -| n_updates | 134260 | -| policy_gradient_loss | -0.00466 | -| std | 0.0132 | -| value_loss | 6.07e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13428 | -| time_elapsed | 71111 | -| total_timesteps | 1718784 | -| train/ | | -| approx_kl | 0.00067728944 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.00908 | -| learning_rate | 0.0003 | -| loss | 0.00703 | -| n_updates | 134270 | -| policy_gradient_loss | 0.0129 | -| std | 0.0132 | -| value_loss | 1.41e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13429 | -| time_elapsed | 71115 | -| total_timesteps | 1718912 | -| train/ | | -| approx_kl | 0.0020594504 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | 0.00579 | -| n_updates | 134280 | -| policy_gradient_loss | 0.0208 | -| std | 0.0132 | -| value_loss | 1.75e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13430 | -| time_elapsed | 71119 | -| total_timesteps | 1719040 | -| train/ | | -| approx_kl | 0.038211778 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.00275 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 134290 | -| policy_gradient_loss | 6.49e-05 | -| std | 0.0132 | -| value_loss | 1.52e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13431 | -| time_elapsed | 71131 | -| total_timesteps | 1719168 | -| train/ | | -| approx_kl | 0.1386511 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.00954 | -| n_updates | 134300 | -| policy_gradient_loss | -0.0136 | -| std | 0.0132 | -| value_loss | 7.84e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13432 | -| time_elapsed | 71136 | -| total_timesteps | 1719296 | -| train/ | | -| approx_kl | 0.056362618 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | 0.00725 | -| n_updates | 134310 | -| policy_gradient_loss | -0.000429 | -| std | 0.0132 | -| value_loss | 2.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13433 | -| time_elapsed | 71141 | -| total_timesteps | 1719424 | -| train/ | | -| approx_kl | 0.019101482 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -3.43 | -| learning_rate | 0.0003 | -| loss | 0.0055 | -| n_updates | 134320 | -| policy_gradient_loss | 0.00585 | -| std | 0.0132 | -| value_loss | 9.05e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13434 | -| time_elapsed | 71145 | -| total_timesteps | 1719552 | -| train/ | | -| approx_kl | 0.07498745 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 134330 | -| policy_gradient_loss | 0.0488 | -| std | 0.0132 | -| value_loss | 2.07e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13435 | -| time_elapsed | 71149 | -| total_timesteps | 1719680 | -| train/ | | -| approx_kl | 0.03782491 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 134340 | -| policy_gradient_loss | 0.0393 | -| std | 0.0133 | -| value_loss | 3.22e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13436 | -| time_elapsed | 71154 | -| total_timesteps | 1719808 | -| train/ | | -| approx_kl | 0.010250844 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.00289 | -| n_updates | 134350 | -| policy_gradient_loss | 0.00674 | -| std | 0.0133 | -| value_loss | 4.26e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13437 | -| time_elapsed | 71158 | -| total_timesteps | 1719936 | -| train/ | | -| approx_kl | 0.16419676 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.00795 | -| learning_rate | 0.0003 | -| loss | 0.0922 | -| n_updates | 134360 | -| policy_gradient_loss | 0.0227 | -| std | 0.0133 | -| value_loss | 2.44e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13438 | -| time_elapsed | 71163 | -| total_timesteps | 1720064 | -| train/ | | -| approx_kl | 0.003530317 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.00119 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 134370 | -| policy_gradient_loss | -0.000617 | -| std | 0.0133 | -| value_loss | 1.51e-11 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13439 | -| time_elapsed | 71169 | -| total_timesteps | 1720192 | -| train/ | | -| approx_kl | 0.2725001 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.833 | -| learning_rate | 0.0003 | -| loss | 0.00376 | -| n_updates | 134380 | -| policy_gradient_loss | -0.00704 | -| std | 0.0133 | -| value_loss | 0.0019 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13440 | -| time_elapsed | 71174 | -| total_timesteps | 1720320 | -| train/ | | -| approx_kl | 9.068241e-05 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.00695 | -| learning_rate | 0.0003 | -| loss | 0.000741 | -| n_updates | 134390 | -| policy_gradient_loss | -0.000348 | -| std | 0.0133 | -| value_loss | 2.45e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13441 | -| time_elapsed | 71178 | -| total_timesteps | 1720448 | -| train/ | | -| approx_kl | 0.033484828 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.0068 | -| n_updates | 134400 | -| policy_gradient_loss | -0.000463 | -| std | 0.0133 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13442 | -| time_elapsed | 71185 | -| total_timesteps | 1720576 | -| train/ | | -| approx_kl | 7.377332e-05 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 134410 | -| policy_gradient_loss | -0.00469 | -| std | 0.0133 | -| value_loss | 3.68e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13443 | -| time_elapsed | 71190 | -| total_timesteps | 1720704 | -| train/ | | -| approx_kl | 0.0046966355 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 134420 | -| policy_gradient_loss | -0.0021 | -| std | 0.0133 | -| value_loss | 1.47e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13444 | -| time_elapsed | 71195 | -| total_timesteps | 1720832 | -| train/ | | -| approx_kl | 0.0083618 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 134430 | -| policy_gradient_loss | -0.00237 | -| std | 0.0133 | -| value_loss | 3.05e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 24 | -| iterations | 13445 | -| time_elapsed | 71199 | -| total_timesteps | 1720960 | -| train/ | | -| approx_kl | 0.0017233733 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 134440 | -| policy_gradient_loss | 0.00607 | -| std | 0.0133 | -| value_loss | 6.38e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13446 | -| time_elapsed | 71204 | -| total_timesteps | 1721088 | -| train/ | | -| approx_kl | 0.05092577 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.0579 | -| n_updates | 134450 | -| policy_gradient_loss | 0.0161 | -| std | 0.0133 | -| value_loss | 9.95e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13447 | -| time_elapsed | 71215 | -| total_timesteps | 1721216 | -| train/ | | -| approx_kl | 0.0069882986 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | 0.9 | -| learning_rate | 0.0003 | -| loss | 0.00728 | -| n_updates | 134460 | -| policy_gradient_loss | 0.00707 | -| std | 0.0132 | -| value_loss | 0.000925 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13448 | -| time_elapsed | 71219 | -| total_timesteps | 1721344 | -| train/ | | -| approx_kl | 0.025640696 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 2.9 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.00844 | -| n_updates | 134470 | -| policy_gradient_loss | 0.000818 | -| std | 0.0132 | -| value_loss | 7.66e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13449 | -| time_elapsed | 71224 | -| total_timesteps | 1721472 | -| train/ | | -| approx_kl | 0.0015043151 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.00507 | -| n_updates | 134480 | -| policy_gradient_loss | -0.00475 | -| std | 0.0132 | -| value_loss | 4.37e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13450 | -| time_elapsed | 71228 | -| total_timesteps | 1721600 | -| train/ | | -| approx_kl | 0.00016519753 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -17 | -| learning_rate | 0.0003 | -| loss | 0.000941 | -| n_updates | 134490 | -| policy_gradient_loss | 0.00686 | -| std | 0.0132 | -| value_loss | 1.31e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13451 | -| time_elapsed | 71234 | -| total_timesteps | 1721728 | -| train/ | | -| approx_kl | 0.002330759 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.000194 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 134500 | -| policy_gradient_loss | 0.057 | -| std | 0.0132 | -| value_loss | 9.35e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13452 | -| time_elapsed | 71239 | -| total_timesteps | 1721856 | -| train/ | | -| approx_kl | 0.03015465 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.00798 | -| n_updates | 134510 | -| policy_gradient_loss | -0.000498 | -| std | 0.0132 | -| value_loss | 6.65e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13453 | -| time_elapsed | 71245 | -| total_timesteps | 1721984 | -| train/ | | -| approx_kl | 0.0078919735 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.00536 | -| n_updates | 134520 | -| policy_gradient_loss | 0.0173 | -| std | 0.0132 | -| value_loss | 3.43e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13454 | -| time_elapsed | 71250 | -| total_timesteps | 1722112 | -| train/ | | -| approx_kl | 0.007659301 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 134530 | -| policy_gradient_loss | 0.00141 | -| std | 0.0132 | -| value_loss | 1.98e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13455 | -| time_elapsed | 71263 | -| total_timesteps | 1722240 | -| train/ | | -| approx_kl | 0.023638688 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 134540 | -| policy_gradient_loss | -0.01 | -| std | 0.0132 | -| value_loss | 0.000705 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13456 | -| time_elapsed | 71268 | -| total_timesteps | 1722368 | -| train/ | | -| approx_kl | 0.01938646 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 134550 | -| policy_gradient_loss | -0.00474 | -| std | 0.0132 | -| value_loss | 1.84e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13457 | -| time_elapsed | 71272 | -| total_timesteps | 1722496 | -| train/ | | -| approx_kl | 0.07468394 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.00426 | -| learning_rate | 0.0003 | -| loss | 0.0452 | -| n_updates | 134560 | -| policy_gradient_loss | 0.017 | -| std | 0.0132 | -| value_loss | 2.5e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13458 | -| time_elapsed | 71278 | -| total_timesteps | 1722624 | -| train/ | | -| approx_kl | 0.018637078 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 134570 | -| policy_gradient_loss | 0.000663 | -| std | 0.0132 | -| value_loss | 2.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13459 | -| time_elapsed | 71282 | -| total_timesteps | 1722752 | -| train/ | | -| approx_kl | 0.049566716 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.000302 | -| learning_rate | 0.0003 | -| loss | 0.00837 | -| n_updates | 134580 | -| policy_gradient_loss | 0.0127 | -| std | 0.0132 | -| value_loss | 7.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13460 | -| time_elapsed | 71288 | -| total_timesteps | 1722880 | -| train/ | | -| approx_kl | 0.056309957 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.029 | -| n_updates | 134590 | -| policy_gradient_loss | 0.00787 | -| std | 0.0132 | -| value_loss | 3.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13461 | -| time_elapsed | 71294 | -| total_timesteps | 1723008 | -| train/ | | -| approx_kl | 0.018677905 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.00631 | -| n_updates | 134600 | -| policy_gradient_loss | 0.0256 | -| std | 0.0132 | -| value_loss | 2.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13462 | -| time_elapsed | 71305 | -| total_timesteps | 1723136 | -| train/ | | -| approx_kl | 0.40319833 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 134610 | -| policy_gradient_loss | -0.0143 | -| std | 0.0132 | -| value_loss | 0.00163 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13463 | -| time_elapsed | 71309 | -| total_timesteps | 1723264 | -| train/ | | -| approx_kl | 0.086867526 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 134620 | -| policy_gradient_loss | 0.00495 | -| std | 0.0132 | -| value_loss | 0.000141 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13464 | -| time_elapsed | 71313 | -| total_timesteps | 1723392 | -| train/ | | -| approx_kl | 1.6046688e-05 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.000343 | -| n_updates | 134630 | -| policy_gradient_loss | -0.00225 | -| std | 0.0132 | -| value_loss | 9.68e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13465 | -| time_elapsed | 71318 | -| total_timesteps | 1723520 | -| train/ | | -| approx_kl | 0.016486816 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.00821 | -| learning_rate | 0.0003 | -| loss | 0.000714 | -| n_updates | 134640 | -| policy_gradient_loss | 0.0192 | -| std | 0.0132 | -| value_loss | 4.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13466 | -| time_elapsed | 71323 | -| total_timesteps | 1723648 | -| train/ | | -| approx_kl | 0.017188542 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | 0.00261 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 134650 | -| policy_gradient_loss | -0.0145 | -| std | 0.0132 | -| value_loss | 1.9e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13467 | -| time_elapsed | 71328 | -| total_timesteps | 1723776 | -| train/ | | -| approx_kl | 0.013201435 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.00723 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 134660 | -| policy_gradient_loss | 0.00368 | -| std | 0.0132 | -| value_loss | 9.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13468 | -| time_elapsed | 71334 | -| total_timesteps | 1723904 | -| train/ | | -| approx_kl | 0.0075675664 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 134670 | -| policy_gradient_loss | 0.0157 | -| std | 0.0132 | -| value_loss | 7.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13469 | -| time_elapsed | 71339 | -| total_timesteps | 1724032 | -| train/ | | -| approx_kl | 0.013152117 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 134680 | -| policy_gradient_loss | -0.00577 | -| std | 0.0131 | -| value_loss | 4.88e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13470 | -| time_elapsed | 71350 | -| total_timesteps | 1724160 | -| train/ | | -| approx_kl | 1.0173793 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -3.06 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 134690 | -| policy_gradient_loss | -0.00984 | -| std | 0.0131 | -| value_loss | 0.00165 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13471 | -| time_elapsed | 71354 | -| total_timesteps | 1724288 | -| train/ | | -| approx_kl | 0.048487946 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -0.636 | -| learning_rate | 0.0003 | -| loss | 0.0096 | -| n_updates | 134700 | -| policy_gradient_loss | 0.0341 | -| std | 0.0131 | -| value_loss | 6.53e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13472 | -| time_elapsed | 71358 | -| total_timesteps | 1724416 | -| train/ | | -| approx_kl | 0.07236104 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 2.91 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | 0.0847 | -| n_updates | 134710 | -| policy_gradient_loss | 0.0314 | -| std | 0.0131 | -| value_loss | 3.68e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13473 | -| time_elapsed | 71362 | -| total_timesteps | 1724544 | -| train/ | | -| approx_kl | 0.00086075347 | -| clip_fraction | 0 | -| clip_range | 0.2 | -| entropy_loss | 2.92 | -| explained_variance | -0.563 | -| learning_rate | 0.0003 | -| loss | -0.00072 | -| n_updates | 134720 | -| policy_gradient_loss | -0.000194 | -| std | 0.0131 | -| value_loss | 3.72e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13474 | -| time_elapsed | 71365 | -| total_timesteps | 1724672 | -| train/ | | -| approx_kl | 0.005266331 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.92 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | -4.88e-05 | -| n_updates | 134730 | -| policy_gradient_loss | 0.00423 | -| std | 0.013 | -| value_loss | 2.8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13475 | -| time_elapsed | 71369 | -| total_timesteps | 1724800 | -| train/ | | -| approx_kl | 0.028232435 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 134740 | -| policy_gradient_loss | 0.000688 | -| std | 0.013 | -| value_loss | 3.81e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13476 | -| time_elapsed | 71374 | -| total_timesteps | 1724928 | -| train/ | | -| approx_kl | 0.020178417 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.00875 | -| n_updates | 134750 | -| policy_gradient_loss | -0.005 | -| std | 0.013 | -| value_loss | 1.57e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13477 | -| time_elapsed | 71378 | -| total_timesteps | 1725056 | -| train/ | | -| approx_kl | 0.037069105 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.0775 | -| n_updates | 134760 | -| policy_gradient_loss | 0.0589 | -| std | 0.0129 | -| value_loss | 8.96e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13478 | -| time_elapsed | 71386 | -| total_timesteps | 1725184 | -| train/ | | -| approx_kl | 0.09934891 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | 0.791 | -| learning_rate | 0.0003 | -| loss | -0.00817 | -| n_updates | 134770 | -| policy_gradient_loss | 0.00142 | -| std | 0.0129 | -| value_loss | 0.00254 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13479 | -| time_elapsed | 71391 | -| total_timesteps | 1725312 | -| train/ | | -| approx_kl | 0.038328912 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0638 | -| n_updates | 134780 | -| policy_gradient_loss | 0.0224 | -| std | 0.0129 | -| value_loss | 1.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13480 | -| time_elapsed | 71399 | -| total_timesteps | 1725440 | -| train/ | | -| approx_kl | 0.037637703 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.00298 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 134790 | -| policy_gradient_loss | 0.00467 | -| std | 0.0129 | -| value_loss | 2.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13481 | -| time_elapsed | 71404 | -| total_timesteps | 1725568 | -| train/ | | -| approx_kl | 0.005356103 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 134800 | -| policy_gradient_loss | -0.000162 | -| std | 0.0129 | -| value_loss | 7.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13482 | -| time_elapsed | 71409 | -| total_timesteps | 1725696 | -| train/ | | -| approx_kl | 0.009684792 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 134810 | -| policy_gradient_loss | 0.00339 | -| std | 0.0129 | -| value_loss | 5.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13483 | -| time_elapsed | 71413 | -| total_timesteps | 1725824 | -| train/ | | -| approx_kl | 0.024579493 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 134820 | -| policy_gradient_loss | 0.0388 | -| std | 0.0129 | -| value_loss | 2.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 24 | -| iterations | 13484 | -| time_elapsed | 71418 | -| total_timesteps | 1725952 | -| train/ | | -| approx_kl | 0.006134657 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 134830 | -| policy_gradient_loss | 0.00659 | -| std | 0.0129 | -| value_loss | 2.5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13485 | -| time_elapsed | 71423 | -| total_timesteps | 1726080 | -| train/ | | -| approx_kl | 0.16886917 | -| clip_fraction | 0.587 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 134840 | -| policy_gradient_loss | 0.0614 | -| std | 0.0129 | -| value_loss | 9.72e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13486 | -| time_elapsed | 71432 | -| total_timesteps | 1726208 | -| train/ | | -| approx_kl | 0.04795712 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 134850 | -| policy_gradient_loss | -0.0071 | -| std | 0.0129 | -| value_loss | 0.000445 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13487 | -| time_elapsed | 71437 | -| total_timesteps | 1726336 | -| train/ | | -| approx_kl | 0.115918025 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | 0.00162 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 134860 | -| policy_gradient_loss | -0.0078 | -| std | 0.0129 | -| value_loss | 0.000103 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13488 | -| time_elapsed | 71441 | -| total_timesteps | 1726464 | -| train/ | | -| approx_kl | 0.0029192264 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | -0.00762 | -| n_updates | 134870 | -| policy_gradient_loss | 0.00711 | -| std | 0.0129 | -| value_loss | 1.83e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13489 | -| time_elapsed | 71445 | -| total_timesteps | 1726592 | -| train/ | | -| approx_kl | 0.0115614645 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | 0.00455 | -| learning_rate | 0.0003 | -| loss | 0.000471 | -| n_updates | 134880 | -| policy_gradient_loss | 0.00908 | -| std | 0.0129 | -| value_loss | 1.81e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13490 | -| time_elapsed | 71451 | -| total_timesteps | 1726720 | -| train/ | | -| approx_kl | 0.15986992 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.0948 | -| n_updates | 134890 | -| policy_gradient_loss | 0.0192 | -| std | 0.0129 | -| value_loss | 1.03e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13491 | -| time_elapsed | 71456 | -| total_timesteps | 1726848 | -| train/ | | -| approx_kl | 0.00042487355 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 134900 | -| policy_gradient_loss | -0.00643 | -| std | 0.0129 | -| value_loss | 1.16e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13492 | -| time_elapsed | 71460 | -| total_timesteps | 1726976 | -| train/ | | -| approx_kl | 0.0014243876 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 134910 | -| policy_gradient_loss | -0.00196 | -| std | 0.0129 | -| value_loss | 3.62e-07 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 24 | -| iterations | 13493 | -| time_elapsed | 71466 | -| total_timesteps | 1727104 | -| train/ | | -| approx_kl | 0.000104326755 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.00172 | -| n_updates | 134920 | -| policy_gradient_loss | -0.00438 | -| std | 0.0129 | -| value_loss | 3.32e-07 | --------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 24 | -| iterations | 13494 | -| time_elapsed | 71476 | -| total_timesteps | 1727232 | -| train/ | | -| approx_kl | 0.0040386645 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | 0.721 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 134930 | -| policy_gradient_loss | 0.0051 | -| std | 0.0128 | -| value_loss | 0.00469 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 24 | -| iterations | 13495 | -| time_elapsed | 71481 | -| total_timesteps | 1727360 | -| train/ | | -| approx_kl | 0.034051165 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.00446 | -| learning_rate | 0.0003 | -| loss | 0.000576 | -| n_updates | 134940 | -| policy_gradient_loss | 0.00259 | -| std | 0.0128 | -| value_loss | 1.6e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 24 | -| iterations | 13496 | -| time_elapsed | 71488 | -| total_timesteps | 1727488 | -| train/ | | -| approx_kl | 0.041588597 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.451 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 134950 | -| policy_gradient_loss | 0.00735 | -| std | 0.0128 | -| value_loss | 6.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 24 | -| iterations | 13497 | -| time_elapsed | 71493 | -| total_timesteps | 1727616 | -| train/ | | -| approx_kl | 0.06968537 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 134960 | -| policy_gradient_loss | 0.0154 | -| std | 0.0128 | -| value_loss | 4.81e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 24 | -| iterations | 13498 | -| time_elapsed | 71499 | -| total_timesteps | 1727744 | -| train/ | | -| approx_kl | 0.023668539 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0624 | -| learning_rate | 0.0003 | -| loss | -0.00565 | -| n_updates | 134970 | -| policy_gradient_loss | 0.00183 | -| std | 0.0128 | -| value_loss | 6.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 24 | -| iterations | 13499 | -| time_elapsed | 71503 | -| total_timesteps | 1727872 | -| train/ | | -| approx_kl | 0.010892332 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.00875 | -| learning_rate | 0.0003 | -| loss | 0.00331 | -| n_updates | 134980 | -| policy_gradient_loss | 0.00685 | -| std | 0.0128 | -| value_loss | 1.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13500 | -| time_elapsed | 71508 | -| total_timesteps | 1728000 | -| train/ | | -| approx_kl | 0.006316821 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | -0.00021 | -| n_updates | 134990 | -| policy_gradient_loss | 0.0043 | -| std | 0.0129 | -| value_loss | 5.61e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13501 | -| time_elapsed | 71513 | -| total_timesteps | 1728128 | -| train/ | | -| approx_kl | 0.08188093 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | 0.000435 | -| learning_rate | 0.0003 | -| loss | 0.0614 | -| n_updates | 135000 | -| policy_gradient_loss | 0.0134 | -| std | 0.0129 | -| value_loss | 3.25e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13502 | -| time_elapsed | 71521 | -| total_timesteps | 1728256 | -| train/ | | -| approx_kl | 0.08785814 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -4.22 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 135010 | -| policy_gradient_loss | -0.015 | -| std | 0.0129 | -| value_loss | 0.00188 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13503 | -| time_elapsed | 71525 | -| total_timesteps | 1728384 | -| train/ | | -| approx_kl | 0.054047853 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 2.93 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | 0.0318 | -| n_updates | 135020 | -| policy_gradient_loss | 0.0144 | -| std | 0.0129 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13504 | -| time_elapsed | 71530 | -| total_timesteps | 1728512 | -| train/ | | -| approx_kl | 0.0025040843 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | 3.68e-05 | -| n_updates | 135030 | -| policy_gradient_loss | 0.00469 | -| std | 0.0128 | -| value_loss | 4.13e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13505 | -| time_elapsed | 71535 | -| total_timesteps | 1728640 | -| train/ | | -| approx_kl | 0.023285907 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0629 | -| learning_rate | 0.0003 | -| loss | 0.0068 | -| n_updates | 135040 | -| policy_gradient_loss | 0.0175 | -| std | 0.0128 | -| value_loss | 6.46e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13506 | -| time_elapsed | 71541 | -| total_timesteps | 1728768 | -| train/ | | -| approx_kl | 0.040727325 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | 0.00363 | -| learning_rate | 0.0003 | -| loss | 0.0553 | -| n_updates | 135050 | -| policy_gradient_loss | 0.0207 | -| std | 0.0127 | -| value_loss | 1.19e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 24 | -| iterations | 13507 | -| time_elapsed | 71545 | -| total_timesteps | 1728896 | -| train/ | | -| approx_kl | 0.10608451 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.00252 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 135060 | -| policy_gradient_loss | 0.00929 | -| std | 0.0127 | -| value_loss | 9.23e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13508 | -| time_elapsed | 71550 | -| total_timesteps | 1729024 | -| train/ | | -| approx_kl | 0.0018013399 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.00783 | -| learning_rate | 0.0003 | -| loss | -0.000395 | -| n_updates | 135070 | -| policy_gradient_loss | 0.00772 | -| std | 0.0127 | -| value_loss | 9.15e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13509 | -| time_elapsed | 71560 | -| total_timesteps | 1729152 | -| train/ | | -| approx_kl | 0.0090485765 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | 0.761 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 135080 | -| policy_gradient_loss | -0.0145 | -| std | 0.0127 | -| value_loss | 0.00302 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13510 | -| time_elapsed | 71564 | -| total_timesteps | 1729280 | -| train/ | | -| approx_kl | 0.09014372 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | 0.0368 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 135090 | -| policy_gradient_loss | 0.00319 | -| std | 0.0128 | -| value_loss | 6.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13511 | -| time_elapsed | 71569 | -| total_timesteps | 1729408 | -| train/ | | -| approx_kl | 0.026246386 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0859 | -| learning_rate | 0.0003 | -| loss | 0.00369 | -| n_updates | 135100 | -| policy_gradient_loss | 0.00465 | -| std | 0.0128 | -| value_loss | 1.01e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13512 | -| time_elapsed | 71575 | -| total_timesteps | 1729536 | -| train/ | | -| approx_kl | 0.012826372 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 135110 | -| policy_gradient_loss | 0.00586 | -| std | 0.0128 | -| value_loss | 3.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13513 | -| time_elapsed | 71580 | -| total_timesteps | 1729664 | -| train/ | | -| approx_kl | 0.09392831 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.0511 | -| n_updates | 135120 | -| policy_gradient_loss | 0.0114 | -| std | 0.0128 | -| value_loss | 2.6e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13514 | -| time_elapsed | 71583 | -| total_timesteps | 1729792 | -| train/ | | -| approx_kl | 1.4426187e-06 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | -0.000191 | -| n_updates | 135130 | -| policy_gradient_loss | -0.00116 | -| std | 0.0127 | -| value_loss | 1.76e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13515 | -| time_elapsed | 71588 | -| total_timesteps | 1729920 | -| train/ | | -| approx_kl | 0.015754502 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.00266 | -| n_updates | 135140 | -| policy_gradient_loss | 0.0173 | -| std | 0.0127 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13516 | -| time_elapsed | 71592 | -| total_timesteps | 1730048 | -| train/ | | -| approx_kl | 0.06298777 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.0451 | -| n_updates | 135150 | -| policy_gradient_loss | 0.0114 | -| std | 0.0127 | -| value_loss | 1.82e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13517 | -| time_elapsed | 71602 | -| total_timesteps | 1730176 | -| train/ | | -| approx_kl | 0.14996873 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 2.94 | -| explained_variance | 0.52 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 135160 | -| policy_gradient_loss | -0.0113 | -| std | 0.0127 | -| value_loss | 0.000659 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13518 | -| time_elapsed | 71605 | -| total_timesteps | 1730304 | -| train/ | | -| approx_kl | 0.00041781692 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -3.06 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 135170 | -| policy_gradient_loss | -0.00333 | -| std | 0.0127 | -| value_loss | 3.75e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13519 | -| time_elapsed | 71609 | -| total_timesteps | 1730432 | -| train/ | | -| approx_kl | 0.037022997 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.961 | -| learning_rate | 0.0003 | -| loss | 0.00289 | -| n_updates | 135180 | -| policy_gradient_loss | 0.0117 | -| std | 0.0127 | -| value_loss | 5.71e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13520 | -| time_elapsed | 71613 | -| total_timesteps | 1730560 | -| train/ | | -| approx_kl | 0.27856138 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 135190 | -| policy_gradient_loss | 0.0986 | -| std | 0.0127 | -| value_loss | 6.56e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13521 | -| time_elapsed | 71616 | -| total_timesteps | 1730688 | -| train/ | | -| approx_kl | 0.0106112035 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00204 | -| n_updates | 135200 | -| policy_gradient_loss | -0.000337 | -| std | 0.0127 | -| value_loss | 3.89e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13522 | -| time_elapsed | 71620 | -| total_timesteps | 1730816 | -| train/ | | -| approx_kl | 0.0048753424 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.00555 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 135210 | -| policy_gradient_loss | 0.00455 | -| std | 0.0127 | -| value_loss | 2.69e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13523 | -| time_elapsed | 71624 | -| total_timesteps | 1730944 | -| train/ | | -| approx_kl | 0.0085812695 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | 0.00359 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 135220 | -| policy_gradient_loss | -0.00553 | -| std | 0.0127 | -| value_loss | 9.04e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13524 | -| time_elapsed | 71629 | -| total_timesteps | 1731072 | -| train/ | | -| approx_kl | 0.001094223 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 135230 | -| policy_gradient_loss | 0.00601 | -| std | 0.0127 | -| value_loss | 4.15e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13525 | -| time_elapsed | 71638 | -| total_timesteps | 1731200 | -| train/ | | -| approx_kl | 0.029315278 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | 0.701 | -| learning_rate | 0.0003 | -| loss | 0.0075 | -| n_updates | 135240 | -| policy_gradient_loss | -0.000743 | -| std | 0.0127 | -| value_loss | 0.00553 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13526 | -| time_elapsed | 71642 | -| total_timesteps | 1731328 | -| train/ | | -| approx_kl | 9.185635e-06 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.76 | -| learning_rate | 0.0003 | -| loss | 0.000248 | -| n_updates | 135250 | -| policy_gradient_loss | -0.00437 | -| std | 0.0127 | -| value_loss | 1.01e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13527 | -| time_elapsed | 71646 | -| total_timesteps | 1731456 | -| train/ | | -| approx_kl | 0.00015884312 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -37.5 | -| learning_rate | 0.0003 | -| loss | -0.000758 | -| n_updates | 135260 | -| policy_gradient_loss | 0.00147 | -| std | 0.0127 | -| value_loss | 1.63e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13528 | -| time_elapsed | 71650 | -| total_timesteps | 1731584 | -| train/ | | -| approx_kl | 0.0029596738 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | 0.00503 | -| n_updates | 135270 | -| policy_gradient_loss | 0.0139 | -| std | 0.0127 | -| value_loss | 1.54e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13529 | -| time_elapsed | 71656 | -| total_timesteps | 1731712 | -| train/ | | -| approx_kl | 0.04272289 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 135280 | -| policy_gradient_loss | 0.00466 | -| std | 0.0127 | -| value_loss | 1.83e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13530 | -| time_elapsed | 71660 | -| total_timesteps | 1731840 | -| train/ | | -| approx_kl | 0.15910798 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | 0.0766 | -| n_updates | 135290 | -| policy_gradient_loss | 0.0166 | -| std | 0.0127 | -| value_loss | 5.12e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13531 | -| time_elapsed | 71666 | -| total_timesteps | 1731968 | -| train/ | | -| approx_kl | 1.5880447e-05 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.499 | -| learning_rate | 0.0003 | -| loss | 0.000409 | -| n_updates | 135300 | -| policy_gradient_loss | -0.00379 | -| std | 0.0127 | -| value_loss | 7.19e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13532 | -| time_elapsed | 71670 | -| total_timesteps | 1732096 | -| train/ | | -| approx_kl | 0.00988191 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 135310 | -| policy_gradient_loss | -0.00234 | -| std | 0.0127 | -| value_loss | 1.9e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13533 | -| time_elapsed | 71681 | -| total_timesteps | 1732224 | -| train/ | | -| approx_kl | 0.1995634 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 135320 | -| policy_gradient_loss | -0.000234 | -| std | 0.0127 | -| value_loss | 2.78e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13534 | -| time_elapsed | 71686 | -| total_timesteps | 1732352 | -| train/ | | -| approx_kl | 0.09293951 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | 0.000973 | -| learning_rate | 0.0003 | -| loss | 0.0493 | -| n_updates | 135330 | -| policy_gradient_loss | 0.0112 | -| std | 0.0126 | -| value_loss | 3.25e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13535 | -| time_elapsed | 71690 | -| total_timesteps | 1732480 | -| train/ | | -| approx_kl | 1.665717e-05 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.605 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 135340 | -| policy_gradient_loss | 0.00121 | -| std | 0.0126 | -| value_loss | 6.79e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13536 | -| time_elapsed | 71695 | -| total_timesteps | 1732608 | -| train/ | | -| approx_kl | 0.013193309 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0752 | -| learning_rate | 0.0003 | -| loss | 0.0046 | -| n_updates | 135350 | -| policy_gradient_loss | 0.0159 | -| std | 0.0126 | -| value_loss | 4.69e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13537 | -| time_elapsed | 71699 | -| total_timesteps | 1732736 | -| train/ | | -| approx_kl | 0.0060190735 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 5.36e-05 | -| n_updates | 135360 | -| policy_gradient_loss | 0.0088 | -| std | 0.0126 | -| value_loss | 1.69e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13538 | -| time_elapsed | 71704 | -| total_timesteps | 1732864 | -| train/ | | -| approx_kl | 0.009577928 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.000122 | -| n_updates | 135370 | -| policy_gradient_loss | 0.0209 | -| std | 0.0126 | -| value_loss | 1.4e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 24 | -| iterations | 13539 | -| time_elapsed | 71709 | -| total_timesteps | 1732992 | -| train/ | | -| approx_kl | 0.004821927 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.00753 | -| n_updates | 135380 | -| policy_gradient_loss | 0.00302 | -| std | 0.0126 | -| value_loss | 1.68e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13540 | -| time_elapsed | 71713 | -| total_timesteps | 1733120 | -| train/ | | -| approx_kl | 0.010695014 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 135390 | -| policy_gradient_loss | 0.00392 | -| std | 0.0126 | -| value_loss | 1.37e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13541 | -| time_elapsed | 71728 | -| total_timesteps | 1733248 | -| train/ | | -| approx_kl | 0.04151985 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.00407 | -| n_updates | 135400 | -| policy_gradient_loss | -0.00481 | -| std | 0.0126 | -| value_loss | 0.0038 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13542 | -| time_elapsed | 71733 | -| total_timesteps | 1733376 | -| train/ | | -| approx_kl | 0.031565297 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 135410 | -| policy_gradient_loss | 0.00954 | -| std | 0.0126 | -| value_loss | 1.64e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13543 | -| time_elapsed | 71738 | -| total_timesteps | 1733504 | -| train/ | | -| approx_kl | 0.15594573 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.0897 | -| n_updates | 135420 | -| policy_gradient_loss | 0.0195 | -| std | 0.0126 | -| value_loss | 6.53e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13544 | -| time_elapsed | 71744 | -| total_timesteps | 1733632 | -| train/ | | -| approx_kl | 0.0002528727 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0827 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 135430 | -| policy_gradient_loss | 0.0144 | -| std | 0.0126 | -| value_loss | 9.79e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13545 | -| time_elapsed | 71749 | -| total_timesteps | 1733760 | -| train/ | | -| approx_kl | 0.0033704252 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.00459 | -| n_updates | 135440 | -| policy_gradient_loss | 0.0311 | -| std | 0.0126 | -| value_loss | 5.59e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13546 | -| time_elapsed | 71754 | -| total_timesteps | 1733888 | -| train/ | | -| approx_kl | 0.034102205 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.0428 | -| n_updates | 135450 | -| policy_gradient_loss | 0.00483 | -| std | 0.0126 | -| value_loss | 3.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13547 | -| time_elapsed | 71759 | -| total_timesteps | 1734016 | -| train/ | | -| approx_kl | 0.08805843 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 135460 | -| policy_gradient_loss | 0.0115 | -| std | 0.0126 | -| value_loss | 2.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13548 | -| time_elapsed | 71770 | -| total_timesteps | 1734144 | -| train/ | | -| approx_kl | 0.12138055 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | 0.809 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 135470 | -| policy_gradient_loss | -0.0178 | -| std | 0.0126 | -| value_loss | 0.000408 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13549 | -| time_elapsed | 71776 | -| total_timesteps | 1734272 | -| train/ | | -| approx_kl | 0.0006333296 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | 0.00378 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 135480 | -| policy_gradient_loss | -0.0117 | -| std | 0.0126 | -| value_loss | 2.9e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13550 | -| time_elapsed | 71780 | -| total_timesteps | 1734400 | -| train/ | | -| approx_kl | 0.021758921 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -6.18 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 135490 | -| policy_gradient_loss | 0.0109 | -| std | 0.0126 | -| value_loss | 5.42e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13551 | -| time_elapsed | 71784 | -| total_timesteps | 1734528 | -| train/ | | -| approx_kl | 7.683411e-07 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -191 | -| learning_rate | 0.0003 | -| loss | -6.42e-05 | -| n_updates | 135500 | -| policy_gradient_loss | -0.0002 | -| std | 0.0126 | -| value_loss | 2.93e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13552 | -| time_elapsed | 71789 | -| total_timesteps | 1734656 | -| train/ | | -| approx_kl | 0.024412341 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -5.02 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 135510 | -| policy_gradient_loss | 0.00328 | -| std | 0.0126 | -| value_loss | 7.08e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13553 | -| time_elapsed | 71794 | -| total_timesteps | 1734784 | -| train/ | | -| approx_kl | 0.0704418 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 135520 | -| policy_gradient_loss | 0.0048 | -| std | 0.0126 | -| value_loss | 8.25e-10 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13554 | -| time_elapsed | 71799 | -| total_timesteps | 1734912 | -| train/ | | -| approx_kl | 0.025800254 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | 0.00877 | -| n_updates | 135530 | -| policy_gradient_loss | 0.00835 | -| std | 0.0126 | -| value_loss | 9.97e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13555 | -| time_elapsed | 71804 | -| total_timesteps | 1735040 | -| train/ | | -| approx_kl | 0.07017888 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | -0.00564 | -| n_updates | 135540 | -| policy_gradient_loss | -0.0156 | -| std | 0.0126 | -| value_loss | 8.48e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13556 | -| time_elapsed | 71814 | -| total_timesteps | 1735168 | -| train/ | | -| approx_kl | 0.08178087 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 135550 | -| policy_gradient_loss | -0.0119 | -| std | 0.0126 | -| value_loss | 0.000375 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13557 | -| time_elapsed | 71819 | -| total_timesteps | 1735296 | -| train/ | | -| approx_kl | 0.051865034 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 135560 | -| policy_gradient_loss | 0.00616 | -| std | 0.0126 | -| value_loss | 1.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13558 | -| time_elapsed | 71824 | -| total_timesteps | 1735424 | -| train/ | | -| approx_kl | 0.017099332 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 135570 | -| policy_gradient_loss | -0.000676 | -| std | 0.0126 | -| value_loss | 6.04e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13559 | -| time_elapsed | 71829 | -| total_timesteps | 1735552 | -| train/ | | -| approx_kl | 0.05176841 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.077 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 135580 | -| policy_gradient_loss | 0.014 | -| std | 0.0126 | -| value_loss | 3.56e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13560 | -| time_elapsed | 71833 | -| total_timesteps | 1735680 | -| train/ | | -| approx_kl | 0.02024997 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 135590 | -| policy_gradient_loss | 0.00555 | -| std | 0.0126 | -| value_loss | 2.63e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13561 | -| time_elapsed | 71838 | -| total_timesteps | 1735808 | -| train/ | | -| approx_kl | 0.0372415 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 135600 | -| policy_gradient_loss | 0.0144 | -| std | 0.0126 | -| value_loss | 1.55e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13562 | -| time_elapsed | 71844 | -| total_timesteps | 1735936 | -| train/ | | -| approx_kl | 0.086444564 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.0671 | -| n_updates | 135610 | -| policy_gradient_loss | 0.0494 | -| std | 0.0126 | -| value_loss | 1.03e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13563 | -| time_elapsed | 71849 | -| total_timesteps | 1736064 | -| train/ | | -| approx_kl | 0.05242102 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 135620 | -| policy_gradient_loss | 0.0521 | -| std | 0.0126 | -| value_loss | 6.23e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13564 | -| time_elapsed | 71857 | -| total_timesteps | 1736192 | -| train/ | | -| approx_kl | 0.16449545 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 135630 | -| policy_gradient_loss | -0.0152 | -| std | 0.0126 | -| value_loss | 0.0011 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13565 | -| time_elapsed | 71862 | -| total_timesteps | 1736320 | -| train/ | | -| approx_kl | 0.015392997 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -234 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 135640 | -| policy_gradient_loss | -0.00533 | -| std | 0.0126 | -| value_loss | 1.26e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13566 | -| time_elapsed | 71867 | -| total_timesteps | 1736448 | -| train/ | | -| approx_kl | 0.14537758 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -1.17e+04 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 135650 | -| policy_gradient_loss | -0.00528 | -| std | 0.0126 | -| value_loss | 6.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13567 | -| time_elapsed | 71872 | -| total_timesteps | 1736576 | -| train/ | | -| approx_kl | 0.035588987 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -317 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 135660 | -| policy_gradient_loss | -0.00193 | -| std | 0.0126 | -| value_loss | 1.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13568 | -| time_elapsed | 71876 | -| total_timesteps | 1736704 | -| train/ | | -| approx_kl | 0.040325683 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -7.89e+03 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 135670 | -| policy_gradient_loss | -0.00663 | -| std | 0.0126 | -| value_loss | 1.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13569 | -| time_elapsed | 71880 | -| total_timesteps | 1736832 | -| train/ | | -| approx_kl | 0.11152515 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | 0.0556 | -| n_updates | 135680 | -| policy_gradient_loss | 0.0481 | -| std | 0.0126 | -| value_loss | 7.74e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 24 | -| iterations | 13570 | -| time_elapsed | 71884 | -| total_timesteps | 1736960 | -| train/ | | -| approx_kl | 0.016590659 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 2.95 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00485 | -| n_updates | 135690 | -| policy_gradient_loss | 0.0057 | -| std | 0.0126 | -| value_loss | 4.5e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13571 | -| time_elapsed | 71888 | -| total_timesteps | 1737088 | -| train/ | | -| approx_kl | 0.005745387 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.00585 | -| n_updates | 135700 | -| policy_gradient_loss | -0.00125 | -| std | 0.0126 | -| value_loss | 2.3e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13572 | -| time_elapsed | 71897 | -| total_timesteps | 1737216 | -| train/ | | -| approx_kl | 0.0016180351 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | 0.692 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 135710 | -| policy_gradient_loss | 0.0197 | -| std | 0.0126 | -| value_loss | 0.00573 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13573 | -| time_elapsed | 71902 | -| total_timesteps | 1737344 | -| train/ | | -| approx_kl | 0.0050237514 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.00421 | -| learning_rate | 0.0003 | -| loss | -0.00529 | -| n_updates | 135720 | -| policy_gradient_loss | 0.0221 | -| std | 0.0126 | -| value_loss | 5.08e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13574 | -| time_elapsed | 71906 | -| total_timesteps | 1737472 | -| train/ | | -| approx_kl | 0.0042336322 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 135730 | -| policy_gradient_loss | 0.00934 | -| std | 0.0126 | -| value_loss | 8.03e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13575 | -| time_elapsed | 71910 | -| total_timesteps | 1737600 | -| train/ | | -| approx_kl | 0.0865742 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.00706 | -| n_updates | 135740 | -| policy_gradient_loss | 0.00258 | -| std | 0.0126 | -| value_loss | 5.36e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13576 | -| time_elapsed | 71914 | -| total_timesteps | 1737728 | -| train/ | | -| approx_kl | 0.020415213 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | 0.00271 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 135750 | -| policy_gradient_loss | 0.00693 | -| std | 0.0125 | -| value_loss | 5.42e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13577 | -| time_elapsed | 71917 | -| total_timesteps | 1737856 | -| train/ | | -| approx_kl | 0.1040418 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 135760 | -| policy_gradient_loss | 0.00341 | -| std | 0.0125 | -| value_loss | 1.3e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 24 | -| iterations | 13578 | -| time_elapsed | 71920 | -| total_timesteps | 1737984 | -| train/ | | -| approx_kl | 0.02094738 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 135770 | -| policy_gradient_loss | 0.0208 | -| std | 0.0125 | -| value_loss | 2.1e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13579 | -| time_elapsed | 71925 | -| total_timesteps | 1738112 | -| train/ | | -| approx_kl | 0.0025451635 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -24.5 | -| learning_rate | 0.0003 | -| loss | -0.00643 | -| n_updates | 135780 | -| policy_gradient_loss | -0.00463 | -| std | 0.0125 | -| value_loss | 1.15e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13580 | -| time_elapsed | 71936 | -| total_timesteps | 1738240 | -| train/ | | -| approx_kl | 0.0046499264 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | 0.75 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 135790 | -| policy_gradient_loss | -0.0123 | -| std | 0.0125 | -| value_loss | 0.00385 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13581 | -| time_elapsed | 71940 | -| total_timesteps | 1738368 | -| train/ | | -| approx_kl | 0.05439637 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | 0.00665 | -| learning_rate | 0.0003 | -| loss | 0.0323 | -| n_updates | 135800 | -| policy_gradient_loss | 0.0139 | -| std | 0.0125 | -| value_loss | 1.88e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13582 | -| time_elapsed | 71944 | -| total_timesteps | 1738496 | -| train/ | | -| approx_kl | 0.016700923 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.00722 | -| n_updates | 135810 | -| policy_gradient_loss | 0.00705 | -| std | 0.0125 | -| value_loss | 9.07e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13583 | -| time_elapsed | 71948 | -| total_timesteps | 1738624 | -| train/ | | -| approx_kl | 0.04539491 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.00522 | -| n_updates | 135820 | -| policy_gradient_loss | 0.00484 | -| std | 0.0125 | -| value_loss | 7.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13584 | -| time_elapsed | 71953 | -| total_timesteps | 1738752 | -| train/ | | -| approx_kl | 0.050770745 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 135830 | -| policy_gradient_loss | 0.00849 | -| std | 0.0125 | -| value_loss | 4.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13585 | -| time_elapsed | 71956 | -| total_timesteps | 1738880 | -| train/ | | -| approx_kl | 0.012591504 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 135840 | -| policy_gradient_loss | 0.00146 | -| std | 0.0125 | -| value_loss | 2.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13586 | -| time_elapsed | 71959 | -| total_timesteps | 1739008 | -| train/ | | -| approx_kl | 0.06076014 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 2.96 | -| explained_variance | -0.00325 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 135850 | -| policy_gradient_loss | 0.00563 | -| std | 0.0125 | -| value_loss | 7.88e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13587 | -| time_elapsed | 71972 | -| total_timesteps | 1739136 | -| train/ | | -| approx_kl | 0.06516854 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.447 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 135860 | -| policy_gradient_loss | -0.016 | -| std | 0.0125 | -| value_loss | 0.0012 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13588 | -| time_elapsed | 71977 | -| total_timesteps | 1739264 | -| train/ | | -| approx_kl | 0.057226613 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.0068 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 135870 | -| policy_gradient_loss | 0.0121 | -| std | 0.0125 | -| value_loss | 5.82e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13589 | -| time_elapsed | 71981 | -| total_timesteps | 1739392 | -| train/ | | -| approx_kl | 0.023847293 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.391 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 135880 | -| policy_gradient_loss | 0.0142 | -| std | 0.0125 | -| value_loss | 5.44e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13590 | -| time_elapsed | 71987 | -| total_timesteps | 1739520 | -| train/ | | -| approx_kl | 0.04143186 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.000338 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 135890 | -| policy_gradient_loss | 0.00791 | -| std | 0.0125 | -| value_loss | 3.26e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13591 | -| time_elapsed | 71993 | -| total_timesteps | 1739648 | -| train/ | | -| approx_kl | 0.07699357 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.00356 | -| learning_rate | 0.0003 | -| loss | 0.0484 | -| n_updates | 135900 | -| policy_gradient_loss | 0.0179 | -| std | 0.0125 | -| value_loss | 5.71e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13592 | -| time_elapsed | 71999 | -| total_timesteps | 1739776 | -| train/ | | -| approx_kl | 0.020466806 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.000392 | -| n_updates | 135910 | -| policy_gradient_loss | 0.00419 | -| std | 0.0124 | -| value_loss | 4.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13593 | -| time_elapsed | 72004 | -| total_timesteps | 1739904 | -| train/ | | -| approx_kl | 0.03705202 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.00976 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 135920 | -| policy_gradient_loss | 0.0081 | -| std | 0.0124 | -| value_loss | 2.45e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13594 | -| time_elapsed | 72009 | -| total_timesteps | 1740032 | -| train/ | | -| approx_kl | 0.2140637 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 135930 | -| policy_gradient_loss | 0.0226 | -| std | 0.0124 | -| value_loss | 1.59e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13595 | -| time_elapsed | 72019 | -| total_timesteps | 1740160 | -| train/ | | -| approx_kl | 0.06628446 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.781 | -| learning_rate | 0.0003 | -| loss | -0.0078 | -| n_updates | 135940 | -| policy_gradient_loss | -0.0112 | -| std | 0.0124 | -| value_loss | 0.00281 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13596 | -| time_elapsed | 72024 | -| total_timesteps | 1740288 | -| train/ | | -| approx_kl | 0.017684784 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | 0.00795 | -| n_updates | 135950 | -| policy_gradient_loss | 0.0239 | -| std | 0.0124 | -| value_loss | 4.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13597 | -| time_elapsed | 72028 | -| total_timesteps | 1740416 | -| train/ | | -| approx_kl | 0.059420493 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -33.8 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 135960 | -| policy_gradient_loss | -0.00157 | -| std | 0.0124 | -| value_loss | 2.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13598 | -| time_elapsed | 72032 | -| total_timesteps | 1740544 | -| train/ | | -| approx_kl | 0.059051767 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -2.36 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 135970 | -| policy_gradient_loss | -0.00238 | -| std | 0.0124 | -| value_loss | 1.21e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13599 | -| time_elapsed | 72037 | -| total_timesteps | 1740672 | -| train/ | | -| approx_kl | 0.22760968 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | 0.0856 | -| n_updates | 135980 | -| policy_gradient_loss | 0.0189 | -| std | 0.0124 | -| value_loss | 1.97e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13600 | -| time_elapsed | 72042 | -| total_timesteps | 1740800 | -| train/ | | -| approx_kl | 0.0057460144 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 135990 | -| policy_gradient_loss | -0.000673 | -| std | 0.0124 | -| value_loss | 1.35e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13601 | -| time_elapsed | 72047 | -| total_timesteps | 1740928 | -| train/ | | -| approx_kl | 9.7288284e-05 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.000387 | -| n_updates | 136000 | -| policy_gradient_loss | 0.00215 | -| std | 0.0124 | -| value_loss | 8.52e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13602 | -| time_elapsed | 72052 | -| total_timesteps | 1741056 | -| train/ | | -| approx_kl | 0.0012616226 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.00746 | -| n_updates | 136010 | -| policy_gradient_loss | 0.00704 | -| std | 0.0124 | -| value_loss | 4.89e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13603 | -| time_elapsed | 72060 | -| total_timesteps | 1741184 | -| train/ | | -| approx_kl | 0.11395642 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.571 | -| learning_rate | 0.0003 | -| loss | -0.00919 | -| n_updates | 136020 | -| policy_gradient_loss | -0.0113 | -| std | 0.0124 | -| value_loss | 0.000709 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13604 | -| time_elapsed | 72064 | -| total_timesteps | 1741312 | -| train/ | | -| approx_kl | 0.008930724 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -7.1 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 136030 | -| policy_gradient_loss | -0.0143 | -| std | 0.0124 | -| value_loss | 6.86e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13605 | -| time_elapsed | 72069 | -| total_timesteps | 1741440 | -| train/ | | -| approx_kl | 1.0766089e-06 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -553 | -| learning_rate | 0.0003 | -| loss | -9.51e-05 | -| n_updates | 136040 | -| policy_gradient_loss | 0.000333 | -| std | 0.0124 | -| value_loss | 1.88e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13606 | -| time_elapsed | 72074 | -| total_timesteps | 1741568 | -| train/ | | -| approx_kl | 0.038613386 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -1.54e+03 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 136050 | -| policy_gradient_loss | 0.00108 | -| std | 0.0124 | -| value_loss | 1.59e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13607 | -| time_elapsed | 72077 | -| total_timesteps | 1741696 | -| train/ | | -| approx_kl | 0.022852765 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -149 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 136060 | -| policy_gradient_loss | -0.00991 | -| std | 0.0124 | -| value_loss | 1.69e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13608 | -| time_elapsed | 72082 | -| total_timesteps | 1741824 | -| train/ | | -| approx_kl | 0.0067480924 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -20.9 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 136070 | -| policy_gradient_loss | -0.00375 | -| std | 0.0124 | -| value_loss | 2.1e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 24 | -| iterations | 13609 | -| time_elapsed | 72089 | -| total_timesteps | 1741952 | -| train/ | | -| approx_kl | 0.026621675 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -3.42 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 136080 | -| policy_gradient_loss | 0.0101 | -| std | 0.0124 | -| value_loss | 4.97e-12 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13610 | -| time_elapsed | 72094 | -| total_timesteps | 1742080 | -| train/ | | -| approx_kl | 0.008072538 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.437 | -| learning_rate | 0.0003 | -| loss | -0.00722 | -| n_updates | 136090 | -| policy_gradient_loss | 0.000735 | -| std | 0.0124 | -| value_loss | 1.86e-12 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13611 | -| time_elapsed | 72105 | -| total_timesteps | 1742208 | -| train/ | | -| approx_kl | 0.004017785 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.863 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 136100 | -| policy_gradient_loss | 0.00125 | -| std | 0.0124 | -| value_loss | 0.00151 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13612 | -| time_elapsed | 72110 | -| total_timesteps | 1742336 | -| train/ | | -| approx_kl | 0.006168737 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.00448 | -| learning_rate | 0.0003 | -| loss | 0.0073 | -| n_updates | 136110 | -| policy_gradient_loss | 0.00952 | -| std | 0.0124 | -| value_loss | 2.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13613 | -| time_elapsed | 72115 | -| total_timesteps | 1742464 | -| train/ | | -| approx_kl | 0.01132894 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.356 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 136120 | -| policy_gradient_loss | 0.00011 | -| std | 0.0124 | -| value_loss | 1.33e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13614 | -| time_elapsed | 72119 | -| total_timesteps | 1742592 | -| train/ | | -| approx_kl | 0.09360304 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 136130 | -| policy_gradient_loss | 0.0145 | -| std | 0.0124 | -| value_loss | 8.77e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13615 | -| time_elapsed | 72123 | -| total_timesteps | 1742720 | -| train/ | | -| approx_kl | 0.003000219 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 136140 | -| policy_gradient_loss | 0.0229 | -| std | 0.0124 | -| value_loss | 5.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13616 | -| time_elapsed | 72127 | -| total_timesteps | 1742848 | -| train/ | | -| approx_kl | 0.030154157 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 136150 | -| policy_gradient_loss | 0.0532 | -| std | 0.0124 | -| value_loss | 4.4e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 24 | -| iterations | 13617 | -| time_elapsed | 72133 | -| total_timesteps | 1742976 | -| train/ | | -| approx_kl | 0.026382824 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 136160 | -| policy_gradient_loss | 0.0123 | -| std | 0.0124 | -| value_loss | 2.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 24 | -| iterations | 13618 | -| time_elapsed | 72138 | -| total_timesteps | 1743104 | -| train/ | | -| approx_kl | 0.062616095 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 136170 | -| policy_gradient_loss | 0.0202 | -| std | 0.0124 | -| value_loss | 1.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 24 | -| iterations | 13619 | -| time_elapsed | 72150 | -| total_timesteps | 1743232 | -| train/ | | -| approx_kl | 0.033177488 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.462 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 136180 | -| policy_gradient_loss | -0.00947 | -| std | 0.0124 | -| value_loss | 0.00132 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 24 | -| iterations | 13620 | -| time_elapsed | 72158 | -| total_timesteps | 1743360 | -| train/ | | -| approx_kl | 0.06191717 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -2.7 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 136190 | -| policy_gradient_loss | 0.00803 | -| std | 0.0124 | -| value_loss | 3.08e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 24 | -| iterations | 13621 | -| time_elapsed | 72162 | -| total_timesteps | 1743488 | -| train/ | | -| approx_kl | 0.0008938378 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.00778 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 136200 | -| policy_gradient_loss | 0.00182 | -| std | 0.0124 | -| value_loss | 9.21e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 24 | -| iterations | 13622 | -| time_elapsed | 72167 | -| total_timesteps | 1743616 | -| train/ | | -| approx_kl | 0.020944076 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.311 | -| learning_rate | 0.0003 | -| loss | 0.00356 | -| n_updates | 136210 | -| policy_gradient_loss | 0.0197 | -| std | 0.0124 | -| value_loss | 3.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 24 | -| iterations | 13623 | -| time_elapsed | 72171 | -| total_timesteps | 1743744 | -| train/ | | -| approx_kl | 0.006826041 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.00528 | -| learning_rate | 0.0003 | -| loss | 9.6e-05 | -| n_updates | 136220 | -| policy_gradient_loss | 0.00757 | -| std | 0.0124 | -| value_loss | 2.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 24 | -| iterations | 13624 | -| time_elapsed | 72176 | -| total_timesteps | 1743872 | -| train/ | | -| approx_kl | 0.009080563 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | -0.00434 | -| n_updates | 136230 | -| policy_gradient_loss | 0.016 | -| std | 0.0125 | -| value_loss | 1.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13625 | -| time_elapsed | 72182 | -| total_timesteps | 1744000 | -| train/ | | -| approx_kl | 0.02477807 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.00154 | -| learning_rate | 0.0003 | -| loss | 0.00615 | -| n_updates | 136240 | -| policy_gradient_loss | 0.0013 | -| std | 0.0124 | -| value_loss | 2.1e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13626 | -| time_elapsed | 72186 | -| total_timesteps | 1744128 | -| train/ | | -| approx_kl | 0.002855279 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -9.35e-05 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 136250 | -| policy_gradient_loss | 0.00183 | -| std | 0.0124 | -| value_loss | 3.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13627 | -| time_elapsed | 72198 | -| total_timesteps | 1744256 | -| train/ | | -| approx_kl | 0.015709382 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.742 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 136260 | -| policy_gradient_loss | -0.0136 | -| std | 0.0124 | -| value_loss | 0.00457 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13628 | -| time_elapsed | 72204 | -| total_timesteps | 1744384 | -| train/ | | -| approx_kl | 0.0037079211 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.793 | -| learning_rate | 0.0003 | -| loss | 0.00257 | -| n_updates | 136270 | -| policy_gradient_loss | 0.0233 | -| std | 0.0124 | -| value_loss | 2.31e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13629 | -| time_elapsed | 72211 | -| total_timesteps | 1744512 | -| train/ | | -| approx_kl | 2.6708934e-05 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -22.8 | -| learning_rate | 0.0003 | -| loss | -0.000682 | -| n_updates | 136280 | -| policy_gradient_loss | -0.00406 | -| std | 0.0124 | -| value_loss | 8.13e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13630 | -| time_elapsed | 72217 | -| total_timesteps | 1744640 | -| train/ | | -| approx_kl | 0.04350344 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.088 | -| learning_rate | 0.0003 | -| loss | -0.000879 | -| n_updates | 136290 | -| policy_gradient_loss | -0.00738 | -| std | 0.0124 | -| value_loss | 4.45e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13631 | -| time_elapsed | 72223 | -| total_timesteps | 1744768 | -| train/ | | -| approx_kl | 0.007725337 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.00669 | -| n_updates | 136300 | -| policy_gradient_loss | -0.00112 | -| std | 0.0124 | -| value_loss | 7.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13632 | -| time_elapsed | 72227 | -| total_timesteps | 1744896 | -| train/ | | -| approx_kl | 0.015728477 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 136310 | -| policy_gradient_loss | -0.00955 | -| std | 0.0124 | -| value_loss | 3.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13633 | -| time_elapsed | 72231 | -| total_timesteps | 1745024 | -| train/ | | -| approx_kl | 0.011864667 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.000304 | -| n_updates | 136320 | -| policy_gradient_loss | 0.000238 | -| std | 0.0124 | -| value_loss | 2.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13634 | -| time_elapsed | 72241 | -| total_timesteps | 1745152 | -| train/ | | -| approx_kl | 0.010287963 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.811 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 136330 | -| policy_gradient_loss | -0.0017 | -| std | 0.0124 | -| value_loss | 0.00281 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13635 | -| time_elapsed | 72247 | -| total_timesteps | 1745280 | -| train/ | | -| approx_kl | 0.035022732 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.002 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 136340 | -| policy_gradient_loss | 0.00696 | -| std | 0.0124 | -| value_loss | 1.39e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13636 | -| time_elapsed | 72251 | -| total_timesteps | 1745408 | -| train/ | | -| approx_kl | 0.03712068 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.524 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 136350 | -| policy_gradient_loss | 0.00417 | -| std | 0.0124 | -| value_loss | 3.63e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13637 | -| time_elapsed | 72257 | -| total_timesteps | 1745536 | -| train/ | | -| approx_kl | 0.04098821 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 136360 | -| policy_gradient_loss | 0.0061 | -| std | 0.0124 | -| value_loss | 5.49e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13638 | -| time_elapsed | 72262 | -| total_timesteps | 1745664 | -| train/ | | -| approx_kl | 0.00040325243 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 136370 | -| policy_gradient_loss | 0.00604 | -| std | 0.0124 | -| value_loss | 3.01e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13639 | -| time_elapsed | 72267 | -| total_timesteps | 1745792 | -| train/ | | -| approx_kl | 0.0003715381 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.00273 | -| n_updates | 136380 | -| policy_gradient_loss | -0.000664 | -| std | 0.0123 | -| value_loss | 1.17e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13640 | -| time_elapsed | 72271 | -| total_timesteps | 1745920 | -| train/ | | -| approx_kl | 0.013976591 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.000524 | -| learning_rate | 0.0003 | -| loss | -0.00965 | -| n_updates | 136390 | -| policy_gradient_loss | 0.00274 | -| std | 0.0123 | -| value_loss | 4.99e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13641 | -| time_elapsed | 72276 | -| total_timesteps | 1746048 | -| train/ | | -| approx_kl | 0.013971439 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00533 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 136400 | -| policy_gradient_loss | 0.00557 | -| std | 0.0123 | -| value_loss | 7.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13642 | -| time_elapsed | 72285 | -| total_timesteps | 1746176 | -| train/ | | -| approx_kl | 0.022828203 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.709 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 136410 | -| policy_gradient_loss | -0.00936 | -| std | 0.0123 | -| value_loss | 0.00102 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13643 | -| time_elapsed | 72290 | -| total_timesteps | 1746304 | -| train/ | | -| approx_kl | 0.00079552596 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 136420 | -| policy_gradient_loss | 0.000448 | -| std | 0.0123 | -| value_loss | 1.86e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13644 | -| time_elapsed | 72295 | -| total_timesteps | 1746432 | -| train/ | | -| approx_kl | 0.011846175 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 136430 | -| policy_gradient_loss | -0.00244 | -| std | 0.0123 | -| value_loss | 5.41e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13645 | -| time_elapsed | 72299 | -| total_timesteps | 1746560 | -| train/ | | -| approx_kl | 0.0017576381 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00539 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 136440 | -| policy_gradient_loss | 0.0119 | -| std | 0.0123 | -| value_loss | 2.25e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13646 | -| time_elapsed | 72304 | -| total_timesteps | 1746688 | -| train/ | | -| approx_kl | 0.0035227356 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.00314 | -| n_updates | 136450 | -| policy_gradient_loss | 0.0484 | -| std | 0.0123 | -| value_loss | 1.37e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13647 | -| time_elapsed | 72308 | -| total_timesteps | 1746816 | -| train/ | | -| approx_kl | 0.020262253 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 136460 | -| policy_gradient_loss | 0.0384 | -| std | 0.0123 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13648 | -| time_elapsed | 72313 | -| total_timesteps | 1746944 | -| train/ | | -| approx_kl | 0.025881786 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 136470 | -| policy_gradient_loss | 0.032 | -| std | 0.0123 | -| value_loss | 6.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13649 | -| time_elapsed | 72319 | -| total_timesteps | 1747072 | -| train/ | | -| approx_kl | 0.05260492 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 136480 | -| policy_gradient_loss | 0.00039 | -| std | 0.0123 | -| value_loss | 1.07e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13650 | -| time_elapsed | 72328 | -| total_timesteps | 1747200 | -| train/ | | -| approx_kl | 0.08297019 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 136490 | -| policy_gradient_loss | -0.0126 | -| std | 0.0123 | -| value_loss | 0.000104 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13651 | -| time_elapsed | 72335 | -| total_timesteps | 1747328 | -| train/ | | -| approx_kl | 0.0027920092 | -| clip_fraction | 0.0117 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00511 | -| learning_rate | 0.0003 | -| loss | -0.000307 | -| n_updates | 136500 | -| policy_gradient_loss | -0.000111 | -| std | 0.0123 | -| value_loss | 4.18e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13652 | -| time_elapsed | 72340 | -| total_timesteps | 1747456 | -| train/ | | -| approx_kl | 0.0012973794 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00142 | -| learning_rate | 0.0003 | -| loss | -0.000675 | -| n_updates | 136510 | -| policy_gradient_loss | 0.00252 | -| std | 0.0124 | -| value_loss | 4.29e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13653 | -| time_elapsed | 72345 | -| total_timesteps | 1747584 | -| train/ | | -| approx_kl | 0.02478556 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.00015 | -| learning_rate | 0.0003 | -| loss | 0.00546 | -| n_updates | 136520 | -| policy_gradient_loss | -0.000533 | -| std | 0.0124 | -| value_loss | 7.03e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13654 | -| time_elapsed | 72349 | -| total_timesteps | 1747712 | -| train/ | | -| approx_kl | 0.011177721 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.00453 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 136530 | -| policy_gradient_loss | 0.00131 | -| std | 0.0125 | -| value_loss | 6.99e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13655 | -| time_elapsed | 72354 | -| total_timesteps | 1747840 | -| train/ | | -| approx_kl | 0.0016228957 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.00629 | -| n_updates | 136540 | -| policy_gradient_loss | 0.0192 | -| std | 0.0125 | -| value_loss | 4.17e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13656 | -| time_elapsed | 72359 | -| total_timesteps | 1747968 | -| train/ | | -| approx_kl | 0.0032396438 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 136550 | -| policy_gradient_loss | 0.0298 | -| std | 0.0125 | -| value_loss | 2.67e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13657 | -| time_elapsed | 72363 | -| total_timesteps | 1748096 | -| train/ | | -| approx_kl | 0.0016783592 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.000809 | -| n_updates | 136560 | -| policy_gradient_loss | 0.00878 | -| std | 0.0125 | -| value_loss | 1.87e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13658 | -| time_elapsed | 72373 | -| total_timesteps | 1748224 | -| train/ | | -| approx_kl | 0.10875589 | -| clip_fraction | 0.546 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.476 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 136570 | -| policy_gradient_loss | -0.00501 | -| std | 0.0125 | -| value_loss | 0.000916 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13659 | -| time_elapsed | 72378 | -| total_timesteps | 1748352 | -| train/ | | -| approx_kl | 0.048887946 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.065 | -| n_updates | 136580 | -| policy_gradient_loss | 0.0377 | -| std | 0.0125 | -| value_loss | 6.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13660 | -| time_elapsed | 72383 | -| total_timesteps | 1748480 | -| train/ | | -| approx_kl | 0.009721868 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.00135 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 136590 | -| policy_gradient_loss | 0.00234 | -| std | 0.0125 | -| value_loss | 1.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13661 | -| time_elapsed | 72388 | -| total_timesteps | 1748608 | -| train/ | | -| approx_kl | 0.012349433 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.00173 | -| learning_rate | 0.0003 | -| loss | -0.000953 | -| n_updates | 136600 | -| policy_gradient_loss | 0.00749 | -| std | 0.0125 | -| value_loss | 1.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13662 | -| time_elapsed | 72393 | -| total_timesteps | 1748736 | -| train/ | | -| approx_kl | 0.21685576 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0072 | -| learning_rate | 0.0003 | -| loss | 0.0659 | -| n_updates | 136610 | -| policy_gradient_loss | 0.013 | -| std | 0.0125 | -| value_loss | 9.68e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13663 | -| time_elapsed | 72397 | -| total_timesteps | 1748864 | -| train/ | | -| approx_kl | 0.0093465075 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 136620 | -| policy_gradient_loss | 0.000218 | -| std | 0.0125 | -| value_loss | 5.83e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 24 | -| iterations | 13664 | -| time_elapsed | 72402 | -| total_timesteps | 1748992 | -| train/ | | -| approx_kl | 0.015083572 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 136630 | -| policy_gradient_loss | -0.0103 | -| std | 0.0125 | -| value_loss | 4.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13665 | -| time_elapsed | 72407 | -| total_timesteps | 1749120 | -| train/ | | -| approx_kl | 0.012957508 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 136640 | -| policy_gradient_loss | -0.00627 | -| std | 0.0124 | -| value_loss | 2.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13666 | -| time_elapsed | 72419 | -| total_timesteps | 1749248 | -| train/ | | -| approx_kl | 0.03890125 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.378 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 136650 | -| policy_gradient_loss | -0.0149 | -| std | 0.0124 | -| value_loss | 0.000977 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13667 | -| time_elapsed | 72424 | -| total_timesteps | 1749376 | -| train/ | | -| approx_kl | 0.011975393 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -7.83 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 136660 | -| policy_gradient_loss | 0.0151 | -| std | 0.0124 | -| value_loss | 6.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13668 | -| time_elapsed | 72429 | -| total_timesteps | 1749504 | -| train/ | | -| approx_kl | 0.00848493 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -6.63 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 136670 | -| policy_gradient_loss | 0.0131 | -| std | 0.0124 | -| value_loss | 2.12e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13669 | -| time_elapsed | 72433 | -| total_timesteps | 1749632 | -| train/ | | -| approx_kl | 0.03706265 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 136680 | -| policy_gradient_loss | -0.00144 | -| std | 0.0124 | -| value_loss | 6.15e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13670 | -| time_elapsed | 72439 | -| total_timesteps | 1749760 | -| train/ | | -| approx_kl | 0.030423615 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.000176 | -| n_updates | 136690 | -| policy_gradient_loss | -0.00445 | -| std | 0.0124 | -| value_loss | 3.44e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 24 | -| iterations | 13671 | -| time_elapsed | 72443 | -| total_timesteps | 1749888 | -| train/ | | -| approx_kl | 0.0075363587 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.00333 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 136700 | -| policy_gradient_loss | -0.00152 | -| std | 0.0124 | -| value_loss | 2.27e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13672 | -| time_elapsed | 72446 | -| total_timesteps | 1750016 | -| train/ | | -| approx_kl | 0.0010108892 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.00183 | -| learning_rate | 0.0003 | -| loss | 0.00538 | -| n_updates | 136710 | -| policy_gradient_loss | -0.00531 | -| std | 0.0124 | -| value_loss | 1.55e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13673 | -| time_elapsed | 72456 | -| total_timesteps | 1750144 | -| train/ | | -| approx_kl | 0.002262252 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | 0.000555 | -| n_updates | 136720 | -| policy_gradient_loss | -4.49e-05 | -| std | 0.0124 | -| value_loss | 0.000431 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13674 | -| time_elapsed | 72460 | -| total_timesteps | 1750272 | -| train/ | | -| approx_kl | 0.0041283085 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | -0.00958 | -| n_updates | 136730 | -| policy_gradient_loss | -0.00357 | -| std | 0.0124 | -| value_loss | 9.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13675 | -| time_elapsed | 72464 | -| total_timesteps | 1750400 | -| train/ | | -| approx_kl | 0.000573494 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 136740 | -| policy_gradient_loss | 0.00184 | -| std | 0.0124 | -| value_loss | 2.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13676 | -| time_elapsed | 72469 | -| total_timesteps | 1750528 | -| train/ | | -| approx_kl | 0.09450398 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0579 | -| learning_rate | 0.0003 | -| loss | 0.0622 | -| n_updates | 136750 | -| policy_gradient_loss | 0.0115 | -| std | 0.0124 | -| value_loss | 3.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13677 | -| time_elapsed | 72473 | -| total_timesteps | 1750656 | -| train/ | | -| approx_kl | 0.03224311 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 136760 | -| policy_gradient_loss | -0.00648 | -| std | 0.0124 | -| value_loss | 3.18e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13678 | -| time_elapsed | 72478 | -| total_timesteps | 1750784 | -| train/ | | -| approx_kl | 0.040673744 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0817 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 136770 | -| policy_gradient_loss | 0.0519 | -| std | 0.0124 | -| value_loss | 1.99e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 24 | -| iterations | 13679 | -| time_elapsed | 72482 | -| total_timesteps | 1750912 | -| train/ | | -| approx_kl | 0.0076223817 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 136780 | -| policy_gradient_loss | 0.00304 | -| std | 0.0124 | -| value_loss | 1.15e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13680 | -| time_elapsed | 72487 | -| total_timesteps | 1751040 | -| train/ | | -| approx_kl | 0.18415852 | -| clip_fraction | 0.614 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 136790 | -| policy_gradient_loss | 0.0806 | -| std | 0.0124 | -| value_loss | 8.92e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13681 | -| time_elapsed | 72496 | -| total_timesteps | 1751168 | -| train/ | | -| approx_kl | 0.00094482535 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 2.97 | -| explained_variance | 0.836 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 136800 | -| policy_gradient_loss | -0.000298 | -| std | 0.0124 | -| value_loss | 0.00233 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13682 | -| time_elapsed | 72501 | -| total_timesteps | 1751296 | -| train/ | | -| approx_kl | 0.0024879812 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 136810 | -| policy_gradient_loss | 0.00192 | -| std | 0.0123 | -| value_loss | 1.49e-06 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13683 | -| time_elapsed | 72505 | -| total_timesteps | 1751424 | -| train/ | | -| approx_kl | 0.000118664466 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 5.99e-05 | -| n_updates | 136820 | -| policy_gradient_loss | 0.00211 | -| std | 0.0123 | -| value_loss | 5.83e-07 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13684 | -| time_elapsed | 72509 | -| total_timesteps | 1751552 | -| train/ | | -| approx_kl | 0.016566735 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 136830 | -| policy_gradient_loss | 0.0194 | -| std | 0.0123 | -| value_loss | 1.69e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13685 | -| time_elapsed | 72513 | -| total_timesteps | 1751680 | -| train/ | | -| approx_kl | 0.0076215104 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00327 | -| learning_rate | 0.0003 | -| loss | -0.00962 | -| n_updates | 136840 | -| policy_gradient_loss | 0.00106 | -| std | 0.0123 | -| value_loss | 3.46e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13686 | -| time_elapsed | 72517 | -| total_timesteps | 1751808 | -| train/ | | -| approx_kl | 0.007169339 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 136850 | -| policy_gradient_loss | 0.0147 | -| std | 0.0123 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 24 | -| iterations | 13687 | -| time_elapsed | 72521 | -| total_timesteps | 1751936 | -| train/ | | -| approx_kl | 0.026143543 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 136860 | -| policy_gradient_loss | 0.00407 | -| std | 0.0123 | -| value_loss | 1.14e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13688 | -| time_elapsed | 72525 | -| total_timesteps | 1752064 | -| train/ | | -| approx_kl | 0.00503472 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 136870 | -| policy_gradient_loss | 0.0321 | -| std | 0.0123 | -| value_loss | 6.79e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13689 | -| time_elapsed | 72533 | -| total_timesteps | 1752192 | -| train/ | | -| approx_kl | 0.08162159 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -13.5 | -| learning_rate | 0.0003 | -| loss | -0.00809 | -| n_updates | 136880 | -| policy_gradient_loss | -0.0123 | -| std | 0.0123 | -| value_loss | 0.00319 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13690 | -| time_elapsed | 72537 | -| total_timesteps | 1752320 | -| train/ | | -| approx_kl | 0.019119117 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | 0.00523 | -| n_updates | 136890 | -| policy_gradient_loss | 0.0144 | -| std | 0.0123 | -| value_loss | 1.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13691 | -| time_elapsed | 72541 | -| total_timesteps | 1752448 | -| train/ | | -| approx_kl | 0.25104943 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.65 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 136900 | -| policy_gradient_loss | 0.0673 | -| std | 0.0123 | -| value_loss | 2.37e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13692 | -| time_elapsed | 72546 | -| total_timesteps | 1752576 | -| train/ | | -| approx_kl | 0.002255545 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 136910 | -| policy_gradient_loss | 0.00799 | -| std | 0.0123 | -| value_loss | 1.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13693 | -| time_elapsed | 72550 | -| total_timesteps | 1752704 | -| train/ | | -| approx_kl | 0.101050824 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0767 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 136920 | -| policy_gradient_loss | -0.00219 | -| std | 0.0123 | -| value_loss | 1.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13694 | -| time_elapsed | 72554 | -| total_timesteps | 1752832 | -| train/ | | -| approx_kl | 0.01977105 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 136930 | -| policy_gradient_loss | 0.0143 | -| std | 0.0123 | -| value_loss | 4.71e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 24 | -| iterations | 13695 | -| time_elapsed | 72558 | -| total_timesteps | 1752960 | -| train/ | | -| approx_kl | 0.09651629 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 136940 | -| policy_gradient_loss | 0.0826 | -| std | 0.0123 | -| value_loss | 1.35e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13696 | -| time_elapsed | 72564 | -| total_timesteps | 1753088 | -| train/ | | -| approx_kl | 0.060255364 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00043 | -| learning_rate | 0.0003 | -| loss | 0.0884 | -| n_updates | 136950 | -| policy_gradient_loss | 0.0717 | -| std | 0.0123 | -| value_loss | 7.95e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13697 | -| time_elapsed | 72571 | -| total_timesteps | 1753216 | -| train/ | | -| approx_kl | 0.04504809 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 136960 | -| policy_gradient_loss | 0.0329 | -| std | 0.0123 | -| value_loss | 8.05e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13698 | -| time_elapsed | 72574 | -| total_timesteps | 1753344 | -| train/ | | -| approx_kl | 0.064939916 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -3.44 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 136970 | -| policy_gradient_loss | -0.0016 | -| std | 0.0123 | -| value_loss | 3.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13699 | -| time_elapsed | 72577 | -| total_timesteps | 1753472 | -| train/ | | -| approx_kl | 0.013597982 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.273 | -| learning_rate | 0.0003 | -| loss | 0.0366 | -| n_updates | 136980 | -| policy_gradient_loss | 0.0196 | -| std | 0.0123 | -| value_loss | 1.73e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13700 | -| time_elapsed | 72580 | -| total_timesteps | 1753600 | -| train/ | | -| approx_kl | 0.0066667562 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | 0.00578 | -| n_updates | 136990 | -| policy_gradient_loss | 0.0569 | -| std | 0.0123 | -| value_loss | 1.17e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13701 | -| time_elapsed | 72586 | -| total_timesteps | 1753728 | -| train/ | | -| approx_kl | 0.027646307 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 137000 | -| policy_gradient_loss | 0.05 | -| std | 0.0123 | -| value_loss | 1.02e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13702 | -| time_elapsed | 72591 | -| total_timesteps | 1753856 | -| train/ | | -| approx_kl | 0.034759894 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 137010 | -| policy_gradient_loss | 0.0527 | -| std | 0.0123 | -| value_loss | 8.72e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13703 | -| time_elapsed | 72596 | -| total_timesteps | 1753984 | -| train/ | | -| approx_kl | 0.0069897086 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00976 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 137020 | -| policy_gradient_loss | 0.007 | -| std | 0.0123 | -| value_loss | 1.13e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13704 | -| time_elapsed | 72601 | -| total_timesteps | 1754112 | -| train/ | | -| approx_kl | 0.011729812 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 137030 | -| policy_gradient_loss | 0.0024 | -| std | 0.0123 | -| value_loss | 1.91e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13705 | -| time_elapsed | 72613 | -| total_timesteps | 1754240 | -| train/ | | -| approx_kl | 0.07316255 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 137040 | -| policy_gradient_loss | -0.00976 | -| std | 0.0123 | -| value_loss | 0.00038 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13706 | -| time_elapsed | 72619 | -| total_timesteps | 1754368 | -| train/ | | -| approx_kl | 0.074213505 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00993 | -| learning_rate | 0.0003 | -| loss | 0.0521 | -| n_updates | 137050 | -| policy_gradient_loss | 0.0827 | -| std | 0.0123 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13707 | -| time_elapsed | 72624 | -| total_timesteps | 1754496 | -| train/ | | -| approx_kl | 0.014877191 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.00516 | -| n_updates | 137060 | -| policy_gradient_loss | 0.0126 | -| std | 0.0123 | -| value_loss | 1.4e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13708 | -| time_elapsed | 72628 | -| total_timesteps | 1754624 | -| train/ | | -| approx_kl | 0.10758827 | -| clip_fraction | 0.56 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0948 | -| n_updates | 137070 | -| policy_gradient_loss | 0.0694 | -| std | 0.0123 | -| value_loss | 9.26e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13709 | -| time_elapsed | 72635 | -| total_timesteps | 1754752 | -| train/ | | -| approx_kl | 0.04159473 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0551 | -| n_updates | 137080 | -| policy_gradient_loss | 0.0361 | -| std | 0.0123 | -| value_loss | 7.36e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 24 | -| iterations | 13710 | -| time_elapsed | 72638 | -| total_timesteps | 1754880 | -| train/ | | -| approx_kl | 0.010285878 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 137090 | -| policy_gradient_loss | 0.0052 | -| std | 0.0123 | -| value_loss | 4.03e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13711 | -| time_elapsed | 72642 | -| total_timesteps | 1755008 | -| train/ | | -| approx_kl | 0.19287002 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | 0.0986 | -| n_updates | 137100 | -| policy_gradient_loss | 0.0249 | -| std | 0.0123 | -| value_loss | 2.36e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13712 | -| time_elapsed | 72653 | -| total_timesteps | 1755136 | -| train/ | | -| approx_kl | 0.0028281799 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 137110 | -| policy_gradient_loss | -0.0116 | -| std | 0.0123 | -| value_loss | 0.000446 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13713 | -| time_elapsed | 72658 | -| total_timesteps | 1755264 | -| train/ | | -| approx_kl | 0.0052068355 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.054 | -| learning_rate | 0.0003 | -| loss | -0.00909 | -| n_updates | 137120 | -| policy_gradient_loss | -0.00686 | -| std | 0.0123 | -| value_loss | 9.91e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13714 | -| time_elapsed | 72664 | -| total_timesteps | 1755392 | -| train/ | | -| approx_kl | 0.03046886 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -2.26 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 137130 | -| policy_gradient_loss | 0.0138 | -| std | 0.0123 | -| value_loss | 8.11e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13715 | -| time_elapsed | 72669 | -| total_timesteps | 1755520 | -| train/ | | -| approx_kl | 0.00781483 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.729 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 137140 | -| policy_gradient_loss | -0.00587 | -| std | 0.0123 | -| value_loss | 4.43e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13716 | -| time_elapsed | 72674 | -| total_timesteps | 1755648 | -| train/ | | -| approx_kl | 0.009587587 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 137150 | -| policy_gradient_loss | 0.0166 | -| std | 0.0123 | -| value_loss | 2.78e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13717 | -| time_elapsed | 72679 | -| total_timesteps | 1755776 | -| train/ | | -| approx_kl | 0.0070864945 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 137160 | -| policy_gradient_loss | 0.00459 | -| std | 0.0123 | -| value_loss | 1.35e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13718 | -| time_elapsed | 72684 | -| total_timesteps | 1755904 | -| train/ | | -| approx_kl | 0.0075679207 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 137170 | -| policy_gradient_loss | 0.00425 | -| std | 0.0123 | -| value_loss | 9.87e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13719 | -| time_elapsed | 72688 | -| total_timesteps | 1756032 | -| train/ | | -| approx_kl | 0.015421867 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.0397 | -| n_updates | 137180 | -| policy_gradient_loss | -0.0306 | -| std | 0.0123 | -| value_loss | 5.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13720 | -| time_elapsed | 72697 | -| total_timesteps | 1756160 | -| train/ | | -| approx_kl | 0.007864272 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.838 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 137190 | -| policy_gradient_loss | -0.00098 | -| std | 0.0123 | -| value_loss | 0.00239 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13721 | -| time_elapsed | 72702 | -| total_timesteps | 1756288 | -| train/ | | -| approx_kl | 0.038303725 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.7 | -| learning_rate | 0.0003 | -| loss | 0.000908 | -| n_updates | 137200 | -| policy_gradient_loss | -0.00225 | -| std | 0.0123 | -| value_loss | 4.71e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13722 | -| time_elapsed | 72706 | -| total_timesteps | 1756416 | -| train/ | | -| approx_kl | 0.1019947 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -3.47 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 137210 | -| policy_gradient_loss | -0.01 | -| std | 0.0123 | -| value_loss | 2.39e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13723 | -| time_elapsed | 72709 | -| total_timesteps | 1756544 | -| train/ | | -| approx_kl | 0.038597703 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.823 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 137220 | -| policy_gradient_loss | 0.00398 | -| std | 0.0123 | -| value_loss | 8.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13724 | -| time_elapsed | 72714 | -| total_timesteps | 1756672 | -| train/ | | -| approx_kl | 0.007570008 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 137230 | -| policy_gradient_loss | 0.00589 | -| std | 0.0123 | -| value_loss | 4.92e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13725 | -| time_elapsed | 72718 | -| total_timesteps | 1756800 | -| train/ | | -| approx_kl | 0.0073967343 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | 0.00074 | -| n_updates | 137240 | -| policy_gradient_loss | 0.0209 | -| std | 0.0122 | -| value_loss | 1.7e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 24 | -| iterations | 13726 | -| time_elapsed | 72723 | -| total_timesteps | 1756928 | -| train/ | | -| approx_kl | 0.0017313487 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.000493 | -| n_updates | 137250 | -| policy_gradient_loss | 0.0324 | -| std | 0.0122 | -| value_loss | 8.57e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13727 | -| time_elapsed | 72726 | -| total_timesteps | 1757056 | -| train/ | | -| approx_kl | 0.026467748 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | 0.00171 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 137260 | -| policy_gradient_loss | 0.041 | -| std | 0.0122 | -| value_loss | 1.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13728 | -| time_elapsed | 72736 | -| total_timesteps | 1757184 | -| train/ | | -| approx_kl | 0.030020494 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.00816 | -| n_updates | 137270 | -| policy_gradient_loss | -0.00766 | -| std | 0.0122 | -| value_loss | 0.000766 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13729 | -| time_elapsed | 72740 | -| total_timesteps | 1757312 | -| train/ | | -| approx_kl | 0.06026109 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 137280 | -| policy_gradient_loss | 0.0237 | -| std | 0.0122 | -| value_loss | 1.31e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13730 | -| time_elapsed | 72745 | -| total_timesteps | 1757440 | -| train/ | | -| approx_kl | 0.05822096 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.0496 | -| n_updates | 137290 | -| policy_gradient_loss | 0.0153 | -| std | 0.0123 | -| value_loss | 7.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13731 | -| time_elapsed | 72750 | -| total_timesteps | 1757568 | -| train/ | | -| approx_kl | 0.0010601422 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00306 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 137300 | -| policy_gradient_loss | -0.00232 | -| std | 0.0123 | -| value_loss | 1.54e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13732 | -| time_elapsed | 72755 | -| total_timesteps | 1757696 | -| train/ | | -| approx_kl | 1.6907696e-05 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00108 | -| learning_rate | 0.0003 | -| loss | 0.000189 | -| n_updates | 137310 | -| policy_gradient_loss | 1.23e-05 | -| std | 0.0123 | -| value_loss | 5.9e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13733 | -| time_elapsed | 72760 | -| total_timesteps | 1757824 | -| train/ | | -| approx_kl | 0.021015527 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 137320 | -| policy_gradient_loss | 0.026 | -| std | 0.0123 | -| value_loss | 5.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 13734 | -| time_elapsed | 72764 | -| total_timesteps | 1757952 | -| train/ | | -| approx_kl | 0.03348286 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.00705 | -| n_updates | 137330 | -| policy_gradient_loss | -0.00103 | -| std | 0.0123 | -| value_loss | 3.66e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13735 | -| time_elapsed | 72769 | -| total_timesteps | 1758080 | -| train/ | | -| approx_kl | 0.0027033216 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 137340 | -| policy_gradient_loss | 0.0296 | -| std | 0.0123 | -| value_loss | 1.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13736 | -| time_elapsed | 72779 | -| total_timesteps | 1758208 | -| train/ | | -| approx_kl | 0.052895144 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.00303 | -| n_updates | 137350 | -| policy_gradient_loss | 0.00771 | -| std | 0.0123 | -| value_loss | 0.000121 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13737 | -| time_elapsed | 72784 | -| total_timesteps | 1758336 | -| train/ | | -| approx_kl | 0.020315718 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0056 | -| learning_rate | 0.0003 | -| loss | 0.00867 | -| n_updates | 137360 | -| policy_gradient_loss | 0.00881 | -| std | 0.0123 | -| value_loss | 7.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13738 | -| time_elapsed | 72789 | -| total_timesteps | 1758464 | -| train/ | | -| approx_kl | 0.082541816 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00128 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 137370 | -| policy_gradient_loss | 0.00592 | -| std | 0.0123 | -| value_loss | 3.42e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13739 | -| time_elapsed | 72794 | -| total_timesteps | 1758592 | -| train/ | | -| approx_kl | 0.02211082 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.000756 | -| learning_rate | 0.0003 | -| loss | 0.00468 | -| n_updates | 137380 | -| policy_gradient_loss | 0.0217 | -| std | 0.0123 | -| value_loss | 2.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13740 | -| time_elapsed | 72798 | -| total_timesteps | 1758720 | -| train/ | | -| approx_kl | 0.011559606 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00742 | -| learning_rate | 0.0003 | -| loss | 0.00731 | -| n_updates | 137390 | -| policy_gradient_loss | 0.00997 | -| std | 0.0123 | -| value_loss | 1.58e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13741 | -| time_elapsed | 72801 | -| total_timesteps | 1758848 | -| train/ | | -| approx_kl | 0.011112719 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | -0.00861 | -| n_updates | 137400 | -| policy_gradient_loss | 0.00211 | -| std | 0.0123 | -| value_loss | 1.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 13742 | -| time_elapsed | 72805 | -| total_timesteps | 1758976 | -| train/ | | -| approx_kl | 0.117894486 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 137410 | -| policy_gradient_loss | 0.0151 | -| std | 0.0123 | -| value_loss | 9.05e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13743 | -| time_elapsed | 72810 | -| total_timesteps | 1759104 | -| train/ | | -| approx_kl | 0.0030474523 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.0026 | -| n_updates | 137420 | -| policy_gradient_loss | 0.00737 | -| std | 0.0123 | -| value_loss | 5.7e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13744 | -| time_elapsed | 72823 | -| total_timesteps | 1759232 | -| train/ | | -| approx_kl | 0.037906043 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 137430 | -| policy_gradient_loss | -0.0145 | -| std | 0.0123 | -| value_loss | 0.000406 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13745 | -| time_elapsed | 72827 | -| total_timesteps | 1759360 | -| train/ | | -| approx_kl | 0.043346085 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00622 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 137440 | -| policy_gradient_loss | -0.000889 | -| std | 0.0123 | -| value_loss | 1.77e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13746 | -| time_elapsed | 72831 | -| total_timesteps | 1759488 | -| train/ | | -| approx_kl | 0.00011767121 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | -0.00362 | -| n_updates | 137450 | -| policy_gradient_loss | -0.000158 | -| std | 0.0123 | -| value_loss | 1.87e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13747 | -| time_elapsed | 72837 | -| total_timesteps | 1759616 | -| train/ | | -| approx_kl | 0.0024144207 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.00838 | -| n_updates | 137460 | -| policy_gradient_loss | 0.0143 | -| std | 0.0123 | -| value_loss | 2.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13748 | -| time_elapsed | 72842 | -| total_timesteps | 1759744 | -| train/ | | -| approx_kl | 0.096370906 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 137470 | -| policy_gradient_loss | 0.00572 | -| std | 0.0123 | -| value_loss | 5.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13749 | -| time_elapsed | 72847 | -| total_timesteps | 1759872 | -| train/ | | -| approx_kl | 0.003285118 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.084 | -| learning_rate | 0.0003 | -| loss | -0.00827 | -| n_updates | 137480 | -| policy_gradient_loss | 0.0023 | -| std | 0.0123 | -| value_loss | 1.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13750 | -| time_elapsed | 72852 | -| total_timesteps | 1760000 | -| train/ | | -| approx_kl | 0.016900057 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 137490 | -| policy_gradient_loss | -0.00612 | -| std | 0.0123 | -| value_loss | 1.39e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13751 | -| time_elapsed | 72857 | -| total_timesteps | 1760128 | -| train/ | | -| approx_kl | 0.03151419 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00239 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 137500 | -| policy_gradient_loss | 0.0492 | -| std | 0.0123 | -| value_loss | 7.31e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13752 | -| time_elapsed | 72869 | -| total_timesteps | 1760256 | -| train/ | | -| approx_kl | 0.009375015 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 137510 | -| policy_gradient_loss | -0.0107 | -| std | 0.0123 | -| value_loss | 0.00258 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13753 | -| time_elapsed | 72875 | -| total_timesteps | 1760384 | -| train/ | | -| approx_kl | 0.043731935 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 137520 | -| policy_gradient_loss | -0.00103 | -| std | 0.0123 | -| value_loss | 1.73e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13754 | -| time_elapsed | 72879 | -| total_timesteps | 1760512 | -| train/ | | -| approx_kl | 0.04422305 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.406 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 137530 | -| policy_gradient_loss | -0.000475 | -| std | 0.0123 | -| value_loss | 5.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13755 | -| time_elapsed | 72884 | -| total_timesteps | 1760640 | -| train/ | | -| approx_kl | 0.030931266 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 137540 | -| policy_gradient_loss | -0.00369 | -| std | 0.0123 | -| value_loss | 2.6e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13756 | -| time_elapsed | 72888 | -| total_timesteps | 1760768 | -| train/ | | -| approx_kl | 0.0145788975 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 137550 | -| policy_gradient_loss | -0.00112 | -| std | 0.0123 | -| value_loss | 1.6e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 24 | -| iterations | 13757 | -| time_elapsed | 72894 | -| total_timesteps | 1760896 | -| train/ | | -| approx_kl | 0.06360205 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.0573 | -| n_updates | 137560 | -| policy_gradient_loss | 0.0279 | -| std | 0.0123 | -| value_loss | 1.01e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13758 | -| time_elapsed | 72898 | -| total_timesteps | 1761024 | -| train/ | | -| approx_kl | 0.00012318278 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.00062 | -| n_updates | 137570 | -| policy_gradient_loss | -0.000688 | -| std | 0.0123 | -| value_loss | 6.32e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13759 | -| time_elapsed | 72908 | -| total_timesteps | 1761152 | -| train/ | | -| approx_kl | 0.07423054 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.504 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 137580 | -| policy_gradient_loss | -0.0146 | -| std | 0.0123 | -| value_loss | 0.00106 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13760 | -| time_elapsed | 72913 | -| total_timesteps | 1761280 | -| train/ | | -| approx_kl | 0.062965766 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -245 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 137590 | -| policy_gradient_loss | 0.00763 | -| std | 0.0123 | -| value_loss | 3.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13761 | -| time_elapsed | 72917 | -| total_timesteps | 1761408 | -| train/ | | -| approx_kl | 0.040281765 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -10.4 | -| learning_rate | 0.0003 | -| loss | 0.00511 | -| n_updates | 137600 | -| policy_gradient_loss | 0.00351 | -| std | 0.0123 | -| value_loss | 3.07e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13762 | -| time_elapsed | 72922 | -| total_timesteps | 1761536 | -| train/ | | -| approx_kl | 0.05987056 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 137610 | -| policy_gradient_loss | 0.00841 | -| std | 0.0123 | -| value_loss | 5.96e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13763 | -| time_elapsed | 72926 | -| total_timesteps | 1761664 | -| train/ | | -| approx_kl | 0.023781098 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.285 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 137620 | -| policy_gradient_loss | -0.000989 | -| std | 0.0123 | -| value_loss | 8.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13764 | -| time_elapsed | 72931 | -| total_timesteps | 1761792 | -| train/ | | -| approx_kl | 0.005950529 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00437 | -| learning_rate | 0.0003 | -| loss | -0.00887 | -| n_updates | 137630 | -| policy_gradient_loss | 0.00609 | -| std | 0.0123 | -| value_loss | 4.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13765 | -| time_elapsed | 72936 | -| total_timesteps | 1761920 | -| train/ | | -| approx_kl | 0.015702799 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 5.66e-05 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 137640 | -| policy_gradient_loss | 0.00139 | -| std | 0.0123 | -| value_loss | 3.09e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13766 | -| time_elapsed | 72941 | -| total_timesteps | 1762048 | -| train/ | | -| approx_kl | 0.10101967 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.00875 | -| learning_rate | 0.0003 | -| loss | 0.0521 | -| n_updates | 137650 | -| policy_gradient_loss | 0.0202 | -| std | 0.0123 | -| value_loss | 2.03e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13767 | -| time_elapsed | 72949 | -| total_timesteps | 1762176 | -| train/ | | -| approx_kl | 0.068641976 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | -0.000723 | -| n_updates | 137660 | -| policy_gradient_loss | -0.0117 | -| std | 0.0123 | -| value_loss | 0.0021 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13768 | -| time_elapsed | 72955 | -| total_timesteps | 1762304 | -| train/ | | -| approx_kl | 0.022465711 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.000648 | -| n_updates | 137670 | -| policy_gradient_loss | 0.00432 | -| std | 0.0123 | -| value_loss | 0.00188 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13769 | -| time_elapsed | 72960 | -| total_timesteps | 1762432 | -| train/ | | -| approx_kl | 0.040345814 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.00548 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 137680 | -| policy_gradient_loss | 0.0166 | -| std | 0.0123 | -| value_loss | 0.000153 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13770 | -| time_elapsed | 72965 | -| total_timesteps | 1762560 | -| train/ | | -| approx_kl | 0.047725096 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 137690 | -| policy_gradient_loss | 0.0203 | -| std | 0.0122 | -| value_loss | 0.000224 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13771 | -| time_elapsed | 72970 | -| total_timesteps | 1762688 | -| train/ | | -| approx_kl | 0.08204195 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.453 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 137700 | -| policy_gradient_loss | 0.0125 | -| std | 0.0122 | -| value_loss | 9.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13772 | -| time_elapsed | 72973 | -| total_timesteps | 1762816 | -| train/ | | -| approx_kl | 0.015833182 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.00188 | -| n_updates | 137710 | -| policy_gradient_loss | 0.0188 | -| std | 0.0122 | -| value_loss | 3.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 24 | -| iterations | 13773 | -| time_elapsed | 72977 | -| total_timesteps | 1762944 | -| train/ | | -| approx_kl | 0.05866146 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 137720 | -| policy_gradient_loss | 0.00996 | -| std | 0.0122 | -| value_loss | 2.07e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13774 | -| time_elapsed | 72983 | -| total_timesteps | 1763072 | -| train/ | | -| approx_kl | 0.00037702918 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 137730 | -| policy_gradient_loss | -0.00339 | -| std | 0.0122 | -| value_loss | 1.64e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13775 | -| time_elapsed | 72992 | -| total_timesteps | 1763200 | -| train/ | | -| approx_kl | 0.071204714 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 137740 | -| policy_gradient_loss | -0.0165 | -| std | 0.0122 | -| value_loss | 0.000245 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13776 | -| time_elapsed | 72996 | -| total_timesteps | 1763328 | -| train/ | | -| approx_kl | 0.19883426 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | 0.0876 | -| n_updates | 137750 | -| policy_gradient_loss | 0.0192 | -| std | 0.0122 | -| value_loss | 5.52e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13777 | -| time_elapsed | 72999 | -| total_timesteps | 1763456 | -| train/ | | -| approx_kl | 0.0035285773 | -| clip_fraction | 0.0336 | -| clip_range | 0.2 | -| entropy_loss | 2.98 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.000394 | -| n_updates | 137760 | -| policy_gradient_loss | 0.00108 | -| std | 0.0122 | -| value_loss | 4.16e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13778 | -| time_elapsed | 73004 | -| total_timesteps | 1763584 | -| train/ | | -| approx_kl | 0.00015722681 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0073 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 137770 | -| policy_gradient_loss | 0.000936 | -| std | 0.0122 | -| value_loss | 1.19e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13779 | -| time_elapsed | 73008 | -| total_timesteps | 1763712 | -| train/ | | -| approx_kl | 0.0017643883 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 137780 | -| policy_gradient_loss | 0.00481 | -| std | 0.0122 | -| value_loss | 7.5e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13780 | -| time_elapsed | 73013 | -| total_timesteps | 1763840 | -| train/ | | -| approx_kl | 0.004336867 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 137790 | -| policy_gradient_loss | 0.0178 | -| std | 0.0122 | -| value_loss | 3.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13781 | -| time_elapsed | 73018 | -| total_timesteps | 1763968 | -| train/ | | -| approx_kl | 0.017805658 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0624 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 137800 | -| policy_gradient_loss | 0.0195 | -| std | 0.0122 | -| value_loss | 1.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13782 | -| time_elapsed | 73023 | -| total_timesteps | 1764096 | -| train/ | | -| approx_kl | 0.011170001 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 137810 | -| policy_gradient_loss | -0.002 | -| std | 0.0122 | -| value_loss | 1.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13783 | -| time_elapsed | 73033 | -| total_timesteps | 1764224 | -| train/ | | -| approx_kl | 0.03196585 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 137820 | -| policy_gradient_loss | -0.0114 | -| std | 0.0122 | -| value_loss | 0.00296 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13784 | -| time_elapsed | 73038 | -| total_timesteps | 1764352 | -| train/ | | -| approx_kl | 0.069619045 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.757 | -| learning_rate | 0.0003 | -| loss | -0.000832 | -| n_updates | 137830 | -| policy_gradient_loss | -0.00258 | -| std | 0.0122 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13785 | -| time_elapsed | 73042 | -| total_timesteps | 1764480 | -| train/ | | -| approx_kl | 0.064271316 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.527 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 137840 | -| policy_gradient_loss | 0.00264 | -| std | 0.0122 | -| value_loss | 1.68e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13786 | -| time_elapsed | 73046 | -| total_timesteps | 1764608 | -| train/ | | -| approx_kl | 0.1926286 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 137850 | -| policy_gradient_loss | 0.00763 | -| std | 0.0122 | -| value_loss | 7.24e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13787 | -| time_elapsed | 73051 | -| total_timesteps | 1764736 | -| train/ | | -| approx_kl | 0.008641301 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0887 | -| learning_rate | 0.0003 | -| loss | -0.00032 | -| n_updates | 137860 | -| policy_gradient_loss | 0.000313 | -| std | 0.0122 | -| value_loss | 3.62e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13788 | -| time_elapsed | 73055 | -| total_timesteps | 1764864 | -| train/ | | -| approx_kl | 2.7897768e-06 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | 6.32e-05 | -| n_updates | 137870 | -| policy_gradient_loss | 0.00158 | -| std | 0.0122 | -| value_loss | 3.04e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 24 | -| iterations | 13789 | -| time_elapsed | 73059 | -| total_timesteps | 1764992 | -| train/ | | -| approx_kl | 0.00055244984 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 137880 | -| policy_gradient_loss | -0.00679 | -| std | 0.0122 | -| value_loss | 1.31e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13790 | -| time_elapsed | 73064 | -| total_timesteps | 1765120 | -| train/ | | -| approx_kl | 0.00043160887 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 137890 | -| policy_gradient_loss | 0.000154 | -| std | 0.0122 | -| value_loss | 8.96e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13791 | -| time_elapsed | 73075 | -| total_timesteps | 1765248 | -| train/ | | -| approx_kl | 0.07848355 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 137900 | -| policy_gradient_loss | -0.014 | -| std | 0.0122 | -| value_loss | 0.000415 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13792 | -| time_elapsed | 73080 | -| total_timesteps | 1765376 | -| train/ | | -| approx_kl | 0.05349221 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -3.72 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 137910 | -| policy_gradient_loss | 0.001 | -| std | 0.0122 | -| value_loss | 4.47e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13793 | -| time_elapsed | 73085 | -| total_timesteps | 1765504 | -| train/ | | -| approx_kl | 0.05574102 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -80.4 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 137920 | -| policy_gradient_loss | 0.00343 | -| std | 0.0122 | -| value_loss | 3.85e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13794 | -| time_elapsed | 73090 | -| total_timesteps | 1765632 | -| train/ | | -| approx_kl | 0.059799396 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -11.6 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 137930 | -| policy_gradient_loss | -0.0084 | -| std | 0.0122 | -| value_loss | 5.12e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13795 | -| time_elapsed | 73094 | -| total_timesteps | 1765760 | -| train/ | | -| approx_kl | 0.048495844 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -2.7 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 137940 | -| policy_gradient_loss | 0.0178 | -| std | 0.0122 | -| value_loss | 1.55e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 24 | -| iterations | 13796 | -| time_elapsed | 73099 | -| total_timesteps | 1765888 | -| train/ | | -| approx_kl | 0.06782383 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.521 | -| learning_rate | 0.0003 | -| loss | 0.0373 | -| n_updates | 137950 | -| policy_gradient_loss | 0.0103 | -| std | 0.0122 | -| value_loss | 8.24e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13797 | -| time_elapsed | 73105 | -| total_timesteps | 1766016 | -| train/ | | -| approx_kl | 0.000429858 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 137960 | -| policy_gradient_loss | -0.000672 | -| std | 0.0122 | -| value_loss | 6.64e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13798 | -| time_elapsed | 73116 | -| total_timesteps | 1766144 | -| train/ | | -| approx_kl | 0.048158206 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | 0.497 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 137970 | -| policy_gradient_loss | -0.016 | -| std | 0.0122 | -| value_loss | 0.00131 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13799 | -| time_elapsed | 73121 | -| total_timesteps | 1766272 | -| train/ | | -| approx_kl | 0.008537838 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | -0.00949 | -| n_updates | 137980 | -| policy_gradient_loss | 8.32e-05 | -| std | 0.0122 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13800 | -| time_elapsed | 73125 | -| total_timesteps | 1766400 | -| train/ | | -| approx_kl | 0.088822514 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -3.02 | -| learning_rate | 0.0003 | -| loss | -0.00851 | -| n_updates | 137990 | -| policy_gradient_loss | -0.00343 | -| std | 0.0122 | -| value_loss | 1.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13801 | -| time_elapsed | 73131 | -| total_timesteps | 1766528 | -| train/ | | -| approx_kl | 0.020659624 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.911 | -| learning_rate | 0.0003 | -| loss | -0.00967 | -| n_updates | 138000 | -| policy_gradient_loss | -0.00407 | -| std | 0.0122 | -| value_loss | 5.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13802 | -| time_elapsed | 73137 | -| total_timesteps | 1766656 | -| train/ | | -| approx_kl | 0.096706055 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 138010 | -| policy_gradient_loss | 0.0129 | -| std | 0.0122 | -| value_loss | 2.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13803 | -| time_elapsed | 73141 | -| total_timesteps | 1766784 | -| train/ | | -| approx_kl | 0.015933972 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 138020 | -| policy_gradient_loss | 0.00681 | -| std | 0.0122 | -| value_loss | 1.77e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 24 | -| iterations | 13804 | -| time_elapsed | 73146 | -| total_timesteps | 1766912 | -| train/ | | -| approx_kl | 0.03934308 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 138030 | -| policy_gradient_loss | 0.0103 | -| std | 0.0122 | -| value_loss | 1.19e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13805 | -| time_elapsed | 73151 | -| total_timesteps | 1767040 | -| train/ | | -| approx_kl | 0.10627747 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 138040 | -| policy_gradient_loss | 0.0826 | -| std | 0.0122 | -| value_loss | 9.29e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13806 | -| time_elapsed | 73164 | -| total_timesteps | 1767168 | -| train/ | | -| approx_kl | 0.015758937 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -9.03 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 138050 | -| policy_gradient_loss | -0.0102 | -| std | 0.0122 | -| value_loss | 0.00415 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13807 | -| time_elapsed | 73170 | -| total_timesteps | 1767296 | -| train/ | | -| approx_kl | 0.014909447 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.567 | -| learning_rate | 0.0003 | -| loss | 0.00469 | -| n_updates | 138060 | -| policy_gradient_loss | 0.00904 | -| std | 0.0122 | -| value_loss | 2.98e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13808 | -| time_elapsed | 73176 | -| total_timesteps | 1767424 | -| train/ | | -| approx_kl | 0.052860517 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -4.05 | -| learning_rate | 0.0003 | -| loss | -0.00506 | -| n_updates | 138070 | -| policy_gradient_loss | -0.00248 | -| std | 0.0122 | -| value_loss | 2.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13809 | -| time_elapsed | 73180 | -| total_timesteps | 1767552 | -| train/ | | -| approx_kl | 0.09617448 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.899 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 138080 | -| policy_gradient_loss | 0.041 | -| std | 0.0122 | -| value_loss | 8e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13810 | -| time_elapsed | 73186 | -| total_timesteps | 1767680 | -| train/ | | -| approx_kl | 0.049184814 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | 0.0465 | -| n_updates | 138090 | -| policy_gradient_loss | 0.0445 | -| std | 0.0122 | -| value_loss | 5.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13811 | -| time_elapsed | 73191 | -| total_timesteps | 1767808 | -| train/ | | -| approx_kl | 0.009479004 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 138100 | -| policy_gradient_loss | 0.00339 | -| std | 0.0122 | -| value_loss | 4.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 24 | -| iterations | 13812 | -| time_elapsed | 73196 | -| total_timesteps | 1767936 | -| train/ | | -| approx_kl | 0.013915679 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | -0.00915 | -| n_updates | 138110 | -| policy_gradient_loss | -0.00301 | -| std | 0.0122 | -| value_loss | 2.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13813 | -| time_elapsed | 73200 | -| total_timesteps | 1768064 | -| train/ | | -| approx_kl | 0.005437502 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 138120 | -| policy_gradient_loss | 0.00797 | -| std | 0.0122 | -| value_loss | 1.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13814 | -| time_elapsed | 73210 | -| total_timesteps | 1768192 | -| train/ | | -| approx_kl | 0.094630174 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | 0.616 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 138130 | -| policy_gradient_loss | -0.00425 | -| std | 0.0122 | -| value_loss | 0.000992 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13815 | -| time_elapsed | 73215 | -| total_timesteps | 1768320 | -| train/ | | -| approx_kl | 0.03941128 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 138140 | -| policy_gradient_loss | 0.0392 | -| std | 0.0121 | -| value_loss | 1.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13816 | -| time_elapsed | 73219 | -| total_timesteps | 1768448 | -| train/ | | -| approx_kl | 0.008771593 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.495 | -| learning_rate | 0.0003 | -| loss | 0.00169 | -| n_updates | 138150 | -| policy_gradient_loss | 0.00823 | -| std | 0.0121 | -| value_loss | 4.53e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13817 | -| time_elapsed | 73224 | -| total_timesteps | 1768576 | -| train/ | | -| approx_kl | 0.017646264 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.00873 | -| n_updates | 138160 | -| policy_gradient_loss | 0.00246 | -| std | 0.0121 | -| value_loss | 2.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13818 | -| time_elapsed | 73229 | -| total_timesteps | 1768704 | -| train/ | | -| approx_kl | 0.06403112 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0752 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 138170 | -| policy_gradient_loss | 0.0112 | -| std | 0.0121 | -| value_loss | 1.57e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13819 | -| time_elapsed | 73233 | -| total_timesteps | 1768832 | -| train/ | | -| approx_kl | 0.02094219 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 138180 | -| policy_gradient_loss | 0.00422 | -| std | 0.0121 | -| value_loss | 9.87e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 24 | -| iterations | 13820 | -| time_elapsed | 73238 | -| total_timesteps | 1768960 | -| train/ | | -| approx_kl | 0.11664356 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 138190 | -| policy_gradient_loss | 0.00648 | -| std | 0.0121 | -| value_loss | 7.79e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13821 | -| time_elapsed | 73244 | -| total_timesteps | 1769088 | -| train/ | | -| approx_kl | 1.0489952e-05 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.000275 | -| n_updates | 138200 | -| policy_gradient_loss | -0.00162 | -| std | 0.0121 | -| value_loss | 5.19e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13822 | -| time_elapsed | 73255 | -| total_timesteps | 1769216 | -| train/ | | -| approx_kl | 0.02573516 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 2.99 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 138210 | -| policy_gradient_loss | -0.00883 | -| std | 0.0121 | -| value_loss | 0.00189 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13823 | -| time_elapsed | 73259 | -| total_timesteps | 1769344 | -| train/ | | -| approx_kl | 0.035666525 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.00152 | -| learning_rate | 0.0003 | -| loss | 0.00906 | -| n_updates | 138220 | -| policy_gradient_loss | -0.00106 | -| std | 0.0121 | -| value_loss | 3e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13824 | -| time_elapsed | 73264 | -| total_timesteps | 1769472 | -| train/ | | -| approx_kl | 6.8033114e-06 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | -0.000494 | -| n_updates | 138230 | -| policy_gradient_loss | -0.00745 | -| std | 0.0121 | -| value_loss | 4.31e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13825 | -| time_elapsed | 73269 | -| total_timesteps | 1769600 | -| train/ | | -| approx_kl | 0.00035808142 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0849 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 138240 | -| policy_gradient_loss | -0.00946 | -| std | 0.0121 | -| value_loss | 7.29e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13826 | -| time_elapsed | 73274 | -| total_timesteps | 1769728 | -| train/ | | -| approx_kl | 4.459964e-05 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -63.1 | -| learning_rate | 0.0003 | -| loss | 0.000918 | -| n_updates | 138250 | -| policy_gradient_loss | 0.00137 | -| std | 0.0121 | -| value_loss | 8.96e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13827 | -| time_elapsed | 73279 | -| total_timesteps | 1769856 | -| train/ | | -| approx_kl | 0.0025194227 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 138260 | -| policy_gradient_loss | 0.0272 | -| std | 0.012 | -| value_loss | 3.13e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 24 | -| iterations | 13828 | -| time_elapsed | 73284 | -| total_timesteps | 1769984 | -| train/ | | -| approx_kl | 0.0021378878 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.00981 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 138270 | -| policy_gradient_loss | 0.000575 | -| std | 0.0121 | -| value_loss | 1.59e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13829 | -| time_elapsed | 73287 | -| total_timesteps | 1770112 | -| train/ | | -| approx_kl | 0.039705012 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 138280 | -| policy_gradient_loss | 0.000742 | -| std | 0.0121 | -| value_loss | 9.43e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13830 | -| time_elapsed | 73298 | -| total_timesteps | 1770240 | -| train/ | | -| approx_kl | 0.09714354 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | 0.856 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 138290 | -| policy_gradient_loss | -0.00642 | -| std | 0.012 | -| value_loss | 0.00266 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13831 | -| time_elapsed | 73303 | -| total_timesteps | 1770368 | -| train/ | | -| approx_kl | 0.011145954 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 138300 | -| policy_gradient_loss | 0.0185 | -| std | 0.012 | -| value_loss | 5.28e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13832 | -| time_elapsed | 73307 | -| total_timesteps | 1770496 | -| train/ | | -| approx_kl | 0.05924308 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 138310 | -| policy_gradient_loss | 0.0169 | -| std | 0.012 | -| value_loss | 4.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13833 | -| time_elapsed | 73311 | -| total_timesteps | 1770624 | -| train/ | | -| approx_kl | 0.017044712 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 138320 | -| policy_gradient_loss | 0.0308 | -| std | 0.012 | -| value_loss | 3.79e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13834 | -| time_elapsed | 73316 | -| total_timesteps | 1770752 | -| train/ | | -| approx_kl | 0.005061154 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 138330 | -| policy_gradient_loss | 0.00547 | -| std | 0.012 | -| value_loss | 2.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 24 | -| iterations | 13835 | -| time_elapsed | 73320 | -| total_timesteps | 1770880 | -| train/ | | -| approx_kl | 0.01195625 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00199 | -| n_updates | 138340 | -| policy_gradient_loss | 0.0273 | -| std | 0.012 | -| value_loss | 3.22e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13836 | -| time_elapsed | 73327 | -| total_timesteps | 1771008 | -| train/ | | -| approx_kl | 0.016062543 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.00805 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 138350 | -| policy_gradient_loss | 0.00167 | -| std | 0.012 | -| value_loss | 1.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13837 | -| time_elapsed | 73340 | -| total_timesteps | 1771136 | -| train/ | | -| approx_kl | 0.020343754 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 138360 | -| policy_gradient_loss | -0.0134 | -| std | 0.012 | -| value_loss | 0.000383 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13838 | -| time_elapsed | 73344 | -| total_timesteps | 1771264 | -| train/ | | -| approx_kl | 0.040970266 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | 0.0194 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 138370 | -| policy_gradient_loss | -0.00609 | -| std | 0.012 | -| value_loss | 4.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13839 | -| time_elapsed | 73349 | -| total_timesteps | 1771392 | -| train/ | | -| approx_kl | 0.074370585 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 138380 | -| policy_gradient_loss | 0.0174 | -| std | 0.012 | -| value_loss | 6.22e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13840 | -| time_elapsed | 73353 | -| total_timesteps | 1771520 | -| train/ | | -| approx_kl | 0.00049099047 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.000429 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 138390 | -| policy_gradient_loss | -0.00896 | -| std | 0.012 | -| value_loss | 1.33e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13841 | -| time_elapsed | 73357 | -| total_timesteps | 1771648 | -| train/ | | -| approx_kl | 0.02282702 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.00862 | -| learning_rate | 0.0003 | -| loss | -0.00913 | -| n_updates | 138400 | -| policy_gradient_loss | 0.0203 | -| std | 0.012 | -| value_loss | 9.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13842 | -| time_elapsed | 73362 | -| total_timesteps | 1771776 | -| train/ | | -| approx_kl | 0.066571906 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.00988 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 138410 | -| policy_gradient_loss | 0.00955 | -| std | 0.012 | -| value_loss | 6.73e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 24 | -| iterations | 13843 | -| time_elapsed | 73366 | -| total_timesteps | 1771904 | -| train/ | | -| approx_kl | 0.016611375 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 138420 | -| policy_gradient_loss | 0.0172 | -| std | 0.012 | -| value_loss | 3.44e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13844 | -| time_elapsed | 73371 | -| total_timesteps | 1772032 | -| train/ | | -| approx_kl | 0.036984216 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.00558 | -| n_updates | 138430 | -| policy_gradient_loss | -0.00124 | -| std | 0.012 | -| value_loss | 2.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13845 | -| time_elapsed | 73382 | -| total_timesteps | 1772160 | -| train/ | | -| approx_kl | 0.005165685 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 138440 | -| policy_gradient_loss | -0.0148 | -| std | 0.012 | -| value_loss | 3.29e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13846 | -| time_elapsed | 73387 | -| total_timesteps | 1772288 | -| train/ | | -| approx_kl | 0.0033237552 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 138450 | -| policy_gradient_loss | 0.00218 | -| std | 0.012 | -| value_loss | 2.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13847 | -| time_elapsed | 73392 | -| total_timesteps | 1772416 | -| train/ | | -| approx_kl | 0.025593402 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.553 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 138460 | -| policy_gradient_loss | 0.0206 | -| std | 0.012 | -| value_loss | 1.44e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13848 | -| time_elapsed | 73397 | -| total_timesteps | 1772544 | -| train/ | | -| approx_kl | 0.06030645 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 138470 | -| policy_gradient_loss | 0.0102 | -| std | 0.012 | -| value_loss | 2.47e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13849 | -| time_elapsed | 73402 | -| total_timesteps | 1772672 | -| train/ | | -| approx_kl | 0.02128394 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0063 | -| learning_rate | 0.0003 | -| loss | 0.00652 | -| n_updates | 138480 | -| policy_gradient_loss | 0.0306 | -| std | 0.012 | -| value_loss | 4.66e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13850 | -| time_elapsed | 73407 | -| total_timesteps | 1772800 | -| train/ | | -| approx_kl | 0.04159021 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.00526 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 138490 | -| policy_gradient_loss | 0.000203 | -| std | 0.012 | -| value_loss | 2.26e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13851 | -| time_elapsed | 73413 | -| total_timesteps | 1772928 | -| train/ | | -| approx_kl | 0.0031644036 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 138500 | -| policy_gradient_loss | 0.0354 | -| std | 0.012 | -| value_loss | 9.54e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13852 | -| time_elapsed | 73418 | -| total_timesteps | 1773056 | -| train/ | | -| approx_kl | 0.030633798 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 138510 | -| policy_gradient_loss | 0.0518 | -| std | 0.012 | -| value_loss | 9.24e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13853 | -| time_elapsed | 73428 | -| total_timesteps | 1773184 | -| train/ | | -| approx_kl | 0.030988595 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -8.21 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 138520 | -| policy_gradient_loss | -0.0141 | -| std | 0.012 | -| value_loss | 0.00399 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13854 | -| time_elapsed | 73434 | -| total_timesteps | 1773312 | -| train/ | | -| approx_kl | 0.2785629 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3 | -| explained_variance | -3.17 | -| learning_rate | 0.0003 | -| loss | 0.0927 | -| n_updates | 138530 | -| policy_gradient_loss | 0.0691 | -| std | 0.012 | -| value_loss | 4.45e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13855 | -| time_elapsed | 73438 | -| total_timesteps | 1773440 | -| train/ | | -| approx_kl | 0.0031112814 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -5.06 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 138540 | -| policy_gradient_loss | 0.00445 | -| std | 0.012 | -| value_loss | 2.59e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13856 | -| time_elapsed | 73442 | -| total_timesteps | 1773568 | -| train/ | | -| approx_kl | 0.0173158 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 138550 | -| policy_gradient_loss | -0.00992 | -| std | 0.012 | -| value_loss | 1.18e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13857 | -| time_elapsed | 73446 | -| total_timesteps | 1773696 | -| train/ | | -| approx_kl | 0.029251412 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.33 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 138560 | -| policy_gradient_loss | 0.033 | -| std | 0.012 | -| value_loss | 4.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13858 | -| time_elapsed | 73451 | -| total_timesteps | 1773824 | -| train/ | | -| approx_kl | 0.006461876 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.00857 | -| n_updates | 138570 | -| policy_gradient_loss | 0.0028 | -| std | 0.012 | -| value_loss | 3.03e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 24 | -| iterations | 13859 | -| time_elapsed | 73456 | -| total_timesteps | 1773952 | -| train/ | | -| approx_kl | 0.20132884 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 138580 | -| policy_gradient_loss | 0.0867 | -| std | 0.012 | -| value_loss | 1.55e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13860 | -| time_elapsed | 73460 | -| total_timesteps | 1774080 | -| train/ | | -| approx_kl | 0.0076815817 | -| clip_fraction | 0.0422 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.00599 | -| n_updates | 138590 | -| policy_gradient_loss | -0.00364 | -| std | 0.012 | -| value_loss | 1.18e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13861 | -| time_elapsed | 73469 | -| total_timesteps | 1774208 | -| train/ | | -| approx_kl | 0.04182904 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.383 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 138600 | -| policy_gradient_loss | -0.0136 | -| std | 0.012 | -| value_loss | 0.00124 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13862 | -| time_elapsed | 73478 | -| total_timesteps | 1774336 | -| train/ | | -| approx_kl | 0.027110023 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -6.49 | -| learning_rate | 0.0003 | -| loss | -0.0194 | -| n_updates | 138610 | -| policy_gradient_loss | -0.0102 | -| std | 0.012 | -| value_loss | 1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13863 | -| time_elapsed | 73484 | -| total_timesteps | 1774464 | -| train/ | | -| approx_kl | 0.003987731 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -17.9 | -| learning_rate | 0.0003 | -| loss | -0.000599 | -| n_updates | 138620 | -| policy_gradient_loss | 0.00265 | -| std | 0.012 | -| value_loss | 3.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13864 | -| time_elapsed | 73490 | -| total_timesteps | 1774592 | -| train/ | | -| approx_kl | 0.013059806 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -1.88 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 138630 | -| policy_gradient_loss | -0.00503 | -| std | 0.0119 | -| value_loss | 5.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13865 | -| time_elapsed | 73494 | -| total_timesteps | 1774720 | -| train/ | | -| approx_kl | 0.028998531 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.0413 | -| n_updates | 138640 | -| policy_gradient_loss | 0.0437 | -| std | 0.0119 | -| value_loss | 6.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13866 | -| time_elapsed | 73499 | -| total_timesteps | 1774848 | -| train/ | | -| approx_kl | 0.034249164 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.00483 | -| learning_rate | 0.0003 | -| loss | 0.0338 | -| n_updates | 138650 | -| policy_gradient_loss | 0.0378 | -| std | 0.0119 | -| value_loss | 1.15e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 24 | -| iterations | 13867 | -| time_elapsed | 73505 | -| total_timesteps | 1774976 | -| train/ | | -| approx_kl | 0.04068061 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.00259 | -| learning_rate | 0.0003 | -| loss | 0.0441 | -| n_updates | 138660 | -| policy_gradient_loss | 0.0601 | -| std | 0.0119 | -| value_loss | 1.08e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13868 | -| time_elapsed | 73509 | -| total_timesteps | 1775104 | -| train/ | | -| approx_kl | 0.04281482 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.00314 | -| learning_rate | 0.0003 | -| loss | 0.0518 | -| n_updates | 138670 | -| policy_gradient_loss | 0.0539 | -| std | 0.0119 | -| value_loss | 1.03e-08 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13869 | -| time_elapsed | 73520 | -| total_timesteps | 1775232 | -| train/ | | -| approx_kl | 0.048529 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.248 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 138680 | -| policy_gradient_loss | -0.00976 | -| std | 0.0119 | -| value_loss | 0.00127 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13870 | -| time_elapsed | 73525 | -| total_timesteps | 1775360 | -| train/ | | -| approx_kl | 0.06299498 | -| clip_fraction | 0.597 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -3.04 | -| learning_rate | 0.0003 | -| loss | 0.0539 | -| n_updates | 138690 | -| policy_gradient_loss | 0.0369 | -| std | 0.0119 | -| value_loss | 9.61e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13871 | -| time_elapsed | 73528 | -| total_timesteps | 1775488 | -| train/ | | -| approx_kl | 0.0072807968 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 138700 | -| policy_gradient_loss | -0.0186 | -| std | 0.0119 | -| value_loss | 5.52e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13872 | -| time_elapsed | 73533 | -| total_timesteps | 1775616 | -| train/ | | -| approx_kl | 0.03163932 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 138710 | -| policy_gradient_loss | -0.0187 | -| std | 0.0119 | -| value_loss | 2.91e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13873 | -| time_elapsed | 73538 | -| total_timesteps | 1775744 | -| train/ | | -| approx_kl | 0.050646946 | -| clip_fraction | 0.589 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | 0.0549 | -| n_updates | 138720 | -| policy_gradient_loss | 0.0404 | -| std | 0.0119 | -| value_loss | 1.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13874 | -| time_elapsed | 73542 | -| total_timesteps | 1775872 | -| train/ | | -| approx_kl | 0.009683978 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 138730 | -| policy_gradient_loss | 0.00267 | -| std | 0.0119 | -| value_loss | 4.04e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13875 | -| time_elapsed | 73547 | -| total_timesteps | 1776000 | -| train/ | | -| approx_kl | 0.00015175063 | -| clip_fraction | 0.0688 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.000478 | -| n_updates | 138740 | -| policy_gradient_loss | -0.000139 | -| std | 0.0119 | -| value_loss | 1.92e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13876 | -| time_elapsed | 73552 | -| total_timesteps | 1776128 | -| train/ | | -| approx_kl | 0.016799688 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.00352 | -| learning_rate | 0.0003 | -| loss | 0.0045 | -| n_updates | 138750 | -| policy_gradient_loss | 0.00751 | -| std | 0.0119 | -| value_loss | 1.46e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13877 | -| time_elapsed | 73562 | -| total_timesteps | 1776256 | -| train/ | | -| approx_kl | 0.03021699 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 138760 | -| policy_gradient_loss | -0.0129 | -| std | 0.0119 | -| value_loss | 5.13e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13878 | -| time_elapsed | 73566 | -| total_timesteps | 1776384 | -| train/ | | -| approx_kl | 0.042145163 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.00352 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 138770 | -| policy_gradient_loss | 0.0129 | -| std | 0.0119 | -| value_loss | 1.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13879 | -| time_elapsed | 73569 | -| total_timesteps | 1776512 | -| train/ | | -| approx_kl | 0.048508525 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.00695 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 138780 | -| policy_gradient_loss | 0.00914 | -| std | 0.0119 | -| value_loss | 2.89e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13880 | -| time_elapsed | 73573 | -| total_timesteps | 1776640 | -| train/ | | -| approx_kl | 0.0097031165 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.00826 | -| n_updates | 138790 | -| policy_gradient_loss | -0.000612 | -| std | 0.0119 | -| value_loss | 1.35e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13881 | -| time_elapsed | 73577 | -| total_timesteps | 1776768 | -| train/ | | -| approx_kl | 0.037245605 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 138800 | -| policy_gradient_loss | 0.0349 | -| std | 0.0119 | -| value_loss | 2.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 24 | -| iterations | 13882 | -| time_elapsed | 73582 | -| total_timesteps | 1776896 | -| train/ | | -| approx_kl | 0.014131462 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 138810 | -| policy_gradient_loss | 0.00227 | -| std | 0.0119 | -| value_loss | 2.47e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13883 | -| time_elapsed | 73586 | -| total_timesteps | 1777024 | -| train/ | | -| approx_kl | 0.0023940327 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 138820 | -| policy_gradient_loss | 0.00662 | -| std | 0.0119 | -| value_loss | 2.84e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13884 | -| time_elapsed | 73597 | -| total_timesteps | 1777152 | -| train/ | | -| approx_kl | 0.4849092 | -| clip_fraction | 0.524 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | 0.00449 | -| n_updates | 138830 | -| policy_gradient_loss | -0.00118 | -| std | 0.0119 | -| value_loss | 0.000217 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13885 | -| time_elapsed | 73603 | -| total_timesteps | 1777280 | -| train/ | | -| approx_kl | 0.04608034 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 138840 | -| policy_gradient_loss | 0.00576 | -| std | 0.0119 | -| value_loss | 3.22e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13886 | -| time_elapsed | 73610 | -| total_timesteps | 1777408 | -| train/ | | -| approx_kl | 1.6877428e-05 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0719 | -| learning_rate | 0.0003 | -| loss | -0.000507 | -| n_updates | 138850 | -| policy_gradient_loss | 0.00553 | -| std | 0.0119 | -| value_loss | 9.98e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13887 | -| time_elapsed | 73613 | -| total_timesteps | 1777536 | -| train/ | | -| approx_kl | 2.0470005e-05 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | 0.00299 | -| learning_rate | 0.0003 | -| loss | 0.000363 | -| n_updates | 138860 | -| policy_gradient_loss | -0.000266 | -| std | 0.0118 | -| value_loss | 2.35e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13888 | -| time_elapsed | 73617 | -| total_timesteps | 1777664 | -| train/ | | -| approx_kl | 0.04933718 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0498 | -| n_updates | 138870 | -| policy_gradient_loss | 0.0522 | -| std | 0.0118 | -| value_loss | 5.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13889 | -| time_elapsed | 73621 | -| total_timesteps | 1777792 | -| train/ | | -| approx_kl | 0.044074975 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | 0.0444 | -| n_updates | 138880 | -| policy_gradient_loss | 0.0528 | -| std | 0.0118 | -| value_loss | 2.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 24 | -| iterations | 13890 | -| time_elapsed | 73626 | -| total_timesteps | 1777920 | -| train/ | | -| approx_kl | 0.00840757 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -0.0028 | -| n_updates | 138890 | -| policy_gradient_loss | 0.00491 | -| std | 0.0118 | -| value_loss | 1.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13891 | -| time_elapsed | 73630 | -| total_timesteps | 1778048 | -| train/ | | -| approx_kl | 0.017878814 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 138900 | -| policy_gradient_loss | 0.0113 | -| std | 0.0118 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13892 | -| time_elapsed | 73639 | -| total_timesteps | 1778176 | -| train/ | | -| approx_kl | 0.012220914 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 138910 | -| policy_gradient_loss | -0.0137 | -| std | 0.0118 | -| value_loss | 0.00398 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13893 | -| time_elapsed | 73643 | -| total_timesteps | 1778304 | -| train/ | | -| approx_kl | 0.102367125 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -10.7 | -| learning_rate | 0.0003 | -| loss | -0.00523 | -| n_updates | 138920 | -| policy_gradient_loss | -0.000253 | -| std | 0.0118 | -| value_loss | 5.25e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13894 | -| time_elapsed | 73648 | -| total_timesteps | 1778432 | -| train/ | | -| approx_kl | 0.0041415696 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -4.79 | -| learning_rate | 0.0003 | -| loss | 0.00488 | -| n_updates | 138930 | -| policy_gradient_loss | -0.000702 | -| std | 0.0118 | -| value_loss | 7.39e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13895 | -| time_elapsed | 73654 | -| total_timesteps | 1778560 | -| train/ | | -| approx_kl | 0.008001651 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | 0.00733 | -| n_updates | 138940 | -| policy_gradient_loss | 0.00732 | -| std | 0.0118 | -| value_loss | 2.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13896 | -| time_elapsed | 73659 | -| total_timesteps | 1778688 | -| train/ | | -| approx_kl | 0.07362792 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.0318 | -| n_updates | 138950 | -| policy_gradient_loss | 0.0123 | -| std | 0.0119 | -| value_loss | 3.7e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13897 | -| time_elapsed | 73665 | -| total_timesteps | 1778816 | -| train/ | | -| approx_kl | 0.0032187612 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 138960 | -| policy_gradient_loss | 0.0287 | -| std | 0.0119 | -| value_loss | 2.5e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 24 | -| iterations | 13898 | -| time_elapsed | 73669 | -| total_timesteps | 1778944 | -| train/ | | -| approx_kl | 0.032330457 | -| clip_fraction | 0.571 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 138970 | -| policy_gradient_loss | 0.0998 | -| std | 0.0119 | -| value_loss | 2.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13899 | -| time_elapsed | 73675 | -| total_timesteps | 1779072 | -| train/ | | -| approx_kl | 0.022295207 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0831 | -| learning_rate | 0.0003 | -| loss | -0.00851 | -| n_updates | 138980 | -| policy_gradient_loss | 0.00111 | -| std | 0.0119 | -| value_loss | 5.59e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13900 | -| time_elapsed | 73684 | -| total_timesteps | 1779200 | -| train/ | | -| approx_kl | 0.12548012 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 138990 | -| policy_gradient_loss | -0.016 | -| std | 0.012 | -| value_loss | 8.28e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13901 | -| time_elapsed | 73689 | -| total_timesteps | 1779328 | -| train/ | | -| approx_kl | 0.0041948296 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 139000 | -| policy_gradient_loss | 0.000654 | -| std | 0.012 | -| value_loss | 1.18e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13902 | -| time_elapsed | 73693 | -| total_timesteps | 1779456 | -| train/ | | -| approx_kl | 0.0010590339 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.00237 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 139010 | -| policy_gradient_loss | 0.000914 | -| std | 0.0119 | -| value_loss | 1.23e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13903 | -| time_elapsed | 73698 | -| total_timesteps | 1779584 | -| train/ | | -| approx_kl | 0.018843144 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.00264 | -| n_updates | 139020 | -| policy_gradient_loss | 0.00713 | -| std | 0.0119 | -| value_loss | 5.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13904 | -| time_elapsed | 73704 | -| total_timesteps | 1779712 | -| train/ | | -| approx_kl | 0.016243726 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.00386 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 139030 | -| policy_gradient_loss | 0.0027 | -| std | 0.0119 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13905 | -| time_elapsed | 73709 | -| total_timesteps | 1779840 | -| train/ | | -| approx_kl | 0.058394317 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | 0.00961 | -| n_updates | 139040 | -| policy_gradient_loss | -0.00361 | -| std | 0.0119 | -| value_loss | 4.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 13906 | -| time_elapsed | 73715 | -| total_timesteps | 1779968 | -| train/ | | -| approx_kl | 0.10085791 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 139050 | -| policy_gradient_loss | 0.000124 | -| std | 0.0119 | -| value_loss | 2.39e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13907 | -| time_elapsed | 73719 | -| total_timesteps | 1780096 | -| train/ | | -| approx_kl | 0.07252269 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 139060 | -| policy_gradient_loss | -0.00698 | -| std | 0.0119 | -| value_loss | 1.96e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13908 | -| time_elapsed | 73728 | -| total_timesteps | 1780224 | -| train/ | | -| approx_kl | 0.007429686 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 139070 | -| policy_gradient_loss | -0.0195 | -| std | 0.0119 | -| value_loss | 2.85e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13909 | -| time_elapsed | 73733 | -| total_timesteps | 1780352 | -| train/ | | -| approx_kl | 9.587733e-05 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.00729 | -| learning_rate | 0.0003 | -| loss | 0.000158 | -| n_updates | 139080 | -| policy_gradient_loss | 0.0023 | -| std | 0.0119 | -| value_loss | 3.92e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13910 | -| time_elapsed | 73738 | -| total_timesteps | 1780480 | -| train/ | | -| approx_kl | 0.017525502 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.00348 | -| n_updates | 139090 | -| policy_gradient_loss | 0.0201 | -| std | 0.0119 | -| value_loss | 1.24e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13911 | -| time_elapsed | 73743 | -| total_timesteps | 1780608 | -| train/ | | -| approx_kl | 0.06390843 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 139100 | -| policy_gradient_loss | 0.0109 | -| std | 0.0119 | -| value_loss | 8.28e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13912 | -| time_elapsed | 73748 | -| total_timesteps | 1780736 | -| train/ | | -| approx_kl | 0.00035017496 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | -0.000476 | -| n_updates | 139110 | -| policy_gradient_loss | 0.00293 | -| std | 0.0119 | -| value_loss | 5.2e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13913 | -| time_elapsed | 73753 | -| total_timesteps | 1780864 | -| train/ | | -| approx_kl | 0.021154154 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.0272 | -| n_updates | 139120 | -| policy_gradient_loss | 0.0191 | -| std | 0.0119 | -| value_loss | 6.79e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 13914 | -| time_elapsed | 73758 | -| total_timesteps | 1780992 | -| train/ | | -| approx_kl | 0.036975347 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.00426 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 139130 | -| policy_gradient_loss | 0.0107 | -| std | 0.0119 | -| value_loss | 9.62e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 13915 | -| time_elapsed | 73763 | -| total_timesteps | 1781120 | -| train/ | | -| approx_kl | 0.021495022 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.0026 | -| learning_rate | 0.0003 | -| loss | -0.00748 | -| n_updates | 139140 | -| policy_gradient_loss | 0.0149 | -| std | 0.0119 | -| value_loss | 5.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 13916 | -| time_elapsed | 73775 | -| total_timesteps | 1781248 | -| train/ | | -| approx_kl | 0.054682806 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 139150 | -| policy_gradient_loss | -0.0168 | -| std | 0.0119 | -| value_loss | 0.000477 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 13917 | -| time_elapsed | 73779 | -| total_timesteps | 1781376 | -| train/ | | -| approx_kl | 0.014597343 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -59.3 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 139160 | -| policy_gradient_loss | 0.00672 | -| std | 0.0119 | -| value_loss | 6.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 13918 | -| time_elapsed | 73784 | -| total_timesteps | 1781504 | -| train/ | | -| approx_kl | 0.062843814 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -52.6 | -| learning_rate | 0.0003 | -| loss | -0.000524 | -| n_updates | 139170 | -| policy_gradient_loss | -0.000902 | -| std | 0.0119 | -| value_loss | 1.09e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 13919 | -| time_elapsed | 73788 | -| total_timesteps | 1781632 | -| train/ | | -| approx_kl | 0.18529244 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -56.4 | -| learning_rate | 0.0003 | -| loss | 0.00418 | -| n_updates | 139180 | -| policy_gradient_loss | -0.00259 | -| std | 0.0119 | -| value_loss | 1.54e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 13920 | -| time_elapsed | 73793 | -| total_timesteps | 1781760 | -| train/ | | -| approx_kl | 0.011160223 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -3.32 | -| learning_rate | 0.0003 | -| loss | 0.00069 | -| n_updates | 139190 | -| policy_gradient_loss | 0.0199 | -| std | 0.0119 | -| value_loss | 6.67e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 13921 | -| time_elapsed | 73797 | -| total_timesteps | 1781888 | -| train/ | | -| approx_kl | 0.060005337 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -1.49 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 139200 | -| policy_gradient_loss | 0.00754 | -| std | 0.0119 | -| value_loss | 2.67e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13922 | -| time_elapsed | 73802 | -| total_timesteps | 1782016 | -| train/ | | -| approx_kl | 0.10170651 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | 0.0589 | -| n_updates | 139210 | -| policy_gradient_loss | 0.0452 | -| std | 0.0119 | -| value_loss | 1.05e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13923 | -| time_elapsed | 73814 | -| total_timesteps | 1782144 | -| train/ | | -| approx_kl | 0.0011812062 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 139220 | -| policy_gradient_loss | -0.00239 | -| std | 0.0119 | -| value_loss | 0.00126 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13924 | -| time_elapsed | 73818 | -| total_timesteps | 1782272 | -| train/ | | -| approx_kl | 0.011162533 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | 0.0042 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 139230 | -| policy_gradient_loss | 0.0101 | -| std | 0.0119 | -| value_loss | 3.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13925 | -| time_elapsed | 73822 | -| total_timesteps | 1782400 | -| train/ | | -| approx_kl | 0.0010816301 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 139240 | -| policy_gradient_loss | 0.00383 | -| std | 0.0119 | -| value_loss | 4.26e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13926 | -| time_elapsed | 73826 | -| total_timesteps | 1782528 | -| train/ | | -| approx_kl | 0.029909797 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | 0.000377 | -| n_updates | 139250 | -| policy_gradient_loss | -0.00406 | -| std | 0.0119 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13927 | -| time_elapsed | 73831 | -| total_timesteps | 1782656 | -| train/ | | -| approx_kl | 0.008250429 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 139260 | -| policy_gradient_loss | -0.000435 | -| std | 0.0119 | -| value_loss | 1.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13928 | -| time_elapsed | 73836 | -| total_timesteps | 1782784 | -| train/ | | -| approx_kl | 0.014853641 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.00768 | -| n_updates | 139270 | -| policy_gradient_loss | 0.00321 | -| std | 0.0119 | -| value_loss | 8.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 24 | -| iterations | 13929 | -| time_elapsed | 73841 | -| total_timesteps | 1782912 | -| train/ | | -| approx_kl | 0.015391102 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 139280 | -| policy_gradient_loss | -0.00247 | -| std | 0.0119 | -| value_loss | 6.71e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13930 | -| time_elapsed | 73847 | -| total_timesteps | 1783040 | -| train/ | | -| approx_kl | 3.592763e-05 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.000545 | -| n_updates | 139290 | -| policy_gradient_loss | 0.000936 | -| std | 0.0119 | -| value_loss | 3.71e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13931 | -| time_elapsed | 73858 | -| total_timesteps | 1783168 | -| train/ | | -| approx_kl | 0.1540856 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | 0.921 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 139300 | -| policy_gradient_loss | -0.0145 | -| std | 0.0119 | -| value_loss | 0.000311 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13932 | -| time_elapsed | 73864 | -| total_timesteps | 1783296 | -| train/ | | -| approx_kl | 0.026559735 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -2.31 | -| learning_rate | 0.0003 | -| loss | -0.000282 | -| n_updates | 139310 | -| policy_gradient_loss | 0.00316 | -| std | 0.0119 | -| value_loss | 1.56e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13933 | -| time_elapsed | 73869 | -| total_timesteps | 1783424 | -| train/ | | -| approx_kl | 0.07362204 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -9 | -| learning_rate | 0.0003 | -| loss | 0.00291 | -| n_updates | 139320 | -| policy_gradient_loss | 0.00622 | -| std | 0.0119 | -| value_loss | 3.47e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13934 | -| time_elapsed | 73874 | -| total_timesteps | 1783552 | -| train/ | | -| approx_kl | 0.03244681 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -1.44 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 139330 | -| policy_gradient_loss | 0.00358 | -| std | 0.0119 | -| value_loss | 9.88e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13935 | -| time_elapsed | 73879 | -| total_timesteps | 1783680 | -| train/ | | -| approx_kl | 0.012836006 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 139340 | -| policy_gradient_loss | 0.00235 | -| std | 0.0119 | -| value_loss | 5.16e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13936 | -| time_elapsed | 73884 | -| total_timesteps | 1783808 | -| train/ | | -| approx_kl | 0.0354658 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.00526 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 139350 | -| policy_gradient_loss | 0.0158 | -| std | 0.0119 | -| value_loss | 3e-10 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 13937 | -| time_elapsed | 73889 | -| total_timesteps | 1783936 | -| train/ | | -| approx_kl | 0.04681422 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.000542 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 139360 | -| policy_gradient_loss | 0.0148 | -| std | 0.0119 | -| value_loss | 3.64e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13938 | -| time_elapsed | 73895 | -| total_timesteps | 1784064 | -| train/ | | -| approx_kl | 0.08308144 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.0511 | -| n_updates | 139370 | -| policy_gradient_loss | 0.0202 | -| std | 0.0119 | -| value_loss | 4.67e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13939 | -| time_elapsed | 73903 | -| total_timesteps | 1784192 | -| train/ | | -| approx_kl | 0.0041687903 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.01 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 139380 | -| policy_gradient_loss | -0.0104 | -| std | 0.0119 | -| value_loss | 0.00196 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13940 | -| time_elapsed | 73907 | -| total_timesteps | 1784320 | -| train/ | | -| approx_kl | 0.010717585 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.404 | -| learning_rate | 0.0003 | -| loss | -0.00679 | -| n_updates | 139390 | -| policy_gradient_loss | 0.0438 | -| std | 0.0119 | -| value_loss | 2.6e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13941 | -| time_elapsed | 73912 | -| total_timesteps | 1784448 | -| train/ | | -| approx_kl | 1.5855767e-06 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | -4.25e-06 | -| n_updates | 139400 | -| policy_gradient_loss | 0.0199 | -| std | 0.0119 | -| value_loss | 6.7e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13942 | -| time_elapsed | 73916 | -| total_timesteps | 1784576 | -| train/ | | -| approx_kl | 0.103107125 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | 0.0438 | -| n_updates | 139410 | -| policy_gradient_loss | 0.00823 | -| std | 0.0118 | -| value_loss | 2.02e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13943 | -| time_elapsed | 73922 | -| total_timesteps | 1784704 | -| train/ | | -| approx_kl | 0.0038168333 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | 0.000217 | -| n_updates | 139420 | -| policy_gradient_loss | 0.00985 | -| std | 0.0118 | -| value_loss | 2.59e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13944 | -| time_elapsed | 73927 | -| total_timesteps | 1784832 | -| train/ | | -| approx_kl | 0.08954671 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.307 | -| learning_rate | 0.0003 | -| loss | 0.0821 | -| n_updates | 139430 | -| policy_gradient_loss | 0.0514 | -| std | 0.0118 | -| value_loss | 7.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13945 | -| time_elapsed | 73932 | -| total_timesteps | 1784960 | -| train/ | | -| approx_kl | 0.042594332 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 139440 | -| policy_gradient_loss | 0.0371 | -| std | 0.0118 | -| value_loss | 9.65e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13946 | -| time_elapsed | 73937 | -| total_timesteps | 1785088 | -| train/ | | -| approx_kl | 0.04893022 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.0466 | -| n_updates | 139450 | -| policy_gradient_loss | 0.0537 | -| std | 0.0118 | -| value_loss | 7.46e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13947 | -| time_elapsed | 73947 | -| total_timesteps | 1785216 | -| train/ | | -| approx_kl | 0.07107306 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | 0.774 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 139460 | -| policy_gradient_loss | -0.0132 | -| std | 0.0118 | -| value_loss | 0.000698 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13948 | -| time_elapsed | 73951 | -| total_timesteps | 1785344 | -| train/ | | -| approx_kl | 0.02866817 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -7.56 | -| learning_rate | 0.0003 | -| loss | -0.000851 | -| n_updates | 139470 | -| policy_gradient_loss | -0.00107 | -| std | 0.0118 | -| value_loss | 2.43e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13949 | -| time_elapsed | 73955 | -| total_timesteps | 1785472 | -| train/ | | -| approx_kl | 3.943406e-05 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -70 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 139480 | -| policy_gradient_loss | -0.0081 | -| std | 0.0118 | -| value_loss | 1.42e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13950 | -| time_elapsed | 73959 | -| total_timesteps | 1785600 | -| train/ | | -| approx_kl | 0.011719263 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -48.6 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 139490 | -| policy_gradient_loss | -0.013 | -| std | 0.0118 | -| value_loss | 1.23e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13951 | -| time_elapsed | 73963 | -| total_timesteps | 1785728 | -| train/ | | -| approx_kl | 0.003406437 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.02 | -| explained_variance | -7.27 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 139500 | -| policy_gradient_loss | 0.00136 | -| std | 0.0118 | -| value_loss | 3.73e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13952 | -| time_elapsed | 73968 | -| total_timesteps | 1785856 | -| train/ | | -| approx_kl | 0.043107856 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.709 | -| learning_rate | 0.0003 | -| loss | 0.00826 | -| n_updates | 139510 | -| policy_gradient_loss | 0.00993 | -| std | 0.0117 | -| value_loss | 1.56e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 13953 | -| time_elapsed | 73973 | -| total_timesteps | 1785984 | -| train/ | | -| approx_kl | 0.065103196 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -84.4 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 139520 | -| policy_gradient_loss | -0.00496 | -| std | 0.0117 | -| value_loss | 4.48e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13954 | -| time_elapsed | 73977 | -| total_timesteps | 1786112 | -| train/ | | -| approx_kl | 0.050836317 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.204 | -| learning_rate | 0.0003 | -| loss | 0.00773 | -| n_updates | 139530 | -| policy_gradient_loss | -0.00259 | -| std | 0.0117 | -| value_loss | 1.54e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13955 | -| time_elapsed | 73990 | -| total_timesteps | 1786240 | -| train/ | | -| approx_kl | 0.4874633 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -6.1 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 139540 | -| policy_gradient_loss | -0.0157 | -| std | 0.0117 | -| value_loss | 0.00333 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13956 | -| time_elapsed | 73996 | -| total_timesteps | 1786368 | -| train/ | | -| approx_kl | 0.00027804775 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -88.4 | -| learning_rate | 0.0003 | -| loss | 0.00262 | -| n_updates | 139550 | -| policy_gradient_loss | -0.0052 | -| std | 0.0117 | -| value_loss | 2.6e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13957 | -| time_elapsed | 74001 | -| total_timesteps | 1786496 | -| train/ | | -| approx_kl | 0.017179437 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -6.18 | -| learning_rate | 0.0003 | -| loss | 0.00511 | -| n_updates | 139560 | -| policy_gradient_loss | 0.012 | -| std | 0.0117 | -| value_loss | 7.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13958 | -| time_elapsed | 74005 | -| total_timesteps | 1786624 | -| train/ | | -| approx_kl | 0.063541874 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 139570 | -| policy_gradient_loss | 0.00585 | -| std | 0.0117 | -| value_loss | 2.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13959 | -| time_elapsed | 74011 | -| total_timesteps | 1786752 | -| train/ | | -| approx_kl | 0.04103412 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.552 | -| learning_rate | 0.0003 | -| loss | 0.00311 | -| n_updates | 139580 | -| policy_gradient_loss | 0.0142 | -| std | 0.0117 | -| value_loss | 4.85e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 24 | -| iterations | 13960 | -| time_elapsed | 74016 | -| total_timesteps | 1786880 | -| train/ | | -| approx_kl | 0.0081815105 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 139590 | -| policy_gradient_loss | -0.00436 | -| std | 0.0117 | -| value_loss | 3.74e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13961 | -| time_elapsed | 74020 | -| total_timesteps | 1787008 | -| train/ | | -| approx_kl | 0.06438169 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.00147 | -| learning_rate | 0.0003 | -| loss | 0.0594 | -| n_updates | 139600 | -| policy_gradient_loss | 0.00828 | -| std | 0.0117 | -| value_loss | 6.12e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13962 | -| time_elapsed | 74030 | -| total_timesteps | 1787136 | -| train/ | | -| approx_kl | 1.3288667 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 139610 | -| policy_gradient_loss | -0.0141 | -| std | 0.0117 | -| value_loss | 6.61e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13963 | -| time_elapsed | 74034 | -| total_timesteps | 1787264 | -| train/ | | -| approx_kl | 0.081767246 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.0381 | -| learning_rate | 0.0003 | -| loss | 0.0449 | -| n_updates | 139620 | -| policy_gradient_loss | 0.0119 | -| std | 0.0117 | -| value_loss | 0.000175 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13964 | -| time_elapsed | 74037 | -| total_timesteps | 1787392 | -| train/ | | -| approx_kl | 0.015387204 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0696 | -| learning_rate | 0.0003 | -| loss | -0.000749 | -| n_updates | 139630 | -| policy_gradient_loss | 0.0163 | -| std | 0.0117 | -| value_loss | 8.19e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13965 | -| time_elapsed | 74041 | -| total_timesteps | 1787520 | -| train/ | | -| approx_kl | 0.03446458 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 139640 | -| policy_gradient_loss | -0.00289 | -| std | 0.0117 | -| value_loss | 5.31e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13966 | -| time_elapsed | 74044 | -| total_timesteps | 1787648 | -| train/ | | -| approx_kl | 0.0047080065 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0775 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 139650 | -| policy_gradient_loss | 0.00258 | -| std | 0.0117 | -| value_loss | 2.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13967 | -| time_elapsed | 74048 | -| total_timesteps | 1787776 | -| train/ | | -| approx_kl | 0.025258739 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 139660 | -| policy_gradient_loss | -0.000712 | -| std | 0.0117 | -| value_loss | 1.94e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13968 | -| time_elapsed | 74051 | -| total_timesteps | 1787904 | -| train/ | | -| approx_kl | 0.00814034 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 139670 | -| policy_gradient_loss | -0.00733 | -| std | 0.0117 | -| value_loss | 8.08e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13969 | -| time_elapsed | 74054 | -| total_timesteps | 1788032 | -| train/ | | -| approx_kl | 0.00058699865 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 139680 | -| policy_gradient_loss | -0.000407 | -| std | 0.0117 | -| value_loss | 7.07e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13970 | -| time_elapsed | 74062 | -| total_timesteps | 1788160 | -| train/ | | -| approx_kl | 0.11354529 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 139690 | -| policy_gradient_loss | -0.0116 | -| std | 0.0117 | -| value_loss | 0.000332 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13971 | -| time_elapsed | 74065 | -| total_timesteps | 1788288 | -| train/ | | -| approx_kl | 0.03236662 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -90.7 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 139700 | -| policy_gradient_loss | 0.000313 | -| std | 0.0116 | -| value_loss | 4.95e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13972 | -| time_elapsed | 74069 | -| total_timesteps | 1788416 | -| train/ | | -| approx_kl | 0.115643695 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -6.86e+03 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 139710 | -| policy_gradient_loss | -0.0109 | -| std | 0.0116 | -| value_loss | 1.87e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13973 | -| time_elapsed | 74074 | -| total_timesteps | 1788544 | -| train/ | | -| approx_kl | 0.026668143 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -7.78e+03 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 139720 | -| policy_gradient_loss | -0.0108 | -| std | 0.0116 | -| value_loss | 1.15e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13974 | -| time_elapsed | 74079 | -| total_timesteps | 1788672 | -| train/ | | -| approx_kl | 0.22314115 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -8.03 | -| learning_rate | 0.0003 | -| loss | 0.00294 | -| n_updates | 139730 | -| policy_gradient_loss | 0.000493 | -| std | 0.0116 | -| value_loss | 3.78e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13975 | -| time_elapsed | 74084 | -| total_timesteps | 1788800 | -| train/ | | -| approx_kl | 0.06495492 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -1.94 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 139740 | -| policy_gradient_loss | 0.00202 | -| std | 0.0116 | -| value_loss | 1.43e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 13976 | -| time_elapsed | 74089 | -| total_timesteps | 1788928 | -| train/ | | -| approx_kl | 0.0040313536 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.934 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 139750 | -| policy_gradient_loss | 0.0119 | -| std | 0.0116 | -| value_loss | 5.44e-12 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13977 | -| time_elapsed | 74094 | -| total_timesteps | 1789056 | -| train/ | | -| approx_kl | 0.012919278 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.431 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 139760 | -| policy_gradient_loss | -0.000687 | -| std | 0.0116 | -| value_loss | 8.96e-13 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13978 | -| time_elapsed | 74101 | -| total_timesteps | 1789184 | -| train/ | | -| approx_kl | 0.014057355 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.966 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 139770 | -| policy_gradient_loss | -0.00961 | -| std | 0.0116 | -| value_loss | 0.000261 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13979 | -| time_elapsed | 74105 | -| total_timesteps | 1789312 | -| train/ | | -| approx_kl | 0.017395 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 139780 | -| policy_gradient_loss | 0.00489 | -| std | 0.0116 | -| value_loss | 5.46e-07 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13980 | -| time_elapsed | 74110 | -| total_timesteps | 1789440 | -| train/ | | -| approx_kl | 0.00054856436 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -1.97 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 139790 | -| policy_gradient_loss | -0.00208 | -| std | 0.0116 | -| value_loss | 1.37e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13981 | -| time_elapsed | 74114 | -| total_timesteps | 1789568 | -| train/ | | -| approx_kl | 0.029842662 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | 0.00558 | -| n_updates | 139800 | -| policy_gradient_loss | 0.0119 | -| std | 0.0117 | -| value_loss | 7.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13982 | -| time_elapsed | 74118 | -| total_timesteps | 1789696 | -| train/ | | -| approx_kl | 0.030533476 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | 0.0602 | -| n_updates | 139810 | -| policy_gradient_loss | 0.037 | -| std | 0.0117 | -| value_loss | 4.92e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13983 | -| time_elapsed | 74122 | -| total_timesteps | 1789824 | -| train/ | | -| approx_kl | 0.012723817 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.00423 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 139820 | -| policy_gradient_loss | 0.0263 | -| std | 0.0117 | -| value_loss | 1.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 13984 | -| time_elapsed | 74126 | -| total_timesteps | 1789952 | -| train/ | | -| approx_kl | 0.008129558 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.00629 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 139830 | -| policy_gradient_loss | 0.0397 | -| std | 0.0117 | -| value_loss | 8.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13985 | -| time_elapsed | 74130 | -| total_timesteps | 1790080 | -| train/ | | -| approx_kl | 0.027407154 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.00913 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 139840 | -| policy_gradient_loss | 0.0958 | -| std | 0.0117 | -| value_loss | 5.3e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13986 | -| time_elapsed | 74138 | -| total_timesteps | 1790208 | -| train/ | | -| approx_kl | 0.0025113085 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 139850 | -| policy_gradient_loss | 0.00101 | -| std | 0.0116 | -| value_loss | 0.00239 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13987 | -| time_elapsed | 74144 | -| total_timesteps | 1790336 | -| train/ | | -| approx_kl | 0.013158634 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -0.006 | -| n_updates | 139860 | -| policy_gradient_loss | 0.00498 | -| std | 0.0116 | -| value_loss | 1.1e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13988 | -| time_elapsed | 74148 | -| total_timesteps | 1790464 | -| train/ | | -| approx_kl | 0.20252454 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.000547 | -| learning_rate | 0.0003 | -| loss | 0.0963 | -| n_updates | 139870 | -| policy_gradient_loss | 0.0247 | -| std | 0.0117 | -| value_loss | 6.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13989 | -| time_elapsed | 74152 | -| total_timesteps | 1790592 | -| train/ | | -| approx_kl | 0.013896631 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.000901 | -| n_updates | 139880 | -| policy_gradient_loss | 0.000679 | -| std | 0.0116 | -| value_loss | 4.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13990 | -| time_elapsed | 74157 | -| total_timesteps | 1790720 | -| train/ | | -| approx_kl | 0.062515974 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0483 | -| n_updates | 139890 | -| policy_gradient_loss | 0.0288 | -| std | 0.0117 | -| value_loss | 7.44e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13991 | -| time_elapsed | 74160 | -| total_timesteps | 1790848 | -| train/ | | -| approx_kl | 0.0025869175 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.00273 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 139900 | -| policy_gradient_loss | 0.00195 | -| std | 0.0117 | -| value_loss | 1.76e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 13992 | -| time_elapsed | 74164 | -| total_timesteps | 1790976 | -| train/ | | -| approx_kl | 0.007977927 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.0041 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 139910 | -| policy_gradient_loss | 0.0198 | -| std | 0.0117 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13993 | -| time_elapsed | 74167 | -| total_timesteps | 1791104 | -| train/ | | -| approx_kl | 0.007306102 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 139920 | -| policy_gradient_loss | -0.00132 | -| std | 0.0117 | -| value_loss | 7.55e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13994 | -| time_elapsed | 74178 | -| total_timesteps | 1791232 | -| train/ | | -| approx_kl | 0.33971784 | -| clip_fraction | 0.0703 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.766 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 139930 | -| policy_gradient_loss | -0.0158 | -| std | 0.0117 | -| value_loss | 0.000536 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13995 | -| time_elapsed | 74184 | -| total_timesteps | 1791360 | -| train/ | | -| approx_kl | 0.023771798 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -9.13 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 139940 | -| policy_gradient_loss | -0.00131 | -| std | 0.0117 | -| value_loss | 0.000214 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13996 | -| time_elapsed | 74188 | -| total_timesteps | 1791488 | -| train/ | | -| approx_kl | 0.010782694 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | -0.00853 | -| n_updates | 139950 | -| policy_gradient_loss | -0.0037 | -| std | 0.0117 | -| value_loss | 1.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13997 | -| time_elapsed | 74193 | -| total_timesteps | 1791616 | -| train/ | | -| approx_kl | 0.032543942 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 139960 | -| policy_gradient_loss | 0.0105 | -| std | 0.0117 | -| value_loss | 2.49e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13998 | -| time_elapsed | 74199 | -| total_timesteps | 1791744 | -| train/ | | -| approx_kl | 0.24366167 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.000498 | -| learning_rate | 0.0003 | -| loss | 0.19 | -| n_updates | 139970 | -| policy_gradient_loss | 0.105 | -| std | 0.0117 | -| value_loss | 3.09e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 13999 | -| time_elapsed | 74204 | -| total_timesteps | 1791872 | -| train/ | | -| approx_kl | 0.0018181428 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 139980 | -| policy_gradient_loss | 0.00334 | -| std | 0.0117 | -| value_loss | 1.68e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14000 | -| time_elapsed | 74210 | -| total_timesteps | 1792000 | -| train/ | | -| approx_kl | 0.016200121 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 139990 | -| policy_gradient_loss | -0.00589 | -| std | 0.0117 | -| value_loss | 1.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14001 | -| time_elapsed | 74215 | -| total_timesteps | 1792128 | -| train/ | | -| approx_kl | 0.005328595 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.00183 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 140000 | -| policy_gradient_loss | 0.00569 | -| std | 0.0117 | -| value_loss | 5.81e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14002 | -| time_elapsed | 74226 | -| total_timesteps | 1792256 | -| train/ | | -| approx_kl | 0.5202789 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 140010 | -| policy_gradient_loss | -0.0154 | -| std | 0.0116 | -| value_loss | 1.43e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14003 | -| time_elapsed | 74231 | -| total_timesteps | 1792384 | -| train/ | | -| approx_kl | 0.008805571 | -| clip_fraction | 0.043 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.00255 | -| n_updates | 140020 | -| policy_gradient_loss | 0.000115 | -| std | 0.0116 | -| value_loss | 1.57e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14004 | -| time_elapsed | 74238 | -| total_timesteps | 1792512 | -| train/ | | -| approx_kl | 0.0596169 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 140030 | -| policy_gradient_loss | 0.00752 | -| std | 0.0116 | -| value_loss | 1.76e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14005 | -| time_elapsed | 74243 | -| total_timesteps | 1792640 | -| train/ | | -| approx_kl | 0.11672127 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.00228 | -| learning_rate | 0.0003 | -| loss | 0.00518 | -| n_updates | 140040 | -| policy_gradient_loss | -0.0015 | -| std | 0.0116 | -| value_loss | 6.48e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14006 | -| time_elapsed | 74249 | -| total_timesteps | 1792768 | -| train/ | | -| approx_kl | 0.0001982511 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.00051 | -| n_updates | 140050 | -| policy_gradient_loss | -9.37e-05 | -| std | 0.0116 | -| value_loss | 3.37e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14007 | -| time_elapsed | 74253 | -| total_timesteps | 1792896 | -| train/ | | -| approx_kl | 0.00021700608 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 140060 | -| policy_gradient_loss | -3.37e-06 | -| std | 0.0116 | -| value_loss | 3.01e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14008 | -| time_elapsed | 74257 | -| total_timesteps | 1793024 | -| train/ | | -| approx_kl | 0.007927688 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.00841 | -| learning_rate | 0.0003 | -| loss | 0.0257 | -| n_updates | 140070 | -| policy_gradient_loss | 0.00422 | -| std | 0.0116 | -| value_loss | 1.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14009 | -| time_elapsed | 74268 | -| total_timesteps | 1793152 | -| train/ | | -| approx_kl | 0.038594484 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 140080 | -| policy_gradient_loss | -0.00469 | -| std | 0.0116 | -| value_loss | 0.00149 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14010 | -| time_elapsed | 74272 | -| total_timesteps | 1793280 | -| train/ | | -| approx_kl | 0.00047078496 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 140090 | -| policy_gradient_loss | 0.00873 | -| std | 0.0116 | -| value_loss | 6.56e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14011 | -| time_elapsed | 74277 | -| total_timesteps | 1793408 | -| train/ | | -| approx_kl | 0.22317812 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.03 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 140100 | -| policy_gradient_loss | 0.0252 | -| std | 0.0116 | -| value_loss | 4.98e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14012 | -| time_elapsed | 74281 | -| total_timesteps | 1793536 | -| train/ | | -| approx_kl | 0.030588442 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | 0.00243 | -| n_updates | 140110 | -| policy_gradient_loss | 0.0109 | -| std | 0.0116 | -| value_loss | 2.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14013 | -| time_elapsed | 74286 | -| total_timesteps | 1793664 | -| train/ | | -| approx_kl | 0.007211563 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 140120 | -| policy_gradient_loss | 0.0278 | -| std | 0.0116 | -| value_loss | 1.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14014 | -| time_elapsed | 74291 | -| total_timesteps | 1793792 | -| train/ | | -| approx_kl | 0.014664847 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00615 | -| n_updates | 140130 | -| policy_gradient_loss | 0.00215 | -| std | 0.0116 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14015 | -| time_elapsed | 74295 | -| total_timesteps | 1793920 | -| train/ | | -| approx_kl | 0.0022123605 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | -0.000486 | -| n_updates | 140140 | -| policy_gradient_loss | 0.00698 | -| std | 0.0116 | -| value_loss | 1.08e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14016 | -| time_elapsed | 74299 | -| total_timesteps | 1794048 | -| train/ | | -| approx_kl | 0.18595988 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 140150 | -| policy_gradient_loss | 0.0852 | -| std | 0.0116 | -| value_loss | 4.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14017 | -| time_elapsed | 74307 | -| total_timesteps | 1794176 | -| train/ | | -| approx_kl | 0.018156381 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.713 | -| learning_rate | 0.0003 | -| loss | -0.00974 | -| n_updates | 140160 | -| policy_gradient_loss | -0.00467 | -| std | 0.0116 | -| value_loss | 0.00555 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14018 | -| time_elapsed | 74312 | -| total_timesteps | 1794304 | -| train/ | | -| approx_kl | 0.00042972434 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.000754 | -| n_updates | 140170 | -| policy_gradient_loss | 0.00111 | -| std | 0.0116 | -| value_loss | 4.04e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14019 | -| time_elapsed | 74317 | -| total_timesteps | 1794432 | -| train/ | | -| approx_kl | 0.019237567 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 140180 | -| policy_gradient_loss | 0.0224 | -| std | 0.0116 | -| value_loss | 7.42e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14020 | -| time_elapsed | 74322 | -| total_timesteps | 1794560 | -| train/ | | -| approx_kl | 0.09014597 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 140190 | -| policy_gradient_loss | 0.0165 | -| std | 0.0116 | -| value_loss | 3.48e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14021 | -| time_elapsed | 74328 | -| total_timesteps | 1794688 | -| train/ | | -| approx_kl | 0.00032972824 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.000886 | -| n_updates | 140200 | -| policy_gradient_loss | 0.000743 | -| std | 0.0116 | -| value_loss | 1.81e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14022 | -| time_elapsed | 74334 | -| total_timesteps | 1794816 | -| train/ | | -| approx_kl | 0.029723411 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.00433 | -| n_updates | 140210 | -| policy_gradient_loss | 0.0297 | -| std | 0.0116 | -| value_loss | 1.45e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 24 | -| iterations | 14023 | -| time_elapsed | 74338 | -| total_timesteps | 1794944 | -| train/ | | -| approx_kl | 0.08259089 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0095 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 140220 | -| policy_gradient_loss | 0.0155 | -| std | 0.0116 | -| value_loss | 1.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14024 | -| time_elapsed | 74344 | -| total_timesteps | 1795072 | -| train/ | | -| approx_kl | 0.023133257 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 140230 | -| policy_gradient_loss | 0.0318 | -| std | 0.0116 | -| value_loss | 5.1e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14025 | -| time_elapsed | 74353 | -| total_timesteps | 1795200 | -| train/ | | -| approx_kl | 0.0141220875 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 140240 | -| policy_gradient_loss | 0.0108 | -| std | 0.0116 | -| value_loss | 0.00121 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14026 | -| time_elapsed | 74357 | -| total_timesteps | 1795328 | -| train/ | | -| approx_kl | 0.009094415 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 140250 | -| policy_gradient_loss | 0.0254 | -| std | 0.0116 | -| value_loss | 2.83e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14027 | -| time_elapsed | 74362 | -| total_timesteps | 1795456 | -| train/ | | -| approx_kl | 0.050923698 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | -2.36e-05 | -| n_updates | 140260 | -| policy_gradient_loss | -0.00671 | -| std | 0.0116 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14028 | -| time_elapsed | 74368 | -| total_timesteps | 1795584 | -| train/ | | -| approx_kl | 0.024470203 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | 0.00218 | -| n_updates | 140270 | -| policy_gradient_loss | 0.000303 | -| std | 0.0116 | -| value_loss | 7.61e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14029 | -| time_elapsed | 74373 | -| total_timesteps | 1795712 | -| train/ | | -| approx_kl | 0.0021068659 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.00702 | -| n_updates | 140280 | -| policy_gradient_loss | 0.00168 | -| std | 0.0116 | -| value_loss | 4.83e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14030 | -| time_elapsed | 74379 | -| total_timesteps | 1795840 | -| train/ | | -| approx_kl | 0.015775679 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 140290 | -| policy_gradient_loss | 0.00234 | -| std | 0.0116 | -| value_loss | 3.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 24 | -| iterations | 14031 | -| time_elapsed | 74384 | -| total_timesteps | 1795968 | -| train/ | | -| approx_kl | 0.07967091 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.0802 | -| n_updates | 140300 | -| policy_gradient_loss | 0.0308 | -| std | 0.0116 | -| value_loss | 2.46e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14032 | -| time_elapsed | 74389 | -| total_timesteps | 1796096 | -| train/ | | -| approx_kl | 0.01608463 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.00732 | -| n_updates | 140310 | -| policy_gradient_loss | 0.0173 | -| std | 0.0116 | -| value_loss | 1.23e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14033 | -| time_elapsed | 74399 | -| total_timesteps | 1796224 | -| train/ | | -| approx_kl | 0.031315252 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 140320 | -| policy_gradient_loss | 0.00486 | -| std | 0.0116 | -| value_loss | 0.00172 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14034 | -| time_elapsed | 74405 | -| total_timesteps | 1796352 | -| train/ | | -| approx_kl | 0.031501845 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 140330 | -| policy_gradient_loss | 0.00296 | -| std | 0.0116 | -| value_loss | 2.61e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14035 | -| time_elapsed | 74410 | -| total_timesteps | 1796480 | -| train/ | | -| approx_kl | 0.24076456 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.00497 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 140340 | -| policy_gradient_loss | 0.0301 | -| std | 0.0116 | -| value_loss | 6.03e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14036 | -| time_elapsed | 74415 | -| total_timesteps | 1796608 | -| train/ | | -| approx_kl | 0.0043361313 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 140350 | -| policy_gradient_loss | -0.000444 | -| std | 0.0116 | -| value_loss | 2.59e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14037 | -| time_elapsed | 74419 | -| total_timesteps | 1796736 | -| train/ | | -| approx_kl | 0.010220423 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.00253 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 140360 | -| policy_gradient_loss | 0.00996 | -| std | 0.0116 | -| value_loss | 0.000991 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14038 | -| time_elapsed | 74424 | -| total_timesteps | 1796864 | -| train/ | | -| approx_kl | 0.017999798 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.333 | -| learning_rate | 0.0003 | -| loss | -0.000566 | -| n_updates | 140370 | -| policy_gradient_loss | 0.0029 | -| std | 0.0115 | -| value_loss | 0.00194 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14039 | -| time_elapsed | 74429 | -| total_timesteps | 1796992 | -| train/ | | -| approx_kl | 0.045329448 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.513 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 140380 | -| policy_gradient_loss | 0.0158 | -| std | 0.0115 | -| value_loss | 4.78e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14040 | -| time_elapsed | 74434 | -| total_timesteps | 1797120 | -| train/ | | -| approx_kl | 0.051603455 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.00256 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 140390 | -| policy_gradient_loss | 0.00592 | -| std | 0.0115 | -| value_loss | 2.53e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14041 | -| time_elapsed | 74446 | -| total_timesteps | 1797248 | -| train/ | | -| approx_kl | 0.0018826467 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.739 | -| learning_rate | 0.0003 | -| loss | 0.00981 | -| n_updates | 140400 | -| policy_gradient_loss | 0.0019 | -| std | 0.0115 | -| value_loss | 0.00503 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14042 | -| time_elapsed | 74450 | -| total_timesteps | 1797376 | -| train/ | | -| approx_kl | 0.022432722 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | -0.00777 | -| n_updates | 140410 | -| policy_gradient_loss | -0.00576 | -| std | 0.0115 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14043 | -| time_elapsed | 74454 | -| total_timesteps | 1797504 | -| train/ | | -| approx_kl | 0.013220677 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.00489 | -| n_updates | 140420 | -| policy_gradient_loss | 0.00279 | -| std | 0.0115 | -| value_loss | 1.1e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14044 | -| time_elapsed | 74459 | -| total_timesteps | 1797632 | -| train/ | | -| approx_kl | 0.03729514 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 140430 | -| policy_gradient_loss | -0.00796 | -| std | 0.0115 | -| value_loss | 5.62e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14045 | -| time_elapsed | 74463 | -| total_timesteps | 1797760 | -| train/ | | -| approx_kl | 0.10508652 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0341 | -| n_updates | 140440 | -| policy_gradient_loss | 0.00213 | -| std | 0.0115 | -| value_loss | 4.79e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 24 | -| iterations | 14046 | -| time_elapsed | 74468 | -| total_timesteps | 1797888 | -| train/ | | -| approx_kl | 0.07582201 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 140450 | -| policy_gradient_loss | 0.0161 | -| std | 0.0115 | -| value_loss | 3.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14047 | -| time_elapsed | 74472 | -| total_timesteps | 1798016 | -| train/ | | -| approx_kl | 0.029655393 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 140460 | -| policy_gradient_loss | 0.0145 | -| std | 0.0115 | -| value_loss | 2.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14048 | -| time_elapsed | 74483 | -| total_timesteps | 1798144 | -| train/ | | -| approx_kl | 0.004719759 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | 0.00304 | -| n_updates | 140470 | -| policy_gradient_loss | 0.00272 | -| std | 0.0115 | -| value_loss | 0.00219 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14049 | -| time_elapsed | 74488 | -| total_timesteps | 1798272 | -| train/ | | -| approx_kl | 0.06515968 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.04 | -| explained_variance | 0.101 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 140480 | -| policy_gradient_loss | 0.0254 | -| std | 0.0115 | -| value_loss | 4.71e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14050 | -| time_elapsed | 74492 | -| total_timesteps | 1798400 | -| train/ | | -| approx_kl | 0.0068986323 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 140490 | -| policy_gradient_loss | 0.00968 | -| std | 0.0115 | -| value_loss | 3.3e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14051 | -| time_elapsed | 74497 | -| total_timesteps | 1798528 | -| train/ | | -| approx_kl | 0.064733654 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 140500 | -| policy_gradient_loss | 0.0134 | -| std | 0.0115 | -| value_loss | 1.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14052 | -| time_elapsed | 74501 | -| total_timesteps | 1798656 | -| train/ | | -| approx_kl | 0.017331982 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.00771 | -| n_updates | 140510 | -| policy_gradient_loss | 0.0315 | -| std | 0.0115 | -| value_loss | 1.37e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14053 | -| time_elapsed | 74506 | -| total_timesteps | 1798784 | -| train/ | | -| approx_kl | 0.08225555 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0664 | -| learning_rate | 0.0003 | -| loss | 0.0509 | -| n_updates | 140520 | -| policy_gradient_loss | 0.0159 | -| std | 0.0115 | -| value_loss | 4.68e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14054 | -| time_elapsed | 74512 | -| total_timesteps | 1798912 | -| train/ | | -| approx_kl | 0.00032661622 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 140530 | -| policy_gradient_loss | -0.00306 | -| std | 0.0115 | -| value_loss | 4.87e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14055 | -| time_elapsed | 74516 | -| total_timesteps | 1799040 | -| train/ | | -| approx_kl | 0.021656748 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 140540 | -| policy_gradient_loss | 0.0214 | -| std | 0.0115 | -| value_loss | 4.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14056 | -| time_elapsed | 74524 | -| total_timesteps | 1799168 | -| train/ | | -| approx_kl | 0.07834353 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -2.04 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 140550 | -| policy_gradient_loss | -0.0143 | -| std | 0.0115 | -| value_loss | 0.00202 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14057 | -| time_elapsed | 74528 | -| total_timesteps | 1799296 | -| train/ | | -| approx_kl | 0.09456309 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -5.72 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 140560 | -| policy_gradient_loss | -0.0101 | -| std | 0.0115 | -| value_loss | 0.000118 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14058 | -| time_elapsed | 74533 | -| total_timesteps | 1799424 | -| train/ | | -| approx_kl | 0.025725434 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.789 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 140570 | -| policy_gradient_loss | 0.0132 | -| std | 0.0115 | -| value_loss | 2.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14059 | -| time_elapsed | 74537 | -| total_timesteps | 1799552 | -| train/ | | -| approx_kl | 0.038326688 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 140580 | -| policy_gradient_loss | 0.00927 | -| std | 0.0115 | -| value_loss | 2.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14060 | -| time_elapsed | 74542 | -| total_timesteps | 1799680 | -| train/ | | -| approx_kl | 0.19609293 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | 0.00197 | -| learning_rate | 0.0003 | -| loss | 0.0782 | -| n_updates | 140590 | -| policy_gradient_loss | 0.0171 | -| std | 0.0115 | -| value_loss | 1.66e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14061 | -| time_elapsed | 74546 | -| total_timesteps | 1799808 | -| train/ | | -| approx_kl | 0.00023751007 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.00559 | -| learning_rate | 0.0003 | -| loss | 0.00187 | -| n_updates | 140600 | -| policy_gradient_loss | -0.00386 | -| std | 0.0114 | -| value_loss | 1.38e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14062 | -| time_elapsed | 74550 | -| total_timesteps | 1799936 | -| train/ | | -| approx_kl | 0.009594351 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.05 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | -0.00444 | -| n_updates | 140610 | -| policy_gradient_loss | 0.0141 | -| std | 0.0114 | -| value_loss | 1.54e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14063 | -| time_elapsed | 74554 | -| total_timesteps | 1800064 | -| train/ | | -| approx_kl | 0.26954672 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 140620 | -| policy_gradient_loss | 0.0851 | -| std | 0.0114 | -| value_loss | 5.32e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14064 | -| time_elapsed | 74563 | -| total_timesteps | 1800192 | -| train/ | | -| approx_kl | 0.05369199 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -8.27 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 140630 | -| policy_gradient_loss | -0.0147 | -| std | 0.0114 | -| value_loss | 0.00242 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14065 | -| time_elapsed | 74568 | -| total_timesteps | 1800320 | -| train/ | | -| approx_kl | 9.479001e-06 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -3.41 | -| learning_rate | 0.0003 | -| loss | -4.25e-05 | -| n_updates | 140640 | -| policy_gradient_loss | 0.00202 | -| std | 0.0114 | -| value_loss | 8.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14066 | -| time_elapsed | 74571 | -| total_timesteps | 1800448 | -| train/ | | -| approx_kl | 0.0038557611 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -3.3 | -| learning_rate | 0.0003 | -| loss | -0.00408 | -| n_updates | 140650 | -| policy_gradient_loss | -0.00187 | -| std | 0.0113 | -| value_loss | 2e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14067 | -| time_elapsed | 74576 | -| total_timesteps | 1800576 | -| train/ | | -| approx_kl | 0.011512244 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.000646 | -| n_updates | 140660 | -| policy_gradient_loss | 0.0255 | -| std | 0.0114 | -| value_loss | 4.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14068 | -| time_elapsed | 74583 | -| total_timesteps | 1800704 | -| train/ | | -| approx_kl | 0.006636878 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | 0.000525 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 140670 | -| policy_gradient_loss | 0.0345 | -| std | 0.0114 | -| value_loss | 5.29e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14069 | -| time_elapsed | 74589 | -| total_timesteps | 1800832 | -| train/ | | -| approx_kl | 0.07337606 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | 0.0037 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 140680 | -| policy_gradient_loss | 0.029 | -| std | 0.0114 | -| value_loss | 1.2e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14070 | -| time_elapsed | 74594 | -| total_timesteps | 1800960 | -| train/ | | -| approx_kl | 0.06430824 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 140690 | -| policy_gradient_loss | 0.00847 | -| std | 0.0114 | -| value_loss | 9.92e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14071 | -| time_elapsed | 74598 | -| total_timesteps | 1801088 | -| train/ | | -| approx_kl | 0.017545957 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.00984 | -| learning_rate | 0.0003 | -| loss | 0.00996 | -| n_updates | 140700 | -| policy_gradient_loss | 0.00256 | -| std | 0.0114 | -| value_loss | 6.07e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14072 | -| time_elapsed | 74607 | -| total_timesteps | 1801216 | -| train/ | | -| approx_kl | 0.0384327 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | 0.758 | -| learning_rate | 0.0003 | -| loss | 0.00391 | -| n_updates | 140710 | -| policy_gradient_loss | 0.000638 | -| std | 0.0114 | -| value_loss | 0.004 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14073 | -| time_elapsed | 74611 | -| total_timesteps | 1801344 | -| train/ | | -| approx_kl | 0.03181467 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | 0.0095 | -| n_updates | 140720 | -| policy_gradient_loss | 0.0236 | -| std | 0.0114 | -| value_loss | 4.91e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14074 | -| time_elapsed | 74615 | -| total_timesteps | 1801472 | -| train/ | | -| approx_kl | 0.068898275 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 140730 | -| policy_gradient_loss | 0.0122 | -| std | 0.0114 | -| value_loss | 8.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14075 | -| time_elapsed | 74619 | -| total_timesteps | 1801600 | -| train/ | | -| approx_kl | 0.017630603 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 140740 | -| policy_gradient_loss | 0.0271 | -| std | 0.0114 | -| value_loss | 2.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14076 | -| time_elapsed | 74624 | -| total_timesteps | 1801728 | -| train/ | | -| approx_kl | 0.076845594 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.0974 | -| learning_rate | 0.0003 | -| loss | 0.00875 | -| n_updates | 140750 | -| policy_gradient_loss | 0.000932 | -| std | 0.0114 | -| value_loss | 1.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14077 | -| time_elapsed | 74628 | -| total_timesteps | 1801856 | -| train/ | | -| approx_kl | 0.14256084 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | 0.0929 | -| n_updates | 140760 | -| policy_gradient_loss | 0.0636 | -| std | 0.0114 | -| value_loss | 1.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 24 | -| iterations | 14078 | -| time_elapsed | 74632 | -| total_timesteps | 1801984 | -| train/ | | -| approx_kl | 0.022870295 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 140770 | -| policy_gradient_loss | 0.0091 | -| std | 0.0113 | -| value_loss | 1.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14079 | -| time_elapsed | 74636 | -| total_timesteps | 1802112 | -| train/ | | -| approx_kl | 0.22545455 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | 0.0854 | -| n_updates | 140780 | -| policy_gradient_loss | 0.0224 | -| std | 0.0113 | -| value_loss | 3.86e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14080 | -| time_elapsed | 74650 | -| total_timesteps | 1802240 | -| train/ | | -| approx_kl | 0.00079691876 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.00391 | -| n_updates | 140790 | -| policy_gradient_loss | 0.00247 | -| std | 0.0113 | -| value_loss | 1.51e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14081 | -| time_elapsed | 74655 | -| total_timesteps | 1802368 | -| train/ | | -| approx_kl | 0.052428994 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | 0.00151 | -| learning_rate | 0.0003 | -| loss | 0.0622 | -| n_updates | 140800 | -| policy_gradient_loss | 0.0122 | -| std | 0.0113 | -| value_loss | 2.47e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14082 | -| time_elapsed | 74659 | -| total_timesteps | 1802496 | -| train/ | | -| approx_kl | 0.0015645009 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.00365 | -| learning_rate | 0.0003 | -| loss | 0.000418 | -| n_updates | 140810 | -| policy_gradient_loss | 0.00179 | -| std | 0.0113 | -| value_loss | 6.04e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14083 | -| time_elapsed | 74664 | -| total_timesteps | 1802624 | -| train/ | | -| approx_kl | 0.06362158 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.051 | -| n_updates | 140820 | -| policy_gradient_loss | 0.047 | -| std | 0.0113 | -| value_loss | 3.88e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14084 | -| time_elapsed | 74668 | -| total_timesteps | 1802752 | -| train/ | | -| approx_kl | 0.054411393 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | 0.064 | -| n_updates | 140830 | -| policy_gradient_loss | 0.0606 | -| std | 0.0113 | -| value_loss | 4.08e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14085 | -| time_elapsed | 74673 | -| total_timesteps | 1802880 | -| train/ | | -| approx_kl | 0.008419953 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.00568 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 140840 | -| policy_gradient_loss | 0.00509 | -| std | 0.0113 | -| value_loss | 3.58e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14086 | -| time_elapsed | 74679 | -| total_timesteps | 1803008 | -| train/ | | -| approx_kl | 0.19341771 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.00573 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 140850 | -| policy_gradient_loss | 0.029 | -| std | 0.0113 | -| value_loss | 1.39e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14087 | -| time_elapsed | 74692 | -| total_timesteps | 1803136 | -| train/ | | -| approx_kl | 0.018798983 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 140860 | -| policy_gradient_loss | -0.0108 | -| std | 0.0113 | -| value_loss | 6.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14088 | -| time_elapsed | 74696 | -| total_timesteps | 1803264 | -| train/ | | -| approx_kl | 0.047448527 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | 0.00508 | -| n_updates | 140870 | -| policy_gradient_loss | -0.00187 | -| std | 0.0113 | -| value_loss | 3.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14089 | -| time_elapsed | 74699 | -| total_timesteps | 1803392 | -| train/ | | -| approx_kl | 0.088537574 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.0626 | -| n_updates | 140880 | -| policy_gradient_loss | 0.0115 | -| std | 0.0112 | -| value_loss | 1.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14090 | -| time_elapsed | 74703 | -| total_timesteps | 1803520 | -| train/ | | -| approx_kl | 0.008689115 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00153 | -| n_updates | 140890 | -| policy_gradient_loss | -0.000177 | -| std | 0.0112 | -| value_loss | 3.92e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14091 | -| time_elapsed | 74707 | -| total_timesteps | 1803648 | -| train/ | | -| approx_kl | 0.0055814325 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 140900 | -| policy_gradient_loss | 0.00291 | -| std | 0.0112 | -| value_loss | 3.21e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14092 | -| time_elapsed | 74712 | -| total_timesteps | 1803776 | -| train/ | | -| approx_kl | 0.22897519 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | 0.0963 | -| n_updates | 140910 | -| policy_gradient_loss | 0.0231 | -| std | 0.0112 | -| value_loss | 2.75e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14093 | -| time_elapsed | 74717 | -| total_timesteps | 1803904 | -| train/ | | -| approx_kl | 0.00050523505 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 140920 | -| policy_gradient_loss | 0.000344 | -| std | 0.0112 | -| value_loss | 1.98e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14094 | -| time_elapsed | 74723 | -| total_timesteps | 1804032 | -| train/ | | -| approx_kl | 0.017500626 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 140930 | -| policy_gradient_loss | -0.00591 | -| std | 0.0112 | -| value_loss | 1.42e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14095 | -| time_elapsed | 74735 | -| total_timesteps | 1804160 | -| train/ | | -| approx_kl | 0.014994822 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | -0.00316 | -| n_updates | 140940 | -| policy_gradient_loss | -0.00436 | -| std | 0.0112 | -| value_loss | 0.00186 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14096 | -| time_elapsed | 74742 | -| total_timesteps | 1804288 | -| train/ | | -| approx_kl | 0.017524887 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 140950 | -| policy_gradient_loss | 0.00503 | -| std | 0.0112 | -| value_loss | 6.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14097 | -| time_elapsed | 74746 | -| total_timesteps | 1804416 | -| train/ | | -| approx_kl | 0.11174747 | -| clip_fraction | 0.586 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.00346 | -| learning_rate | 0.0003 | -| loss | 0.0854 | -| n_updates | 140960 | -| policy_gradient_loss | 0.0662 | -| std | 0.0112 | -| value_loss | 1.91e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14098 | -| time_elapsed | 74750 | -| total_timesteps | 1804544 | -| train/ | | -| approx_kl | 0.018889463 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00501 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 140970 | -| policy_gradient_loss | 0.00344 | -| std | 0.0112 | -| value_loss | 1.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14099 | -| time_elapsed | 74756 | -| total_timesteps | 1804672 | -| train/ | | -| approx_kl | 0.015496485 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00451 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 140980 | -| policy_gradient_loss | -0.00125 | -| std | 0.0112 | -| value_loss | 7.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14100 | -| time_elapsed | 74760 | -| total_timesteps | 1804800 | -| train/ | | -| approx_kl | 0.09530924 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0484 | -| n_updates | 140990 | -| policy_gradient_loss | 0.0191 | -| std | 0.0112 | -| value_loss | 5.88e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14101 | -| time_elapsed | 74765 | -| total_timesteps | 1804928 | -| train/ | | -| approx_kl | 0.0319459 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.00731 | -| n_updates | 141000 | -| policy_gradient_loss | 0.0102 | -| std | 0.0112 | -| value_loss | 2.69e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14102 | -| time_elapsed | 74770 | -| total_timesteps | 1805056 | -| train/ | | -| approx_kl | 0.04441067 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00914 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 141010 | -| policy_gradient_loss | -0.000246 | -| std | 0.0112 | -| value_loss | 2.65e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14103 | -| time_elapsed | 74779 | -| total_timesteps | 1805184 | -| train/ | | -| approx_kl | 0.0011722688 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.728 | -| learning_rate | 0.0003 | -| loss | 0.000999 | -| n_updates | 141020 | -| policy_gradient_loss | -0.000423 | -| std | 0.0112 | -| value_loss | 0.00547 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14104 | -| time_elapsed | 74784 | -| total_timesteps | 1805312 | -| train/ | | -| approx_kl | 0.048015464 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | 0.00998 | -| n_updates | 141030 | -| policy_gradient_loss | 0.0175 | -| std | 0.0112 | -| value_loss | 8.85e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14105 | -| time_elapsed | 74789 | -| total_timesteps | 1805440 | -| train/ | | -| approx_kl | 0.0070594237 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.000127 | -| n_updates | 141040 | -| policy_gradient_loss | 0.00958 | -| std | 0.0112 | -| value_loss | 8.81e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14106 | -| time_elapsed | 74792 | -| total_timesteps | 1805568 | -| train/ | | -| approx_kl | 0.10578002 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | 0.0217 | -| n_updates | 141050 | -| policy_gradient_loss | 0.0103 | -| std | 0.0112 | -| value_loss | 2.76e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14107 | -| time_elapsed | 74796 | -| total_timesteps | 1805696 | -| train/ | | -| approx_kl | 0.0047233496 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00556 | -| learning_rate | 0.0003 | -| loss | -0.000943 | -| n_updates | 141060 | -| policy_gradient_loss | 0.0401 | -| std | 0.0112 | -| value_loss | 6.13e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14108 | -| time_elapsed | 74800 | -| total_timesteps | 1805824 | -| train/ | | -| approx_kl | 0.025275124 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.00597 | -| n_updates | 141070 | -| policy_gradient_loss | 0.0486 | -| std | 0.0112 | -| value_loss | 6.25e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14109 | -| time_elapsed | 74806 | -| total_timesteps | 1805952 | -| train/ | | -| approx_kl | 0.0004858789 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | 0.00327 | -| n_updates | 141080 | -| policy_gradient_loss | 0.0113 | -| std | 0.0112 | -| value_loss | 5.68e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14110 | -| time_elapsed | 74811 | -| total_timesteps | 1806080 | -| train/ | | -| approx_kl | 0.0970884 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.008 | -| learning_rate | 0.0003 | -| loss | 0.0751 | -| n_updates | 141090 | -| policy_gradient_loss | 0.0736 | -| std | 0.0112 | -| value_loss | 3.5e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14111 | -| time_elapsed | 74822 | -| total_timesteps | 1806208 | -| train/ | | -| approx_kl | 0.05035906 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 141100 | -| policy_gradient_loss | -0.00784 | -| std | 0.0112 | -| value_loss | 0.000167 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14112 | -| time_elapsed | 74827 | -| total_timesteps | 1806336 | -| train/ | | -| approx_kl | 0.026694678 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | 0.006 | -| n_updates | 141110 | -| policy_gradient_loss | 0.000139 | -| std | 0.0112 | -| value_loss | 4.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14113 | -| time_elapsed | 74832 | -| total_timesteps | 1806464 | -| train/ | | -| approx_kl | 0.014092136 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | -0.0066 | -| n_updates | 141120 | -| policy_gradient_loss | -0.00239 | -| std | 0.0112 | -| value_loss | 3.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14114 | -| time_elapsed | 74836 | -| total_timesteps | 1806592 | -| train/ | | -| approx_kl | 0.01582757 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00972 | -| learning_rate | 0.0003 | -| loss | 0.00363 | -| n_updates | 141130 | -| policy_gradient_loss | 0.00146 | -| std | 0.0112 | -| value_loss | 1.71e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14115 | -| time_elapsed | 74840 | -| total_timesteps | 1806720 | -| train/ | | -| approx_kl | 0.0026247846 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 141140 | -| policy_gradient_loss | 0.000707 | -| std | 0.0112 | -| value_loss | 9.84e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14116 | -| time_elapsed | 74844 | -| total_timesteps | 1806848 | -| train/ | | -| approx_kl | 0.014524506 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.00889 | -| n_updates | 141150 | -| policy_gradient_loss | 0.000149 | -| std | 0.0112 | -| value_loss | 9.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14117 | -| time_elapsed | 74848 | -| total_timesteps | 1806976 | -| train/ | | -| approx_kl | 0.021916052 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 141160 | -| policy_gradient_loss | 0.0357 | -| std | 0.0112 | -| value_loss | 7.77e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14118 | -| time_elapsed | 74852 | -| total_timesteps | 1807104 | -| train/ | | -| approx_kl | 0.04432147 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00805 | -| learning_rate | 0.0003 | -| loss | 0.0296 | -| n_updates | 141170 | -| policy_gradient_loss | 0.0748 | -| std | 0.0112 | -| value_loss | 5.62e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14119 | -| time_elapsed | 74861 | -| total_timesteps | 1807232 | -| train/ | | -| approx_kl | 0.04888875 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 141180 | -| policy_gradient_loss | -0.00709 | -| std | 0.0112 | -| value_loss | 6.59e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14120 | -| time_elapsed | 74865 | -| total_timesteps | 1807360 | -| train/ | | -| approx_kl | 7.783994e-06 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.000229 | -| learning_rate | 0.0003 | -| loss | -0.000286 | -| n_updates | 141190 | -| policy_gradient_loss | 0.0558 | -| std | 0.0112 | -| value_loss | 4.61e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14121 | -| time_elapsed | 74870 | -| total_timesteps | 1807488 | -| train/ | | -| approx_kl | 0.026502563 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00245 | -| learning_rate | 0.0003 | -| loss | 0.0265 | -| n_updates | 141200 | -| policy_gradient_loss | 0.0521 | -| std | 0.0113 | -| value_loss | 1.37e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14122 | -| time_elapsed | 74875 | -| total_timesteps | 1807616 | -| train/ | | -| approx_kl | 0.03558252 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | 0.084 | -| n_updates | 141210 | -| policy_gradient_loss | 0.0362 | -| std | 0.0113 | -| value_loss | 3.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14123 | -| time_elapsed | 74880 | -| total_timesteps | 1807744 | -| train/ | | -| approx_kl | 0.049874596 | -| clip_fraction | 0.558 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.00467 | -| learning_rate | 0.0003 | -| loss | 0.0451 | -| n_updates | 141220 | -| policy_gradient_loss | 0.0687 | -| std | 0.0113 | -| value_loss | 1.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 24 | -| iterations | 14124 | -| time_elapsed | 74885 | -| total_timesteps | 1807872 | -| train/ | | -| approx_kl | 0.04007686 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.000778 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 141230 | -| policy_gradient_loss | 0.058 | -| std | 0.0113 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14125 | -| time_elapsed | 74891 | -| total_timesteps | 1808000 | -| train/ | | -| approx_kl | 0.00890751 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.00297 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 141240 | -| policy_gradient_loss | 0.00647 | -| std | 0.0113 | -| value_loss | 9.2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14126 | -| time_elapsed | 74897 | -| total_timesteps | 1808128 | -| train/ | | -| approx_kl | 0.048703022 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.000769 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 141250 | -| policy_gradient_loss | 0.00367 | -| std | 0.0113 | -| value_loss | 2.9e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14127 | -| time_elapsed | 74909 | -| total_timesteps | 1808256 | -| train/ | | -| approx_kl | 0.0668218 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -3.76 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 141260 | -| policy_gradient_loss | -0.0142 | -| std | 0.0113 | -| value_loss | 0.00221 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14128 | -| time_elapsed | 74915 | -| total_timesteps | 1808384 | -| train/ | | -| approx_kl | 0.06624508 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -13.6 | -| learning_rate | 0.0003 | -| loss | 0.0453 | -| n_updates | 141270 | -| policy_gradient_loss | 0.028 | -| std | 0.0113 | -| value_loss | 1.67e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14129 | -| time_elapsed | 74920 | -| total_timesteps | 1808512 | -| train/ | | -| approx_kl | 0.047211803 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -33.7 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 141280 | -| policy_gradient_loss | 0.0192 | -| std | 0.0113 | -| value_loss | 5.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14130 | -| time_elapsed | 74925 | -| total_timesteps | 1808640 | -| train/ | | -| approx_kl | 0.051839937 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -6.33 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 141290 | -| policy_gradient_loss | 0.0323 | -| std | 0.0113 | -| value_loss | 8.92e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14131 | -| time_elapsed | 74930 | -| total_timesteps | 1808768 | -| train/ | | -| approx_kl | 0.008279966 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.908 | -| learning_rate | 0.0003 | -| loss | 0.000783 | -| n_updates | 141300 | -| policy_gradient_loss | 0.00458 | -| std | 0.0113 | -| value_loss | 8.62e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14132 | -| time_elapsed | 74935 | -| total_timesteps | 1808896 | -| train/ | | -| approx_kl | 0.21587856 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.0912 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 141310 | -| policy_gradient_loss | 0.0269 | -| std | 0.0113 | -| value_loss | 8.47e-10 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14133 | -| time_elapsed | 74939 | -| total_timesteps | 1809024 | -| train/ | | -| approx_kl | 0.00021216273 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.06 | -| explained_variance | -0.00966 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 141320 | -| policy_gradient_loss | -0.00034 | -| std | 0.0113 | -| value_loss | 7.52e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14134 | -| time_elapsed | 74947 | -| total_timesteps | 1809152 | -| train/ | | -| approx_kl | 7.095747e-05 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.793 | -| learning_rate | 0.0003 | -| loss | 0.00091 | -| n_updates | 141330 | -| policy_gradient_loss | 0.0003 | -| std | 0.0113 | -| value_loss | 0.00311 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14135 | -| time_elapsed | 74951 | -| total_timesteps | 1809280 | -| train/ | | -| approx_kl | 0.0021141404 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | 0.0919 | -| learning_rate | 0.0003 | -| loss | 0.00375 | -| n_updates | 141340 | -| policy_gradient_loss | 0.00107 | -| std | 0.0112 | -| value_loss | 3.57e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14136 | -| time_elapsed | 74955 | -| total_timesteps | 1809408 | -| train/ | | -| approx_kl | 0.04629897 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -2.45 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 141350 | -| policy_gradient_loss | 0.0166 | -| std | 0.0112 | -| value_loss | 5.71e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14137 | -| time_elapsed | 74960 | -| total_timesteps | 1809536 | -| train/ | | -| approx_kl | 0.011791572 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.479 | -| learning_rate | 0.0003 | -| loss | 0.00301 | -| n_updates | 141360 | -| policy_gradient_loss | 0.0104 | -| std | 0.0112 | -| value_loss | 2.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14138 | -| time_elapsed | 74965 | -| total_timesteps | 1809664 | -| train/ | | -| approx_kl | 0.053338915 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0299 | -| n_updates | 141370 | -| policy_gradient_loss | 0.00639 | -| std | 0.0112 | -| value_loss | 1.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14139 | -| time_elapsed | 74969 | -| total_timesteps | 1809792 | -| train/ | | -| approx_kl | 0.059854385 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.049 | -| n_updates | 141380 | -| policy_gradient_loss | 0.0225 | -| std | 0.0112 | -| value_loss | 1.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14140 | -| time_elapsed | 74973 | -| total_timesteps | 1809920 | -| train/ | | -| approx_kl | 0.02011542 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | -0.00862 | -| n_updates | 141390 | -| policy_gradient_loss | 0.00281 | -| std | 0.0112 | -| value_loss | 9.21e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14141 | -| time_elapsed | 74978 | -| total_timesteps | 1810048 | -| train/ | | -| approx_kl | 0.047685128 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 141400 | -| policy_gradient_loss | -0.00549 | -| std | 0.0112 | -| value_loss | 8.49e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14142 | -| time_elapsed | 74987 | -| total_timesteps | 1810176 | -| train/ | | -| approx_kl | 0.07438128 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -9.15 | -| learning_rate | 0.0003 | -| loss | -0.00591 | -| n_updates | 141410 | -| policy_gradient_loss | -0.00263 | -| std | 0.0112 | -| value_loss | 0.00282 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14143 | -| time_elapsed | 74991 | -| total_timesteps | 1810304 | -| train/ | | -| approx_kl | 0.002187178 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | 1.34e-05 | -| n_updates | 141420 | -| policy_gradient_loss | 0.00597 | -| std | 0.0112 | -| value_loss | 3.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14144 | -| time_elapsed | 74996 | -| total_timesteps | 1810432 | -| train/ | | -| approx_kl | 0.16769347 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 141430 | -| policy_gradient_loss | 0.0115 | -| std | 0.0112 | -| value_loss | 2.44e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14145 | -| time_elapsed | 75002 | -| total_timesteps | 1810560 | -| train/ | | -| approx_kl | 0.0017283713 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -0.937 | -| learning_rate | 0.0003 | -| loss | 0.00642 | -| n_updates | 141440 | -| policy_gradient_loss | 0.016 | -| std | 0.0112 | -| value_loss | 9.45e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14146 | -| time_elapsed | 75008 | -| total_timesteps | 1810688 | -| train/ | | -| approx_kl | 0.004631103 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.07 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 141450 | -| policy_gradient_loss | 0.000618 | -| std | 0.0112 | -| value_loss | 6.78e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14147 | -| time_elapsed | 75013 | -| total_timesteps | 1810816 | -| train/ | | -| approx_kl | 0.014940038 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -4.57 | -| learning_rate | 0.0003 | -| loss | 4.87e-05 | -| n_updates | 141460 | -| policy_gradient_loss | 0.00669 | -| std | 0.0112 | -| value_loss | 1.48e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14148 | -| time_elapsed | 75018 | -| total_timesteps | 1810944 | -| train/ | | -| approx_kl | 0.2754793 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 141470 | -| policy_gradient_loss | 0.118 | -| std | 0.0112 | -| value_loss | 1.29e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14149 | -| time_elapsed | 75022 | -| total_timesteps | 1811072 | -| train/ | | -| approx_kl | 0.011386547 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.00163 | -| learning_rate | 0.0003 | -| loss | 0.000637 | -| n_updates | 141480 | -| policy_gradient_loss | -0.000215 | -| std | 0.0112 | -| value_loss | 5.15e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14150 | -| time_elapsed | 75029 | -| total_timesteps | 1811200 | -| train/ | | -| approx_kl | 0.011317083 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.00904 | -| n_updates | 141490 | -| policy_gradient_loss | -0.00184 | -| std | 0.0112 | -| value_loss | 3.88e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14151 | -| time_elapsed | 75033 | -| total_timesteps | 1811328 | -| train/ | | -| approx_kl | 0.013800083 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | -0.00314 | -| n_updates | 141500 | -| policy_gradient_loss | 0.00693 | -| std | 0.0112 | -| value_loss | 2.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14152 | -| time_elapsed | 75039 | -| total_timesteps | 1811456 | -| train/ | | -| approx_kl | 0.056570966 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.00444 | -| learning_rate | 0.0003 | -| loss | 0.0261 | -| n_updates | 141510 | -| policy_gradient_loss | 0.0167 | -| std | 0.0112 | -| value_loss | 1.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14153 | -| time_elapsed | 75044 | -| total_timesteps | 1811584 | -| train/ | | -| approx_kl | 0.06636468 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 141520 | -| policy_gradient_loss | 0.0146 | -| std | 0.0112 | -| value_loss | 1.16e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14154 | -| time_elapsed | 75048 | -| total_timesteps | 1811712 | -| train/ | | -| approx_kl | 0.019216128 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.000658 | -| n_updates | 141530 | -| policy_gradient_loss | -0.00387 | -| std | 0.0112 | -| value_loss | 8.48e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14155 | -| time_elapsed | 75053 | -| total_timesteps | 1811840 | -| train/ | | -| approx_kl | 0.054350376 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 141540 | -| policy_gradient_loss | 0.00701 | -| std | 0.0111 | -| value_loss | 5.98e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 24 | -| iterations | 14156 | -| time_elapsed | 75058 | -| total_timesteps | 1811968 | -| train/ | | -| approx_kl | 0.021426369 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.00882 | -| n_updates | 141550 | -| policy_gradient_loss | 0.0103 | -| std | 0.0112 | -| value_loss | 4.85e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14157 | -| time_elapsed | 75063 | -| total_timesteps | 1812096 | -| train/ | | -| approx_kl | 0.109043814 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 141560 | -| policy_gradient_loss | 0.00686 | -| std | 0.0112 | -| value_loss | 4.29e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14158 | -| time_elapsed | 75072 | -| total_timesteps | 1812224 | -| train/ | | -| approx_kl | 0.030801738 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 141570 | -| policy_gradient_loss | 0.0222 | -| std | 0.0112 | -| value_loss | 7.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14159 | -| time_elapsed | 75078 | -| total_timesteps | 1812352 | -| train/ | | -| approx_kl | 0.041493136 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.00211 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 141580 | -| policy_gradient_loss | 0.00356 | -| std | 0.0112 | -| value_loss | 3.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14160 | -| time_elapsed | 75084 | -| total_timesteps | 1812480 | -| train/ | | -| approx_kl | 0.022667535 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.00357 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 141590 | -| policy_gradient_loss | 0.00422 | -| std | 0.0112 | -| value_loss | 7.4e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14161 | -| time_elapsed | 75089 | -| total_timesteps | 1812608 | -| train/ | | -| approx_kl | 0.1216864 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 141600 | -| policy_gradient_loss | 0.00437 | -| std | 0.0111 | -| value_loss | 7.95e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14162 | -| time_elapsed | 75094 | -| total_timesteps | 1812736 | -| train/ | | -| approx_kl | 0.029924793 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0841 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 141610 | -| policy_gradient_loss | 0.0323 | -| std | 0.0111 | -| value_loss | 3.49e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14163 | -| time_elapsed | 75100 | -| total_timesteps | 1812864 | -| train/ | | -| approx_kl | 0.0061068903 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0837 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 141620 | -| policy_gradient_loss | -0.00955 | -| std | 0.0111 | -| value_loss | 5.75e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14164 | -| time_elapsed | 75105 | -| total_timesteps | 1812992 | -| train/ | | -| approx_kl | 0.022139562 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.00854 | -| n_updates | 141630 | -| policy_gradient_loss | 0.0111 | -| std | 0.0111 | -| value_loss | 4.99e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14165 | -| time_elapsed | 75109 | -| total_timesteps | 1813120 | -| train/ | | -| approx_kl | 0.09855257 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | 0.0607 | -| n_updates | 141640 | -| policy_gradient_loss | 0.0122 | -| std | 0.0111 | -| value_loss | 2.97e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14166 | -| time_elapsed | 75120 | -| total_timesteps | 1813248 | -| train/ | | -| approx_kl | 0.05533014 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 141650 | -| policy_gradient_loss | -0.0156 | -| std | 0.0111 | -| value_loss | 9.54e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14167 | -| time_elapsed | 75125 | -| total_timesteps | 1813376 | -| train/ | | -| approx_kl | 0.018688807 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -113 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 141660 | -| policy_gradient_loss | -0.000786 | -| std | 0.0111 | -| value_loss | 3.56e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14168 | -| time_elapsed | 75130 | -| total_timesteps | 1813504 | -| train/ | | -| approx_kl | 0.021965811 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -173 | -| learning_rate | 0.0003 | -| loss | -0.0051 | -| n_updates | 141670 | -| policy_gradient_loss | -0.00239 | -| std | 0.0111 | -| value_loss | 2.05e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14169 | -| time_elapsed | 75135 | -| total_timesteps | 1813632 | -| train/ | | -| approx_kl | 0.03463128 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -13.7 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 141680 | -| policy_gradient_loss | -0.00429 | -| std | 0.0111 | -| value_loss | 7.22e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14170 | -| time_elapsed | 75140 | -| total_timesteps | 1813760 | -| train/ | | -| approx_kl | 0.03484627 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.989 | -| learning_rate | 0.0003 | -| loss | 0.0348 | -| n_updates | 141690 | -| policy_gradient_loss | 0.0169 | -| std | 0.0111 | -| value_loss | 1.44e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14171 | -| time_elapsed | 75145 | -| total_timesteps | 1813888 | -| train/ | | -| approx_kl | 0.015385708 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0736 | -| learning_rate | 0.0003 | -| loss | 0.00935 | -| n_updates | 141700 | -| policy_gradient_loss | 0.022 | -| std | 0.0111 | -| value_loss | 8.02e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14172 | -| time_elapsed | 75149 | -| total_timesteps | 1814016 | -| train/ | | -| approx_kl | 0.29851994 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.00232 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 141710 | -| policy_gradient_loss | 0.0984 | -| std | 0.0111 | -| value_loss | 3.77e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14173 | -| time_elapsed | 75160 | -| total_timesteps | 1814144 | -| train/ | | -| approx_kl | 0.016633697 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.778 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 141720 | -| policy_gradient_loss | -0.0123 | -| std | 0.0111 | -| value_loss | 0.00386 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14174 | -| time_elapsed | 75165 | -| total_timesteps | 1814272 | -| train/ | | -| approx_kl | 0.09282647 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.0574 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 141730 | -| policy_gradient_loss | 0.012 | -| std | 0.0111 | -| value_loss | 3.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14175 | -| time_elapsed | 75170 | -| total_timesteps | 1814400 | -| train/ | | -| approx_kl | 0.018179826 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 141740 | -| policy_gradient_loss | 0.0179 | -| std | 0.0111 | -| value_loss | 9.02e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14176 | -| time_elapsed | 75174 | -| total_timesteps | 1814528 | -| train/ | | -| approx_kl | 0.0935689 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.0712 | -| n_updates | 141750 | -| policy_gradient_loss | 0.0193 | -| std | 0.0111 | -| value_loss | 2.66e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14177 | -| time_elapsed | 75180 | -| total_timesteps | 1814656 | -| train/ | | -| approx_kl | 0.023179129 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 141760 | -| policy_gradient_loss | 0.0386 | -| std | 0.0111 | -| value_loss | 2.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14178 | -| time_elapsed | 75185 | -| total_timesteps | 1814784 | -| train/ | | -| approx_kl | 0.038603146 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 141770 | -| policy_gradient_loss | -0.00912 | -| std | 0.0111 | -| value_loss | 2.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 24 | -| iterations | 14179 | -| time_elapsed | 75189 | -| total_timesteps | 1814912 | -| train/ | | -| approx_kl | 0.024888437 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.00715 | -| n_updates | 141780 | -| policy_gradient_loss | 0.00316 | -| std | 0.0111 | -| value_loss | 1.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14180 | -| time_elapsed | 75194 | -| total_timesteps | 1815040 | -| train/ | | -| approx_kl | 0.0051368806 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 141790 | -| policy_gradient_loss | -0.00137 | -| std | 0.0111 | -| value_loss | 8.65e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14181 | -| time_elapsed | 75203 | -| total_timesteps | 1815168 | -| train/ | | -| approx_kl | 0.13614993 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 141800 | -| policy_gradient_loss | -0.0153 | -| std | 0.0111 | -| value_loss | 9.69e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14182 | -| time_elapsed | 75209 | -| total_timesteps | 1815296 | -| train/ | | -| approx_kl | 0.06675949 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.000105 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 141810 | -| policy_gradient_loss | 0.0163 | -| std | 0.0111 | -| value_loss | 3.83e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14183 | -| time_elapsed | 75214 | -| total_timesteps | 1815424 | -| train/ | | -| approx_kl | 0.03717048 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 141820 | -| policy_gradient_loss | 0.0173 | -| std | 0.0111 | -| value_loss | 2.81e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14184 | -| time_elapsed | 75217 | -| total_timesteps | 1815552 | -| train/ | | -| approx_kl | 0.0548876 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 141830 | -| policy_gradient_loss | 0.00717 | -| std | 0.0111 | -| value_loss | 2.54e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14185 | -| time_elapsed | 75222 | -| total_timesteps | 1815680 | -| train/ | | -| approx_kl | 0.22457474 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0086 | -| learning_rate | 0.0003 | -| loss | 0.0997 | -| n_updates | 141840 | -| policy_gradient_loss | 0.0223 | -| std | 0.0111 | -| value_loss | 2.17e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14186 | -| time_elapsed | 75227 | -| total_timesteps | 1815808 | -| train/ | | -| approx_kl | 0.011795751 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.00859 | -| learning_rate | 0.0003 | -| loss | -0.0041 | -| n_updates | 141850 | -| policy_gradient_loss | -0.000975 | -| std | 0.0111 | -| value_loss | 1.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14187 | -| time_elapsed | 75232 | -| total_timesteps | 1815936 | -| train/ | | -| approx_kl | 0.019791862 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 141860 | -| policy_gradient_loss | -0.0047 | -| std | 0.0111 | -| value_loss | 1.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14188 | -| time_elapsed | 75236 | -| total_timesteps | 1816064 | -| train/ | | -| approx_kl | 0.034588277 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | 0.0067 | -| n_updates | 141870 | -| policy_gradient_loss | 0.0136 | -| std | 0.0111 | -| value_loss | 8.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14189 | -| time_elapsed | 75242 | -| total_timesteps | 1816192 | -| train/ | | -| approx_kl | 0.007947631 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.796 | -| learning_rate | 0.0003 | -| loss | -0.000184 | -| n_updates | 141880 | -| policy_gradient_loss | -0.000211 | -| std | 0.0111 | -| value_loss | 0.00342 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14190 | -| time_elapsed | 75247 | -| total_timesteps | 1816320 | -| train/ | | -| approx_kl | 0.12340595 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 141890 | -| policy_gradient_loss | 0.0121 | -| std | 0.0111 | -| value_loss | 6.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14191 | -| time_elapsed | 75251 | -| total_timesteps | 1816448 | -| train/ | | -| approx_kl | 0.08003373 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 141900 | -| policy_gradient_loss | 0.00754 | -| std | 0.0111 | -| value_loss | 1.42e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14192 | -| time_elapsed | 75255 | -| total_timesteps | 1816576 | -| train/ | | -| approx_kl | 0.040410057 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 141910 | -| policy_gradient_loss | 0.0116 | -| std | 0.0111 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14193 | -| time_elapsed | 75260 | -| total_timesteps | 1816704 | -| train/ | | -| approx_kl | 0.044532668 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.0192 | -| n_updates | 141920 | -| policy_gradient_loss | 0.0145 | -| std | 0.0111 | -| value_loss | 2.11e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14194 | -| time_elapsed | 75265 | -| total_timesteps | 1816832 | -| train/ | | -| approx_kl | 0.11358422 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.0816 | -| n_updates | 141930 | -| policy_gradient_loss | 0.067 | -| std | 0.0111 | -| value_loss | 2.98e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14195 | -| time_elapsed | 75270 | -| total_timesteps | 1816960 | -| train/ | | -| approx_kl | 0.018738065 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0831 | -| learning_rate | 0.0003 | -| loss | -0.00226 | -| n_updates | 141940 | -| policy_gradient_loss | 0.00465 | -| std | 0.0111 | -| value_loss | 5.79e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14196 | -| time_elapsed | 75274 | -| total_timesteps | 1817088 | -| train/ | | -| approx_kl | 0.017079 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 141950 | -| policy_gradient_loss | -0.00525 | -| std | 0.0111 | -| value_loss | 5.29e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14197 | -| time_elapsed | 75285 | -| total_timesteps | 1817216 | -| train/ | | -| approx_kl | 0.021657847 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.773 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 141960 | -| policy_gradient_loss | 0.000624 | -| std | 0.0111 | -| value_loss | 0.00432 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14198 | -| time_elapsed | 75290 | -| total_timesteps | 1817344 | -| train/ | | -| approx_kl | 0.00017985748 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 141970 | -| policy_gradient_loss | 0.0102 | -| std | 0.0111 | -| value_loss | 2.62e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14199 | -| time_elapsed | 75295 | -| total_timesteps | 1817472 | -| train/ | | -| approx_kl | 0.0029841652 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.447 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 141980 | -| policy_gradient_loss | 0.0162 | -| std | 0.0111 | -| value_loss | 1.28e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14200 | -| time_elapsed | 75301 | -| total_timesteps | 1817600 | -| train/ | | -| approx_kl | 0.09413934 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 141990 | -| policy_gradient_loss | 0.00762 | -| std | 0.0111 | -| value_loss | 6.36e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14201 | -| time_elapsed | 75305 | -| total_timesteps | 1817728 | -| train/ | | -| approx_kl | 0.07693508 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | 0.0253 | -| n_updates | 142000 | -| policy_gradient_loss | 0.00912 | -| std | 0.0111 | -| value_loss | 4.32e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14202 | -| time_elapsed | 75309 | -| total_timesteps | 1817856 | -| train/ | | -| approx_kl | 0.02144675 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 142010 | -| policy_gradient_loss | 0.0107 | -| std | 0.0111 | -| value_loss | 9.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14203 | -| time_elapsed | 75313 | -| total_timesteps | 1817984 | -| train/ | | -| approx_kl | 0.051445626 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 142020 | -| policy_gradient_loss | 0.0112 | -| std | 0.0111 | -| value_loss | 1.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14204 | -| time_elapsed | 75317 | -| total_timesteps | 1818112 | -| train/ | | -| approx_kl | 0.13457108 | -| clip_fraction | 0.563 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00836 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 142030 | -| policy_gradient_loss | 0.0779 | -| std | 0.0111 | -| value_loss | 7.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14205 | -| time_elapsed | 75329 | -| total_timesteps | 1818240 | -| train/ | | -| approx_kl | 0.016861632 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -14.1 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 142040 | -| policy_gradient_loss | -0.01 | -| std | 0.0111 | -| value_loss | 0.00347 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14206 | -| time_elapsed | 75334 | -| total_timesteps | 1818368 | -| train/ | | -| approx_kl | 0.0071355975 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -2.03 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 142050 | -| policy_gradient_loss | -0.000373 | -| std | 0.0111 | -| value_loss | 8.47e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14207 | -| time_elapsed | 75339 | -| total_timesteps | 1818496 | -| train/ | | -| approx_kl | 0.014005061 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -75.5 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 142060 | -| policy_gradient_loss | -0.00169 | -| std | 0.0111 | -| value_loss | 9.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14208 | -| time_elapsed | 75344 | -| total_timesteps | 1818624 | -| train/ | | -| approx_kl | 0.09827524 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -1.27e+03 | -| learning_rate | 0.0003 | -| loss | 0.00127 | -| n_updates | 142070 | -| policy_gradient_loss | -0.000697 | -| std | 0.011 | -| value_loss | 3.17e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14209 | -| time_elapsed | 75349 | -| total_timesteps | 1818752 | -| train/ | | -| approx_kl | 0.16439158 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -1.17e+04 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 142080 | -| policy_gradient_loss | 0.0206 | -| std | 0.011 | -| value_loss | 1.21e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 24 | -| iterations | 14210 | -| time_elapsed | 75355 | -| total_timesteps | 1818880 | -| train/ | | -| approx_kl | 0.023972072 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -11.2 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 142090 | -| policy_gradient_loss | 0.00042 | -| std | 0.011 | -| value_loss | 5.12e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14211 | -| time_elapsed | 75358 | -| total_timesteps | 1819008 | -| train/ | | -| approx_kl | 0.11500529 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -8.23 | -| learning_rate | 0.0003 | -| loss | 0.00803 | -| n_updates | 142100 | -| policy_gradient_loss | 0.00029 | -| std | 0.011 | -| value_loss | 5.17e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14212 | -| time_elapsed | 75372 | -| total_timesteps | 1819136 | -| train/ | | -| approx_kl | 0.04609091 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 142110 | -| policy_gradient_loss | -0.00346 | -| std | 0.011 | -| value_loss | 7.88e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14213 | -| time_elapsed | 75377 | -| total_timesteps | 1819264 | -| train/ | | -| approx_kl | 0.12239684 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 142120 | -| policy_gradient_loss | 0.00895 | -| std | 0.011 | -| value_loss | 5.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14214 | -| time_elapsed | 75384 | -| total_timesteps | 1819392 | -| train/ | | -| approx_kl | 0.029805683 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -3.6 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 142130 | -| policy_gradient_loss | -0.00586 | -| std | 0.011 | -| value_loss | 1.14e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14215 | -| time_elapsed | 75389 | -| total_timesteps | 1819520 | -| train/ | | -| approx_kl | 0.159435 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.373 | -| learning_rate | 0.0003 | -| loss | 0.0838 | -| n_updates | 142140 | -| policy_gradient_loss | 0.0287 | -| std | 0.011 | -| value_loss | 1.6e-08 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14216 | -| time_elapsed | 75392 | -| total_timesteps | 1819648 | -| train/ | | -| approx_kl | 0.0030478695 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 142150 | -| policy_gradient_loss | -0.00418 | -| std | 0.011 | -| value_loss | 1.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14217 | -| time_elapsed | 75394 | -| total_timesteps | 1819776 | -| train/ | | -| approx_kl | 0.028208245 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.00374 | -| learning_rate | 0.0003 | -| loss | -0.000754 | -| n_updates | 142160 | -| policy_gradient_loss | 0.0218 | -| std | 0.011 | -| value_loss | 2.01e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14218 | -| time_elapsed | 75399 | -| total_timesteps | 1819904 | -| train/ | | -| approx_kl | 0.08132887 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 142170 | -| policy_gradient_loss | 0.0156 | -| std | 0.011 | -| value_loss | 9.44e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14219 | -| time_elapsed | 75403 | -| total_timesteps | 1820032 | -| train/ | | -| approx_kl | 0.00057572406 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | -0.000447 | -| n_updates | 142180 | -| policy_gradient_loss | 0.00541 | -| std | 0.011 | -| value_loss | 5.94e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14220 | -| time_elapsed | 75413 | -| total_timesteps | 1820160 | -| train/ | | -| approx_kl | 0.01052778 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 142190 | -| policy_gradient_loss | -0.00057 | -| std | 0.011 | -| value_loss | 3.86e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14221 | -| time_elapsed | 75418 | -| total_timesteps | 1820288 | -| train/ | | -| approx_kl | 0.010373196 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.00453 | -| learning_rate | 0.0003 | -| loss | 0.000754 | -| n_updates | 142200 | -| policy_gradient_loss | 0.0254 | -| std | 0.011 | -| value_loss | 7.13e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14222 | -| time_elapsed | 75424 | -| total_timesteps | 1820416 | -| train/ | | -| approx_kl | 0.0017649666 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | -0.000481 | -| n_updates | 142210 | -| policy_gradient_loss | 0.0321 | -| std | 0.011 | -| value_loss | 1.35e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14223 | -| time_elapsed | 75429 | -| total_timesteps | 1820544 | -| train/ | | -| approx_kl | 0.10427913 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.0661 | -| n_updates | 142220 | -| policy_gradient_loss | 0.015 | -| std | 0.011 | -| value_loss | 5.41e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14224 | -| time_elapsed | 75435 | -| total_timesteps | 1820672 | -| train/ | | -| approx_kl | 0.02655066 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 142230 | -| policy_gradient_loss | 0.0293 | -| std | 0.011 | -| value_loss | 4.77e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14225 | -| time_elapsed | 75439 | -| total_timesteps | 1820800 | -| train/ | | -| approx_kl | 0.09044211 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | 0.0324 | -| n_updates | 142240 | -| policy_gradient_loss | 0.0155 | -| std | 0.011 | -| value_loss | 4.36e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14226 | -| time_elapsed | 75443 | -| total_timesteps | 1820928 | -| train/ | | -| approx_kl | 0.00034494651 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00859 | -| learning_rate | 0.0003 | -| loss | -0.000889 | -| n_updates | 142250 | -| policy_gradient_loss | 0.0176 | -| std | 0.011 | -| value_loss | 2.37e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14227 | -| time_elapsed | 75448 | -| total_timesteps | 1821056 | -| train/ | | -| approx_kl | 0.035932776 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 142260 | -| policy_gradient_loss | 0.00633 | -| std | 0.011 | -| value_loss | 2.16e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14228 | -| time_elapsed | 75458 | -| total_timesteps | 1821184 | -| train/ | | -| approx_kl | 0.007982532 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | -0.00939 | -| n_updates | 142270 | -| policy_gradient_loss | 0.0159 | -| std | 0.011 | -| value_loss | 6.38e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14229 | -| time_elapsed | 75464 | -| total_timesteps | 1821312 | -| train/ | | -| approx_kl | 0.0025935322 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 142280 | -| policy_gradient_loss | 0.00228 | -| std | 0.011 | -| value_loss | 1.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14230 | -| time_elapsed | 75467 | -| total_timesteps | 1821440 | -| train/ | | -| approx_kl | 0.032404106 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.0046 | -| learning_rate | 0.0003 | -| loss | 0.00989 | -| n_updates | 142290 | -| policy_gradient_loss | 0.0296 | -| std | 0.011 | -| value_loss | 1.41e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14231 | -| time_elapsed | 75471 | -| total_timesteps | 1821568 | -| train/ | | -| approx_kl | 2.1646265e-05 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.000273 | -| n_updates | 142300 | -| policy_gradient_loss | 0.0314 | -| std | 0.011 | -| value_loss | 1.03e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14232 | -| time_elapsed | 75476 | -| total_timesteps | 1821696 | -| train/ | | -| approx_kl | 0.040255938 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.00783 | -| n_updates | 142310 | -| policy_gradient_loss | 0.0469 | -| std | 0.011 | -| value_loss | 8.92e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14233 | -| time_elapsed | 75481 | -| total_timesteps | 1821824 | -| train/ | | -| approx_kl | 0.00034078816 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00817 | -| learning_rate | 0.0003 | -| loss | -3.79e-05 | -| n_updates | 142320 | -| policy_gradient_loss | 0.01 | -| std | 0.011 | -| value_loss | 1.16e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 24 | -| iterations | 14234 | -| time_elapsed | 75486 | -| total_timesteps | 1821952 | -| train/ | | -| approx_kl | 0.00024100672 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.000882 | -| learning_rate | 0.0003 | -| loss | 0.00242 | -| n_updates | 142330 | -| policy_gradient_loss | -0.00369 | -| std | 0.0111 | -| value_loss | 1.02e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14235 | -| time_elapsed | 75490 | -| total_timesteps | 1822080 | -| train/ | | -| approx_kl | 0.000319215 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.00112 | -| n_updates | 142340 | -| policy_gradient_loss | 0.00257 | -| std | 0.0111 | -| value_loss | 2.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14236 | -| time_elapsed | 75498 | -| total_timesteps | 1822208 | -| train/ | | -| approx_kl | 0.004963067 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.766 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 142350 | -| policy_gradient_loss | 0.000182 | -| std | 0.0111 | -| value_loss | 0.00459 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14237 | -| time_elapsed | 75503 | -| total_timesteps | 1822336 | -| train/ | | -| approx_kl | 0.0356611 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.0197 | -| n_updates | 142360 | -| policy_gradient_loss | 0.0117 | -| std | 0.0111 | -| value_loss | 3.92e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14238 | -| time_elapsed | 75507 | -| total_timesteps | 1822464 | -| train/ | | -| approx_kl | 0.044267982 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 142370 | -| policy_gradient_loss | 0.01 | -| std | 0.0111 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14239 | -| time_elapsed | 75512 | -| total_timesteps | 1822592 | -| train/ | | -| approx_kl | 0.095226385 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0888 | -| learning_rate | 0.0003 | -| loss | 0.0569 | -| n_updates | 142380 | -| policy_gradient_loss | 0.0429 | -| std | 0.0111 | -| value_loss | 1.27e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14240 | -| time_elapsed | 75517 | -| total_timesteps | 1822720 | -| train/ | | -| approx_kl | 0.06868636 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 142390 | -| policy_gradient_loss | 0.0571 | -| std | 0.0111 | -| value_loss | 3.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14241 | -| time_elapsed | 75522 | -| total_timesteps | 1822848 | -| train/ | | -| approx_kl | 0.051287252 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 142400 | -| policy_gradient_loss | 0.0519 | -| std | 0.0111 | -| value_loss | 7.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 24 | -| iterations | 14242 | -| time_elapsed | 75528 | -| total_timesteps | 1822976 | -| train/ | | -| approx_kl | 0.0016661445 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -194 | -| learning_rate | 0.0003 | -| loss | -0.000863 | -| n_updates | 142410 | -| policy_gradient_loss | 0.0164 | -| std | 0.0111 | -| value_loss | 8.61e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14243 | -| time_elapsed | 75534 | -| total_timesteps | 1823104 | -| train/ | | -| approx_kl | 0.30144578 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.0744 | -| n_updates | 142420 | -| policy_gradient_loss | 0.0152 | -| std | 0.0111 | -| value_loss | 1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14244 | -| time_elapsed | 75544 | -| total_timesteps | 1823232 | -| train/ | | -| approx_kl | 0.07345834 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.08 | -| explained_variance | 0.102 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 142430 | -| policy_gradient_loss | -0.0132 | -| std | 0.0111 | -| value_loss | 0.00125 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14245 | -| time_elapsed | 75549 | -| total_timesteps | 1823360 | -| train/ | | -| approx_kl | 0.009327708 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -114 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 142440 | -| policy_gradient_loss | -0.00317 | -| std | 0.011 | -| value_loss | 1.78e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14246 | -| time_elapsed | 75553 | -| total_timesteps | 1823488 | -| train/ | | -| approx_kl | 0.0060121147 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -1.83 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 142450 | -| policy_gradient_loss | -0.00137 | -| std | 0.011 | -| value_loss | 1.7e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14247 | -| time_elapsed | 75559 | -| total_timesteps | 1823616 | -| train/ | | -| approx_kl | 0.011018263 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -2.41 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 142460 | -| policy_gradient_loss | 0.011 | -| std | 0.011 | -| value_loss | 3.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14248 | -| time_elapsed | 75562 | -| total_timesteps | 1823744 | -| train/ | | -| approx_kl | 0.037206262 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 142470 | -| policy_gradient_loss | -0.00452 | -| std | 0.011 | -| value_loss | 7.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 24 | -| iterations | 14249 | -| time_elapsed | 75566 | -| total_timesteps | 1823872 | -| train/ | | -| approx_kl | 0.037026294 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | 0.00305 | -| n_updates | 142480 | -| policy_gradient_loss | -0.00335 | -| std | 0.011 | -| value_loss | 3.26e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14250 | -| time_elapsed | 75571 | -| total_timesteps | 1824000 | -| train/ | | -| approx_kl | 0.0067035384 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | -0.00813 | -| n_updates | 142490 | -| policy_gradient_loss | -0.00156 | -| std | 0.011 | -| value_loss | 2.67e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14251 | -| time_elapsed | 75575 | -| total_timesteps | 1824128 | -| train/ | | -| approx_kl | 0.020543752 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.00194 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 142500 | -| policy_gradient_loss | -0.00665 | -| std | 0.011 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14252 | -| time_elapsed | 75585 | -| total_timesteps | 1824256 | -| train/ | | -| approx_kl | 0.03776031 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.79 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 142510 | -| policy_gradient_loss | -0.000322 | -| std | 0.011 | -| value_loss | 0.00351 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14253 | -| time_elapsed | 75590 | -| total_timesteps | 1824384 | -| train/ | | -| approx_kl | 0.20686825 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.00606 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 142520 | -| policy_gradient_loss | 0.0254 | -| std | 0.011 | -| value_loss | 1.38e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14254 | -| time_elapsed | 75595 | -| total_timesteps | 1824512 | -| train/ | | -| approx_kl | 0.014278773 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.00247 | -| n_updates | 142530 | -| policy_gradient_loss | 0.00174 | -| std | 0.011 | -| value_loss | 2.59e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14255 | -| time_elapsed | 75600 | -| total_timesteps | 1824640 | -| train/ | | -| approx_kl | 0.0021939906 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 142540 | -| policy_gradient_loss | 0.000304 | -| std | 0.011 | -| value_loss | 1.22e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14256 | -| time_elapsed | 75604 | -| total_timesteps | 1824768 | -| train/ | | -| approx_kl | 0.026660593 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 142550 | -| policy_gradient_loss | 0.00317 | -| std | 0.011 | -| value_loss | 1.12e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 24 | -| iterations | 14257 | -| time_elapsed | 75609 | -| total_timesteps | 1824896 | -| train/ | | -| approx_kl | 0.01652158 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.00254 | -| n_updates | 142560 | -| policy_gradient_loss | 0.0155 | -| std | 0.011 | -| value_loss | 4.71e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14258 | -| time_elapsed | 75613 | -| total_timesteps | 1825024 | -| train/ | | -| approx_kl | 0.2660703 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 142570 | -| policy_gradient_loss | 0.0809 | -| std | 0.011 | -| value_loss | 3.25e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14259 | -| time_elapsed | 75624 | -| total_timesteps | 1825152 | -| train/ | | -| approx_kl | 0.07254702 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 142580 | -| policy_gradient_loss | -0.0113 | -| std | 0.011 | -| value_loss | 2.14e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14260 | -| time_elapsed | 75628 | -| total_timesteps | 1825280 | -| train/ | | -| approx_kl | 0.056906167 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.0505 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 142590 | -| policy_gradient_loss | 0.0062 | -| std | 0.011 | -| value_loss | 7.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14261 | -| time_elapsed | 75631 | -| total_timesteps | 1825408 | -| train/ | | -| approx_kl | 0.017375644 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00912 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 142600 | -| policy_gradient_loss | -0.00143 | -| std | 0.011 | -| value_loss | 1.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14262 | -| time_elapsed | 75635 | -| total_timesteps | 1825536 | -| train/ | | -| approx_kl | 0.05450192 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00977 | -| learning_rate | 0.0003 | -| loss | 0.0334 | -| n_updates | 142610 | -| policy_gradient_loss | 0.0146 | -| std | 0.011 | -| value_loss | 1.02e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14263 | -| time_elapsed | 75638 | -| total_timesteps | 1825664 | -| train/ | | -| approx_kl | 0.019139074 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 142620 | -| policy_gradient_loss | 0.00608 | -| std | 0.011 | -| value_loss | 4.44e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14264 | -| time_elapsed | 75642 | -| total_timesteps | 1825792 | -| train/ | | -| approx_kl | 0.052827477 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0035 | -| n_updates | 142630 | -| policy_gradient_loss | 0.00349 | -| std | 0.011 | -| value_loss | 3.93e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14265 | -| time_elapsed | 75645 | -| total_timesteps | 1825920 | -| train/ | | -| approx_kl | 0.13633165 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00993 | -| learning_rate | 0.0003 | -| loss | 0.0957 | -| n_updates | 142640 | -| policy_gradient_loss | 0.067 | -| std | 0.011 | -| value_loss | 3.26e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14266 | -| time_elapsed | 75649 | -| total_timesteps | 1826048 | -| train/ | | -| approx_kl | 0.073707685 | -| clip_fraction | 0.594 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00892 | -| learning_rate | 0.0003 | -| loss | 0.0724 | -| n_updates | 142650 | -| policy_gradient_loss | 0.0742 | -| std | 0.011 | -| value_loss | 2.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14267 | -| time_elapsed | 75657 | -| total_timesteps | 1826176 | -| train/ | | -| approx_kl | 0.042309288 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.234 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 142660 | -| policy_gradient_loss | -0.0136 | -| std | 0.011 | -| value_loss | 0.0011 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14268 | -| time_elapsed | 75663 | -| total_timesteps | 1826304 | -| train/ | | -| approx_kl | 0.020854227 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | 0.00664 | -| n_updates | 142670 | -| policy_gradient_loss | 0.0106 | -| std | 0.011 | -| value_loss | 4.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14269 | -| time_elapsed | 75668 | -| total_timesteps | 1826432 | -| train/ | | -| approx_kl | 0.03523372 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -4.35 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 142680 | -| policy_gradient_loss | -0.00443 | -| std | 0.011 | -| value_loss | 3.59e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14270 | -| time_elapsed | 75673 | -| total_timesteps | 1826560 | -| train/ | | -| approx_kl | 0.20997047 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | 0.0495 | -| n_updates | 142690 | -| policy_gradient_loss | 0.0124 | -| std | 0.011 | -| value_loss | 9.24e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14271 | -| time_elapsed | 75678 | -| total_timesteps | 1826688 | -| train/ | | -| approx_kl | 0.049105473 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.351 | -| learning_rate | 0.0003 | -| loss | 0.00347 | -| n_updates | 142700 | -| policy_gradient_loss | 0.012 | -| std | 0.011 | -| value_loss | 4.69e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14272 | -| time_elapsed | 75684 | -| total_timesteps | 1826816 | -| train/ | | -| approx_kl | 0.030735992 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.0296 | -| n_updates | 142710 | -| policy_gradient_loss | 0.0239 | -| std | 0.011 | -| value_loss | 2.48e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14273 | -| time_elapsed | 75689 | -| total_timesteps | 1826944 | -| train/ | | -| approx_kl | 0.011752455 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.00314 | -| n_updates | 142720 | -| policy_gradient_loss | 0.0156 | -| std | 0.011 | -| value_loss | 2.39e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14274 | -| time_elapsed | 75695 | -| total_timesteps | 1827072 | -| train/ | | -| approx_kl | 0.0126853045 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0665 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 142730 | -| policy_gradient_loss | 0.0251 | -| std | 0.011 | -| value_loss | 1.02e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14275 | -| time_elapsed | 75703 | -| total_timesteps | 1827200 | -| train/ | | -| approx_kl | 0.015291413 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 142740 | -| policy_gradient_loss | -0.0132 | -| std | 0.011 | -| value_loss | 9.58e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14276 | -| time_elapsed | 75708 | -| total_timesteps | 1827328 | -| train/ | | -| approx_kl | 0.0071155024 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.00773 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 142750 | -| policy_gradient_loss | -0.0101 | -| std | 0.011 | -| value_loss | 3.05e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14277 | -| time_elapsed | 75714 | -| total_timesteps | 1827456 | -| train/ | | -| approx_kl | 0.00039652316 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 142760 | -| policy_gradient_loss | 0.00331 | -| std | 0.011 | -| value_loss | 3.09e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14278 | -| time_elapsed | 75718 | -| total_timesteps | 1827584 | -| train/ | | -| approx_kl | 0.24377711 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -231 | -| learning_rate | 0.0003 | -| loss | 0.00508 | -| n_updates | 142770 | -| policy_gradient_loss | -0.00376 | -| std | 0.011 | -| value_loss | 3.51e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14279 | -| time_elapsed | 75722 | -| total_timesteps | 1827712 | -| train/ | | -| approx_kl | 0.01036597 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.805 | -| learning_rate | 0.0003 | -| loss | -0.00826 | -| n_updates | 142780 | -| policy_gradient_loss | 0.00043 | -| std | 0.011 | -| value_loss | 3.91e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14280 | -| time_elapsed | 75727 | -| total_timesteps | 1827840 | -| train/ | | -| approx_kl | 0.07238844 | -| clip_fraction | 0.479 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 142790 | -| policy_gradient_loss | 0.0421 | -| std | 0.011 | -| value_loss | 1.59e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 24 | -| iterations | 14281 | -| time_elapsed | 75733 | -| total_timesteps | 1827968 | -| train/ | | -| approx_kl | 0.021034736 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 142800 | -| policy_gradient_loss | 0.00646 | -| std | 0.011 | -| value_loss | 3.69e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14282 | -| time_elapsed | 75736 | -| total_timesteps | 1828096 | -| train/ | | -| approx_kl | 0.016354607 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00858 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 142810 | -| policy_gradient_loss | -0.00718 | -| std | 0.011 | -| value_loss | 1.99e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14283 | -| time_elapsed | 75746 | -| total_timesteps | 1828224 | -| train/ | | -| approx_kl | 0.009906381 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 142820 | -| policy_gradient_loss | 0.00431 | -| std | 0.011 | -| value_loss | 0.00214 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14284 | -| time_elapsed | 75751 | -| total_timesteps | 1828352 | -| train/ | | -| approx_kl | 0.021063713 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 142830 | -| policy_gradient_loss | 0.00201 | -| std | 0.011 | -| value_loss | 9.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14285 | -| time_elapsed | 75756 | -| total_timesteps | 1828480 | -| train/ | | -| approx_kl | 0.015522677 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.00388 | -| learning_rate | 0.0003 | -| loss | 0.0076 | -| n_updates | 142840 | -| policy_gradient_loss | 0.0133 | -| std | 0.011 | -| value_loss | 1.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14286 | -| time_elapsed | 75761 | -| total_timesteps | 1828608 | -| train/ | | -| approx_kl | 0.11060931 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 142850 | -| policy_gradient_loss | 0.0106 | -| std | 0.011 | -| value_loss | 1.29e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14287 | -| time_elapsed | 75765 | -| total_timesteps | 1828736 | -| train/ | | -| approx_kl | 6.215647e-06 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | -0.000194 | -| n_updates | 142860 | -| policy_gradient_loss | 0.0011 | -| std | 0.011 | -| value_loss | 7.99e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14288 | -| time_elapsed | 75771 | -| total_timesteps | 1828864 | -| train/ | | -| approx_kl | 0.020187384 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.00771 | -| n_updates | 142870 | -| policy_gradient_loss | 0.018 | -| std | 0.011 | -| value_loss | 4.93e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 24 | -| iterations | 14289 | -| time_elapsed | 75776 | -| total_timesteps | 1828992 | -| train/ | | -| approx_kl | 0.030858453 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 142880 | -| policy_gradient_loss | 0.0111 | -| std | 0.011 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14290 | -| time_elapsed | 75780 | -| total_timesteps | 1829120 | -| train/ | | -| approx_kl | 0.008027175 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 142890 | -| policy_gradient_loss | 0.0212 | -| std | 0.011 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14291 | -| time_elapsed | 75793 | -| total_timesteps | 1829248 | -| train/ | | -| approx_kl | 0.034228638 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.797 | -| learning_rate | 0.0003 | -| loss | -0.00656 | -| n_updates | 142900 | -| policy_gradient_loss | -0.00134 | -| std | 0.011 | -| value_loss | 0.000636 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14292 | -| time_elapsed | 75798 | -| total_timesteps | 1829376 | -| train/ | | -| approx_kl | 0.101524994 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0894 | -| learning_rate | 0.0003 | -| loss | 0.0722 | -| n_updates | 142910 | -| policy_gradient_loss | 0.0644 | -| std | 0.011 | -| value_loss | 1.83e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14293 | -| time_elapsed | 75803 | -| total_timesteps | 1829504 | -| train/ | | -| approx_kl | 0.051867776 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.00276 | -| learning_rate | 0.0003 | -| loss | 0.0592 | -| n_updates | 142920 | -| policy_gradient_loss | 0.0493 | -| std | 0.011 | -| value_loss | 5.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14294 | -| time_elapsed | 75808 | -| total_timesteps | 1829632 | -| train/ | | -| approx_kl | 0.009048048 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00041 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 142930 | -| policy_gradient_loss | 0.00276 | -| std | 0.011 | -| value_loss | 3.46e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14295 | -| time_elapsed | 75812 | -| total_timesteps | 1829760 | -| train/ | | -| approx_kl | 0.2146307 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.00842 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 142940 | -| policy_gradient_loss | 0.0859 | -| std | 0.011 | -| value_loss | 1.66e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 24 | -| iterations | 14296 | -| time_elapsed | 75816 | -| total_timesteps | 1829888 | -| train/ | | -| approx_kl | 0.005564644 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 142950 | -| policy_gradient_loss | -0.00131 | -| std | 0.011 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14297 | -| time_elapsed | 75820 | -| total_timesteps | 1830016 | -| train/ | | -| approx_kl | 0.018207567 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 142960 | -| policy_gradient_loss | -0.0131 | -| std | 0.011 | -| value_loss | 9.73e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14298 | -| time_elapsed | 75831 | -| total_timesteps | 1830144 | -| train/ | | -| approx_kl | 0.0064150523 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 142970 | -| policy_gradient_loss | -0.00272 | -| std | 0.011 | -| value_loss | 0.0016 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14299 | -| time_elapsed | 75835 | -| total_timesteps | 1830272 | -| train/ | | -| approx_kl | 0.036606856 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.0404 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 142980 | -| policy_gradient_loss | 0.00394 | -| std | 0.011 | -| value_loss | 0.000159 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14300 | -| time_elapsed | 75841 | -| total_timesteps | 1830400 | -| train/ | | -| approx_kl | 0.084493995 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 142990 | -| policy_gradient_loss | 0.00537 | -| std | 0.011 | -| value_loss | 5.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14301 | -| time_elapsed | 75845 | -| total_timesteps | 1830528 | -| train/ | | -| approx_kl | 0.028931316 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0099 | -| learning_rate | 0.0003 | -| loss | 0.00785 | -| n_updates | 143000 | -| policy_gradient_loss | 0.00873 | -| std | 0.011 | -| value_loss | 2.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14302 | -| time_elapsed | 75850 | -| total_timesteps | 1830656 | -| train/ | | -| approx_kl | 0.05192158 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 143010 | -| policy_gradient_loss | 0.0218 | -| std | 0.011 | -| value_loss | 1.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14303 | -| time_elapsed | 75855 | -| total_timesteps | 1830784 | -| train/ | | -| approx_kl | 0.059057273 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 143020 | -| policy_gradient_loss | 0.00981 | -| std | 0.011 | -| value_loss | 8.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 24 | -| iterations | 14304 | -| time_elapsed | 75860 | -| total_timesteps | 1830912 | -| train/ | | -| approx_kl | 0.091405675 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 143030 | -| policy_gradient_loss | 0.00337 | -| std | 0.011 | -| value_loss | 5.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14305 | -| time_elapsed | 75864 | -| total_timesteps | 1831040 | -| train/ | | -| approx_kl | 0.029021125 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.00904 | -| n_updates | 143040 | -| policy_gradient_loss | 0.0109 | -| std | 0.011 | -| value_loss | 4.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14306 | -| time_elapsed | 75875 | -| total_timesteps | 1831168 | -| train/ | | -| approx_kl | 0.008968197 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | 0.00298 | -| n_updates | 143050 | -| policy_gradient_loss | 0.00237 | -| std | 0.011 | -| value_loss | 0.00386 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14307 | -| time_elapsed | 75880 | -| total_timesteps | 1831296 | -| train/ | | -| approx_kl | 0.02837134 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0882 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 143060 | -| policy_gradient_loss | -0.0032 | -| std | 0.011 | -| value_loss | 3.68e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14308 | -| time_elapsed | 75885 | -| total_timesteps | 1831424 | -| train/ | | -| approx_kl | 0.013033927 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 143070 | -| policy_gradient_loss | -0.0113 | -| std | 0.011 | -| value_loss | 9.21e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14309 | -| time_elapsed | 75889 | -| total_timesteps | 1831552 | -| train/ | | -| approx_kl | 0.18004636 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.0737 | -| n_updates | 143080 | -| policy_gradient_loss | 0.0143 | -| std | 0.011 | -| value_loss | 3.78e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14310 | -| time_elapsed | 75894 | -| total_timesteps | 1831680 | -| train/ | | -| approx_kl | 0.0077849925 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.06 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 143090 | -| policy_gradient_loss | 0.00102 | -| std | 0.011 | -| value_loss | 2.55e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14311 | -| time_elapsed | 75899 | -| total_timesteps | 1831808 | -| train/ | | -| approx_kl | 0.019771576 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.09 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 143100 | -| policy_gradient_loss | -0.00229 | -| std | 0.011 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14312 | -| time_elapsed | 75904 | -| total_timesteps | 1831936 | -| train/ | | -| approx_kl | 0.0038474253 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | -0.000102 | -| n_updates | 143110 | -| policy_gradient_loss | 0.00147 | -| std | 0.0109 | -| value_loss | 1.33e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14313 | -| time_elapsed | 75909 | -| total_timesteps | 1832064 | -| train/ | | -| approx_kl | 0.0020787306 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | 0.00305 | -| n_updates | 143120 | -| policy_gradient_loss | -0.000463 | -| std | 0.0109 | -| value_loss | 2.35e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14314 | -| time_elapsed | 75918 | -| total_timesteps | 1832192 | -| train/ | | -| approx_kl | 0.15218423 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 143130 | -| policy_gradient_loss | -0.0141 | -| std | 0.0109 | -| value_loss | 0.000889 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14315 | -| time_elapsed | 75923 | -| total_timesteps | 1832320 | -| train/ | | -| approx_kl | 0.02867142 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0806 | -| learning_rate | 0.0003 | -| loss | -0.00395 | -| n_updates | 143140 | -| policy_gradient_loss | 0.0259 | -| std | 0.011 | -| value_loss | 1.39e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14316 | -| time_elapsed | 75928 | -| total_timesteps | 1832448 | -| train/ | | -| approx_kl | 0.009473204 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 143150 | -| policy_gradient_loss | 0.00369 | -| std | 0.011 | -| value_loss | 4.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14317 | -| time_elapsed | 75934 | -| total_timesteps | 1832576 | -| train/ | | -| approx_kl | 0.010440309 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.000409 | -| n_updates | 143160 | -| policy_gradient_loss | 0.0236 | -| std | 0.011 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14318 | -| time_elapsed | 75939 | -| total_timesteps | 1832704 | -| train/ | | -| approx_kl | 0.01708039 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 143170 | -| policy_gradient_loss | 0.00337 | -| std | 0.0109 | -| value_loss | 2.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14319 | -| time_elapsed | 75944 | -| total_timesteps | 1832832 | -| train/ | | -| approx_kl | 0.085901834 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.062 | -| learning_rate | 0.0003 | -| loss | 0.0793 | -| n_updates | 143180 | -| policy_gradient_loss | 0.031 | -| std | 0.0109 | -| value_loss | 4.13e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14320 | -| time_elapsed | 75948 | -| total_timesteps | 1832960 | -| train/ | | -| approx_kl | 0.00023050746 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 143190 | -| policy_gradient_loss | -0.00192 | -| std | 0.0109 | -| value_loss | 1.86e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14321 | -| time_elapsed | 75953 | -| total_timesteps | 1833088 | -| train/ | | -| approx_kl | 1.1859462e-05 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | -9.67e-05 | -| n_updates | 143200 | -| policy_gradient_loss | 0.00271 | -| std | 0.0109 | -| value_loss | 7.5e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14322 | -| time_elapsed | 75964 | -| total_timesteps | 1833216 | -| train/ | | -| approx_kl | 0.027095824 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 143210 | -| policy_gradient_loss | 0.00603 | -| std | 0.0109 | -| value_loss | 0.0025 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14323 | -| time_elapsed | 75970 | -| total_timesteps | 1833344 | -| train/ | | -| approx_kl | 0.08126841 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.000772 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 143220 | -| policy_gradient_loss | 0.017 | -| std | 0.0109 | -| value_loss | 1.13e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14324 | -| time_elapsed | 75976 | -| total_timesteps | 1833472 | -| train/ | | -| approx_kl | 0.000644329 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | -0.000935 | -| n_updates | 143230 | -| policy_gradient_loss | 0.00179 | -| std | 0.0109 | -| value_loss | 1.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14325 | -| time_elapsed | 75981 | -| total_timesteps | 1833600 | -| train/ | | -| approx_kl | 0.030491672 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 143240 | -| policy_gradient_loss | 0.0325 | -| std | 0.0109 | -| value_loss | 9.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14326 | -| time_elapsed | 75987 | -| total_timesteps | 1833728 | -| train/ | | -| approx_kl | 0.008647103 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.00832 | -| n_updates | 143250 | -| policy_gradient_loss | 0.00186 | -| std | 0.0109 | -| value_loss | 7.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14327 | -| time_elapsed | 75991 | -| total_timesteps | 1833856 | -| train/ | | -| approx_kl | 0.012615863 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.00251 | -| n_updates | 143260 | -| policy_gradient_loss | 0.0244 | -| std | 0.0109 | -| value_loss | 3.28e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 24 | -| iterations | 14328 | -| time_elapsed | 75997 | -| total_timesteps | 1833984 | -| train/ | | -| approx_kl | 0.0069764755 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.00301 | -| n_updates | 143270 | -| policy_gradient_loss | 0.015 | -| std | 0.0109 | -| value_loss | 2.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 14329 | -| time_elapsed | 76001 | -| total_timesteps | 1834112 | -| train/ | | -| approx_kl | 0.060640074 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0375 | -| n_updates | 143280 | -| policy_gradient_loss | 0.0147 | -| std | 0.0109 | -| value_loss | 1.56e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 14330 | -| time_elapsed | 76012 | -| total_timesteps | 1834240 | -| train/ | | -| approx_kl | 0.0053455215 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 143290 | -| policy_gradient_loss | -0.00889 | -| std | 0.0109 | -| value_loss | 0.000254 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 14331 | -| time_elapsed | 76017 | -| total_timesteps | 1834368 | -| train/ | | -| approx_kl | 0.055400968 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 143300 | -| policy_gradient_loss | 0.0181 | -| std | 0.0109 | -| value_loss | 6.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 14332 | -| time_elapsed | 76021 | -| total_timesteps | 1834496 | -| train/ | | -| approx_kl | 0.05431362 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | 0.035 | -| n_updates | 143310 | -| policy_gradient_loss | 0.014 | -| std | 0.0109 | -| value_loss | 1.69e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 14333 | -| time_elapsed | 76026 | -| total_timesteps | 1834624 | -| train/ | | -| approx_kl | 0.119852625 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0615 | -| learning_rate | 0.0003 | -| loss | 0.0427 | -| n_updates | 143320 | -| policy_gradient_loss | 0.0129 | -| std | 0.0109 | -| value_loss | 1.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 14334 | -| time_elapsed | 76030 | -| total_timesteps | 1834752 | -| train/ | | -| approx_kl | 0.030471403 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.00529 | -| n_updates | 143330 | -| policy_gradient_loss | 0.00881 | -| std | 0.0109 | -| value_loss | 9.3e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 24 | -| iterations | 14335 | -| time_elapsed | 76035 | -| total_timesteps | 1834880 | -| train/ | | -| approx_kl | 0.11161913 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.0856 | -| n_updates | 143340 | -| policy_gradient_loss | 0.0668 | -| std | 0.0109 | -| value_loss | 5.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14336 | -| time_elapsed | 76040 | -| total_timesteps | 1835008 | -| train/ | | -| approx_kl | 0.070726074 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | 0.0808 | -| n_updates | 143350 | -| policy_gradient_loss | 0.0622 | -| std | 0.0109 | -| value_loss | 5.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14337 | -| time_elapsed | 76050 | -| total_timesteps | 1835136 | -| train/ | | -| approx_kl | 0.05172171 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | 0.934 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 143360 | -| policy_gradient_loss | -0.0126 | -| std | 0.0109 | -| value_loss | 0.000244 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14338 | -| time_elapsed | 76056 | -| total_timesteps | 1835264 | -| train/ | | -| approx_kl | 0.0054833163 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 143370 | -| policy_gradient_loss | -0.0125 | -| std | 0.0109 | -| value_loss | 3.53e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14339 | -| time_elapsed | 76060 | -| total_timesteps | 1835392 | -| train/ | | -| approx_kl | 0.020944176 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -1.81 | -| learning_rate | 0.0003 | -| loss | -0.00786 | -| n_updates | 143380 | -| policy_gradient_loss | -0.00539 | -| std | 0.0109 | -| value_loss | 2.48e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14340 | -| time_elapsed | 76065 | -| total_timesteps | 1835520 | -| train/ | | -| approx_kl | 0.23460457 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0889 | -| n_updates | 143390 | -| policy_gradient_loss | 0.0198 | -| std | 0.0109 | -| value_loss | 3.1e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14341 | -| time_elapsed | 76070 | -| total_timesteps | 1835648 | -| train/ | | -| approx_kl | 0.0065382915 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.005 | -| learning_rate | 0.0003 | -| loss | -0.00562 | -| n_updates | 143400 | -| policy_gradient_loss | 0.000856 | -| std | 0.0109 | -| value_loss | 9.31e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14342 | -| time_elapsed | 76075 | -| total_timesteps | 1835776 | -| train/ | | -| approx_kl | 0.02579801 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 143410 | -| policy_gradient_loss | 0.0186 | -| std | 0.0109 | -| value_loss | 4.95e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14343 | -| time_elapsed | 76079 | -| total_timesteps | 1835904 | -| train/ | | -| approx_kl | 0.034125946 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0617 | -| n_updates | 143420 | -| policy_gradient_loss | 0.0224 | -| std | 0.0109 | -| value_loss | 3.18e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14344 | -| time_elapsed | 76083 | -| total_timesteps | 1836032 | -| train/ | | -| approx_kl | 0.04995506 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -8.55e-06 | -| n_updates | 143430 | -| policy_gradient_loss | -0.009 | -| std | 0.0109 | -| value_loss | 2.76e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14345 | -| time_elapsed | 76094 | -| total_timesteps | 1836160 | -| train/ | | -| approx_kl | 0.25293025 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 143440 | -| policy_gradient_loss | -0.0113 | -| std | 0.0109 | -| value_loss | 1.71e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14346 | -| time_elapsed | 76098 | -| total_timesteps | 1836288 | -| train/ | | -| approx_kl | 0.05016443 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 143450 | -| policy_gradient_loss | 0.0143 | -| std | 0.0109 | -| value_loss | 1.37e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14347 | -| time_elapsed | 76103 | -| total_timesteps | 1836416 | -| train/ | | -| approx_kl | 0.2233522 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0773 | -| n_updates | 143460 | -| policy_gradient_loss | 0.0198 | -| std | 0.0109 | -| value_loss | 9.81e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14348 | -| time_elapsed | 76107 | -| total_timesteps | 1836544 | -| train/ | | -| approx_kl | 0.016099405 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.00384 | -| n_updates | 143470 | -| policy_gradient_loss | 0.00282 | -| std | 0.0109 | -| value_loss | 8.35e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14349 | -| time_elapsed | 76112 | -| total_timesteps | 1836672 | -| train/ | | -| approx_kl | 0.021635586 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.00625 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 143480 | -| policy_gradient_loss | -0.00376 | -| std | 0.0109 | -| value_loss | 4.81e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14350 | -| time_elapsed | 76117 | -| total_timesteps | 1836800 | -| train/ | | -| approx_kl | 0.13102451 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.0696 | -| n_updates | 143490 | -| policy_gradient_loss | 0.0229 | -| std | 0.0109 | -| value_loss | 4.1e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14351 | -| time_elapsed | 76122 | -| total_timesteps | 1836928 | -| train/ | | -| approx_kl | 0.11679371 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | 0.000806 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 143500 | -| policy_gradient_loss | 0.0175 | -| std | 0.0109 | -| value_loss | 4.2e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14352 | -| time_elapsed | 76127 | -| total_timesteps | 1837056 | -| train/ | | -| approx_kl | 0.005203328 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 3.1 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 143510 | -| policy_gradient_loss | 0.00186 | -| std | 0.0109 | -| value_loss | 3.08e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14353 | -| time_elapsed | 76136 | -| total_timesteps | 1837184 | -| train/ | | -| approx_kl | 0.17651142 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.000302 | -| n_updates | 143520 | -| policy_gradient_loss | 0.00756 | -| std | 0.0108 | -| value_loss | 0.00019 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14354 | -| time_elapsed | 76140 | -| total_timesteps | 1837312 | -| train/ | | -| approx_kl | 0.007933995 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.000349 | -| learning_rate | 0.0003 | -| loss | 0.000454 | -| n_updates | 143530 | -| policy_gradient_loss | 0.0143 | -| std | 0.0108 | -| value_loss | 4.59e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14355 | -| time_elapsed | 76145 | -| total_timesteps | 1837440 | -| train/ | | -| approx_kl | 0.3508162 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 143540 | -| policy_gradient_loss | 0.114 | -| std | 0.0108 | -| value_loss | 1.29e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14356 | -| time_elapsed | 76149 | -| total_timesteps | 1837568 | -| train/ | | -| approx_kl | 0.012317948 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 143550 | -| policy_gradient_loss | -0.00246 | -| std | 0.0108 | -| value_loss | 2.33e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14357 | -| time_elapsed | 76155 | -| total_timesteps | 1837696 | -| train/ | | -| approx_kl | 0.0037829862 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0826 | -| learning_rate | 0.0003 | -| loss | 0.00097 | -| n_updates | 143560 | -| policy_gradient_loss | 0.00307 | -| std | 0.0108 | -| value_loss | 1.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14358 | -| time_elapsed | 76160 | -| total_timesteps | 1837824 | -| train/ | | -| approx_kl | 0.003475158 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 143570 | -| policy_gradient_loss | -0.00528 | -| std | 0.0108 | -| value_loss | 3.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14359 | -| time_elapsed | 76165 | -| total_timesteps | 1837952 | -| train/ | | -| approx_kl | 0.039201017 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.00443 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 143580 | -| policy_gradient_loss | 0.0374 | -| std | 0.0108 | -| value_loss | 1.48e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14360 | -| time_elapsed | 76169 | -| total_timesteps | 1838080 | -| train/ | | -| approx_kl | 0.00843256 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.00102 | -| n_updates | 143590 | -| policy_gradient_loss | 0.0111 | -| std | 0.0108 | -| value_loss | 1.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14361 | -| time_elapsed | 76178 | -| total_timesteps | 1838208 | -| train/ | | -| approx_kl | 0.007541897 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.00445 | -| n_updates | 143600 | -| policy_gradient_loss | 0.0273 | -| std | 0.0108 | -| value_loss | 2.08e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14362 | -| time_elapsed | 76185 | -| total_timesteps | 1838336 | -| train/ | | -| approx_kl | 0.013238903 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.00397 | -| learning_rate | 0.0003 | -| loss | 0.00254 | -| n_updates | 143610 | -| policy_gradient_loss | 0.00875 | -| std | 0.0108 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14363 | -| time_elapsed | 76190 | -| total_timesteps | 1838464 | -| train/ | | -| approx_kl | 0.029041257 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.00855 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 143620 | -| policy_gradient_loss | 0.0585 | -| std | 0.0108 | -| value_loss | 2.69e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14364 | -| time_elapsed | 76196 | -| total_timesteps | 1838592 | -| train/ | | -| approx_kl | 0.0062043103 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 143630 | -| policy_gradient_loss | 0.00763 | -| std | 0.0108 | -| value_loss | 1.91e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14365 | -| time_elapsed | 76201 | -| total_timesteps | 1838720 | -| train/ | | -| approx_kl | 0.012328336 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00629 | -| n_updates | 143640 | -| policy_gradient_loss | -0.000493 | -| std | 0.0108 | -| value_loss | 1.4e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14366 | -| time_elapsed | 76206 | -| total_timesteps | 1838848 | -| train/ | | -| approx_kl | 0.034711566 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.0503 | -| n_updates | 143650 | -| policy_gradient_loss | 0.0489 | -| std | 0.0108 | -| value_loss | 6.8e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14367 | -| time_elapsed | 76211 | -| total_timesteps | 1838976 | -| train/ | | -| approx_kl | 0.058314662 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 143660 | -| policy_gradient_loss | 0.075 | -| std | 0.0108 | -| value_loss | 6.16e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14368 | -| time_elapsed | 76215 | -| total_timesteps | 1839104 | -| train/ | | -| approx_kl | 0.010536741 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.00957 | -| learning_rate | 0.0003 | -| loss | -0.00769 | -| n_updates | 143670 | -| policy_gradient_loss | 0.00878 | -| std | 0.0108 | -| value_loss | 4.9e-09 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14369 | -| time_elapsed | 76225 | -| total_timesteps | 1839232 | -| train/ | | -| approx_kl | 7.503216 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.838 | -| learning_rate | 0.0003 | -| loss | 0.0886 | -| n_updates | 143680 | -| policy_gradient_loss | 0.0778 | -| std | 0.0108 | -| value_loss | 0.00261 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14370 | -| time_elapsed | 76230 | -| total_timesteps | 1839360 | -| train/ | | -| approx_kl | 0.00011334848 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.000992 | -| n_updates | 143690 | -| policy_gradient_loss | 0.00181 | -| std | 0.0108 | -| value_loss | 6.96e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14371 | -| time_elapsed | 76235 | -| total_timesteps | 1839488 | -| train/ | | -| approx_kl | 0.0011455631 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | -0.00562 | -| n_updates | 143700 | -| policy_gradient_loss | -0.00435 | -| std | 0.0108 | -| value_loss | 6.58e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14372 | -| time_elapsed | 76239 | -| total_timesteps | 1839616 | -| train/ | | -| approx_kl | 0.008331059 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.641 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 143710 | -| policy_gradient_loss | -0.00884 | -| std | 0.0108 | -| value_loss | 1.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14373 | -| time_elapsed | 76244 | -| total_timesteps | 1839744 | -| train/ | | -| approx_kl | 0.034554064 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 143720 | -| policy_gradient_loss | 0.0178 | -| std | 0.0108 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 24 | -| iterations | 14374 | -| time_elapsed | 76247 | -| total_timesteps | 1839872 | -| train/ | | -| approx_kl | 0.010167433 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 143730 | -| policy_gradient_loss | 0.00978 | -| std | 0.0108 | -| value_loss | 4.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14375 | -| time_elapsed | 76252 | -| total_timesteps | 1840000 | -| train/ | | -| approx_kl | 0.011204956 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | 0.000224 | -| n_updates | 143740 | -| policy_gradient_loss | 0.0297 | -| std | 0.0108 | -| value_loss | 2.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14376 | -| time_elapsed | 76256 | -| total_timesteps | 1840128 | -| train/ | | -| approx_kl | 0.016905924 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.00244 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 143750 | -| policy_gradient_loss | 0.00325 | -| std | 0.0108 | -| value_loss | 1.54e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14377 | -| time_elapsed | 76264 | -| total_timesteps | 1840256 | -| train/ | | -| approx_kl | 11.237954 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 143760 | -| policy_gradient_loss | 0.0553 | -| std | 0.0108 | -| value_loss | 2.55e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14378 | -| time_elapsed | 76268 | -| total_timesteps | 1840384 | -| train/ | | -| approx_kl | 0.07904213 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0641 | -| n_updates | 143770 | -| policy_gradient_loss | 0.0241 | -| std | 0.0108 | -| value_loss | 7.35e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14379 | -| time_elapsed | 76273 | -| total_timesteps | 1840512 | -| train/ | | -| approx_kl | 0.014236694 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00665 | -| n_updates | 143780 | -| policy_gradient_loss | 0.00138 | -| std | 0.0108 | -| value_loss | 5.19e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14380 | -| time_elapsed | 76276 | -| total_timesteps | 1840640 | -| train/ | | -| approx_kl | 0.0056189806 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | -0.000894 | -| n_updates | 143790 | -| policy_gradient_loss | 0.00944 | -| std | 0.0108 | -| value_loss | 4.31e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14381 | -| time_elapsed | 76279 | -| total_timesteps | 1840768 | -| train/ | | -| approx_kl | 0.09665857 | -| clip_fraction | 0.569 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 143800 | -| policy_gradient_loss | 0.0644 | -| std | 0.0108 | -| value_loss | 6.34e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14382 | -| time_elapsed | 76284 | -| total_timesteps | 1840896 | -| train/ | | -| approx_kl | 0.014937853 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 143810 | -| policy_gradient_loss | 0.00528 | -| std | 0.0108 | -| value_loss | 4.08e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14383 | -| time_elapsed | 76286 | -| total_timesteps | 1841024 | -| train/ | | -| approx_kl | 0.017376697 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 143820 | -| policy_gradient_loss | -0.00506 | -| std | 0.0108 | -| value_loss | 2.92e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14384 | -| time_elapsed | 76299 | -| total_timesteps | 1841152 | -| train/ | | -| approx_kl | 0.10144302 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.819 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 143830 | -| policy_gradient_loss | 0.0736 | -| std | 0.0108 | -| value_loss | 0.00293 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14385 | -| time_elapsed | 76304 | -| total_timesteps | 1841280 | -| train/ | | -| approx_kl | 0.064866565 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -4.37e-06 | -| n_updates | 143840 | -| policy_gradient_loss | 0.00217 | -| std | 0.0108 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14386 | -| time_elapsed | 76309 | -| total_timesteps | 1841408 | -| train/ | | -| approx_kl | 0.0077311574 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.00306 | -| learning_rate | 0.0003 | -| loss | -0.00588 | -| n_updates | 143850 | -| policy_gradient_loss | 0.00764 | -| std | 0.0108 | -| value_loss | 9.95e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14387 | -| time_elapsed | 76316 | -| total_timesteps | 1841536 | -| train/ | | -| approx_kl | 0.070832305 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 143860 | -| policy_gradient_loss | 0.00546 | -| std | 0.0108 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14388 | -| time_elapsed | 76320 | -| total_timesteps | 1841664 | -| train/ | | -| approx_kl | 0.040354654 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 143870 | -| policy_gradient_loss | 0.0116 | -| std | 0.0108 | -| value_loss | 4.52e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14389 | -| time_elapsed | 76324 | -| total_timesteps | 1841792 | -| train/ | | -| approx_kl | 0.04540051 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 143880 | -| policy_gradient_loss | 0.0133 | -| std | 0.0108 | -| value_loss | 2.23e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14390 | -| time_elapsed | 76328 | -| total_timesteps | 1841920 | -| train/ | | -| approx_kl | 0.055806 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.0361 | -| n_updates | 143890 | -| policy_gradient_loss | 0.0146 | -| std | 0.0108 | -| value_loss | 1.37e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14391 | -| time_elapsed | 76331 | -| total_timesteps | 1842048 | -| train/ | | -| approx_kl | 0.009688028 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0049 | -| n_updates | 143900 | -| policy_gradient_loss | -4.18e-05 | -| std | 0.0108 | -| value_loss | 1.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14392 | -| time_elapsed | 76338 | -| total_timesteps | 1842176 | -| train/ | | -| approx_kl | 0.12037848 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 143910 | -| policy_gradient_loss | 0.000598 | -| std | 0.0108 | -| value_loss | 0.00121 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14393 | -| time_elapsed | 76343 | -| total_timesteps | 1842304 | -| train/ | | -| approx_kl | 0.03568008 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.00935 | -| n_updates | 143920 | -| policy_gradient_loss | 0.0089 | -| std | 0.0108 | -| value_loss | 4.67e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14394 | -| time_elapsed | 76349 | -| total_timesteps | 1842432 | -| train/ | | -| approx_kl | 0.12571882 | -| clip_fraction | 0.579 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.00242 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 143930 | -| policy_gradient_loss | 0.0677 | -| std | 0.0108 | -| value_loss | 5.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14395 | -| time_elapsed | 76353 | -| total_timesteps | 1842560 | -| train/ | | -| approx_kl | 0.08170673 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0654 | -| n_updates | 143940 | -| policy_gradient_loss | 0.069 | -| std | 0.0108 | -| value_loss | 2.96e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14396 | -| time_elapsed | 76359 | -| total_timesteps | 1842688 | -| train/ | | -| approx_kl | 0.04892314 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0422 | -| n_updates | 143950 | -| policy_gradient_loss | 0.0518 | -| std | 0.0108 | -| value_loss | 1.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14397 | -| time_elapsed | 76364 | -| total_timesteps | 1842816 | -| train/ | | -| approx_kl | 0.053290065 | -| clip_fraction | 0.578 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0398 | -| n_updates | 143960 | -| policy_gradient_loss | 0.0603 | -| std | 0.0108 | -| value_loss | 2.33e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 24 | -| iterations | 14398 | -| time_elapsed | 76368 | -| total_timesteps | 1842944 | -| train/ | | -| approx_kl | 0.010169715 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0691 | -| learning_rate | 0.0003 | -| loss | -0.00759 | -| n_updates | 143970 | -| policy_gradient_loss | 0.00507 | -| std | 0.0108 | -| value_loss | 4.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14399 | -| time_elapsed | 76374 | -| total_timesteps | 1843072 | -| train/ | | -| approx_kl | 0.24284634 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 143980 | -| policy_gradient_loss | 0.0946 | -| std | 0.0108 | -| value_loss | 3.92e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14400 | -| time_elapsed | 76380 | -| total_timesteps | 1843200 | -| train/ | | -| approx_kl | 0.46306795 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 143990 | -| policy_gradient_loss | -0.0142 | -| std | 0.0108 | -| value_loss | 0.00213 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14401 | -| time_elapsed | 76385 | -| total_timesteps | 1843328 | -| train/ | | -| approx_kl | 0.022246858 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.887 | -| learning_rate | 0.0003 | -| loss | -0.00568 | -| n_updates | 144000 | -| policy_gradient_loss | 0.00217 | -| std | 0.0108 | -| value_loss | 1.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14402 | -| time_elapsed | 76389 | -| total_timesteps | 1843456 | -| train/ | | -| approx_kl | 0.106481634 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -218 | -| learning_rate | 0.0003 | -| loss | 0.00639 | -| n_updates | 144010 | -| policy_gradient_loss | 0.00123 | -| std | 0.0108 | -| value_loss | 5.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14403 | -| time_elapsed | 76393 | -| total_timesteps | 1843584 | -| train/ | | -| approx_kl | 0.028235562 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -55.9 | -| learning_rate | 0.0003 | -| loss | 0.00405 | -| n_updates | 144020 | -| policy_gradient_loss | 0.00429 | -| std | 0.0108 | -| value_loss | 1.08e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14404 | -| time_elapsed | 76396 | -| total_timesteps | 1843712 | -| train/ | | -| approx_kl | 0.058702826 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -8.91 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 144030 | -| policy_gradient_loss | 0.00629 | -| std | 0.0108 | -| value_loss | 2.44e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14405 | -| time_elapsed | 76400 | -| total_timesteps | 1843840 | -| train/ | | -| approx_kl | 0.08635809 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 144040 | -| policy_gradient_loss | 0.0109 | -| std | 0.0108 | -| value_loss | 4.61e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 24 | -| iterations | 14406 | -| time_elapsed | 76406 | -| total_timesteps | 1843968 | -| train/ | | -| approx_kl | 0.021939315 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.000824 | -| n_updates | 144050 | -| policy_gradient_loss | 0.0242 | -| std | 0.0108 | -| value_loss | 2.55e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14407 | -| time_elapsed | 76412 | -| total_timesteps | 1844096 | -| train/ | | -| approx_kl | 0.010270622 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 144060 | -| policy_gradient_loss | 0.0106 | -| std | 0.0108 | -| value_loss | 1.83e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14408 | -| time_elapsed | 76423 | -| total_timesteps | 1844224 | -| train/ | | -| approx_kl | 0.9219951 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.551 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 144070 | -| policy_gradient_loss | -0.0182 | -| std | 0.0108 | -| value_loss | 0.000966 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14409 | -| time_elapsed | 76429 | -| total_timesteps | 1844352 | -| train/ | | -| approx_kl | 0.0032929173 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -22.2 | -| learning_rate | 0.0003 | -| loss | -0.00719 | -| n_updates | 144080 | -| policy_gradient_loss | -0.000333 | -| std | 0.0108 | -| value_loss | 3.49e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14410 | -| time_elapsed | 76434 | -| total_timesteps | 1844480 | -| train/ | | -| approx_kl | 0.0007666112 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -2.16 | -| learning_rate | 0.0003 | -| loss | 0.00335 | -| n_updates | 144090 | -| policy_gradient_loss | 0.0142 | -| std | 0.0108 | -| value_loss | 1.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14411 | -| time_elapsed | 76438 | -| total_timesteps | 1844608 | -| train/ | | -| approx_kl | 0.023045892 | -| clip_fraction | 0.539 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.754 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 144100 | -| policy_gradient_loss | 0.0228 | -| std | 0.0108 | -| value_loss | 6.28e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14412 | -| time_elapsed | 76443 | -| total_timesteps | 1844736 | -| train/ | | -| approx_kl | 0.0060427748 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 144110 | -| policy_gradient_loss | 0.00694 | -| std | 0.0108 | -| value_loss | 4.13e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14413 | -| time_elapsed | 76447 | -| total_timesteps | 1844864 | -| train/ | | -| approx_kl | 0.0790626 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | 0.0552 | -| n_updates | 144120 | -| policy_gradient_loss | 0.0236 | -| std | 0.0108 | -| value_loss | 1.53e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14414 | -| time_elapsed | 76452 | -| total_timesteps | 1844992 | -| train/ | | -| approx_kl | 0.027968954 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.00695 | -| learning_rate | 0.0003 | -| loss | 0.00723 | -| n_updates | 144130 | -| policy_gradient_loss | -0.000296 | -| std | 0.0108 | -| value_loss | 3.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14415 | -| time_elapsed | 76456 | -| total_timesteps | 1845120 | -| train/ | | -| approx_kl | 0.0045441743 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.00427 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 144140 | -| policy_gradient_loss | -0.000441 | -| std | 0.0108 | -| value_loss | 4.65e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14416 | -| time_elapsed | 76468 | -| total_timesteps | 1845248 | -| train/ | | -| approx_kl | 0.05053615 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.865 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 144150 | -| policy_gradient_loss | 0.0236 | -| std | 0.0108 | -| value_loss | 0.000977 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14417 | -| time_elapsed | 76472 | -| total_timesteps | 1845376 | -| train/ | | -| approx_kl | 0.07150748 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0976 | -| learning_rate | 0.0003 | -| loss | 0.0583 | -| n_updates | 144160 | -| policy_gradient_loss | 0.076 | -| std | 0.0108 | -| value_loss | 6.36e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14418 | -| time_elapsed | 76476 | -| total_timesteps | 1845504 | -| train/ | | -| approx_kl | 0.0126638785 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | 0.00144 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 144170 | -| policy_gradient_loss | 0.0068 | -| std | 0.0108 | -| value_loss | 7.08e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14419 | -| time_elapsed | 76480 | -| total_timesteps | 1845632 | -| train/ | | -| approx_kl | 0.058824036 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.0337 | -| n_updates | 144180 | -| policy_gradient_loss | 0.00697 | -| std | 0.0108 | -| value_loss | 6.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14420 | -| time_elapsed | 76485 | -| total_timesteps | 1845760 | -| train/ | | -| approx_kl | 0.008466475 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0786 | -| learning_rate | 0.0003 | -| loss | -0.000581 | -| n_updates | 144190 | -| policy_gradient_loss | 0.01 | -| std | 0.0108 | -| value_loss | 2.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 24 | -| iterations | 14421 | -| time_elapsed | 76491 | -| total_timesteps | 1845888 | -| train/ | | -| approx_kl | 0.03169428 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.0191 | -| n_updates | 144200 | -| policy_gradient_loss | 0.00958 | -| std | 0.0107 | -| value_loss | 1.11e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14422 | -| time_elapsed | 76496 | -| total_timesteps | 1846016 | -| train/ | | -| approx_kl | 0.10015738 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.11 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 144210 | -| policy_gradient_loss | 0.00817 | -| std | 0.0107 | -| value_loss | 1.82e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14423 | -| time_elapsed | 76508 | -| total_timesteps | 1846144 | -| train/ | | -| approx_kl | 0.009348545 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 144220 | -| policy_gradient_loss | -0.0108 | -| std | 0.0107 | -| value_loss | 0.0017 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14424 | -| time_elapsed | 76513 | -| total_timesteps | 1846272 | -| train/ | | -| approx_kl | 0.050583668 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 144230 | -| policy_gradient_loss | 0.00643 | -| std | 0.0107 | -| value_loss | 1.76e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14425 | -| time_elapsed | 76518 | -| total_timesteps | 1846400 | -| train/ | | -| approx_kl | 0.047078513 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00825 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 144240 | -| policy_gradient_loss | 0.0163 | -| std | 0.0107 | -| value_loss | 2.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14426 | -| time_elapsed | 76523 | -| total_timesteps | 1846528 | -| train/ | | -| approx_kl | 0.051347125 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 144250 | -| policy_gradient_loss | 0.00977 | -| std | 0.0107 | -| value_loss | 1.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14427 | -| time_elapsed | 76529 | -| total_timesteps | 1846656 | -| train/ | | -| approx_kl | 0.013165426 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0074 | -| n_updates | 144260 | -| policy_gradient_loss | 0.00204 | -| std | 0.0107 | -| value_loss | 1.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14428 | -| time_elapsed | 76534 | -| total_timesteps | 1846784 | -| train/ | | -| approx_kl | 0.06972148 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.0338 | -| n_updates | 144270 | -| policy_gradient_loss | 0.00511 | -| std | 0.0107 | -| value_loss | 6.14e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 24 | -| iterations | 14429 | -| time_elapsed | 76539 | -| total_timesteps | 1846912 | -| train/ | | -| approx_kl | 0.0056318804 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -0.000537 | -| n_updates | 144280 | -| policy_gradient_loss | 0.0121 | -| std | 0.0107 | -| value_loss | 1.32e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14430 | -| time_elapsed | 76543 | -| total_timesteps | 1847040 | -| train/ | | -| approx_kl | 0.04079112 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0885 | -| learning_rate | 0.0003 | -| loss | 0.0086 | -| n_updates | 144290 | -| policy_gradient_loss | 0.00706 | -| std | 0.0107 | -| value_loss | 1.69e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14431 | -| time_elapsed | 76554 | -| total_timesteps | 1847168 | -| train/ | | -| approx_kl | 0.20387958 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -2.21 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 144300 | -| policy_gradient_loss | -0.0144 | -| std | 0.0107 | -| value_loss | 0.00216 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14432 | -| time_elapsed | 76561 | -| total_timesteps | 1847296 | -| train/ | | -| approx_kl | 0.0010403721 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -14.8 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 144310 | -| policy_gradient_loss | -0.00392 | -| std | 0.0107 | -| value_loss | 3.38e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14433 | -| time_elapsed | 76566 | -| total_timesteps | 1847424 | -| train/ | | -| approx_kl | 0.042173807 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0909 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 144320 | -| policy_gradient_loss | 0.00199 | -| std | 0.0107 | -| value_loss | 3.75e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14434 | -| time_elapsed | 76571 | -| total_timesteps | 1847552 | -| train/ | | -| approx_kl | 0.0072959773 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.00922 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 144330 | -| policy_gradient_loss | -0.00391 | -| std | 0.0107 | -| value_loss | 1.05e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14435 | -| time_elapsed | 76574 | -| total_timesteps | 1847680 | -| train/ | | -| approx_kl | 0.009224329 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00525 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 144340 | -| policy_gradient_loss | 0.0458 | -| std | 0.0107 | -| value_loss | 2.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14436 | -| time_elapsed | 76578 | -| total_timesteps | 1847808 | -| train/ | | -| approx_kl | 0.020986646 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00312 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 144350 | -| policy_gradient_loss | 0.0413 | -| std | 0.0107 | -| value_loss | 1.37e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 24 | -| iterations | 14437 | -| time_elapsed | 76581 | -| total_timesteps | 1847936 | -| train/ | | -| approx_kl | 0.04654946 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00936 | -| learning_rate | 0.0003 | -| loss | 0.0746 | -| n_updates | 144360 | -| policy_gradient_loss | 0.0845 | -| std | 0.0107 | -| value_loss | 1.06e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14438 | -| time_elapsed | 76585 | -| total_timesteps | 1848064 | -| train/ | | -| approx_kl | 0.043559976 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00797 | -| learning_rate | 0.0003 | -| loss | 0.0481 | -| n_updates | 144370 | -| policy_gradient_loss | 0.0892 | -| std | 0.0107 | -| value_loss | 6.48e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14439 | -| time_elapsed | 76593 | -| total_timesteps | 1848192 | -| train/ | | -| approx_kl | 0.0024006395 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.67 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 144380 | -| policy_gradient_loss | -0.00767 | -| std | 0.0107 | -| value_loss | 0.00683 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14440 | -| time_elapsed | 76598 | -| total_timesteps | 1848320 | -| train/ | | -| approx_kl | 0.044204965 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 144390 | -| policy_gradient_loss | 0.0572 | -| std | 0.0107 | -| value_loss | 5.36e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14441 | -| time_elapsed | 76602 | -| total_timesteps | 1848448 | -| train/ | | -| approx_kl | 0.04661758 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 144400 | -| policy_gradient_loss | 0.05 | -| std | 0.0107 | -| value_loss | 8.82e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14442 | -| time_elapsed | 76607 | -| total_timesteps | 1848576 | -| train/ | | -| approx_kl | 0.040268764 | -| clip_fraction | 0.546 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 144410 | -| policy_gradient_loss | 0.054 | -| std | 0.0107 | -| value_loss | 3.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14443 | -| time_elapsed | 76611 | -| total_timesteps | 1848704 | -| train/ | | -| approx_kl | 0.010350518 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 144420 | -| policy_gradient_loss | 0.00761 | -| std | 0.0107 | -| value_loss | 2.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14444 | -| time_elapsed | 76616 | -| total_timesteps | 1848832 | -| train/ | | -| approx_kl | 0.06291305 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.0473 | -| n_updates | 144430 | -| policy_gradient_loss | 0.00911 | -| std | 0.0107 | -| value_loss | 4.48e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 24 | -| iterations | 14445 | -| time_elapsed | 76621 | -| total_timesteps | 1848960 | -| train/ | | -| approx_kl | 0.007791103 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 144440 | -| policy_gradient_loss | 0.00794 | -| std | 0.0107 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14446 | -| time_elapsed | 76626 | -| total_timesteps | 1849088 | -| train/ | | -| approx_kl | 0.037919678 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0095 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 144450 | -| policy_gradient_loss | 0.00884 | -| std | 0.0107 | -| value_loss | 4.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14447 | -| time_elapsed | 76634 | -| total_timesteps | 1849216 | -| train/ | | -| approx_kl | 0.09062816 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.671 | -| learning_rate | 0.0003 | -| loss | 0.0134 | -| n_updates | 144460 | -| policy_gradient_loss | -0.00347 | -| std | 0.0107 | -| value_loss | 0.00367 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14448 | -| time_elapsed | 76639 | -| total_timesteps | 1849344 | -| train/ | | -| approx_kl | 0.0036749686 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.00365 | -| n_updates | 144470 | -| policy_gradient_loss | 0.00759 | -| std | 0.0107 | -| value_loss | 2.25e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14449 | -| time_elapsed | 76644 | -| total_timesteps | 1849472 | -| train/ | | -| approx_kl | 0.036383804 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.000344 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 144480 | -| policy_gradient_loss | 0.0273 | -| std | 0.0107 | -| value_loss | 2.7e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14450 | -| time_elapsed | 76649 | -| total_timesteps | 1849600 | -| train/ | | -| approx_kl | 0.10191292 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 144490 | -| policy_gradient_loss | 0.0177 | -| std | 0.0107 | -| value_loss | 2.92e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14451 | -| time_elapsed | 76654 | -| total_timesteps | 1849728 | -| train/ | | -| approx_kl | 0.0006889617 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00648 | -| n_updates | 144500 | -| policy_gradient_loss | -0.00784 | -| std | 0.0107 | -| value_loss | 1.55e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14452 | -| time_elapsed | 76657 | -| total_timesteps | 1849856 | -| train/ | | -| approx_kl | 1.8533319e-07 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | -2.03e-05 | -| n_updates | 144510 | -| policy_gradient_loss | 0.00311 | -| std | 0.0107 | -| value_loss | 1.47e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14453 | -| time_elapsed | 76660 | -| total_timesteps | 1849984 | -| train/ | | -| approx_kl | 0.02493768 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 144520 | -| policy_gradient_loss | 0.0279 | -| std | 0.0107 | -| value_loss | 7.64e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14454 | -| time_elapsed | 76665 | -| total_timesteps | 1850112 | -| train/ | | -| approx_kl | 0.07843432 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.00555 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 144530 | -| policy_gradient_loss | 0.0126 | -| std | 0.0107 | -| value_loss | 1.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14455 | -| time_elapsed | 76677 | -| total_timesteps | 1850240 | -| train/ | | -| approx_kl | 0.032330368 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 144540 | -| policy_gradient_loss | -0.0184 | -| std | 0.0107 | -| value_loss | 0.00226 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14456 | -| time_elapsed | 76681 | -| total_timesteps | 1850368 | -| train/ | | -| approx_kl | 0.044292577 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 144550 | -| policy_gradient_loss | 0.00877 | -| std | 0.0107 | -| value_loss | 2.93e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14457 | -| time_elapsed | 76686 | -| total_timesteps | 1850496 | -| train/ | | -| approx_kl | 0.16307506 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | 0.0513 | -| n_updates | 144560 | -| policy_gradient_loss | 0.0103 | -| std | 0.0107 | -| value_loss | 6.12e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14458 | -| time_elapsed | 76690 | -| total_timesteps | 1850624 | -| train/ | | -| approx_kl | 8.251378e-05 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 144570 | -| policy_gradient_loss | -0.00381 | -| std | 0.0107 | -| value_loss | 2.74e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14459 | -| time_elapsed | 76694 | -| total_timesteps | 1850752 | -| train/ | | -| approx_kl | 0.020978356 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.000561 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 144580 | -| policy_gradient_loss | 0.0232 | -| std | 0.0107 | -| value_loss | 2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14460 | -| time_elapsed | 76699 | -| total_timesteps | 1850880 | -| train/ | | -| approx_kl | 0.07655814 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00293 | -| learning_rate | 0.0003 | -| loss | 0.0496 | -| n_updates | 144590 | -| policy_gradient_loss | 0.0149 | -| std | 0.0107 | -| value_loss | 1.3e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14461 | -| time_elapsed | 76704 | -| total_timesteps | 1851008 | -| train/ | | -| approx_kl | 0.00045846403 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00992 | -| learning_rate | 0.0003 | -| loss | -0.000965 | -| n_updates | 144600 | -| policy_gradient_loss | 0.00433 | -| std | 0.0107 | -| value_loss | 8.07e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14462 | -| time_elapsed | 76718 | -| total_timesteps | 1851136 | -| train/ | | -| approx_kl | 0.001149266 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 144610 | -| policy_gradient_loss | -0.0092 | -| std | 0.0107 | -| value_loss | 0.000603 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14463 | -| time_elapsed | 76721 | -| total_timesteps | 1851264 | -| train/ | | -| approx_kl | 0.011199201 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | 0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 144620 | -| policy_gradient_loss | -0.00783 | -| std | 0.0107 | -| value_loss | 8.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14464 | -| time_elapsed | 76727 | -| total_timesteps | 1851392 | -| train/ | | -| approx_kl | 0.03588039 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 144630 | -| policy_gradient_loss | 0.00284 | -| std | 0.0107 | -| value_loss | 3.46e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14465 | -| time_elapsed | 76733 | -| total_timesteps | 1851520 | -| train/ | | -| approx_kl | 0.061642453 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.077 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 144640 | -| policy_gradient_loss | 0.00877 | -| std | 0.0107 | -| value_loss | 1.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14466 | -| time_elapsed | 76737 | -| total_timesteps | 1851648 | -| train/ | | -| approx_kl | 0.24962282 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 144650 | -| policy_gradient_loss | 0.0142 | -| std | 0.0107 | -| value_loss | 1.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14467 | -| time_elapsed | 76742 | -| total_timesteps | 1851776 | -| train/ | | -| approx_kl | 0.01228113 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 144660 | -| policy_gradient_loss | -0.00565 | -| std | 0.0107 | -| value_loss | 7.6e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 24 | -| iterations | 14468 | -| time_elapsed | 76747 | -| total_timesteps | 1851904 | -| train/ | | -| approx_kl | 1.15484e-07 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 4.89e-05 | -| n_updates | 144670 | -| policy_gradient_loss | -0.000634 | -| std | 0.0107 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14469 | -| time_elapsed | 76752 | -| total_timesteps | 1852032 | -| train/ | | -| approx_kl | 6.798189e-05 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.12 | -| explained_variance | -0.00909 | -| learning_rate | 0.0003 | -| loss | -0.000369 | -| n_updates | 144680 | -| policy_gradient_loss | 0.013 | -| std | 0.0106 | -| value_loss | 3.72e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14470 | -| time_elapsed | 76761 | -| total_timesteps | 1852160 | -| train/ | | -| approx_kl | 0.0956772 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.749 | -| learning_rate | 0.0003 | -| loss | 0.00932 | -| n_updates | 144690 | -| policy_gradient_loss | 0.00122 | -| std | 0.0106 | -| value_loss | 0.00313 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14471 | -| time_elapsed | 76766 | -| total_timesteps | 1852288 | -| train/ | | -| approx_kl | 0.04925148 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00343 | -| learning_rate | 0.0003 | -| loss | 0.0632 | -| n_updates | 144700 | -| policy_gradient_loss | 0.0628 | -| std | 0.0106 | -| value_loss | 2.15e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14472 | -| time_elapsed | 76770 | -| total_timesteps | 1852416 | -| train/ | | -| approx_kl | 0.008550048 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0834 | -| learning_rate | 0.0003 | -| loss | 0.000133 | -| n_updates | 144710 | -| policy_gradient_loss | 0.00688 | -| std | 0.0106 | -| value_loss | 3.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14473 | -| time_elapsed | 76774 | -| total_timesteps | 1852544 | -| train/ | | -| approx_kl | 0.019201236 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 144720 | -| policy_gradient_loss | -0.00441 | -| std | 0.0106 | -| value_loss | 6.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14474 | -| time_elapsed | 76779 | -| total_timesteps | 1852672 | -| train/ | | -| approx_kl | 0.07779738 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.00449 | -| n_updates | 144730 | -| policy_gradient_loss | -0.00437 | -| std | 0.0106 | -| value_loss | 4.32e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14475 | -| time_elapsed | 76782 | -| total_timesteps | 1852800 | -| train/ | | -| approx_kl | 0.028926091 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.00672 | -| n_updates | 144740 | -| policy_gradient_loss | 0.00974 | -| std | 0.0106 | -| value_loss | 2.83e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 24 | -| iterations | 14476 | -| time_elapsed | 76786 | -| total_timesteps | 1852928 | -| train/ | | -| approx_kl | 0.15403391 | -| clip_fraction | 0.593 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 144750 | -| policy_gradient_loss | 0.0902 | -| std | 0.0106 | -| value_loss | 1.92e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14477 | -| time_elapsed | 76790 | -| total_timesteps | 1853056 | -| train/ | | -| approx_kl | 0.045071803 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.0468 | -| n_updates | 144760 | -| policy_gradient_loss | 0.043 | -| std | 0.0106 | -| value_loss | 8.68e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14478 | -| time_elapsed | 76800 | -| total_timesteps | 1853184 | -| train/ | | -| approx_kl | 0.0018064366 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.65 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 144770 | -| policy_gradient_loss | -0.001 | -| std | 0.0106 | -| value_loss | 0.00776 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14479 | -| time_elapsed | 76806 | -| total_timesteps | 1853312 | -| train/ | | -| approx_kl | 0.057287842 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.0451 | -| n_updates | 144780 | -| policy_gradient_loss | 0.0223 | -| std | 0.0106 | -| value_loss | 5.84e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14480 | -| time_elapsed | 76811 | -| total_timesteps | 1853440 | -| train/ | | -| approx_kl | 0.035923287 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00365 | -| learning_rate | 0.0003 | -| loss | 0.00632 | -| n_updates | 144790 | -| policy_gradient_loss | -0.00145 | -| std | 0.0106 | -| value_loss | 7.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14481 | -| time_elapsed | 76816 | -| total_timesteps | 1853568 | -| train/ | | -| approx_kl | 0.008140853 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.000209 | -| n_updates | 144800 | -| policy_gradient_loss | 0.00185 | -| std | 0.0106 | -| value_loss | 3.77e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14482 | -| time_elapsed | 76821 | -| total_timesteps | 1853696 | -| train/ | | -| approx_kl | 0.01888055 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 144810 | -| policy_gradient_loss | 0.000987 | -| std | 0.0106 | -| value_loss | 2.39e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14483 | -| time_elapsed | 76826 | -| total_timesteps | 1853824 | -| train/ | | -| approx_kl | 0.014927546 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 144820 | -| policy_gradient_loss | -0.00732 | -| std | 0.0106 | -| value_loss | 1.58e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 24 | -| iterations | 14484 | -| time_elapsed | 76831 | -| total_timesteps | 1853952 | -| train/ | | -| approx_kl | 0.04085876 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.0014 | -| n_updates | 144830 | -| policy_gradient_loss | 0.0128 | -| std | 0.0106 | -| value_loss | 1.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14485 | -| time_elapsed | 76835 | -| total_timesteps | 1854080 | -| train/ | | -| approx_kl | 0.33092913 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 144840 | -| policy_gradient_loss | 0.0828 | -| std | 0.0106 | -| value_loss | 5.56e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14486 | -| time_elapsed | 76845 | -| total_timesteps | 1854208 | -| train/ | | -| approx_kl | 0.0465524 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -5.3 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 144850 | -| policy_gradient_loss | -0.016 | -| std | 0.0106 | -| value_loss | 0.00245 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14487 | -| time_elapsed | 76850 | -| total_timesteps | 1854336 | -| train/ | | -| approx_kl | 0.0076982877 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -3.18 | -| learning_rate | 0.0003 | -| loss | -0.00926 | -| n_updates | 144860 | -| policy_gradient_loss | 0.000602 | -| std | 0.0106 | -| value_loss | 0.00018 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14488 | -| time_elapsed | 76856 | -| total_timesteps | 1854464 | -| train/ | | -| approx_kl | 0.19105998 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.476 | -| learning_rate | 0.0003 | -| loss | 0.0578 | -| n_updates | 144870 | -| policy_gradient_loss | 0.0158 | -| std | 0.0106 | -| value_loss | 8.49e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14489 | -| time_elapsed | 76861 | -| total_timesteps | 1854592 | -| train/ | | -| approx_kl | 0.013988861 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00815 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 144880 | -| policy_gradient_loss | -0.000501 | -| std | 0.0106 | -| value_loss | 1.78e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14490 | -| time_elapsed | 76866 | -| total_timesteps | 1854720 | -| train/ | | -| approx_kl | 0.0029276726 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.000581 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 144890 | -| policy_gradient_loss | 0.0109 | -| std | 0.0106 | -| value_loss | 6.68e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14491 | -| time_elapsed | 76870 | -| total_timesteps | 1854848 | -| train/ | | -| approx_kl | 0.084381066 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 144900 | -| policy_gradient_loss | -0.00165 | -| std | 0.0106 | -| value_loss | 3.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14492 | -| time_elapsed | 76874 | -| total_timesteps | 1854976 | -| train/ | | -| approx_kl | 0.024614403 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 144910 | -| policy_gradient_loss | 0.0118 | -| std | 0.0106 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14493 | -| time_elapsed | 76878 | -| total_timesteps | 1855104 | -| train/ | | -| approx_kl | 0.093545884 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | 0.0445 | -| n_updates | 144920 | -| policy_gradient_loss | 0.038 | -| std | 0.0106 | -| value_loss | 1.1e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14494 | -| time_elapsed | 76888 | -| total_timesteps | 1855232 | -| train/ | | -| approx_kl | 0.07938746 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.763 | -| learning_rate | 0.0003 | -| loss | 0.0452 | -| n_updates | 144930 | -| policy_gradient_loss | 0.0381 | -| std | 0.0106 | -| value_loss | 0.00196 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14495 | -| time_elapsed | 76893 | -| total_timesteps | 1855360 | -| train/ | | -| approx_kl | 0.008867367 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 144940 | -| policy_gradient_loss | -0.00476 | -| std | 0.0106 | -| value_loss | 1e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14496 | -| time_elapsed | 76897 | -| total_timesteps | 1855488 | -| train/ | | -| approx_kl | 0.08961987 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.000806 | -| learning_rate | 0.0003 | -| loss | 0.0506 | -| n_updates | 144950 | -| policy_gradient_loss | 0.0126 | -| std | 0.0106 | -| value_loss | 6.92e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14497 | -| time_elapsed | 76902 | -| total_timesteps | 1855616 | -| train/ | | -| approx_kl | 0.00028094137 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.00175 | -| n_updates | 144960 | -| policy_gradient_loss | 0.00282 | -| std | 0.0106 | -| value_loss | 0.00288 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14498 | -| time_elapsed | 76907 | -| total_timesteps | 1855744 | -| train/ | | -| approx_kl | 0.025514532 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | 0.00913 | -| n_updates | 144970 | -| policy_gradient_loss | 0.0274 | -| std | 0.0106 | -| value_loss | 6.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14499 | -| time_elapsed | 76911 | -| total_timesteps | 1855872 | -| train/ | | -| approx_kl | 0.017972644 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 144980 | -| policy_gradient_loss | 0.0129 | -| std | 0.0106 | -| value_loss | 3.8e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14500 | -| time_elapsed | 76917 | -| total_timesteps | 1856000 | -| train/ | | -| approx_kl | 0.07567805 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.0485 | -| n_updates | 144990 | -| policy_gradient_loss | 0.0179 | -| std | 0.0105 | -| value_loss | 2.39e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14501 | -| time_elapsed | 76921 | -| total_timesteps | 1856128 | -| train/ | | -| approx_kl | 0.018302742 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.00194 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 145000 | -| policy_gradient_loss | 0.0173 | -| std | 0.0105 | -| value_loss | 0.000155 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14502 | -| time_elapsed | 76933 | -| total_timesteps | 1856256 | -| train/ | | -| approx_kl | 0.45016238 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.566 | -| learning_rate | 0.0003 | -| loss | 0.0728 | -| n_updates | 145010 | -| policy_gradient_loss | 0.0519 | -| std | 0.0105 | -| value_loss | 0.00882 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14503 | -| time_elapsed | 76938 | -| total_timesteps | 1856384 | -| train/ | | -| approx_kl | 0.01607025 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.00167 | -| learning_rate | 0.0003 | -| loss | 0.00352 | -| n_updates | 145020 | -| policy_gradient_loss | 0.012 | -| std | 0.0105 | -| value_loss | 7.88e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14504 | -| time_elapsed | 76941 | -| total_timesteps | 1856512 | -| train/ | | -| approx_kl | 0.11564723 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00518 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 145030 | -| policy_gradient_loss | 0.0683 | -| std | 0.0105 | -| value_loss | 3.21e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14505 | -| time_elapsed | 76946 | -| total_timesteps | 1856640 | -| train/ | | -| approx_kl | 0.062267862 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00902 | -| learning_rate | 0.0003 | -| loss | 0.0713 | -| n_updates | 145040 | -| policy_gradient_loss | 0.0634 | -| std | 0.0105 | -| value_loss | 2.7e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14506 | -| time_elapsed | 76951 | -| total_timesteps | 1856768 | -| train/ | | -| approx_kl | 0.0586077 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00643 | -| learning_rate | 0.0003 | -| loss | 0.069 | -| n_updates | 145050 | -| policy_gradient_loss | 0.0572 | -| std | 0.0105 | -| value_loss | 2.41e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 24 | -| iterations | 14507 | -| time_elapsed | 76956 | -| total_timesteps | 1856896 | -| train/ | | -| approx_kl | 0.04712873 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00529 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 145060 | -| policy_gradient_loss | 0.0632 | -| std | 0.0105 | -| value_loss | 1.93e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14508 | -| time_elapsed | 76961 | -| total_timesteps | 1857024 | -| train/ | | -| approx_kl | 0.050473623 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | -0.00573 | -| learning_rate | 0.0003 | -| loss | 0.0706 | -| n_updates | 145070 | -| policy_gradient_loss | 0.0542 | -| std | 0.0105 | -| value_loss | 1.73e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14509 | -| time_elapsed | 76973 | -| total_timesteps | 1857152 | -| train/ | | -| approx_kl | 0.064774826 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 145080 | -| policy_gradient_loss | 0.0149 | -| std | 0.0105 | -| value_loss | 0.000513 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14510 | -| time_elapsed | 76977 | -| total_timesteps | 1857280 | -| train/ | | -| approx_kl | 0.1271471 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.13 | -| explained_variance | 0.00183 | -| learning_rate | 0.0003 | -| loss | 0.0986 | -| n_updates | 145090 | -| policy_gradient_loss | 0.0619 | -| std | 0.0105 | -| value_loss | 1.15e-05 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14511 | -| time_elapsed | 76982 | -| total_timesteps | 1857408 | -| train/ | | -| approx_kl | 0.0677136 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0519 | -| n_updates | 145100 | -| policy_gradient_loss | 0.0595 | -| std | 0.0105 | -| value_loss | 4.82e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14512 | -| time_elapsed | 76987 | -| total_timesteps | 1857536 | -| train/ | | -| approx_kl | 0.012071019 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | -0.00801 | -| n_updates | 145110 | -| policy_gradient_loss | 0.00423 | -| std | 0.0105 | -| value_loss | 3.23e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14513 | -| time_elapsed | 76990 | -| total_timesteps | 1857664 | -| train/ | | -| approx_kl | 0.19548647 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 145120 | -| policy_gradient_loss | 0.0268 | -| std | 0.0105 | -| value_loss | 1.93e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14514 | -| time_elapsed | 76994 | -| total_timesteps | 1857792 | -| train/ | | -| approx_kl | 0.0039940435 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 8.74e-05 | -| n_updates | 145130 | -| policy_gradient_loss | 0.00098 | -| std | 0.0105 | -| value_loss | 1.86e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 24 | -| iterations | 14515 | -| time_elapsed | 76999 | -| total_timesteps | 1857920 | -| train/ | | -| approx_kl | 0.00025750697 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.000997 | -| n_updates | 145140 | -| policy_gradient_loss | 0.00245 | -| std | 0.0105 | -| value_loss | 4.4e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14516 | -| time_elapsed | 77004 | -| total_timesteps | 1858048 | -| train/ | | -| approx_kl | 0.03920965 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.00175 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 145150 | -| policy_gradient_loss | 0.00186 | -| std | 0.0105 | -| value_loss | 8.96e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14517 | -| time_elapsed | 77013 | -| total_timesteps | 1858176 | -| train/ | | -| approx_kl | 0.16510835 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.621 | -| learning_rate | 0.0003 | -| loss | 0.0674 | -| n_updates | 145160 | -| policy_gradient_loss | 0.0333 | -| std | 0.0105 | -| value_loss | 0.00653 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14518 | -| time_elapsed | 77018 | -| total_timesteps | 1858304 | -| train/ | | -| approx_kl | 0.027407842 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 145170 | -| policy_gradient_loss | 0.00616 | -| std | 0.0105 | -| value_loss | 7.47e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14519 | -| time_elapsed | 77025 | -| total_timesteps | 1858432 | -| train/ | | -| approx_kl | 0.0036794962 | -| clip_fraction | 0.068 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.00594 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 145180 | -| policy_gradient_loss | 0.000466 | -| std | 0.0105 | -| value_loss | 1.1e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14520 | -| time_elapsed | 77029 | -| total_timesteps | 1858560 | -| train/ | | -| approx_kl | 0.01101584 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.0191 | -| n_updates | 145190 | -| policy_gradient_loss | 0.0407 | -| std | 0.0105 | -| value_loss | 9.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14521 | -| time_elapsed | 77034 | -| total_timesteps | 1858688 | -| train/ | | -| approx_kl | 0.027867919 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | 0.0331 | -| n_updates | 145200 | -| policy_gradient_loss | 0.0393 | -| std | 0.0105 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14522 | -| time_elapsed | 77039 | -| total_timesteps | 1858816 | -| train/ | | -| approx_kl | 0.045114007 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.038 | -| n_updates | 145210 | -| policy_gradient_loss | 0.0604 | -| std | 0.0105 | -| value_loss | 7.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 24 | -| iterations | 14523 | -| time_elapsed | 77044 | -| total_timesteps | 1858944 | -| train/ | | -| approx_kl | 0.008887645 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 145220 | -| policy_gradient_loss | 0.0086 | -| std | 0.0105 | -| value_loss | 7.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14524 | -| time_elapsed | 77048 | -| total_timesteps | 1859072 | -| train/ | | -| approx_kl | 0.023917403 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.00794 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 145230 | -| policy_gradient_loss | 0.00555 | -| std | 0.0105 | -| value_loss | 4.57e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14525 | -| time_elapsed | 77057 | -| total_timesteps | 1859200 | -| train/ | | -| approx_kl | 0.05069424 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.741 | -| learning_rate | 0.0003 | -| loss | 0.0537 | -| n_updates | 145240 | -| policy_gradient_loss | 0.0219 | -| std | 0.0105 | -| value_loss | 0.00265 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14526 | -| time_elapsed | 77062 | -| total_timesteps | 1859328 | -| train/ | | -| approx_kl | 0.026448816 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.0019 | -| learning_rate | 0.0003 | -| loss | 0.00144 | -| n_updates | 145250 | -| policy_gradient_loss | -0.00144 | -| std | 0.0105 | -| value_loss | 4.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14527 | -| time_elapsed | 77066 | -| total_timesteps | 1859456 | -| train/ | | -| approx_kl | 0.013513917 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.00606 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 145260 | -| policy_gradient_loss | -0.00591 | -| std | 0.0105 | -| value_loss | 7.09e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14528 | -| time_elapsed | 77070 | -| total_timesteps | 1859584 | -| train/ | | -| approx_kl | 0.0016786335 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.00815 | -| n_updates | 145270 | -| policy_gradient_loss | 0.0178 | -| std | 0.0105 | -| value_loss | 4.42e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14529 | -| time_elapsed | 77075 | -| total_timesteps | 1859712 | -| train/ | | -| approx_kl | 0.0037469524 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 145280 | -| policy_gradient_loss | 0.0626 | -| std | 0.0105 | -| value_loss | 1.61e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14530 | -| time_elapsed | 77078 | -| total_timesteps | 1859840 | -| train/ | | -| approx_kl | 0.052132677 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 145290 | -| policy_gradient_loss | -0.00189 | -| std | 0.0105 | -| value_loss | 1.58e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14531 | -| time_elapsed | 77082 | -| total_timesteps | 1859968 | -| train/ | | -| approx_kl | 0.2241314 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.0606 | -| n_updates | 145300 | -| policy_gradient_loss | 0.00795 | -| std | 0.0105 | -| value_loss | 1.14e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14532 | -| time_elapsed | 77086 | -| total_timesteps | 1860096 | -| train/ | | -| approx_kl | 0.1041188 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 145310 | -| policy_gradient_loss | 0.0121 | -| std | 0.0105 | -| value_loss | 9.43e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14533 | -| time_elapsed | 77098 | -| total_timesteps | 1860224 | -| train/ | | -| approx_kl | 0.008955973 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 145320 | -| policy_gradient_loss | -0.0123 | -| std | 0.0105 | -| value_loss | 0.00259 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14534 | -| time_elapsed | 77102 | -| total_timesteps | 1860352 | -| train/ | | -| approx_kl | 0.09384038 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.00173 | -| learning_rate | 0.0003 | -| loss | 0.00385 | -| n_updates | 145330 | -| policy_gradient_loss | -0.00546 | -| std | 0.0105 | -| value_loss | 6.06e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14535 | -| time_elapsed | 77107 | -| total_timesteps | 1860480 | -| train/ | | -| approx_kl | 0.0009171325 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | -0.00556 | -| n_updates | 145340 | -| policy_gradient_loss | 0.00635 | -| std | 0.0105 | -| value_loss | 1.38e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14536 | -| time_elapsed | 77111 | -| total_timesteps | 1860608 | -| train/ | | -| approx_kl | 0.030534726 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.00847 | -| n_updates | 145350 | -| policy_gradient_loss | 0.00935 | -| std | 0.0105 | -| value_loss | 7.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14537 | -| time_elapsed | 77115 | -| total_timesteps | 1860736 | -| train/ | | -| approx_kl | 0.015488787 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | -0.000976 | -| n_updates | 145360 | -| policy_gradient_loss | 0.00862 | -| std | 0.0105 | -| value_loss | 5.78e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14538 | -| time_elapsed | 77119 | -| total_timesteps | 1860864 | -| train/ | | -| approx_kl | 0.04977786 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 145370 | -| policy_gradient_loss | 0.0126 | -| std | 0.0105 | -| value_loss | 3.87e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 24 | -| iterations | 14539 | -| time_elapsed | 77124 | -| total_timesteps | 1860992 | -| train/ | | -| approx_kl | 0.05446022 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.00205 | -| n_updates | 145380 | -| policy_gradient_loss | 0.00019 | -| std | 0.0105 | -| value_loss | 3.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14540 | -| time_elapsed | 77128 | -| total_timesteps | 1861120 | -| train/ | | -| approx_kl | 0.101193115 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | 0.0335 | -| n_updates | 145390 | -| policy_gradient_loss | 0.00955 | -| std | 0.0105 | -| value_loss | 2.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14541 | -| time_elapsed | 77143 | -| total_timesteps | 1861248 | -| train/ | | -| approx_kl | 0.03614813 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.638 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 145400 | -| policy_gradient_loss | -0.00632 | -| std | 0.0105 | -| value_loss | 0.007 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14542 | -| time_elapsed | 77148 | -| total_timesteps | 1861376 | -| train/ | | -| approx_kl | 0.13116568 | -| clip_fraction | 0.578 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.00609 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 145410 | -| policy_gradient_loss | 0.0795 | -| std | 0.0105 | -| value_loss | 4.63e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14543 | -| time_elapsed | 77152 | -| total_timesteps | 1861504 | -| train/ | | -| approx_kl | 0.06925502 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.00452 | -| learning_rate | 0.0003 | -| loss | 0.0645 | -| n_updates | 145420 | -| policy_gradient_loss | 0.0587 | -| std | 0.0105 | -| value_loss | 1.65e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14544 | -| time_elapsed | 77159 | -| total_timesteps | 1861632 | -| train/ | | -| approx_kl | 0.051017717 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0038 | -| learning_rate | 0.0003 | -| loss | 0.051 | -| n_updates | 145430 | -| policy_gradient_loss | 0.0542 | -| std | 0.0105 | -| value_loss | 9.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14545 | -| time_elapsed | 77164 | -| total_timesteps | 1861760 | -| train/ | | -| approx_kl | 0.059993155 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0078 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 145440 | -| policy_gradient_loss | 0.0935 | -| std | 0.0105 | -| value_loss | 5.65e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 24 | -| iterations | 14546 | -| time_elapsed | 77168 | -| total_timesteps | 1861888 | -| train/ | | -| approx_kl | 0.067392595 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.086 | -| n_updates | 145450 | -| policy_gradient_loss | 0.0815 | -| std | 0.0105 | -| value_loss | 2.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14547 | -| time_elapsed | 77173 | -| total_timesteps | 1862016 | -| train/ | | -| approx_kl | 0.010028124 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 145460 | -| policy_gradient_loss | 0.00716 | -| std | 0.0105 | -| value_loss | 1.78e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14548 | -| time_elapsed | 77185 | -| total_timesteps | 1862144 | -| train/ | | -| approx_kl | 0.21884926 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.756 | -| learning_rate | 0.0003 | -| loss | 0.0538 | -| n_updates | 145470 | -| policy_gradient_loss | 0.0142 | -| std | 0.0105 | -| value_loss | 0.00287 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14549 | -| time_elapsed | 77190 | -| total_timesteps | 1862272 | -| train/ | | -| approx_kl | 0.013120518 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.00434 | -| n_updates | 145480 | -| policy_gradient_loss | 0.00347 | -| std | 0.0105 | -| value_loss | 1.07e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14550 | -| time_elapsed | 77195 | -| total_timesteps | 1862400 | -| train/ | | -| approx_kl | 0.018274982 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.00344 | -| learning_rate | 0.0003 | -| loss | 0.00948 | -| n_updates | 145490 | -| policy_gradient_loss | 0.00418 | -| std | 0.0105 | -| value_loss | 2.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14551 | -| time_elapsed | 77200 | -| total_timesteps | 1862528 | -| train/ | | -| approx_kl | 0.014329273 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.00612 | -| n_updates | 145500 | -| policy_gradient_loss | 0.0029 | -| std | 0.0105 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14552 | -| time_elapsed | 77205 | -| total_timesteps | 1862656 | -| train/ | | -| approx_kl | 0.021322776 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 145510 | -| policy_gradient_loss | -0.00261 | -| std | 0.0105 | -| value_loss | 1.9e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14553 | -| time_elapsed | 77211 | -| total_timesteps | 1862784 | -| train/ | | -| approx_kl | 0.017191082 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.00474 | -| learning_rate | 0.0003 | -| loss | -0.00764 | -| n_updates | 145520 | -| policy_gradient_loss | -0.00376 | -| std | 0.0105 | -| value_loss | 9.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 24 | -| iterations | 14554 | -| time_elapsed | 77215 | -| total_timesteps | 1862912 | -| train/ | | -| approx_kl | 0.03765788 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.00826 | -| n_updates | 145530 | -| policy_gradient_loss | 0.0175 | -| std | 0.0105 | -| value_loss | 6.33e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14555 | -| time_elapsed | 77219 | -| total_timesteps | 1863040 | -| train/ | | -| approx_kl | 0.33866164 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 145540 | -| policy_gradient_loss | 0.0933 | -| std | 0.0105 | -| value_loss | 4.99e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14556 | -| time_elapsed | 77229 | -| total_timesteps | 1863168 | -| train/ | | -| approx_kl | 0.008768434 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 145550 | -| policy_gradient_loss | -0.0101 | -| std | 0.0105 | -| value_loss | 0.000746 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14557 | -| time_elapsed | 77232 | -| total_timesteps | 1863296 | -| train/ | | -| approx_kl | 0.037971135 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.0048 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 145560 | -| policy_gradient_loss | 0.0618 | -| std | 0.0105 | -| value_loss | 2.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14558 | -| time_elapsed | 77236 | -| total_timesteps | 1863424 | -| train/ | | -| approx_kl | 0.046190605 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.00314 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 145570 | -| policy_gradient_loss | 0.0597 | -| std | 0.0105 | -| value_loss | 1.67e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14559 | -| time_elapsed | 77239 | -| total_timesteps | 1863552 | -| train/ | | -| approx_kl | 0.009591788 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | -6.69e-05 | -| n_updates | 145580 | -| policy_gradient_loss | 0.00609 | -| std | 0.0105 | -| value_loss | 1.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14560 | -| time_elapsed | 77243 | -| total_timesteps | 1863680 | -| train/ | | -| approx_kl | 0.017654276 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 145590 | -| policy_gradient_loss | 0.00373 | -| std | 0.0105 | -| value_loss | 1.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14561 | -| time_elapsed | 77247 | -| total_timesteps | 1863808 | -| train/ | | -| approx_kl | 0.033982832 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 145600 | -| policy_gradient_loss | -0.00819 | -| std | 0.0105 | -| value_loss | 1.22e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14562 | -| time_elapsed | 77253 | -| total_timesteps | 1863936 | -| train/ | | -| approx_kl | 0.01115856 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 145610 | -| policy_gradient_loss | 0.00995 | -| std | 0.0105 | -| value_loss | 8.82e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14563 | -| time_elapsed | 77258 | -| total_timesteps | 1864064 | -| train/ | | -| approx_kl | 0.015226501 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 145620 | -| policy_gradient_loss | -0.000262 | -| std | 0.0105 | -| value_loss | 6.55e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14564 | -| time_elapsed | 77266 | -| total_timesteps | 1864192 | -| train/ | | -| approx_kl | 0.06536175 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.723 | -| learning_rate | 0.0003 | -| loss | 0.0249 | -| n_updates | 145630 | -| policy_gradient_loss | 0.0349 | -| std | 0.0105 | -| value_loss | 0.00413 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14565 | -| time_elapsed | 77271 | -| total_timesteps | 1864320 | -| train/ | | -| approx_kl | 0.058038875 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.000323 | -| learning_rate | 0.0003 | -| loss | 0.0675 | -| n_updates | 145640 | -| policy_gradient_loss | 0.0579 | -| std | 0.0105 | -| value_loss | 5.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14566 | -| time_elapsed | 77275 | -| total_timesteps | 1864448 | -| train/ | | -| approx_kl | 0.009703167 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | 0.00635 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 145650 | -| policy_gradient_loss | 0.0038 | -| std | 0.0104 | -| value_loss | 1.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14567 | -| time_elapsed | 77281 | -| total_timesteps | 1864576 | -| train/ | | -| approx_kl | 0.033127002 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.00282 | -| n_updates | 145660 | -| policy_gradient_loss | 0.0135 | -| std | 0.0104 | -| value_loss | 6.83e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14568 | -| time_elapsed | 77287 | -| total_timesteps | 1864704 | -| train/ | | -| approx_kl | 0.11612044 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -1.78 | -| learning_rate | 0.0003 | -| loss | 0.0286 | -| n_updates | 145670 | -| policy_gradient_loss | 0.00239 | -| std | 0.0104 | -| value_loss | 3.06e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14569 | -| time_elapsed | 77292 | -| total_timesteps | 1864832 | -| train/ | | -| approx_kl | 0.011183925 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 3.14 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 145680 | -| policy_gradient_loss | -0.00197 | -| std | 0.0104 | -| value_loss | 1.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 24 | -| iterations | 14570 | -| time_elapsed | 77297 | -| total_timesteps | 1864960 | -| train/ | | -| approx_kl | 0.006327628 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.000931 | -| n_updates | 145690 | -| policy_gradient_loss | 0.000298 | -| std | 0.0104 | -| value_loss | 9e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14571 | -| time_elapsed | 77304 | -| total_timesteps | 1865088 | -| train/ | | -| approx_kl | 0.008153135 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.00915 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 145700 | -| policy_gradient_loss | -0.00248 | -| std | 0.0104 | -| value_loss | 6.43e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14572 | -| time_elapsed | 77311 | -| total_timesteps | 1865216 | -| train/ | | -| approx_kl | 0.01189154 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | 0.663 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 145710 | -| policy_gradient_loss | -0.00849 | -| std | 0.0104 | -| value_loss | 0.00444 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14573 | -| time_elapsed | 77317 | -| total_timesteps | 1865344 | -| train/ | | -| approx_kl | 0.04611089 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 145720 | -| policy_gradient_loss | 0.000849 | -| std | 0.0104 | -| value_loss | 5.2e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14574 | -| time_elapsed | 77322 | -| total_timesteps | 1865472 | -| train/ | | -| approx_kl | 0.003119493 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.00641 | -| n_updates | 145730 | -| policy_gradient_loss | 0.0325 | -| std | 0.0104 | -| value_loss | 1.09e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14575 | -| time_elapsed | 77327 | -| total_timesteps | 1865600 | -| train/ | | -| approx_kl | 0.03766802 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | 0.00592 | -| n_updates | 145740 | -| policy_gradient_loss | 0.0452 | -| std | 0.0104 | -| value_loss | 4.92e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14576 | -| time_elapsed | 77332 | -| total_timesteps | 1865728 | -| train/ | | -| approx_kl | 0.0004306147 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.00343 | -| n_updates | 145750 | -| policy_gradient_loss | 0.0113 | -| std | 0.0104 | -| value_loss | 4.09e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14577 | -| time_elapsed | 77336 | -| total_timesteps | 1865856 | -| train/ | | -| approx_kl | 0.025747292 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.00872 | -| n_updates | 145760 | -| policy_gradient_loss | 0.00599 | -| std | 0.0104 | -| value_loss | 4.16e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14578 | -| time_elapsed | 77341 | -| total_timesteps | 1865984 | -| train/ | | -| approx_kl | 0.0013213698 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 145770 | -| policy_gradient_loss | 0.000488 | -| std | 0.0104 | -| value_loss | 1.91e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14579 | -| time_elapsed | 77345 | -| total_timesteps | 1866112 | -| train/ | | -| approx_kl | 0.065901734 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | 0.0505 | -| n_updates | 145780 | -| policy_gradient_loss | 0.0634 | -| std | 0.0104 | -| value_loss | 3.95e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14580 | -| time_elapsed | 77355 | -| total_timesteps | 1866240 | -| train/ | | -| approx_kl | 0.003170901 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | 0.639 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 145790 | -| policy_gradient_loss | -0.000934 | -| std | 0.0104 | -| value_loss | 0.00778 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14581 | -| time_elapsed | 77361 | -| total_timesteps | 1866368 | -| train/ | | -| approx_kl | 0.03842012 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 145800 | -| policy_gradient_loss | -0.00413 | -| std | 0.0104 | -| value_loss | 4.93e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14582 | -| time_elapsed | 77366 | -| total_timesteps | 1866496 | -| train/ | | -| approx_kl | 0.004507877 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.000744 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 145810 | -| policy_gradient_loss | 0.0014 | -| std | 0.0104 | -| value_loss | 6.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14583 | -| time_elapsed | 77372 | -| total_timesteps | 1866624 | -| train/ | | -| approx_kl | 0.025190828 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.00696 | -| n_updates | 145820 | -| policy_gradient_loss | 0.00156 | -| std | 0.0104 | -| value_loss | 3.47e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14584 | -| time_elapsed | 77377 | -| total_timesteps | 1866752 | -| train/ | | -| approx_kl | 0.0041778795 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 145830 | -| policy_gradient_loss | -0.000952 | -| std | 0.0104 | -| value_loss | 2.68e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14585 | -| time_elapsed | 77382 | -| total_timesteps | 1866880 | -| train/ | | -| approx_kl | 0.013763176 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.000445 | -| n_updates | 145840 | -| policy_gradient_loss | 0.00518 | -| std | 0.0104 | -| value_loss | 1.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14586 | -| time_elapsed | 77386 | -| total_timesteps | 1867008 | -| train/ | | -| approx_kl | 0.03316701 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 145850 | -| policy_gradient_loss | 0.0562 | -| std | 0.0103 | -| value_loss | 9.98e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14587 | -| time_elapsed | 77396 | -| total_timesteps | 1867136 | -| train/ | | -| approx_kl | 0.006123142 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 145860 | -| policy_gradient_loss | -0.00201 | -| std | 0.0103 | -| value_loss | 0.0003 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14588 | -| time_elapsed | 77401 | -| total_timesteps | 1867264 | -| train/ | | -| approx_kl | 0.01925358 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | 0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 145870 | -| policy_gradient_loss | 0.00197 | -| std | 0.0103 | -| value_loss | 0.00135 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14589 | -| time_elapsed | 77406 | -| total_timesteps | 1867392 | -| train/ | | -| approx_kl | 0.07809204 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.00681 | -| learning_rate | 0.0003 | -| loss | 0.0353 | -| n_updates | 145880 | -| policy_gradient_loss | 0.00584 | -| std | 0.0103 | -| value_loss | 2.19e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14590 | -| time_elapsed | 77411 | -| total_timesteps | 1867520 | -| train/ | | -| approx_kl | 0.006152894 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.00356 | -| n_updates | 145890 | -| policy_gradient_loss | 0.0135 | -| std | 0.0104 | -| value_loss | 5.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14591 | -| time_elapsed | 77415 | -| total_timesteps | 1867648 | -| train/ | | -| approx_kl | 0.10095569 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | 0.0803 | -| n_updates | 145900 | -| policy_gradient_loss | 0.0663 | -| std | 0.0104 | -| value_loss | 2.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14592 | -| time_elapsed | 77421 | -| total_timesteps | 1867776 | -| train/ | | -| approx_kl | 0.018675676 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 145910 | -| policy_gradient_loss | 0.00775 | -| std | 0.0104 | -| value_loss | 2.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14593 | -| time_elapsed | 77426 | -| total_timesteps | 1867904 | -| train/ | | -| approx_kl | 0.21110885 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.0793 | -| n_updates | 145920 | -| policy_gradient_loss | 0.0225 | -| std | 0.0104 | -| value_loss | 1.33e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14594 | -| time_elapsed | 77430 | -| total_timesteps | 1868032 | -| train/ | | -| approx_kl | 0.012016824 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 145930 | -| policy_gradient_loss | 0.00143 | -| std | 0.0104 | -| value_loss | 8.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14595 | -| time_elapsed | 77440 | -| total_timesteps | 1868160 | -| train/ | | -| approx_kl | 0.044260338 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 145940 | -| policy_gradient_loss | 0.0101 | -| std | 0.0103 | -| value_loss | 0.00139 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14596 | -| time_elapsed | 77444 | -| total_timesteps | 1868288 | -| train/ | | -| approx_kl | 0.059159175 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | 0.00207 | -| learning_rate | 0.0003 | -| loss | 0.063 | -| n_updates | 145950 | -| policy_gradient_loss | 0.014 | -| std | 0.0103 | -| value_loss | 3.78e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14597 | -| time_elapsed | 77449 | -| total_timesteps | 1868416 | -| train/ | | -| approx_kl | 0.0019153561 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | 0.00455 | -| learning_rate | 0.0003 | -| loss | 0.000253 | -| n_updates | 145960 | -| policy_gradient_loss | 0.00271 | -| std | 0.0103 | -| value_loss | 9.7e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14598 | -| time_elapsed | 77453 | -| total_timesteps | 1868544 | -| train/ | | -| approx_kl | 0.028412543 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.00479 | -| n_updates | 145970 | -| policy_gradient_loss | 0.0104 | -| std | 0.0104 | -| value_loss | 8.01e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14599 | -| time_elapsed | 77458 | -| total_timesteps | 1868672 | -| train/ | | -| approx_kl | 0.1844028 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | 0.0072 | -| learning_rate | 0.0003 | -| loss | 0.0992 | -| n_updates | 145980 | -| policy_gradient_loss | 0.0225 | -| std | 0.0104 | -| value_loss | 1.11e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14600 | -| time_elapsed | 77461 | -| total_timesteps | 1868800 | -| train/ | | -| approx_kl | 0.040454768 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | 0.00446 | -| n_updates | 145990 | -| policy_gradient_loss | 0.0134 | -| std | 0.0104 | -| value_loss | 8.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14601 | -| time_elapsed | 77465 | -| total_timesteps | 1868928 | -| train/ | | -| approx_kl | 0.041021254 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 146000 | -| policy_gradient_loss | 0.0268 | -| std | 0.0103 | -| value_loss | 2.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14602 | -| time_elapsed | 77470 | -| total_timesteps | 1869056 | -| train/ | | -| approx_kl | 0.04161755 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 146010 | -| policy_gradient_loss | -0.00239 | -| std | 0.0103 | -| value_loss | 2.33e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14603 | -| time_elapsed | 77478 | -| total_timesteps | 1869184 | -| train/ | | -| approx_kl | 0.04454545 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 146020 | -| policy_gradient_loss | -0.0084 | -| std | 0.0103 | -| value_loss | 0.00159 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14604 | -| time_elapsed | 77483 | -| total_timesteps | 1869312 | -| train/ | | -| approx_kl | 0.43608728 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 146030 | -| policy_gradient_loss | 0.0671 | -| std | 0.0104 | -| value_loss | 3.87e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14605 | -| time_elapsed | 77488 | -| total_timesteps | 1869440 | -| train/ | | -| approx_kl | 0.23584512 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.15 | -| explained_variance | -2.71 | -| learning_rate | 0.0003 | -| loss | 0.0956 | -| n_updates | 146040 | -| policy_gradient_loss | 0.0211 | -| std | 0.0103 | -| value_loss | 8.89e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14606 | -| time_elapsed | 77493 | -| total_timesteps | 1869568 | -| train/ | | -| approx_kl | 0.045674093 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.16 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.0332 | -| n_updates | 146050 | -| policy_gradient_loss | 0.00539 | -| std | 0.0103 | -| value_loss | 6.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14607 | -| time_elapsed | 77497 | -| total_timesteps | 1869696 | -| train/ | | -| approx_kl | 0.10165711 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.16 | -| explained_variance | -1.63 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 146060 | -| policy_gradient_loss | 0.0131 | -| std | 0.0102 | -| value_loss | 2.86e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14608 | -| time_elapsed | 77501 | -| total_timesteps | 1869824 | -| train/ | | -| approx_kl | 0.023641648 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.16 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 146070 | -| policy_gradient_loss | 0.0176 | -| std | 0.0102 | -| value_loss | 2.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14609 | -| time_elapsed | 77504 | -| total_timesteps | 1869952 | -| train/ | | -| approx_kl | 0.009520093 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.315 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 146080 | -| policy_gradient_loss | 0.00684 | -| std | 0.0102 | -| value_loss | 5.84e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14610 | -| time_elapsed | 77508 | -| total_timesteps | 1870080 | -| train/ | | -| approx_kl | 0.07364186 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.0331 | -| n_updates | 146090 | -| policy_gradient_loss | 0.00451 | -| std | 0.0102 | -| value_loss | 4.05e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14611 | -| time_elapsed | 77516 | -| total_timesteps | 1870208 | -| train/ | | -| approx_kl | 0.03498477 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 146100 | -| policy_gradient_loss | -0.00485 | -| std | 0.0102 | -| value_loss | 0.000636 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14612 | -| time_elapsed | 77521 | -| total_timesteps | 1870336 | -| train/ | | -| approx_kl | 0.04563018 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0748 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 146110 | -| policy_gradient_loss | 0.0097 | -| std | 0.0102 | -| value_loss | 7.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14613 | -| time_elapsed | 77526 | -| total_timesteps | 1870464 | -| train/ | | -| approx_kl | 0.17748763 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | 0.00549 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 146120 | -| policy_gradient_loss | 0.0857 | -| std | 0.0102 | -| value_loss | 8.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14614 | -| time_elapsed | 77531 | -| total_timesteps | 1870592 | -| train/ | | -| approx_kl | 0.026993614 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.00859 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 146130 | -| policy_gradient_loss | 0.0114 | -| std | 0.0102 | -| value_loss | 3.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14615 | -| time_elapsed | 77537 | -| total_timesteps | 1870720 | -| train/ | | -| approx_kl | 0.016485142 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00703 | -| n_updates | 146140 | -| policy_gradient_loss | 0.00553 | -| std | 0.0102 | -| value_loss | 2.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14616 | -| time_elapsed | 77541 | -| total_timesteps | 1870848 | -| train/ | | -| approx_kl | 0.019163318 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 146150 | -| policy_gradient_loss | 0.0022 | -| std | 0.0102 | -| value_loss | 1.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14617 | -| time_elapsed | 77545 | -| total_timesteps | 1870976 | -| train/ | | -| approx_kl | 0.0071602166 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 146160 | -| policy_gradient_loss | 0.00125 | -| std | 0.0102 | -| value_loss | 1.15e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14618 | -| time_elapsed | 77550 | -| total_timesteps | 1871104 | -| train/ | | -| approx_kl | 0.03465717 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 146170 | -| policy_gradient_loss | 0.0549 | -| std | 0.0102 | -| value_loss | 8.07e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14619 | -| time_elapsed | 77559 | -| total_timesteps | 1871232 | -| train/ | | -| approx_kl | 0.0043593384 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 146180 | -| policy_gradient_loss | 0.00114 | -| std | 0.0102 | -| value_loss | 0.00219 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14620 | -| time_elapsed | 77563 | -| total_timesteps | 1871360 | -| train/ | | -| approx_kl | 0.0944434 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.00589 | -| learning_rate | 0.0003 | -| loss | 0.0539 | -| n_updates | 146190 | -| policy_gradient_loss | 0.00868 | -| std | 0.0102 | -| value_loss | 1.19e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14621 | -| time_elapsed | 77568 | -| total_timesteps | 1871488 | -| train/ | | -| approx_kl | 0.005025822 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | 0.00282 | -| learning_rate | 0.0003 | -| loss | -0.000711 | -| n_updates | 146200 | -| policy_gradient_loss | 0.0106 | -| std | 0.0102 | -| value_loss | 8.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14622 | -| time_elapsed | 77573 | -| total_timesteps | 1871616 | -| train/ | | -| approx_kl | 0.08172327 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 146210 | -| policy_gradient_loss | 0.0527 | -| std | 0.0102 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14623 | -| time_elapsed | 77577 | -| total_timesteps | 1871744 | -| train/ | | -| approx_kl | 0.08480945 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.0572 | -| n_updates | 146220 | -| policy_gradient_loss | 0.0291 | -| std | 0.0102 | -| value_loss | 6.43e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14624 | -| time_elapsed | 77582 | -| total_timesteps | 1871872 | -| train/ | | -| approx_kl | 0.040772215 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 146230 | -| policy_gradient_loss | 0.0073 | -| std | 0.0101 | -| value_loss | 5.83e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14625 | -| time_elapsed | 77587 | -| total_timesteps | 1872000 | -| train/ | | -| approx_kl | 4.1761436e-05 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | 0.00262 | -| learning_rate | 0.0003 | -| loss | 0.00167 | -| n_updates | 146240 | -| policy_gradient_loss | -0.0127 | -| std | 0.0101 | -| value_loss | 9.32e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14626 | -| time_elapsed | 77591 | -| total_timesteps | 1872128 | -| train/ | | -| approx_kl | 0.007224036 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.00201 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 146250 | -| policy_gradient_loss | -0.000769 | -| std | 0.0101 | -| value_loss | 3.86e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14627 | -| time_elapsed | 77601 | -| total_timesteps | 1872256 | -| train/ | | -| approx_kl | 0.00019790279 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | 0.922 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 146260 | -| policy_gradient_loss | -0.00436 | -| std | 0.0101 | -| value_loss | 0.000267 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14628 | -| time_elapsed | 77605 | -| total_timesteps | 1872384 | -| train/ | | -| approx_kl | 0.005883368 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | 0.0056 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 146270 | -| policy_gradient_loss | 0.00283 | -| std | 0.0101 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14629 | -| time_elapsed | 77610 | -| total_timesteps | 1872512 | -| train/ | | -| approx_kl | 0.042066023 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 146280 | -| policy_gradient_loss | 0.00243 | -| std | 0.0101 | -| value_loss | 8.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14630 | -| time_elapsed | 77614 | -| total_timesteps | 1872640 | -| train/ | | -| approx_kl | 0.014385665 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.17 | -| explained_variance | -0.0782 | -| learning_rate | 0.0003 | -| loss | -0.00431 | -| n_updates | 146290 | -| policy_gradient_loss | 0.0149 | -| std | 0.0101 | -| value_loss | 1.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14631 | -| time_elapsed | 77619 | -| total_timesteps | 1872768 | -| train/ | | -| approx_kl | 0.050353963 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.0513 | -| n_updates | 146300 | -| policy_gradient_loss | 0.0214 | -| std | 0.0101 | -| value_loss | 8.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14632 | -| time_elapsed | 77623 | -| total_timesteps | 1872896 | -| train/ | | -| approx_kl | 0.014830988 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.0044 | -| n_updates | 146310 | -| policy_gradient_loss | 0.0188 | -| std | 0.0101 | -| value_loss | 4.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14633 | -| time_elapsed | 77627 | -| total_timesteps | 1873024 | -| train/ | | -| approx_kl | 0.059092168 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.0429 | -| n_updates | 146320 | -| policy_gradient_loss | 0.0283 | -| std | 0.0101 | -| value_loss | 3.2e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14634 | -| time_elapsed | 77638 | -| total_timesteps | 1873152 | -| train/ | | -| approx_kl | 0.04144335 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | 0.0134 | -| n_updates | 146330 | -| policy_gradient_loss | -0.00142 | -| std | 0.0101 | -| value_loss | 0.000279 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14635 | -| time_elapsed | 77643 | -| total_timesteps | 1873280 | -| train/ | | -| approx_kl | 0.013288625 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 146340 | -| policy_gradient_loss | 0.0104 | -| std | 0.0101 | -| value_loss | 3.27e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14636 | -| time_elapsed | 77648 | -| total_timesteps | 1873408 | -| train/ | | -| approx_kl | 0.0018442939 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.00414 | -| learning_rate | 0.0003 | -| loss | -0.000672 | -| n_updates | 146350 | -| policy_gradient_loss | 0.00825 | -| std | 0.0101 | -| value_loss | 2.88e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14637 | -| time_elapsed | 77653 | -| total_timesteps | 1873536 | -| train/ | | -| approx_kl | 0.028931651 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 146360 | -| policy_gradient_loss | 0.0156 | -| std | 0.0101 | -| value_loss | 3.07e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14638 | -| time_elapsed | 77658 | -| total_timesteps | 1873664 | -| train/ | | -| approx_kl | 0.04661358 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 146370 | -| policy_gradient_loss | 0.00568 | -| std | 0.0101 | -| value_loss | 9.38e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14639 | -| time_elapsed | 77662 | -| total_timesteps | 1873792 | -| train/ | | -| approx_kl | 0.10159594 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 146380 | -| policy_gradient_loss | 0.0189 | -| std | 0.0101 | -| value_loss | 6.23e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 24 | -| iterations | 14640 | -| time_elapsed | 77667 | -| total_timesteps | 1873920 | -| train/ | | -| approx_kl | 0.028270563 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 146390 | -| policy_gradient_loss | 0.000338 | -| std | 0.0101 | -| value_loss | 5.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14641 | -| time_elapsed | 77671 | -| total_timesteps | 1874048 | -| train/ | | -| approx_kl | 0.016266331 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 146400 | -| policy_gradient_loss | 0.00913 | -| std | 0.0101 | -| value_loss | 3.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14642 | -| time_elapsed | 77680 | -| total_timesteps | 1874176 | -| train/ | | -| approx_kl | 0.030755593 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | -0.00908 | -| n_updates | 146410 | -| policy_gradient_loss | 0.00244 | -| std | 0.0101 | -| value_loss | 0.000352 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14643 | -| time_elapsed | 77685 | -| total_timesteps | 1874304 | -| train/ | | -| approx_kl | 0.041740183 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0938 | -| learning_rate | 0.0003 | -| loss | 0.0339 | -| n_updates | 146420 | -| policy_gradient_loss | 0.0163 | -| std | 0.0101 | -| value_loss | 5.8e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14644 | -| time_elapsed | 77690 | -| total_timesteps | 1874432 | -| train/ | | -| approx_kl | 0.23499036 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.0951 | -| n_updates | 146430 | -| policy_gradient_loss | 0.022 | -| std | 0.0101 | -| value_loss | 8.06e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14645 | -| time_elapsed | 77695 | -| total_timesteps | 1874560 | -| train/ | | -| approx_kl | 0.013361683 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0044 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 146440 | -| policy_gradient_loss | -0.00627 | -| std | 0.0101 | -| value_loss | 1.83e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14646 | -| time_elapsed | 77699 | -| total_timesteps | 1874688 | -| train/ | | -| approx_kl | 2.3506582e-06 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | -0.000166 | -| n_updates | 146450 | -| policy_gradient_loss | 0.00131 | -| std | 0.0101 | -| value_loss | 1.26e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14647 | -| time_elapsed | 77705 | -| total_timesteps | 1874816 | -| train/ | | -| approx_kl | 0.040118422 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 146460 | -| policy_gradient_loss | 0.0109 | -| std | 0.0101 | -| value_loss | 7.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 24 | -| iterations | 14648 | -| time_elapsed | 77709 | -| total_timesteps | 1874944 | -| train/ | | -| approx_kl | 0.008216229 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 146470 | -| policy_gradient_loss | 0.0375 | -| std | 0.0101 | -| value_loss | 5.73e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14649 | -| time_elapsed | 77714 | -| total_timesteps | 1875072 | -| train/ | | -| approx_kl | 0.015424157 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 146480 | -| policy_gradient_loss | 0.079 | -| std | 0.0101 | -| value_loss | 2.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14650 | -| time_elapsed | 77721 | -| total_timesteps | 1875200 | -| train/ | | -| approx_kl | 0.037720747 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.548 | -| learning_rate | 0.0003 | -| loss | 0.043 | -| n_updates | 146490 | -| policy_gradient_loss | 0.0407 | -| std | 0.0101 | -| value_loss | 0.0118 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14651 | -| time_elapsed | 77726 | -| total_timesteps | 1875328 | -| train/ | | -| approx_kl | 0.04098138 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.0639 | -| n_updates | 146500 | -| policy_gradient_loss | 0.0543 | -| std | 0.0101 | -| value_loss | 7.19e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14652 | -| time_elapsed | 77730 | -| total_timesteps | 1875456 | -| train/ | | -| approx_kl | 0.009137498 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.00675 | -| learning_rate | 0.0003 | -| loss | 0.000916 | -| n_updates | 146510 | -| policy_gradient_loss | 0.00743 | -| std | 0.0101 | -| value_loss | 6.26e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14653 | -| time_elapsed | 77734 | -| total_timesteps | 1875584 | -| train/ | | -| approx_kl | 0.00016774889 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 146520 | -| policy_gradient_loss | 0.000649 | -| std | 0.0101 | -| value_loss | 3.11e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14654 | -| time_elapsed | 77740 | -| total_timesteps | 1875712 | -| train/ | | -| approx_kl | 0.018584855 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 146530 | -| policy_gradient_loss | 0.0119 | -| std | 0.0101 | -| value_loss | 1.88e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14655 | -| time_elapsed | 77745 | -| total_timesteps | 1875840 | -| train/ | | -| approx_kl | 0.21329676 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.0835 | -| n_updates | 146540 | -| policy_gradient_loss | 0.0225 | -| std | 0.0101 | -| value_loss | 1.48e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14656 | -| time_elapsed | 77750 | -| total_timesteps | 1875968 | -| train/ | | -| approx_kl | 0.005173235 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 146550 | -| policy_gradient_loss | 0.000836 | -| std | 0.0101 | -| value_loss | 9.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14657 | -| time_elapsed | 77755 | -| total_timesteps | 1876096 | -| train/ | | -| approx_kl | 0.026647698 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 146560 | -| policy_gradient_loss | 0.0196 | -| std | 0.0101 | -| value_loss | 1.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14658 | -| time_elapsed | 77763 | -| total_timesteps | 1876224 | -| train/ | | -| approx_kl | 0.33015725 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.736 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 146570 | -| policy_gradient_loss | 0.0536 | -| std | 0.0101 | -| value_loss | 0.00379 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14659 | -| time_elapsed | 77768 | -| total_timesteps | 1876352 | -| train/ | | -| approx_kl | 0.005178009 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.00016 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 146580 | -| policy_gradient_loss | 0.00928 | -| std | 0.0101 | -| value_loss | 4.35e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14660 | -| time_elapsed | 77774 | -| total_timesteps | 1876480 | -| train/ | | -| approx_kl | 0.10158882 | -| clip_fraction | 0.576 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.00437 | -| learning_rate | 0.0003 | -| loss | 0.0967 | -| n_updates | 146590 | -| policy_gradient_loss | 0.0681 | -| std | 0.01 | -| value_loss | 1.55e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14661 | -| time_elapsed | 77779 | -| total_timesteps | 1876608 | -| train/ | | -| approx_kl | 0.06974202 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 146600 | -| policy_gradient_loss | 0.0707 | -| std | 0.01 | -| value_loss | 1.97e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14662 | -| time_elapsed | 77784 | -| total_timesteps | 1876736 | -| train/ | | -| approx_kl | 0.07899375 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0795 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 146610 | -| policy_gradient_loss | 0.0893 | -| std | 0.01 | -| value_loss | 3.92e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14663 | -| time_elapsed | 77790 | -| total_timesteps | 1876864 | -| train/ | | -| approx_kl | 0.014567576 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.0053 | -| n_updates | 146620 | -| policy_gradient_loss | 0.0126 | -| std | 0.01 | -| value_loss | 2.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14664 | -| time_elapsed | 77795 | -| total_timesteps | 1876992 | -| train/ | | -| approx_kl | 0.0012840386 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 146630 | -| policy_gradient_loss | -0.000229 | -| std | 0.01 | -| value_loss | 3.43e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14665 | -| time_elapsed | 77800 | -| total_timesteps | 1877120 | -| train/ | | -| approx_kl | 0.17679529 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -61.6 | -| learning_rate | 0.0003 | -| loss | 0.032 | -| n_updates | 146640 | -| policy_gradient_loss | 0.00163 | -| std | 0.01 | -| value_loss | 1.06e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14666 | -| time_elapsed | 77809 | -| total_timesteps | 1877248 | -| train/ | | -| approx_kl | 0.0017038016 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | -0.000667 | -| n_updates | 146650 | -| policy_gradient_loss | 0.00292 | -| std | 0.01 | -| value_loss | 0.00375 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14667 | -| time_elapsed | 77813 | -| total_timesteps | 1877376 | -| train/ | | -| approx_kl | 0.014607252 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 146660 | -| policy_gradient_loss | 0.00613 | -| std | 0.01 | -| value_loss | 2.42e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14668 | -| time_elapsed | 77817 | -| total_timesteps | 1877504 | -| train/ | | -| approx_kl | 0.09635529 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 146670 | -| policy_gradient_loss | 0.00149 | -| std | 0.01 | -| value_loss | 1.68e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14669 | -| time_elapsed | 77822 | -| total_timesteps | 1877632 | -| train/ | | -| approx_kl | 0.03872878 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 146680 | -| policy_gradient_loss | 0.018 | -| std | 0.01 | -| value_loss | 1.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14670 | -| time_elapsed | 77827 | -| total_timesteps | 1877760 | -| train/ | | -| approx_kl | 0.19654319 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 146690 | -| policy_gradient_loss | 0.107 | -| std | 0.01 | -| value_loss | 1.12e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14671 | -| time_elapsed | 77832 | -| total_timesteps | 1877888 | -| train/ | | -| approx_kl | 0.022360953 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.00818 | -| n_updates | 146700 | -| policy_gradient_loss | 0.00817 | -| std | 0.01 | -| value_loss | 7.36e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14672 | -| time_elapsed | 77837 | -| total_timesteps | 1878016 | -| train/ | | -| approx_kl | 0.2773897 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 146710 | -| policy_gradient_loss | 0.0274 | -| std | 0.01 | -| value_loss | 3.94e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14673 | -| time_elapsed | 77848 | -| total_timesteps | 1878144 | -| train/ | | -| approx_kl | 0.0004080315 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 146720 | -| policy_gradient_loss | -0.00405 | -| std | 0.01 | -| value_loss | 0.000348 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14674 | -| time_elapsed | 77853 | -| total_timesteps | 1878272 | -| train/ | | -| approx_kl | 0.00014084298 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 146730 | -| policy_gradient_loss | 0.00272 | -| std | 0.01 | -| value_loss | 2.62e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14675 | -| time_elapsed | 77858 | -| total_timesteps | 1878400 | -| train/ | | -| approx_kl | 0.018798377 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00434 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 146740 | -| policy_gradient_loss | -0.0102 | -| std | 0.01 | -| value_loss | 1.49e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14676 | -| time_elapsed | 77863 | -| total_timesteps | 1878528 | -| train/ | | -| approx_kl | 0.0032143625 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 146750 | -| policy_gradient_loss | 0.00164 | -| std | 0.01 | -| value_loss | 5.82e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14677 | -| time_elapsed | 77868 | -| total_timesteps | 1878656 | -| train/ | | -| approx_kl | 0.029325234 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 146760 | -| policy_gradient_loss | 0.00629 | -| std | 0.01 | -| value_loss | 3.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14678 | -| time_elapsed | 77873 | -| total_timesteps | 1878784 | -| train/ | | -| approx_kl | 0.015214673 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.000604 | -| n_updates | 146770 | -| policy_gradient_loss | 0.000514 | -| std | 0.00999 | -| value_loss | 5.32e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14679 | -| time_elapsed | 77877 | -| total_timesteps | 1878912 | -| train/ | | -| approx_kl | 2.2341963e-05 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 146780 | -| policy_gradient_loss | -0.00105 | -| std | 0.00998 | -| value_loss | 1.58e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14680 | -| time_elapsed | 77883 | -| total_timesteps | 1879040 | -| train/ | | -| approx_kl | 0.02066892 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.00267 | -| n_updates | 146790 | -| policy_gradient_loss | 0.00111 | -| std | 0.00998 | -| value_loss | 1.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14681 | -| time_elapsed | 77892 | -| total_timesteps | 1879168 | -| train/ | | -| approx_kl | 0.014279898 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.908 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 146800 | -| policy_gradient_loss | -0.0127 | -| std | 0.00998 | -| value_loss | 0.000366 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14682 | -| time_elapsed | 77896 | -| total_timesteps | 1879296 | -| train/ | | -| approx_kl | 0.019957084 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 146810 | -| policy_gradient_loss | -0.00257 | -| std | 0.00998 | -| value_loss | 6.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14683 | -| time_elapsed | 77902 | -| total_timesteps | 1879424 | -| train/ | | -| approx_kl | 0.019723386 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00185 | -| learning_rate | 0.0003 | -| loss | 0.00565 | -| n_updates | 146820 | -| policy_gradient_loss | 0.00281 | -| std | 0.00998 | -| value_loss | 7.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14684 | -| time_elapsed | 77908 | -| total_timesteps | 1879552 | -| train/ | | -| approx_kl | 0.019236721 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 146830 | -| policy_gradient_loss | -0.00431 | -| std | 0.00998 | -| value_loss | 5.98e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14685 | -| time_elapsed | 77913 | -| total_timesteps | 1879680 | -| train/ | | -| approx_kl | 0.052922316 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 146840 | -| policy_gradient_loss | 0.00809 | -| std | 0.00999 | -| value_loss | 8.12e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14686 | -| time_elapsed | 77918 | -| total_timesteps | 1879808 | -| train/ | | -| approx_kl | 0.6597979 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.324 | -| n_updates | 146850 | -| policy_gradient_loss | 0.109 | -| std | 0.00999 | -| value_loss | 5.51e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14687 | -| time_elapsed | 77923 | -| total_timesteps | 1879936 | -| train/ | | -| approx_kl | 0.01493371 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.00476 | -| n_updates | 146860 | -| policy_gradient_loss | 0.000528 | -| std | 0.00999 | -| value_loss | 9.63e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14688 | -| time_elapsed | 77927 | -| total_timesteps | 1880064 | -| train/ | | -| approx_kl | 0.008020305 | -| clip_fraction | 0.0469 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 146870 | -| policy_gradient_loss | -0.00108 | -| std | 0.01 | -| value_loss | 5.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14689 | -| time_elapsed | 77935 | -| total_timesteps | 1880192 | -| train/ | | -| approx_kl | 0.008750193 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.457 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 146880 | -| policy_gradient_loss | -0.0127 | -| std | 0.00999 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14690 | -| time_elapsed | 77940 | -| total_timesteps | 1880320 | -| train/ | | -| approx_kl | 0.066452615 | -| clip_fraction | 0.558 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0978 | -| learning_rate | 0.0003 | -| loss | 0.0422 | -| n_updates | 146890 | -| policy_gradient_loss | 0.056 | -| std | 0.00999 | -| value_loss | 5.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14691 | -| time_elapsed | 77945 | -| total_timesteps | 1880448 | -| train/ | | -| approx_kl | 0.01348683 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -3.24 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 146900 | -| policy_gradient_loss | 0.000806 | -| std | 0.00999 | -| value_loss | 8.8e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14692 | -| time_elapsed | 77951 | -| total_timesteps | 1880576 | -| train/ | | -| approx_kl | 0.018403709 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.854 | -| learning_rate | 0.0003 | -| loss | -0.00819 | -| n_updates | 146910 | -| policy_gradient_loss | 0.00045 | -| std | 0.01 | -| value_loss | 2.74e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14693 | -| time_elapsed | 77955 | -| total_timesteps | 1880704 | -| train/ | | -| approx_kl | 0.0065739923 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | 0.00268 | -| n_updates | 146920 | -| policy_gradient_loss | 0.00468 | -| std | 0.00999 | -| value_loss | 1.61e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14694 | -| time_elapsed | 77960 | -| total_timesteps | 1880832 | -| train/ | | -| approx_kl | 0.028040618 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0993 | -| learning_rate | 0.0003 | -| loss | 0.00377 | -| n_updates | 146930 | -| policy_gradient_loss | 0.00569 | -| std | 0.01 | -| value_loss | 1.52e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14695 | -| time_elapsed | 77965 | -| total_timesteps | 1880960 | -| train/ | | -| approx_kl | 0.003061309 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 146940 | -| policy_gradient_loss | -0.00265 | -| std | 0.01 | -| value_loss | 5.72e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14696 | -| time_elapsed | 77969 | -| total_timesteps | 1881088 | -| train/ | | -| approx_kl | 0.12793429 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.00736 | -| learning_rate | 0.0003 | -| loss | 0.0788 | -| n_updates | 146950 | -| policy_gradient_loss | 0.0152 | -| std | 0.01 | -| value_loss | 1.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14697 | -| time_elapsed | 77977 | -| total_timesteps | 1881216 | -| train/ | | -| approx_kl | 0.006700426 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 146960 | -| policy_gradient_loss | 0.00329 | -| std | 0.0101 | -| value_loss | 0.000785 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14698 | -| time_elapsed | 77981 | -| total_timesteps | 1881344 | -| train/ | | -| approx_kl | 0.14745602 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 146970 | -| policy_gradient_loss | 0.0829 | -| std | 0.0101 | -| value_loss | 1.92e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14699 | -| time_elapsed | 77986 | -| total_timesteps | 1881472 | -| train/ | | -| approx_kl | 0.016024403 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.00488 | -| learning_rate | 0.0003 | -| loss | 0.00941 | -| n_updates | 146980 | -| policy_gradient_loss | 0.00879 | -| std | 0.0101 | -| value_loss | 1.36e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14700 | -| time_elapsed | 77991 | -| total_timesteps | 1881600 | -| train/ | | -| approx_kl | 0.273439 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 146990 | -| policy_gradient_loss | 0.0357 | -| std | 0.0101 | -| value_loss | 1.23e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14701 | -| time_elapsed | 77995 | -| total_timesteps | 1881728 | -| train/ | | -| approx_kl | 0.01864284 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.00884 | -| learning_rate | 0.0003 | -| loss | -0.00707 | -| n_updates | 147000 | -| policy_gradient_loss | -0.00254 | -| std | 0.0101 | -| value_loss | 6.98e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14702 | -| time_elapsed | 77999 | -| total_timesteps | 1881856 | -| train/ | | -| approx_kl | 0.019160789 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 147010 | -| policy_gradient_loss | 0.000243 | -| std | 0.0101 | -| value_loss | 4.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14703 | -| time_elapsed | 78004 | -| total_timesteps | 1881984 | -| train/ | | -| approx_kl | 0.018395009 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 147020 | -| policy_gradient_loss | -0.00908 | -| std | 0.0101 | -| value_loss | 3.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 24 | -| iterations | 14704 | -| time_elapsed | 78009 | -| total_timesteps | 1882112 | -| train/ | | -| approx_kl | 0.019582167 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 147030 | -| policy_gradient_loss | 0.00532 | -| std | 0.0101 | -| value_loss | 2.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 24 | -| iterations | 14705 | -| time_elapsed | 78022 | -| total_timesteps | 1882240 | -| train/ | | -| approx_kl | 0.014493972 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.852 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 147040 | -| policy_gradient_loss | -0.00858 | -| std | 0.0101 | -| value_loss | 0.000521 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 24 | -| iterations | 14706 | -| time_elapsed | 78028 | -| total_timesteps | 1882368 | -| train/ | | -| approx_kl | 0.04910285 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0384 | -| n_updates | 147050 | -| policy_gradient_loss | 0.0544 | -| std | 0.0101 | -| value_loss | 1.46e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 24 | -| iterations | 14707 | -| time_elapsed | 78033 | -| total_timesteps | 1882496 | -| train/ | | -| approx_kl | 0.0663394 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 147060 | -| policy_gradient_loss | 0.0737 | -| std | 0.0101 | -| value_loss | 5.52e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 24 | -| iterations | 14708 | -| time_elapsed | 78038 | -| total_timesteps | 1882624 | -| train/ | | -| approx_kl | 0.013628177 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 147070 | -| policy_gradient_loss | 0.00972 | -| std | 0.0101 | -| value_loss | 1.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 24 | -| iterations | 14709 | -| time_elapsed | 78040 | -| total_timesteps | 1882752 | -| train/ | | -| approx_kl | 0.020139594 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0485 | -| n_updates | 147080 | -| policy_gradient_loss | -0.0072 | -| std | 0.0101 | -| value_loss | 1.21e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 24 | -| iterations | 14710 | -| time_elapsed | 78043 | -| total_timesteps | 1882880 | -| train/ | | -| approx_kl | 0.25509158 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 147090 | -| policy_gradient_loss | 0.0222 | -| std | 0.0101 | -| value_loss | 7.18e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14711 | -| time_elapsed | 78046 | -| total_timesteps | 1883008 | -| train/ | | -| approx_kl | 0.011330795 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 147100 | -| policy_gradient_loss | 0.000135 | -| std | 0.0101 | -| value_loss | 4.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14712 | -| time_elapsed | 78058 | -| total_timesteps | 1883136 | -| train/ | | -| approx_kl | 0.011267819 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.938 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 147110 | -| policy_gradient_loss | -0.0113 | -| std | 0.0101 | -| value_loss | 0.000345 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14713 | -| time_elapsed | 78062 | -| total_timesteps | 1883264 | -| train/ | | -| approx_kl | 0.038519435 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.0847 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 147120 | -| policy_gradient_loss | 0.0402 | -| std | 0.0101 | -| value_loss | 9.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14714 | -| time_elapsed | 78066 | -| total_timesteps | 1883392 | -| train/ | | -| approx_kl | 0.049753673 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.00238 | -| learning_rate | 0.0003 | -| loss | 0.0889 | -| n_updates | 147130 | -| policy_gradient_loss | 0.0654 | -| std | 0.0101 | -| value_loss | 7.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14715 | -| time_elapsed | 78072 | -| total_timesteps | 1883520 | -| train/ | | -| approx_kl | 0.007295166 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.00845 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 147140 | -| policy_gradient_loss | 0.00624 | -| std | 0.0101 | -| value_loss | 2.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14716 | -| time_elapsed | 78077 | -| total_timesteps | 1883648 | -| train/ | | -| approx_kl | 0.0012396425 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.000167 | -| n_updates | 147150 | -| policy_gradient_loss | 0.00258 | -| std | 0.01 | -| value_loss | 1.34e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14717 | -| time_elapsed | 78081 | -| total_timesteps | 1883776 | -| train/ | | -| approx_kl | 0.044661403 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.0075 | -| learning_rate | 0.0003 | -| loss | 0.00699 | -| n_updates | 147160 | -| policy_gradient_loss | -0.00268 | -| std | 0.01 | -| value_loss | 1.99e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14718 | -| time_elapsed | 78086 | -| total_timesteps | 1883904 | -| train/ | | -| approx_kl | 0.10679747 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.0467 | -| n_updates | 147170 | -| policy_gradient_loss | 0.00679 | -| std | 0.01 | -| value_loss | 1.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14719 | -| time_elapsed | 78092 | -| total_timesteps | 1884032 | -| train/ | | -| approx_kl | 0.004754518 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -1.61e-05 | -| n_updates | 147180 | -| policy_gradient_loss | 0.0141 | -| std | 0.01 | -| value_loss | 1.17e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14720 | -| time_elapsed | 78101 | -| total_timesteps | 1884160 | -| train/ | | -| approx_kl | 0.1157209 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.569 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 147190 | -| policy_gradient_loss | 0.0606 | -| std | 0.01 | -| value_loss | 0.0119 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14721 | -| time_elapsed | 78105 | -| total_timesteps | 1884288 | -| train/ | | -| approx_kl | 0.01963497 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 147200 | -| policy_gradient_loss | 0.00858 | -| std | 0.01 | -| value_loss | 8.63e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14722 | -| time_elapsed | 78110 | -| total_timesteps | 1884416 | -| train/ | | -| approx_kl | 0.00056230044 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.18 | -| explained_variance | 0.00718 | -| learning_rate | 0.0003 | -| loss | 0.00127 | -| n_updates | 147210 | -| policy_gradient_loss | 0.00101 | -| std | 0.01 | -| value_loss | 9.04e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14723 | -| time_elapsed | 78115 | -| total_timesteps | 1884544 | -| train/ | | -| approx_kl | 0.07783088 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.0885 | -| n_updates | 147220 | -| policy_gradient_loss | 0.0676 | -| std | 0.01 | -| value_loss | 1.54e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14724 | -| time_elapsed | 78119 | -| total_timesteps | 1884672 | -| train/ | | -| approx_kl | 0.01413222 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.000645 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 147230 | -| policy_gradient_loss | 0.00747 | -| std | 0.01 | -| value_loss | 4.29e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14725 | -| time_elapsed | 78123 | -| total_timesteps | 1884800 | -| train/ | | -| approx_kl | 0.00062095514 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.000162 | -| n_updates | 147240 | -| policy_gradient_loss | 0.0115 | -| std | 0.01 | -| value_loss | 1.55e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 24 | -| iterations | 14726 | -| time_elapsed | 78128 | -| total_timesteps | 1884928 | -| train/ | | -| approx_kl | 0.26935256 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00747 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 147250 | -| policy_gradient_loss | 0.0355 | -| std | 0.00999 | -| value_loss | 0.000104 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14727 | -| time_elapsed | 78131 | -| total_timesteps | 1885056 | -| train/ | | -| approx_kl | 0.0040221633 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0963 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 147260 | -| policy_gradient_loss | 0.00128 | -| std | 0.00998 | -| value_loss | 0.00022 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14728 | -| time_elapsed | 78139 | -| total_timesteps | 1885184 | -| train/ | | -| approx_kl | 0.02018485 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.688 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 147270 | -| policy_gradient_loss | 0.0185 | -| std | 0.00997 | -| value_loss | 0.00619 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14729 | -| time_elapsed | 78143 | -| total_timesteps | 1885312 | -| train/ | | -| approx_kl | 0.04694135 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.0438 | -| n_updates | 147280 | -| policy_gradient_loss | 0.0659 | -| std | 0.00997 | -| value_loss | 0.000102 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14730 | -| time_elapsed | 78148 | -| total_timesteps | 1885440 | -| train/ | | -| approx_kl | 0.009137515 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00297 | -| learning_rate | 0.0003 | -| loss | 0.000923 | -| n_updates | 147290 | -| policy_gradient_loss | 0.00751 | -| std | 0.00997 | -| value_loss | 8.84e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14731 | -| time_elapsed | 78153 | -| total_timesteps | 1885568 | -| train/ | | -| approx_kl | 0.06618628 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 147300 | -| policy_gradient_loss | 0.00978 | -| std | 0.00997 | -| value_loss | 6.85e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14732 | -| time_elapsed | 78158 | -| total_timesteps | 1885696 | -| train/ | | -| approx_kl | 0.008578923 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 147310 | -| policy_gradient_loss | 0.013 | -| std | 0.00997 | -| value_loss | 4.66e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14733 | -| time_elapsed | 78163 | -| total_timesteps | 1885824 | -| train/ | | -| approx_kl | 0.1014503 | -| clip_fraction | 0.583 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.0884 | -| n_updates | 147320 | -| policy_gradient_loss | 0.0727 | -| std | 0.00997 | -| value_loss | 3.4e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14734 | -| time_elapsed | 78167 | -| total_timesteps | 1885952 | -| train/ | | -| approx_kl | 0.019914633 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | -0.00955 | -| n_updates | 147330 | -| policy_gradient_loss | 0.0063 | -| std | 0.00997 | -| value_loss | 2.82e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14735 | -| time_elapsed | 78171 | -| total_timesteps | 1886080 | -| train/ | | -| approx_kl | 0.0613864 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | 0.0417 | -| n_updates | 147340 | -| policy_gradient_loss | 0.00866 | -| std | 0.00997 | -| value_loss | 1.49e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14736 | -| time_elapsed | 78181 | -| total_timesteps | 1886208 | -| train/ | | -| approx_kl | 0.25942683 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.869 | -| learning_rate | 0.0003 | -| loss | 0.0332 | -| n_updates | 147350 | -| policy_gradient_loss | -0.000162 | -| std | 0.00998 | -| value_loss | 0.0011 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14737 | -| time_elapsed | 78186 | -| total_timesteps | 1886336 | -| train/ | | -| approx_kl | 0.010514402 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00589 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 147360 | -| policy_gradient_loss | -0.00379 | -| std | 0.00998 | -| value_loss | 7.67e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14738 | -| time_elapsed | 78190 | -| total_timesteps | 1886464 | -| train/ | | -| approx_kl | 3.6608893e-05 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.000874 | -| n_updates | 147370 | -| policy_gradient_loss | -0.00146 | -| std | 0.00998 | -| value_loss | 1.25e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14739 | -| time_elapsed | 78194 | -| total_timesteps | 1886592 | -| train/ | | -| approx_kl | 0.002458563 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | 2.64e-05 | -| n_updates | 147380 | -| policy_gradient_loss | 0.00198 | -| std | 0.00996 | -| value_loss | 2.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14740 | -| time_elapsed | 78200 | -| total_timesteps | 1886720 | -| train/ | | -| approx_kl | 0.027512072 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 147390 | -| policy_gradient_loss | 0.00774 | -| std | 0.00996 | -| value_loss | 1.93e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14741 | -| time_elapsed | 78205 | -| total_timesteps | 1886848 | -| train/ | | -| approx_kl | 0.017068103 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0453 | -| learning_rate | 0.0003 | -| loss | 0.0048 | -| n_updates | 147400 | -| policy_gradient_loss | 0.0028 | -| std | 0.00995 | -| value_loss | 3.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 14742 | -| time_elapsed | 78210 | -| total_timesteps | 1886976 | -| train/ | | -| approx_kl | 0.03612952 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.00204 | -| n_updates | 147410 | -| policy_gradient_loss | 0.0145 | -| std | 0.00995 | -| value_loss | 2.18e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14743 | -| time_elapsed | 78215 | -| total_timesteps | 1887104 | -| train/ | | -| approx_kl | 0.04429827 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 147420 | -| policy_gradient_loss | 0.0241 | -| std | 0.00995 | -| value_loss | 1.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14744 | -| time_elapsed | 78223 | -| total_timesteps | 1887232 | -| train/ | | -| approx_kl | 0.089793965 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -2.83 | -| learning_rate | 0.0003 | -| loss | -0.00954 | -| n_updates | 147430 | -| policy_gradient_loss | -0.00543 | -| std | 0.00995 | -| value_loss | 0.0019 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14745 | -| time_elapsed | 78229 | -| total_timesteps | 1887360 | -| train/ | | -| approx_kl | 0.027625341 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.0486 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 147440 | -| policy_gradient_loss | 0.0419 | -| std | 0.00995 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14746 | -| time_elapsed | 78234 | -| total_timesteps | 1887488 | -| train/ | | -| approx_kl | 0.045143735 | -| clip_fraction | 0.589 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 147450 | -| policy_gradient_loss | 0.0562 | -| std | 0.00995 | -| value_loss | 1.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14747 | -| time_elapsed | 78238 | -| total_timesteps | 1887616 | -| train/ | | -| approx_kl | 0.050243057 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 147460 | -| policy_gradient_loss | 0.0443 | -| std | 0.00995 | -| value_loss | 4.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14748 | -| time_elapsed | 78243 | -| total_timesteps | 1887744 | -| train/ | | -| approx_kl | 0.057140574 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | 0.0466 | -| n_updates | 147470 | -| policy_gradient_loss | 0.0451 | -| std | 0.00995 | -| value_loss | 3.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 14749 | -| time_elapsed | 78248 | -| total_timesteps | 1887872 | -| train/ | | -| approx_kl | 0.054324392 | -| clip_fraction | 0.563 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.0695 | -| n_updates | 147480 | -| policy_gradient_loss | 0.0639 | -| std | 0.00995 | -| value_loss | 2.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14750 | -| time_elapsed | 78253 | -| total_timesteps | 1888000 | -| train/ | | -| approx_kl | 0.048481837 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.043 | -| n_updates | 147490 | -| policy_gradient_loss | 0.0446 | -| std | 0.00995 | -| value_loss | 2.19e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14751 | -| time_elapsed | 78257 | -| total_timesteps | 1888128 | -| train/ | | -| approx_kl | 0.014461797 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00191 | -| learning_rate | 0.0003 | -| loss | -0.00796 | -| n_updates | 147500 | -| policy_gradient_loss | 0.00983 | -| std | 0.00995 | -| value_loss | 1.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14752 | -| time_elapsed | 78269 | -| total_timesteps | 1888256 | -| train/ | | -| approx_kl | 0.020651858 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 147510 | -| policy_gradient_loss | -0.00694 | -| std | 0.00995 | -| value_loss | 0.00174 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14753 | -| time_elapsed | 78275 | -| total_timesteps | 1888384 | -| train/ | | -| approx_kl | 0.0011405898 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0664 | -| learning_rate | 0.0003 | -| loss | -0.00083 | -| n_updates | 147520 | -| policy_gradient_loss | 0.00952 | -| std | 0.00995 | -| value_loss | 2.6e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14754 | -| time_elapsed | 78280 | -| total_timesteps | 1888512 | -| train/ | | -| approx_kl | 0.20656943 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00627 | -| learning_rate | 0.0003 | -| loss | 0.0952 | -| n_updates | 147530 | -| policy_gradient_loss | 0.0243 | -| std | 0.00996 | -| value_loss | 2.83e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14755 | -| time_elapsed | 78286 | -| total_timesteps | 1888640 | -| train/ | | -| approx_kl | 0.016768385 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0988 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 147540 | -| policy_gradient_loss | -0.00242 | -| std | 0.00996 | -| value_loss | 3.11e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14756 | -| time_elapsed | 78291 | -| total_timesteps | 1888768 | -| train/ | | -| approx_kl | 0.003354377 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00548 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 147550 | -| policy_gradient_loss | 0.00208 | -| std | 0.00996 | -| value_loss | 1.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 24 | -| iterations | 14757 | -| time_elapsed | 78296 | -| total_timesteps | 1888896 | -| train/ | | -| approx_kl | 0.013508055 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.00695 | -| n_updates | 147560 | -| policy_gradient_loss | 0.0627 | -| std | 0.00995 | -| value_loss | 1.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14758 | -| time_elapsed | 78300 | -| total_timesteps | 1889024 | -| train/ | | -| approx_kl | 0.03835533 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | 0.0635 | -| n_updates | 147570 | -| policy_gradient_loss | 0.0513 | -| std | 0.00995 | -| value_loss | 8.41e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14759 | -| time_elapsed | 78311 | -| total_timesteps | 1889152 | -| train/ | | -| approx_kl | 0.05920948 | -| clip_fraction | 0.576 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.716 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 147580 | -| policy_gradient_loss | 0.0329 | -| std | 0.00995 | -| value_loss | 0.00502 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14760 | -| time_elapsed | 78315 | -| total_timesteps | 1889280 | -| train/ | | -| approx_kl | 0.015371786 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 147590 | -| policy_gradient_loss | 0.0075 | -| std | 0.00995 | -| value_loss | 1.34e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14761 | -| time_elapsed | 78319 | -| total_timesteps | 1889408 | -| train/ | | -| approx_kl | 0.00047380803 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.000595 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 147600 | -| policy_gradient_loss | 0.00188 | -| std | 0.00995 | -| value_loss | 2.12e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14762 | -| time_elapsed | 78324 | -| total_timesteps | 1889536 | -| train/ | | -| approx_kl | 0.08195944 | -| clip_fraction | 0.586 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.0646 | -| n_updates | 147610 | -| policy_gradient_loss | 0.0718 | -| std | 0.00995 | -| value_loss | 1.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14763 | -| time_elapsed | 78328 | -| total_timesteps | 1889664 | -| train/ | | -| approx_kl | 0.05673859 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.0623 | -| n_updates | 147620 | -| policy_gradient_loss | 0.0546 | -| std | 0.00995 | -| value_loss | 7.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14764 | -| time_elapsed | 78332 | -| total_timesteps | 1889792 | -| train/ | | -| approx_kl | 0.011986779 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.000735 | -| n_updates | 147630 | -| policy_gradient_loss | 0.0101 | -| std | 0.00995 | -| value_loss | 4.84e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14765 | -| time_elapsed | 78336 | -| total_timesteps | 1889920 | -| train/ | | -| approx_kl | 0.00029146764 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.000613 | -| n_updates | 147640 | -| policy_gradient_loss | 0.00235 | -| std | 0.00995 | -| value_loss | 3.6e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14766 | -| time_elapsed | 78342 | -| total_timesteps | 1890048 | -| train/ | | -| approx_kl | 0.023066152 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.00073 | -| n_updates | 147650 | -| policy_gradient_loss | 0.00985 | -| std | 0.00995 | -| value_loss | 2.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14767 | -| time_elapsed | 78354 | -| total_timesteps | 1890176 | -| train/ | | -| approx_kl | 0.11344363 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 147660 | -| policy_gradient_loss | 0.00799 | -| std | 0.00995 | -| value_loss | 0.00132 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14768 | -| time_elapsed | 78360 | -| total_timesteps | 1890304 | -| train/ | | -| approx_kl | 0.0004502288 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.000563 | -| n_updates | 147670 | -| policy_gradient_loss | 0.00358 | -| std | 0.00995 | -| value_loss | 3.61e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14769 | -| time_elapsed | 78364 | -| total_timesteps | 1890432 | -| train/ | | -| approx_kl | 0.032608803 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.00802 | -| n_updates | 147680 | -| policy_gradient_loss | 0.0321 | -| std | 0.00994 | -| value_loss | 9.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14770 | -| time_elapsed | 78369 | -| total_timesteps | 1890560 | -| train/ | | -| approx_kl | 0.11783253 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0489 | -| learning_rate | 0.0003 | -| loss | 0.06 | -| n_updates | 147690 | -| policy_gradient_loss | 0.0189 | -| std | 0.00994 | -| value_loss | 4.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14771 | -| time_elapsed | 78374 | -| total_timesteps | 1890688 | -| train/ | | -| approx_kl | 0.023803502 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 147700 | -| policy_gradient_loss | 0.0295 | -| std | 0.00995 | -| value_loss | 3.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14772 | -| time_elapsed | 78378 | -| total_timesteps | 1890816 | -| train/ | | -| approx_kl | 0.009480835 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.00537 | -| n_updates | 147710 | -| policy_gradient_loss | 0.00845 | -| std | 0.00995 | -| value_loss | 2.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 14773 | -| time_elapsed | 78383 | -| total_timesteps | 1890944 | -| train/ | | -| approx_kl | 0.07342488 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 147720 | -| policy_gradient_loss | 0.00266 | -| std | 0.00994 | -| value_loss | 1.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14774 | -| time_elapsed | 78389 | -| total_timesteps | 1891072 | -| train/ | | -| approx_kl | 0.029642915 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 147730 | -| policy_gradient_loss | 0.0188 | -| std | 0.00994 | -| value_loss | 8.68e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14775 | -| time_elapsed | 78397 | -| total_timesteps | 1891200 | -| train/ | | -| approx_kl | 0.012668673 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 147740 | -| policy_gradient_loss | -0.00377 | -| std | 0.00994 | -| value_loss | 0.000224 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14776 | -| time_elapsed | 78403 | -| total_timesteps | 1891328 | -| train/ | | -| approx_kl | 0.018558295 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00456 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 147750 | -| policy_gradient_loss | 0.00515 | -| std | 0.00994 | -| value_loss | 4.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14777 | -| time_elapsed | 78407 | -| total_timesteps | 1891456 | -| train/ | | -| approx_kl | 0.26163408 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0962 | -| n_updates | 147760 | -| policy_gradient_loss | 0.0207 | -| std | 0.00993 | -| value_loss | 1.13e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14778 | -| time_elapsed | 78412 | -| total_timesteps | 1891584 | -| train/ | | -| approx_kl | 0.05383686 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 147770 | -| policy_gradient_loss | 0.0241 | -| std | 0.00996 | -| value_loss | 3.75e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14779 | -| time_elapsed | 78416 | -| total_timesteps | 1891712 | -| train/ | | -| approx_kl | 0.0031337775 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00522 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 147780 | -| policy_gradient_loss | 0.00658 | -| std | 0.00997 | -| value_loss | 1.76e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14780 | -| time_elapsed | 78421 | -| total_timesteps | 1891840 | -| train/ | | -| approx_kl | 0.012219467 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00909 | -| learning_rate | 0.0003 | -| loss | 0.00508 | -| n_updates | 147790 | -| policy_gradient_loss | 0.0186 | -| std | 0.00998 | -| value_loss | 1.75e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14781 | -| time_elapsed | 78426 | -| total_timesteps | 1891968 | -| train/ | | -| approx_kl | 0.37148464 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 147800 | -| policy_gradient_loss | 0.106 | -| std | 0.00998 | -| value_loss | 2.65e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14782 | -| time_elapsed | 78430 | -| total_timesteps | 1892096 | -| train/ | | -| approx_kl | 0.012348838 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00112 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 147810 | -| policy_gradient_loss | -0.00246 | -| std | 0.00998 | -| value_loss | 1.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14783 | -| time_elapsed | 78438 | -| total_timesteps | 1892224 | -| train/ | | -| approx_kl | 0.06673103 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.682 | -| learning_rate | 0.0003 | -| loss | 0.000974 | -| n_updates | 147820 | -| policy_gradient_loss | -0.00656 | -| std | 0.00997 | -| value_loss | 0.0069 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14784 | -| time_elapsed | 78443 | -| total_timesteps | 1892352 | -| train/ | | -| approx_kl | 0.046361174 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 147830 | -| policy_gradient_loss | 0.0124 | -| std | 0.00997 | -| value_loss | 4.85e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14785 | -| time_elapsed | 78448 | -| total_timesteps | 1892480 | -| train/ | | -| approx_kl | 0.047458038 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00496 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 147840 | -| policy_gradient_loss | 0.014 | -| std | 0.00997 | -| value_loss | 4.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14786 | -| time_elapsed | 78452 | -| total_timesteps | 1892608 | -| train/ | | -| approx_kl | 0.10286021 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 147850 | -| policy_gradient_loss | -0.00119 | -| std | 0.00997 | -| value_loss | 8.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14787 | -| time_elapsed | 78457 | -| total_timesteps | 1892736 | -| train/ | | -| approx_kl | 0.04114682 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00249 | -| learning_rate | 0.0003 | -| loss | 0.00374 | -| n_updates | 147860 | -| policy_gradient_loss | 0.00914 | -| std | 0.00997 | -| value_loss | 2.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14788 | -| time_elapsed | 78461 | -| total_timesteps | 1892864 | -| train/ | | -| approx_kl | 0.017811403 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 147870 | -| policy_gradient_loss | 0.00968 | -| std | 0.00998 | -| value_loss | 1.65e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 14789 | -| time_elapsed | 78465 | -| total_timesteps | 1892992 | -| train/ | | -| approx_kl | 0.055844255 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 147880 | -| policy_gradient_loss | 0.012 | -| std | 0.00998 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 14790 | -| time_elapsed | 78469 | -| total_timesteps | 1893120 | -| train/ | | -| approx_kl | 0.061347358 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 147890 | -| policy_gradient_loss | -0.00537 | -| std | 0.00998 | -| value_loss | 8.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 14791 | -| time_elapsed | 78479 | -| total_timesteps | 1893248 | -| train/ | | -| approx_kl | 0.040013086 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 147900 | -| policy_gradient_loss | -0.0169 | -| std | 0.00998 | -| value_loss | 0.00181 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 14792 | -| time_elapsed | 78484 | -| total_timesteps | 1893376 | -| train/ | | -| approx_kl | 0.03571545 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 147910 | -| policy_gradient_loss | 0.019 | -| std | 0.00998 | -| value_loss | 3.57e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 14793 | -| time_elapsed | 78488 | -| total_timesteps | 1893504 | -| train/ | | -| approx_kl | 0.122255854 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 147920 | -| policy_gradient_loss | 0.076 | -| std | 0.00999 | -| value_loss | 3.55e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 14794 | -| time_elapsed | 78493 | -| total_timesteps | 1893632 | -| train/ | | -| approx_kl | 0.08784617 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.539 | -| learning_rate | 0.0003 | -| loss | 0.0546 | -| n_updates | 147930 | -| policy_gradient_loss | 0.059 | -| std | 0.00999 | -| value_loss | 9.05e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 14795 | -| time_elapsed | 78497 | -| total_timesteps | 1893760 | -| train/ | | -| approx_kl | 0.052924402 | -| clip_fraction | 0.576 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0793 | -| learning_rate | 0.0003 | -| loss | 0.0338 | -| n_updates | 147940 | -| policy_gradient_loss | 0.0531 | -| std | 0.01 | -| value_loss | 5.33e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 14796 | -| time_elapsed | 78501 | -| total_timesteps | 1893888 | -| train/ | | -| approx_kl | 0.0636462 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0828 | -| learning_rate | 0.0003 | -| loss | 0.0704 | -| n_updates | 147950 | -| policy_gradient_loss | 0.0643 | -| std | 0.01 | -| value_loss | 4.45e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14797 | -| time_elapsed | 78505 | -| total_timesteps | 1894016 | -| train/ | | -| approx_kl | 0.05803196 | -| clip_fraction | 0.593 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.0753 | -| n_updates | 147960 | -| policy_gradient_loss | 0.105 | -| std | 0.01 | -| value_loss | 3.05e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14798 | -| time_elapsed | 78516 | -| total_timesteps | 1894144 | -| train/ | | -| approx_kl | 0.08501961 | -| clip_fraction | 0.612 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.704 | -| learning_rate | 0.0003 | -| loss | 0.0668 | -| n_updates | 147970 | -| policy_gradient_loss | 0.0463 | -| std | 0.01 | -| value_loss | 0.00518 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14799 | -| time_elapsed | 78521 | -| total_timesteps | 1894272 | -| train/ | | -| approx_kl | 0.02824932 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.0195 | -| learning_rate | 0.0003 | -| loss | 0.000188 | -| n_updates | 147980 | -| policy_gradient_loss | 0.00984 | -| std | 0.01 | -| value_loss | 0.00172 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14800 | -| time_elapsed | 78527 | -| total_timesteps | 1894400 | -| train/ | | -| approx_kl | 0.0011673812 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00279 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 147990 | -| policy_gradient_loss | 0.00298 | -| std | 0.01 | -| value_loss | 1.58e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14801 | -| time_elapsed | 78531 | -| total_timesteps | 1894528 | -| train/ | | -| approx_kl | 0.054913454 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 148000 | -| policy_gradient_loss | 0.0545 | -| std | 0.01 | -| value_loss | 7.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14802 | -| time_elapsed | 78536 | -| total_timesteps | 1894656 | -| train/ | | -| approx_kl | 0.012079497 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0907 | -| learning_rate | 0.0003 | -| loss | 0.00288 | -| n_updates | 148010 | -| policy_gradient_loss | 0.0074 | -| std | 0.01 | -| value_loss | 1.24e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14803 | -| time_elapsed | 78541 | -| total_timesteps | 1894784 | -| train/ | | -| approx_kl | 0.0003815284 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.00195 | -| n_updates | 148020 | -| policy_gradient_loss | 0.000518 | -| std | 0.01 | -| value_loss | 2.45e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 14804 | -| time_elapsed | 78545 | -| total_timesteps | 1894912 | -| train/ | | -| approx_kl | 0.018708909 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 148030 | -| policy_gradient_loss | 0.00463 | -| std | 0.01 | -| value_loss | 2.35e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14805 | -| time_elapsed | 78549 | -| total_timesteps | 1895040 | -| train/ | | -| approx_kl | 0.0010596379 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | -0.000206 | -| n_updates | 148040 | -| policy_gradient_loss | 0.0147 | -| std | 0.00999 | -| value_loss | 5.85e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14806 | -| time_elapsed | 78560 | -| total_timesteps | 1895168 | -| train/ | | -| approx_kl | 0.001989963 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -2.7 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 148050 | -| policy_gradient_loss | -0.0104 | -| std | 0.00996 | -| value_loss | 0.00196 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14807 | -| time_elapsed | 78565 | -| total_timesteps | 1895296 | -| train/ | | -| approx_kl | 0.15034877 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.361 | -| learning_rate | 0.0003 | -| loss | 0.0601 | -| n_updates | 148060 | -| policy_gradient_loss | 0.0557 | -| std | 0.00996 | -| value_loss | 0.000179 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14808 | -| time_elapsed | 78569 | -| total_timesteps | 1895424 | -| train/ | | -| approx_kl | 0.023345254 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00283 | -| n_updates | 148070 | -| policy_gradient_loss | 0.00778 | -| std | 0.00996 | -| value_loss | 7e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14809 | -| time_elapsed | 78573 | -| total_timesteps | 1895552 | -| train/ | | -| approx_kl | 0.0009803595 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.000301 | -| learning_rate | 0.0003 | -| loss | 0.00459 | -| n_updates | 148080 | -| policy_gradient_loss | -0.000247 | -| std | 0.00995 | -| value_loss | 2.21e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14810 | -| time_elapsed | 78578 | -| total_timesteps | 1895680 | -| train/ | | -| approx_kl | 0.019222675 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 148090 | -| policy_gradient_loss | 0.00583 | -| std | 0.00995 | -| value_loss | 1.35e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14811 | -| time_elapsed | 78583 | -| total_timesteps | 1895808 | -| train/ | | -| approx_kl | 0.29007885 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 148100 | -| policy_gradient_loss | 0.0315 | -| std | 0.00995 | -| value_loss | 8.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14812 | -| time_elapsed | 78589 | -| total_timesteps | 1895936 | -| train/ | | -| approx_kl | 0.015778458 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 148110 | -| policy_gradient_loss | -0.00146 | -| std | 0.00995 | -| value_loss | 6.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14813 | -| time_elapsed | 78593 | -| total_timesteps | 1896064 | -| train/ | | -| approx_kl | 0.02123128 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00527 | -| n_updates | 148120 | -| policy_gradient_loss | -0.00302 | -| std | 0.00995 | -| value_loss | 4.49e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14814 | -| time_elapsed | 78599 | -| total_timesteps | 1896192 | -| train/ | | -| approx_kl | 0.0054539507 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.729 | -| learning_rate | 0.0003 | -| loss | -0.000753 | -| n_updates | 148130 | -| policy_gradient_loss | -0.00148 | -| std | 0.00995 | -| value_loss | 0.00428 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14815 | -| time_elapsed | 78604 | -| total_timesteps | 1896320 | -| train/ | | -| approx_kl | 0.010571041 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00022 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 148140 | -| policy_gradient_loss | 0.00148 | -| std | 0.00995 | -| value_loss | 2.72e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14816 | -| time_elapsed | 78609 | -| total_timesteps | 1896448 | -| train/ | | -| approx_kl | 0.049248412 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0087 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 148150 | -| policy_gradient_loss | -0.0105 | -| std | 0.00995 | -| value_loss | 3.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14817 | -| time_elapsed | 78615 | -| total_timesteps | 1896576 | -| train/ | | -| approx_kl | 0.12797834 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.044 | -| n_updates | 148160 | -| policy_gradient_loss | 0.00454 | -| std | 0.00995 | -| value_loss | 2.51e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14818 | -| time_elapsed | 78619 | -| total_timesteps | 1896704 | -| train/ | | -| approx_kl | 0.09948816 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | 0.0499 | -| n_updates | 148170 | -| policy_gradient_loss | 0.0213 | -| std | 0.00995 | -| value_loss | 2.61e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14819 | -| time_elapsed | 78623 | -| total_timesteps | 1896832 | -| train/ | | -| approx_kl | 0.030632293 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 148180 | -| policy_gradient_loss | -6.16e-05 | -| std | 0.00996 | -| value_loss | 1.67e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14820 | -| time_elapsed | 78627 | -| total_timesteps | 1896960 | -| train/ | | -| approx_kl | 0.14143915 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00765 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 148190 | -| policy_gradient_loss | 0.07 | -| std | 0.00996 | -| value_loss | 1.12e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14821 | -| time_elapsed | 78631 | -| total_timesteps | 1897088 | -| train/ | | -| approx_kl | 0.091754824 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.0694 | -| n_updates | 148200 | -| policy_gradient_loss | 0.085 | -| std | 0.00996 | -| value_loss | 6.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14822 | -| time_elapsed | 78640 | -| total_timesteps | 1897216 | -| train/ | | -| approx_kl | 0.10886808 | -| clip_fraction | 0.633 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 148210 | -| policy_gradient_loss | 0.0264 | -| std | 0.00996 | -| value_loss | 0.0049 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14823 | -| time_elapsed | 78645 | -| total_timesteps | 1897344 | -| train/ | | -| approx_kl | 0.03071727 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00476 | -| learning_rate | 0.0003 | -| loss | 0.0091 | -| n_updates | 148220 | -| policy_gradient_loss | 0.0103 | -| std | 0.00996 | -| value_loss | 1.72e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14824 | -| time_elapsed | 78650 | -| total_timesteps | 1897472 | -| train/ | | -| approx_kl | 0.3117024 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.0027 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 148230 | -| policy_gradient_loss | 0.037 | -| std | 0.00996 | -| value_loss | 2.22e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14825 | -| time_elapsed | 78655 | -| total_timesteps | 1897600 | -| train/ | | -| approx_kl | 0.005332275 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 148240 | -| policy_gradient_loss | -0.00736 | -| std | 0.00995 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14826 | -| time_elapsed | 78659 | -| total_timesteps | 1897728 | -| train/ | | -| approx_kl | 0.0033348133 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 148250 | -| policy_gradient_loss | -0.0132 | -| std | 0.00995 | -| value_loss | 7.4e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14827 | -| time_elapsed | 78663 | -| total_timesteps | 1897856 | -| train/ | | -| approx_kl | 0.04306844 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00305 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 148260 | -| policy_gradient_loss | 0.0165 | -| std | 0.00995 | -| value_loss | 1.21e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 24 | -| iterations | 14828 | -| time_elapsed | 78669 | -| total_timesteps | 1897984 | -| train/ | | -| approx_kl | 0.050415263 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 148270 | -| policy_gradient_loss | 0.0231 | -| std | 0.00995 | -| value_loss | 4.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14829 | -| time_elapsed | 78675 | -| total_timesteps | 1898112 | -| train/ | | -| approx_kl | 0.18773425 | -| clip_fraction | 0.636 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 148280 | -| policy_gradient_loss | 0.0934 | -| std | 0.00996 | -| value_loss | 2.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14830 | -| time_elapsed | 78687 | -| total_timesteps | 1898240 | -| train/ | | -| approx_kl | 0.018214079 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | -0.03 | -| n_updates | 148290 | -| policy_gradient_loss | -0.0157 | -| std | 0.00996 | -| value_loss | 0.00135 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14831 | -| time_elapsed | 78692 | -| total_timesteps | 1898368 | -| train/ | | -| approx_kl | 0.012135029 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.0027 | -| learning_rate | 0.0003 | -| loss | 0.00522 | -| n_updates | 148300 | -| policy_gradient_loss | 0.00246 | -| std | 0.00996 | -| value_loss | 3.61e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14832 | -| time_elapsed | 78696 | -| total_timesteps | 1898496 | -| train/ | | -| approx_kl | 0.0018985649 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0745 | -| learning_rate | 0.0003 | -| loss | -0.00802 | -| n_updates | 148310 | -| policy_gradient_loss | -0.00459 | -| std | 0.00996 | -| value_loss | 7.65e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14833 | -| time_elapsed | 78700 | -| total_timesteps | 1898624 | -| train/ | | -| approx_kl | 0.028660549 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0653 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 148320 | -| policy_gradient_loss | 0.03 | -| std | 0.00997 | -| value_loss | 4.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14834 | -| time_elapsed | 78705 | -| total_timesteps | 1898752 | -| train/ | | -| approx_kl | 0.010882871 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 148330 | -| policy_gradient_loss | 0.00359 | -| std | 0.00997 | -| value_loss | 3.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 24 | -| iterations | 14835 | -| time_elapsed | 78710 | -| total_timesteps | 1898880 | -| train/ | | -| approx_kl | 0.018074991 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.00873 | -| n_updates | 148340 | -| policy_gradient_loss | 0.0395 | -| std | 0.00997 | -| value_loss | 1.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14836 | -| time_elapsed | 78714 | -| total_timesteps | 1899008 | -| train/ | | -| approx_kl | 0.030139672 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 148350 | -| policy_gradient_loss | 0.00355 | -| std | 0.00997 | -| value_loss | 1.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14837 | -| time_elapsed | 78728 | -| total_timesteps | 1899136 | -| train/ | | -| approx_kl | 0.022685029 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.728 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 148360 | -| policy_gradient_loss | -0.00352 | -| std | 0.00997 | -| value_loss | 0.00507 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14838 | -| time_elapsed | 78733 | -| total_timesteps | 1899264 | -| train/ | | -| approx_kl | 0.006341359 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 148370 | -| policy_gradient_loss | 0.00293 | -| std | 0.00997 | -| value_loss | 0.00216 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14839 | -| time_elapsed | 78738 | -| total_timesteps | 1899392 | -| train/ | | -| approx_kl | 0.014444078 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.0025 | -| learning_rate | 0.0003 | -| loss | 0.0249 | -| n_updates | 148380 | -| policy_gradient_loss | 0.00975 | -| std | 0.00997 | -| value_loss | 6.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14840 | -| time_elapsed | 78743 | -| total_timesteps | 1899520 | -| train/ | | -| approx_kl | 0.010057006 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00403 | -| learning_rate | 0.0003 | -| loss | 0.00823 | -| n_updates | 148390 | -| policy_gradient_loss | 0.0105 | -| std | 0.00997 | -| value_loss | 7.47e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14841 | -| time_elapsed | 78748 | -| total_timesteps | 1899648 | -| train/ | | -| approx_kl | 0.0010446128 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 148400 | -| policy_gradient_loss | 0.0643 | -| std | 0.00998 | -| value_loss | 0.00107 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14842 | -| time_elapsed | 78752 | -| total_timesteps | 1899776 | -| train/ | | -| approx_kl | 0.05076921 | -| clip_fraction | 0.597 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0456 | -| n_updates | 148410 | -| policy_gradient_loss | 0.098 | -| std | 0.00999 | -| value_loss | 0.000975 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 24 | -| iterations | 14843 | -| time_elapsed | 78758 | -| total_timesteps | 1899904 | -| train/ | | -| approx_kl | 0.040135704 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | 0.00222 | -| n_updates | 148420 | -| policy_gradient_loss | 0.00534 | -| std | 0.01 | -| value_loss | 9.67e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14844 | -| time_elapsed | 78762 | -| total_timesteps | 1900032 | -| train/ | | -| approx_kl | 0.016643655 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.00248 | -| n_updates | 148430 | -| policy_gradient_loss | 0.0105 | -| std | 0.01 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14845 | -| time_elapsed | 78772 | -| total_timesteps | 1900160 | -| train/ | | -| approx_kl | 0.0041849045 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.702 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 148440 | -| policy_gradient_loss | -0.0175 | -| std | 0.01 | -| value_loss | 0.00599 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14846 | -| time_elapsed | 78777 | -| total_timesteps | 1900288 | -| train/ | | -| approx_kl | 0.030418288 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0878 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 148450 | -| policy_gradient_loss | 0.0466 | -| std | 0.01 | -| value_loss | 5.81e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14847 | -| time_elapsed | 78782 | -| total_timesteps | 1900416 | -| train/ | | -| approx_kl | 0.10016018 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00559 | -| learning_rate | 0.0003 | -| loss | 0.057 | -| n_updates | 148460 | -| policy_gradient_loss | 0.0192 | -| std | 0.01 | -| value_loss | 1.85e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14848 | -| time_elapsed | 78789 | -| total_timesteps | 1900544 | -| train/ | | -| approx_kl | 0.027902514 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00744 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 148470 | -| policy_gradient_loss | 0.0356 | -| std | 0.01 | -| value_loss | 9.3e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14849 | -| time_elapsed | 78795 | -| total_timesteps | 1900672 | -| train/ | | -| approx_kl | 0.10239655 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0615 | -| n_updates | 148480 | -| policy_gradient_loss | 0.02 | -| std | 0.01 | -| value_loss | 5.69e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14850 | -| time_elapsed | 78800 | -| total_timesteps | 1900800 | -| train/ | | -| approx_kl | 0.00037019188 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 148490 | -| policy_gradient_loss | -0.000688 | -| std | 0.01 | -| value_loss | 4.16e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14851 | -| time_elapsed | 78804 | -| total_timesteps | 1900928 | -| train/ | | -| approx_kl | 7.772353e-06 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.000143 | -| n_updates | 148500 | -| policy_gradient_loss | 0.00292 | -| std | 0.01 | -| value_loss | 2.53e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14852 | -| time_elapsed | 78808 | -| total_timesteps | 1901056 | -| train/ | | -| approx_kl | 7.917965e-05 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.000402 | -| n_updates | 148510 | -| policy_gradient_loss | 0.00426 | -| std | 0.01 | -| value_loss | 1.61e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14853 | -| time_elapsed | 78817 | -| total_timesteps | 1901184 | -| train/ | | -| approx_kl | 0.10411187 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.888 | -| learning_rate | 0.0003 | -| loss | 0.00568 | -| n_updates | 148520 | -| policy_gradient_loss | -0.00889 | -| std | 0.01 | -| value_loss | 0.00104 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14854 | -| time_elapsed | 78822 | -| total_timesteps | 1901312 | -| train/ | | -| approx_kl | 0.06451829 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00402 | -| learning_rate | 0.0003 | -| loss | 0.0489 | -| n_updates | 148530 | -| policy_gradient_loss | 0.00772 | -| std | 0.01 | -| value_loss | 1.79e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14855 | -| time_elapsed | 78827 | -| total_timesteps | 1901440 | -| train/ | | -| approx_kl | 0.021600103 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 148540 | -| policy_gradient_loss | -0.00142 | -| std | 0.01 | -| value_loss | 3.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14856 | -| time_elapsed | 78831 | -| total_timesteps | 1901568 | -| train/ | | -| approx_kl | 0.057051983 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0359 | -| n_updates | 148550 | -| policy_gradient_loss | 0.0172 | -| std | 0.01 | -| value_loss | 3.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14857 | -| time_elapsed | 78834 | -| total_timesteps | 1901696 | -| train/ | | -| approx_kl | 0.13577005 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 148560 | -| policy_gradient_loss | 0.00565 | -| std | 0.01 | -| value_loss | 2.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14858 | -| time_elapsed | 78839 | -| total_timesteps | 1901824 | -| train/ | | -| approx_kl | 0.03710684 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 148570 | -| policy_gradient_loss | 0.0153 | -| std | 0.01 | -| value_loss | 1.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 14859 | -| time_elapsed | 78843 | -| total_timesteps | 1901952 | -| train/ | | -| approx_kl | 0.050199177 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 148580 | -| policy_gradient_loss | 0.0167 | -| std | 0.01 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14860 | -| time_elapsed | 78849 | -| total_timesteps | 1902080 | -| train/ | | -| approx_kl | 0.06971747 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 148590 | -| policy_gradient_loss | 0.00468 | -| std | 0.01 | -| value_loss | 7.75e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14861 | -| time_elapsed | 78858 | -| total_timesteps | 1902208 | -| train/ | | -| approx_kl | 0.07436493 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 148600 | -| policy_gradient_loss | -0.0162 | -| std | 0.01 | -| value_loss | 0.00181 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14862 | -| time_elapsed | 78862 | -| total_timesteps | 1902336 | -| train/ | | -| approx_kl | 0.053607795 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -5.29 | -| learning_rate | 0.0003 | -| loss | 0.00953 | -| n_updates | 148610 | -| policy_gradient_loss | 0.00709 | -| std | 0.01 | -| value_loss | 2.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14863 | -| time_elapsed | 78866 | -| total_timesteps | 1902464 | -| train/ | | -| approx_kl | 0.008275241 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -13 | -| learning_rate | 0.0003 | -| loss | 0.000755 | -| n_updates | 148620 | -| policy_gradient_loss | 0.00468 | -| std | 0.00997 | -| value_loss | 3.08e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14864 | -| time_elapsed | 78872 | -| total_timesteps | 1902592 | -| train/ | | -| approx_kl | 7.267762e-05 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | 0.000441 | -| n_updates | 148630 | -| policy_gradient_loss | -3.58e-05 | -| std | 0.00996 | -| value_loss | 8.73e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14865 | -| time_elapsed | 78876 | -| total_timesteps | 1902720 | -| train/ | | -| approx_kl | 0.0153814275 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.318 | -| learning_rate | 0.0003 | -| loss | 0.0082 | -| n_updates | 148640 | -| policy_gradient_loss | 0.00921 | -| std | 0.00993 | -| value_loss | 1.65e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14866 | -| time_elapsed | 78879 | -| total_timesteps | 1902848 | -| train/ | | -| approx_kl | 0.23230839 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00488 | -| learning_rate | 0.0003 | -| loss | 0.0936 | -| n_updates | 148650 | -| policy_gradient_loss | 0.0265 | -| std | 0.00991 | -| value_loss | 3.61e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 24 | -| iterations | 14867 | -| time_elapsed | 78884 | -| total_timesteps | 1902976 | -| train/ | | -| approx_kl | 0.014260028 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 148660 | -| policy_gradient_loss | 0.0012 | -| std | 0.00991 | -| value_loss | 1.84e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14868 | -| time_elapsed | 78888 | -| total_timesteps | 1903104 | -| train/ | | -| approx_kl | 0.00076518767 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 148670 | -| policy_gradient_loss | -0.00475 | -| std | 0.0099 | -| value_loss | 1.5e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14869 | -| time_elapsed | 78900 | -| total_timesteps | 1903232 | -| train/ | | -| approx_kl | 0.01051497 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.679 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 148680 | -| policy_gradient_loss | -0.0156 | -| std | 0.0099 | -| value_loss | 0.00756 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14870 | -| time_elapsed | 78904 | -| total_timesteps | 1903360 | -| train/ | | -| approx_kl | 0.0005433457 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 148690 | -| policy_gradient_loss | 0.00841 | -| std | 0.0099 | -| value_loss | 6.9e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14871 | -| time_elapsed | 78909 | -| total_timesteps | 1903488 | -| train/ | | -| approx_kl | 0.087184675 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.0496 | -| n_updates | 148700 | -| policy_gradient_loss | 0.0127 | -| std | 0.00989 | -| value_loss | 1.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14872 | -| time_elapsed | 78914 | -| total_timesteps | 1903616 | -| train/ | | -| approx_kl | 0.008258006 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | -0.00564 | -| n_updates | 148710 | -| policy_gradient_loss | 0.00634 | -| std | 0.00989 | -| value_loss | 5.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14873 | -| time_elapsed | 78918 | -| total_timesteps | 1903744 | -| train/ | | -| approx_kl | 0.04871067 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 148720 | -| policy_gradient_loss | 0.0147 | -| std | 0.00989 | -| value_loss | 6.94e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14874 | -| time_elapsed | 78922 | -| total_timesteps | 1903872 | -| train/ | | -| approx_kl | 0.22780885 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 148730 | -| policy_gradient_loss | 0.0245 | -| std | 0.00989 | -| value_loss | 7.57e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14875 | -| time_elapsed | 78926 | -| total_timesteps | 1904000 | -| train/ | | -| approx_kl | 0.016396947 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.000175 | -| learning_rate | 0.0003 | -| loss | 0.00546 | -| n_updates | 148740 | -| policy_gradient_loss | 0.00367 | -| std | 0.00988 | -| value_loss | 1.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14876 | -| time_elapsed | 78931 | -| total_timesteps | 1904128 | -| train/ | | -| approx_kl | 0.022885934 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00335 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 148750 | -| policy_gradient_loss | 0.00798 | -| std | 0.00987 | -| value_loss | 7.8e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14877 | -| time_elapsed | 78942 | -| total_timesteps | 1904256 | -| train/ | | -| approx_kl | 0.0022664545 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.949 | -| learning_rate | 0.0003 | -| loss | -0.0251 | -| n_updates | 148760 | -| policy_gradient_loss | -0.0185 | -| std | 0.00986 | -| value_loss | 0.000364 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14878 | -| time_elapsed | 78948 | -| total_timesteps | 1904384 | -| train/ | | -| approx_kl | 0.020722035 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0013 | -| learning_rate | 0.0003 | -| loss | 0.00714 | -| n_updates | 148770 | -| policy_gradient_loss | 0.0224 | -| std | 0.00985 | -| value_loss | 2.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14879 | -| time_elapsed | 78952 | -| total_timesteps | 1904512 | -| train/ | | -| approx_kl | 0.062020775 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.0492 | -| n_updates | 148780 | -| policy_gradient_loss | 0.0301 | -| std | 0.00985 | -| value_loss | 4.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14880 | -| time_elapsed | 78956 | -| total_timesteps | 1904640 | -| train/ | | -| approx_kl | 0.014084509 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 148790 | -| policy_gradient_loss | 0.00629 | -| std | 0.00985 | -| value_loss | 6.28e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14881 | -| time_elapsed | 78960 | -| total_timesteps | 1904768 | -| train/ | | -| approx_kl | 0.06656094 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0592 | -| learning_rate | 0.0003 | -| loss | 0.0668 | -| n_updates | 148800 | -| policy_gradient_loss | 0.0325 | -| std | 0.00985 | -| value_loss | 3.02e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 24 | -| iterations | 14882 | -| time_elapsed | 78963 | -| total_timesteps | 1904896 | -| train/ | | -| approx_kl | 0.016645899 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 148810 | -| policy_gradient_loss | 0.0163 | -| std | 0.00985 | -| value_loss | 2.06e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14883 | -| time_elapsed | 78966 | -| total_timesteps | 1905024 | -| train/ | | -| approx_kl | 0.4616128 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 148820 | -| policy_gradient_loss | 0.124 | -| std | 0.00985 | -| value_loss | 1.08e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14884 | -| time_elapsed | 78975 | -| total_timesteps | 1905152 | -| train/ | | -| approx_kl | 0.038557436 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.758 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 148830 | -| policy_gradient_loss | -0.0154 | -| std | 0.00985 | -| value_loss | 0.000592 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14885 | -| time_elapsed | 78981 | -| total_timesteps | 1905280 | -| train/ | | -| approx_kl | 0.06440998 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00063 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 148840 | -| policy_gradient_loss | 0.0121 | -| std | 0.00985 | -| value_loss | 5.37e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14886 | -| time_elapsed | 78984 | -| total_timesteps | 1905408 | -| train/ | | -| approx_kl | 0.17254767 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 148850 | -| policy_gradient_loss | 0.0824 | -| std | 0.00985 | -| value_loss | 8.82e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14887 | -| time_elapsed | 78987 | -| total_timesteps | 1905536 | -| train/ | | -| approx_kl | 0.07790908 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00646 | -| learning_rate | 0.0003 | -| loss | 0.0684 | -| n_updates | 148860 | -| policy_gradient_loss | 0.0709 | -| std | 0.00985 | -| value_loss | 6.99e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14888 | -| time_elapsed | 78991 | -| total_timesteps | 1905664 | -| train/ | | -| approx_kl | 0.07796505 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.000766 | -| learning_rate | 0.0003 | -| loss | 0.0715 | -| n_updates | 148870 | -| policy_gradient_loss | 0.0837 | -| std | 0.00985 | -| value_loss | 5.47e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14889 | -| time_elapsed | 78996 | -| total_timesteps | 1905792 | -| train/ | | -| approx_kl | 0.012136847 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00714 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 148880 | -| policy_gradient_loss | 0.00633 | -| std | 0.00985 | -| value_loss | 4.82e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 14890 | -| time_elapsed | 79002 | -| total_timesteps | 1905920 | -| train/ | | -| approx_kl | 0.28650582 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 148890 | -| policy_gradient_loss | 0.129 | -| std | 0.00985 | -| value_loss | 2.32e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14891 | -| time_elapsed | 79007 | -| total_timesteps | 1906048 | -| train/ | | -| approx_kl | 0.007743491 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 148900 | -| policy_gradient_loss | 0.0117 | -| std | 0.00985 | -| value_loss | 1.8e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14892 | -| time_elapsed | 79016 | -| total_timesteps | 1906176 | -| train/ | | -| approx_kl | 0.03425453 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.783 | -| learning_rate | 0.0003 | -| loss | 0.00548 | -| n_updates | 148910 | -| policy_gradient_loss | 0.00282 | -| std | 0.00985 | -| value_loss | 0.00382 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14893 | -| time_elapsed | 79021 | -| total_timesteps | 1906304 | -| train/ | | -| approx_kl | 0.22470357 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 148920 | -| policy_gradient_loss | 0.0259 | -| std | 0.00984 | -| value_loss | 1.23e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14894 | -| time_elapsed | 79027 | -| total_timesteps | 1906432 | -| train/ | | -| approx_kl | 0.016827377 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00823 | -| learning_rate | 0.0003 | -| loss | 0.00358 | -| n_updates | 148930 | -| policy_gradient_loss | 0.00242 | -| std | 0.00984 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14895 | -| time_elapsed | 79032 | -| total_timesteps | 1906560 | -| train/ | | -| approx_kl | 0.024235215 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 148940 | -| policy_gradient_loss | -0.00311 | -| std | 0.00985 | -| value_loss | 2.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14896 | -| time_elapsed | 79037 | -| total_timesteps | 1906688 | -| train/ | | -| approx_kl | 0.021835858 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -3.45e-05 | -| learning_rate | 0.0003 | -| loss | 0.000581 | -| n_updates | 148950 | -| policy_gradient_loss | 0.000366 | -| std | 0.00985 | -| value_loss | 9.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14897 | -| time_elapsed | 79041 | -| total_timesteps | 1906816 | -| train/ | | -| approx_kl | 0.002816449 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 148960 | -| policy_gradient_loss | 0.00039 | -| std | 0.00985 | -| value_loss | 7.95e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 24 | -| iterations | 14898 | -| time_elapsed | 79046 | -| total_timesteps | 1906944 | -| train/ | | -| approx_kl | 0.017302865 | -| clip_fraction | 0.571 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 148970 | -| policy_gradient_loss | 0.0467 | -| std | 0.00985 | -| value_loss | 6.64e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14899 | -| time_elapsed | 79050 | -| total_timesteps | 1907072 | -| train/ | | -| approx_kl | 0.04502568 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 148980 | -| policy_gradient_loss | 0.0745 | -| std | 0.00984 | -| value_loss | 8.44e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14900 | -| time_elapsed | 79056 | -| total_timesteps | 1907200 | -| train/ | | -| approx_kl | 0.12608558 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 148990 | -| policy_gradient_loss | 0.0393 | -| std | 0.00984 | -| value_loss | 0.00625 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14901 | -| time_elapsed | 79060 | -| total_timesteps | 1907328 | -| train/ | | -| approx_kl | 0.08562566 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 149000 | -| policy_gradient_loss | 0.0709 | -| std | 0.00984 | -| value_loss | 2.71e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14902 | -| time_elapsed | 79065 | -| total_timesteps | 1907456 | -| train/ | | -| approx_kl | 0.017274253 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.0047 | -| learning_rate | 0.0003 | -| loss | 0.00416 | -| n_updates | 149010 | -| policy_gradient_loss | 0.0097 | -| std | 0.00984 | -| value_loss | 4.49e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14903 | -| time_elapsed | 79069 | -| total_timesteps | 1907584 | -| train/ | | -| approx_kl | 0.0003286586 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | 0.00272 | -| n_updates | 149020 | -| policy_gradient_loss | 5.09e-05 | -| std | 0.00984 | -| value_loss | 2.49e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14904 | -| time_elapsed | 79074 | -| total_timesteps | 1907712 | -| train/ | | -| approx_kl | 0.021093726 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | 0.00638 | -| n_updates | 149030 | -| policy_gradient_loss | 0.00853 | -| std | 0.00983 | -| value_loss | 4e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14905 | -| time_elapsed | 79079 | -| total_timesteps | 1907840 | -| train/ | | -| approx_kl | 0.00076915184 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 149040 | -| policy_gradient_loss | 0.00122 | -| std | 0.00983 | -| value_loss | 6.1e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 24 | -| iterations | 14906 | -| time_elapsed | 79084 | -| total_timesteps | 1907968 | -| train/ | | -| approx_kl | 0.018768398 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 149050 | -| policy_gradient_loss | 0.00441 | -| std | 0.00983 | -| value_loss | 3.76e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14907 | -| time_elapsed | 79089 | -| total_timesteps | 1908096 | -| train/ | | -| approx_kl | 0.00088648684 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 149060 | -| policy_gradient_loss | 0.0021 | -| std | 0.00982 | -| value_loss | 2.45e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14908 | -| time_elapsed | 79098 | -| total_timesteps | 1908224 | -| train/ | | -| approx_kl | 0.10267651 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.783 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 149070 | -| policy_gradient_loss | 0.023 | -| std | 0.00982 | -| value_loss | 0.00393 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14909 | -| time_elapsed | 79102 | -| total_timesteps | 1908352 | -| train/ | | -| approx_kl | 0.07318091 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | 0.0646 | -| n_updates | 149080 | -| policy_gradient_loss | 0.058 | -| std | 0.00982 | -| value_loss | 3.29e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14910 | -| time_elapsed | 79106 | -| total_timesteps | 1908480 | -| train/ | | -| approx_kl | 0.0727847 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00691 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 149090 | -| policy_gradient_loss | 0.0673 | -| std | 0.00982 | -| value_loss | 6.35e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14911 | -| time_elapsed | 79110 | -| total_timesteps | 1908608 | -| train/ | | -| approx_kl | 0.013724329 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00937 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 149100 | -| policy_gradient_loss | 0.01 | -| std | 0.00982 | -| value_loss | 3.3e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14912 | -| time_elapsed | 79115 | -| total_timesteps | 1908736 | -| train/ | | -| approx_kl | 0.00031723361 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.00223 | -| n_updates | 149110 | -| policy_gradient_loss | 0.00195 | -| std | 0.00982 | -| value_loss | 2.11e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14913 | -| time_elapsed | 79119 | -| total_timesteps | 1908864 | -| train/ | | -| approx_kl | 0.056637667 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0621 | -| n_updates | 149120 | -| policy_gradient_loss | 0.047 | -| std | 0.00982 | -| value_loss | 1.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 24 | -| iterations | 14914 | -| time_elapsed | 79122 | -| total_timesteps | 1908992 | -| train/ | | -| approx_kl | 0.06374339 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 149130 | -| policy_gradient_loss | 0.0713 | -| std | 0.00982 | -| value_loss | 1.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 24 | -| iterations | 14915 | -| time_elapsed | 79126 | -| total_timesteps | 1909120 | -| train/ | | -| approx_kl | 0.06373744 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.0606 | -| n_updates | 149140 | -| policy_gradient_loss | 0.0614 | -| std | 0.00983 | -| value_loss | 8.58e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 24 | -| iterations | 14916 | -| time_elapsed | 79138 | -| total_timesteps | 1909248 | -| train/ | | -| approx_kl | 0.05887715 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 149150 | -| policy_gradient_loss | 0.0259 | -| std | 0.00983 | -| value_loss | 0.00158 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 24 | -| iterations | 14917 | -| time_elapsed | 79144 | -| total_timesteps | 1909376 | -| train/ | | -| approx_kl | 0.026045827 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00606 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 149160 | -| policy_gradient_loss | 0.00272 | -| std | 0.00983 | -| value_loss | 7.85e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 24 | -| iterations | 14918 | -| time_elapsed | 79150 | -| total_timesteps | 1909504 | -| train/ | | -| approx_kl | 0.25230098 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00135 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 149170 | -| policy_gradient_loss | 0.0309 | -| std | 0.00982 | -| value_loss | 1.36e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 24 | -| iterations | 14919 | -| time_elapsed | 79157 | -| total_timesteps | 1909632 | -| train/ | | -| approx_kl | 0.0052226568 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.000534 | -| n_updates | 149180 | -| policy_gradient_loss | 0.0013 | -| std | 0.00983 | -| value_loss | 7.86e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 24 | -| iterations | 14920 | -| time_elapsed | 79162 | -| total_timesteps | 1909760 | -| train/ | | -| approx_kl | 0.023262307 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00281 | -| learning_rate | 0.0003 | -| loss | 4.46e-05 | -| n_updates | 149190 | -| policy_gradient_loss | -0.00163 | -| std | 0.00984 | -| value_loss | 8.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 24 | -| iterations | 14921 | -| time_elapsed | 79167 | -| total_timesteps | 1909888 | -| train/ | | -| approx_kl | 0.0061087576 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00642 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 149200 | -| policy_gradient_loss | -0.00641 | -| std | 0.00985 | -| value_loss | 1.05e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14922 | -| time_elapsed | 79169 | -| total_timesteps | 1910016 | -| train/ | | -| approx_kl | 0.017996814 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0014 | -| n_updates | 149210 | -| policy_gradient_loss | 0.00229 | -| std | 0.00985 | -| value_loss | 6.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14923 | -| time_elapsed | 79181 | -| total_timesteps | 1910144 | -| train/ | | -| approx_kl | 0.026630461 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 149220 | -| policy_gradient_loss | -0.0106 | -| std | 0.00984 | -| value_loss | 0.00011 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14924 | -| time_elapsed | 79186 | -| total_timesteps | 1910272 | -| train/ | | -| approx_kl | 0.006395779 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.0288 | -| learning_rate | 0.0003 | -| loss | -0.00468 | -| n_updates | 149230 | -| policy_gradient_loss | 0.0391 | -| std | 0.00984 | -| value_loss | 9.95e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14925 | -| time_elapsed | 79191 | -| total_timesteps | 1910400 | -| train/ | | -| approx_kl | 0.0057495707 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.000692 | -| n_updates | 149240 | -| policy_gradient_loss | 0.0156 | -| std | 0.00984 | -| value_loss | 4.25e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14926 | -| time_elapsed | 79195 | -| total_timesteps | 1910528 | -| train/ | | -| approx_kl | 0.016938385 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | -0.00439 | -| n_updates | 149250 | -| policy_gradient_loss | 0.0225 | -| std | 0.00983 | -| value_loss | 4.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14927 | -| time_elapsed | 79199 | -| total_timesteps | 1910656 | -| train/ | | -| approx_kl | 0.009214805 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0078 | -| n_updates | 149260 | -| policy_gradient_loss | 0.0128 | -| std | 0.00983 | -| value_loss | 1.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14928 | -| time_elapsed | 79203 | -| total_timesteps | 1910784 | -| train/ | | -| approx_kl | 0.011895468 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.00775 | -| n_updates | 149270 | -| policy_gradient_loss | 0.014 | -| std | 0.00983 | -| value_loss | 1.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 24 | -| iterations | 14929 | -| time_elapsed | 79208 | -| total_timesteps | 1910912 | -| train/ | | -| approx_kl | 0.03707855 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 149280 | -| policy_gradient_loss | 0.00278 | -| std | 0.00982 | -| value_loss | 5.25e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14930 | -| time_elapsed | 79214 | -| total_timesteps | 1911040 | -| train/ | | -| approx_kl | 0.029249325 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 149290 | -| policy_gradient_loss | 0.00512 | -| std | 0.00982 | -| value_loss | 3.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14931 | -| time_elapsed | 79223 | -| total_timesteps | 1911168 | -| train/ | | -| approx_kl | 0.009191007 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.73 | -| learning_rate | 0.0003 | -| loss | -0.000816 | -| n_updates | 149300 | -| policy_gradient_loss | 0.0222 | -| std | 0.00981 | -| value_loss | 0.00643 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14932 | -| time_elapsed | 79228 | -| total_timesteps | 1911296 | -| train/ | | -| approx_kl | 0.06612548 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0646 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 149310 | -| policy_gradient_loss | 0.109 | -| std | 0.00981 | -| value_loss | 2.86e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14933 | -| time_elapsed | 79234 | -| total_timesteps | 1911424 | -| train/ | | -| approx_kl | 0.046991587 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 149320 | -| policy_gradient_loss | 0.0171 | -| std | 0.0098 | -| value_loss | 4.31e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14934 | -| time_elapsed | 79238 | -| total_timesteps | 1911552 | -| train/ | | -| approx_kl | 0.06297581 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0896 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 149330 | -| policy_gradient_loss | 0.0191 | -| std | 0.0098 | -| value_loss | 2.5e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14935 | -| time_elapsed | 79243 | -| total_timesteps | 1911680 | -| train/ | | -| approx_kl | 0.085430816 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 149340 | -| policy_gradient_loss | 0.0124 | -| std | 0.0098 | -| value_loss | 1.66e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14936 | -| time_elapsed | 79247 | -| total_timesteps | 1911808 | -| train/ | | -| approx_kl | 0.11559905 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.0552 | -| n_updates | 149350 | -| policy_gradient_loss | 0.0211 | -| std | 0.0098 | -| value_loss | 1.49e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14937 | -| time_elapsed | 79251 | -| total_timesteps | 1911936 | -| train/ | | -| approx_kl | 0.045480065 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.00775 | -| n_updates | 149360 | -| policy_gradient_loss | 0.0133 | -| std | 0.0098 | -| value_loss | 1.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14938 | -| time_elapsed | 79255 | -| total_timesteps | 1912064 | -| train/ | | -| approx_kl | 0.14108525 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00587 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 149370 | -| policy_gradient_loss | 0.0771 | -| std | 0.0098 | -| value_loss | 6.7e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14939 | -| time_elapsed | 79266 | -| total_timesteps | 1912192 | -| train/ | | -| approx_kl | 0.07081132 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.0262 | -| n_updates | 149380 | -| policy_gradient_loss | -0.0145 | -| std | 0.0098 | -| value_loss | 0.000527 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14940 | -| time_elapsed | 79272 | -| total_timesteps | 1912320 | -| train/ | | -| approx_kl | 0.0029613352 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 149390 | -| policy_gradient_loss | -0.00319 | -| std | 0.0098 | -| value_loss | 1.47e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14941 | -| time_elapsed | 79278 | -| total_timesteps | 1912448 | -| train/ | | -| approx_kl | 1.4187768e-05 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00767 | -| learning_rate | 0.0003 | -| loss | 0.000126 | -| n_updates | 149400 | -| policy_gradient_loss | 0.0048 | -| std | 0.0098 | -| value_loss | 1.78e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14942 | -| time_elapsed | 79282 | -| total_timesteps | 1912576 | -| train/ | | -| approx_kl | 0.00012895279 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 149410 | -| policy_gradient_loss | -0.00226 | -| std | 0.00981 | -| value_loss | 1.29e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14943 | -| time_elapsed | 79286 | -| total_timesteps | 1912704 | -| train/ | | -| approx_kl | 0.031261694 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 149420 | -| policy_gradient_loss | 0.0324 | -| std | 0.00981 | -| value_loss | 8.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14944 | -| time_elapsed | 79290 | -| total_timesteps | 1912832 | -| train/ | | -| approx_kl | 0.009936726 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.000192 | -| n_updates | 149430 | -| policy_gradient_loss | 0.0123 | -| std | 0.00981 | -| value_loss | 4.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14945 | -| time_elapsed | 79294 | -| total_timesteps | 1912960 | -| train/ | | -| approx_kl | 0.013642781 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 149440 | -| policy_gradient_loss | 0.0288 | -| std | 0.00981 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14946 | -| time_elapsed | 79300 | -| total_timesteps | 1913088 | -| train/ | | -| approx_kl | 0.0025205472 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00597 | -| learning_rate | 0.0003 | -| loss | -0.000278 | -| n_updates | 149450 | -| policy_gradient_loss | 0.0447 | -| std | 0.00981 | -| value_loss | 1.58e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14947 | -| time_elapsed | 79310 | -| total_timesteps | 1913216 | -| train/ | | -| approx_kl | 0.021052368 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.763 | -| learning_rate | 0.0003 | -| loss | -0.00595 | -| n_updates | 149460 | -| policy_gradient_loss | -0.00292 | -| std | 0.0098 | -| value_loss | 0.00534 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14948 | -| time_elapsed | 79315 | -| total_timesteps | 1913344 | -| train/ | | -| approx_kl | 0.004657745 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 149470 | -| policy_gradient_loss | 0.0159 | -| std | 0.0098 | -| value_loss | 2.81e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14949 | -| time_elapsed | 79320 | -| total_timesteps | 1913472 | -| train/ | | -| approx_kl | 0.03957802 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 149480 | -| policy_gradient_loss | 0.0188 | -| std | 0.00979 | -| value_loss | 5.35e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14950 | -| time_elapsed | 79324 | -| total_timesteps | 1913600 | -| train/ | | -| approx_kl | 0.07801231 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.444 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 149490 | -| policy_gradient_loss | 0.0215 | -| std | 0.00979 | -| value_loss | 3.35e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14951 | -| time_elapsed | 79328 | -| total_timesteps | 1913728 | -| train/ | | -| approx_kl | 0.07260777 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 149500 | -| policy_gradient_loss | 0.00587 | -| std | 0.00979 | -| value_loss | 1.11e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14952 | -| time_elapsed | 79332 | -| total_timesteps | 1913856 | -| train/ | | -| approx_kl | 0.0007093074 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.000388 | -| n_updates | 149510 | -| policy_gradient_loss | 0.013 | -| std | 0.00979 | -| value_loss | 9.01e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 24 | -| iterations | 14953 | -| time_elapsed | 79336 | -| total_timesteps | 1913984 | -| train/ | | -| approx_kl | 0.00055302214 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 149520 | -| policy_gradient_loss | 0.000615 | -| std | 0.00978 | -| value_loss | 2.18e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 24 | -| iterations | 14954 | -| time_elapsed | 79340 | -| total_timesteps | 1914112 | -| train/ | | -| approx_kl | 0.08890377 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0609 | -| n_updates | 149530 | -| policy_gradient_loss | 0.0836 | -| std | 0.00978 | -| value_loss | 1.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 24 | -| iterations | 14955 | -| time_elapsed | 79353 | -| total_timesteps | 1914240 | -| train/ | | -| approx_kl | 0.027968157 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 149540 | -| policy_gradient_loss | -0.000521 | -| std | 0.00978 | -| value_loss | 0.00232 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 24 | -| iterations | 14956 | -| time_elapsed | 79357 | -| total_timesteps | 1914368 | -| train/ | | -| approx_kl | 0.027274262 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.887 | -| learning_rate | 0.0003 | -| loss | 0.0265 | -| n_updates | 149550 | -| policy_gradient_loss | 0.00934 | -| std | 0.00979 | -| value_loss | 4.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 24 | -| iterations | 14957 | -| time_elapsed | 79362 | -| total_timesteps | 1914496 | -| train/ | | -| approx_kl | 0.07116808 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 149560 | -| policy_gradient_loss | 0.0326 | -| std | 0.00979 | -| value_loss | 4.69e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 24 | -| iterations | 14958 | -| time_elapsed | 79366 | -| total_timesteps | 1914624 | -| train/ | | -| approx_kl | 0.07181233 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00735 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 149570 | -| policy_gradient_loss | 0.00719 | -| std | 0.00979 | -| value_loss | 2.6e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 24 | -| iterations | 14959 | -| time_elapsed | 79371 | -| total_timesteps | 1914752 | -| train/ | | -| approx_kl | 0.3082786 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00603 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 149580 | -| policy_gradient_loss | 0.0262 | -| std | 0.00979 | -| value_loss | 1.3e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 24 | -| iterations | 14960 | -| time_elapsed | 79376 | -| total_timesteps | 1914880 | -| train/ | | -| approx_kl | 0.019394914 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | -0.0307 | -| n_updates | 149590 | -| policy_gradient_loss | -0.0108 | -| std | 0.00979 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14961 | -| time_elapsed | 79381 | -| total_timesteps | 1915008 | -| train/ | | -| approx_kl | 0.024324566 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 149600 | -| policy_gradient_loss | 0.000843 | -| std | 0.0098 | -| value_loss | 6.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14962 | -| time_elapsed | 79394 | -| total_timesteps | 1915136 | -| train/ | | -| approx_kl | 0.063215606 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.778 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 149610 | -| policy_gradient_loss | -0.0157 | -| std | 0.0098 | -| value_loss | 0.00191 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14963 | -| time_elapsed | 79399 | -| total_timesteps | 1915264 | -| train/ | | -| approx_kl | 0.009707022 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.0253 | -| learning_rate | 0.0003 | -| loss | 0.00655 | -| n_updates | 149620 | -| policy_gradient_loss | 0.00898 | -| std | 0.00978 | -| value_loss | 0.00105 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14964 | -| time_elapsed | 79403 | -| total_timesteps | 1915392 | -| train/ | | -| approx_kl | 0.10333937 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 149630 | -| policy_gradient_loss | 0.0748 | -| std | 0.00978 | -| value_loss | 1.87e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14965 | -| time_elapsed | 79408 | -| total_timesteps | 1915520 | -| train/ | | -| approx_kl | 0.015731733 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00355 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 149640 | -| policy_gradient_loss | 0.00562 | -| std | 0.00977 | -| value_loss | 7.81e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14966 | -| time_elapsed | 79412 | -| total_timesteps | 1915648 | -| train/ | | -| approx_kl | 0.30792308 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 149650 | -| policy_gradient_loss | 0.0373 | -| std | 0.00977 | -| value_loss | 3.31e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14967 | -| time_elapsed | 79416 | -| total_timesteps | 1915776 | -| train/ | | -| approx_kl | 0.006616468 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 149660 | -| policy_gradient_loss | 0.00115 | -| std | 0.00976 | -| value_loss | 2.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14968 | -| time_elapsed | 79419 | -| total_timesteps | 1915904 | -| train/ | | -| approx_kl | 0.036926392 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 149670 | -| policy_gradient_loss | 0.00214 | -| std | 0.00976 | -| value_loss | 1.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14969 | -| time_elapsed | 79423 | -| total_timesteps | 1916032 | -| train/ | | -| approx_kl | 0.026262874 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | 0.00961 | -| n_updates | 149680 | -| policy_gradient_loss | 0.0305 | -| std | 0.00976 | -| value_loss | 1.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14970 | -| time_elapsed | 79432 | -| total_timesteps | 1916160 | -| train/ | | -| approx_kl | 0.07364845 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 149690 | -| policy_gradient_loss | -0.0148 | -| std | 0.00975 | -| value_loss | 0.000214 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14971 | -| time_elapsed | 79436 | -| total_timesteps | 1916288 | -| train/ | | -| approx_kl | 0.1982262 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 149700 | -| policy_gradient_loss | 0.0889 | -| std | 0.00975 | -| value_loss | 3.84e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14972 | -| time_elapsed | 79441 | -| total_timesteps | 1916416 | -| train/ | | -| approx_kl | 0.10654439 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 149710 | -| policy_gradient_loss | 0.0818 | -| std | 0.00975 | -| value_loss | 1.44e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14973 | -| time_elapsed | 79446 | -| total_timesteps | 1916544 | -| train/ | | -| approx_kl | 0.096759036 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 149720 | -| policy_gradient_loss | 0.0962 | -| std | 0.00975 | -| value_loss | 1.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14974 | -| time_elapsed | 79451 | -| total_timesteps | 1916672 | -| train/ | | -| approx_kl | 0.084262885 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | 0.0834 | -| n_updates | 149730 | -| policy_gradient_loss | 0.0847 | -| std | 0.00975 | -| value_loss | 1.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14975 | -| time_elapsed | 79456 | -| total_timesteps | 1916800 | -| train/ | | -| approx_kl | 0.015123019 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 149740 | -| policy_gradient_loss | 0.0127 | -| std | 0.00976 | -| value_loss | 6.9e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 24 | -| iterations | 14976 | -| time_elapsed | 79461 | -| total_timesteps | 1916928 | -| train/ | | -| approx_kl | 0.27399898 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | 0.0915 | -| n_updates | 149750 | -| policy_gradient_loss | 0.028 | -| std | 0.00976 | -| value_loss | 4.41e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14977 | -| time_elapsed | 79467 | -| total_timesteps | 1917056 | -| train/ | | -| approx_kl | 0.023201667 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.00677 | -| n_updates | 149760 | -| policy_gradient_loss | 0.00377 | -| std | 0.00976 | -| value_loss | 2.76e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14978 | -| time_elapsed | 79479 | -| total_timesteps | 1917184 | -| train/ | | -| approx_kl | 0.36876494 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | -0.0057 | -| n_updates | 149770 | -| policy_gradient_loss | -0.0101 | -| std | 0.00975 | -| value_loss | 0.0021 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14979 | -| time_elapsed | 79485 | -| total_timesteps | 1917312 | -| train/ | | -| approx_kl | 0.13971666 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 149780 | -| policy_gradient_loss | 0.017 | -| std | 0.00975 | -| value_loss | 4.78e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14980 | -| time_elapsed | 79491 | -| total_timesteps | 1917440 | -| train/ | | -| approx_kl | 0.1333682 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 149790 | -| policy_gradient_loss | 0.0513 | -| std | 0.00974 | -| value_loss | 3.99e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14981 | -| time_elapsed | 79498 | -| total_timesteps | 1917568 | -| train/ | | -| approx_kl | 0.00087747443 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.000954 | -| n_updates | 149800 | -| policy_gradient_loss | 0.00376 | -| std | 0.00975 | -| value_loss | 2.11e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14982 | -| time_elapsed | 79505 | -| total_timesteps | 1917696 | -| train/ | | -| approx_kl | 1.97161e-06 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | -4.14e-05 | -| n_updates | 149810 | -| policy_gradient_loss | 0.00547 | -| std | 0.00977 | -| value_loss | 3.99e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14983 | -| time_elapsed | 79511 | -| total_timesteps | 1917824 | -| train/ | | -| approx_kl | 0.00013809279 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.00085 | -| n_updates | 149820 | -| policy_gradient_loss | 0.00638 | -| std | 0.00977 | -| value_loss | 5.57e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 14984 | -| time_elapsed | 79516 | -| total_timesteps | 1917952 | -| train/ | | -| approx_kl | 5.107606e-05 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | -0.000359 | -| n_updates | 149830 | -| policy_gradient_loss | 0.00101 | -| std | 0.00977 | -| value_loss | 9.05e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14985 | -| time_elapsed | 79523 | -| total_timesteps | 1918080 | -| train/ | | -| approx_kl | 9.62317e-05 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 149840 | -| policy_gradient_loss | -0.000963 | -| std | 0.00977 | -| value_loss | 3.94e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14986 | -| time_elapsed | 79535 | -| total_timesteps | 1918208 | -| train/ | | -| approx_kl | 0.5576691 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00679 | -| learning_rate | 0.0003 | -| loss | -0.027 | -| n_updates | 149850 | -| policy_gradient_loss | -0.0209 | -| std | 0.00977 | -| value_loss | 0.00134 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14987 | -| time_elapsed | 79540 | -| total_timesteps | 1918336 | -| train/ | | -| approx_kl | 0.04014556 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -8.92 | -| learning_rate | 0.0003 | -| loss | 0.00902 | -| n_updates | 149860 | -| policy_gradient_loss | 0.00859 | -| std | 0.00976 | -| value_loss | 3.6e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14988 | -| time_elapsed | 79546 | -| total_timesteps | 1918464 | -| train/ | | -| approx_kl | 0.1289216 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -5.31 | -| learning_rate | 0.0003 | -| loss | 0.0957 | -| n_updates | 149870 | -| policy_gradient_loss | 0.0476 | -| std | 0.00976 | -| value_loss | 5.75e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14989 | -| time_elapsed | 79554 | -| total_timesteps | 1918592 | -| train/ | | -| approx_kl | 0.03824972 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 149880 | -| policy_gradient_loss | 0.0127 | -| std | 0.00976 | -| value_loss | 1.72e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14990 | -| time_elapsed | 79560 | -| total_timesteps | 1918720 | -| train/ | | -| approx_kl | 0.31461746 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 149890 | -| policy_gradient_loss | 0.0404 | -| std | 0.00976 | -| value_loss | 1.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14991 | -| time_elapsed | 79565 | -| total_timesteps | 1918848 | -| train/ | | -| approx_kl | 0.019713705 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.0083 | -| learning_rate | 0.0003 | -| loss | 0.000286 | -| n_updates | 149900 | -| policy_gradient_loss | 0.000915 | -| std | 0.00976 | -| value_loss | 5.75e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 14992 | -| time_elapsed | 79574 | -| total_timesteps | 1918976 | -| train/ | | -| approx_kl | 1.3491139e-05 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00875 | -| learning_rate | 0.0003 | -| loss | -0.000915 | -| n_updates | 149910 | -| policy_gradient_loss | -0.00525 | -| std | 0.00976 | -| value_loss | 3.86e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14993 | -| time_elapsed | 79580 | -| total_timesteps | 1919104 | -| train/ | | -| approx_kl | 0.021754615 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 149920 | -| policy_gradient_loss | -0.00853 | -| std | 0.00976 | -| value_loss | 2.4e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14994 | -| time_elapsed | 79597 | -| total_timesteps | 1919232 | -| train/ | | -| approx_kl | 0.15883859 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 149930 | -| policy_gradient_loss | -0.0165 | -| std | 0.00975 | -| value_loss | 0.000202 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14995 | -| time_elapsed | 79603 | -| total_timesteps | 1919360 | -| train/ | | -| approx_kl | 0.0052507226 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | -0.00848 | -| n_updates | 149940 | -| policy_gradient_loss | 0.00763 | -| std | 0.00975 | -| value_loss | 1.71e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14996 | -| time_elapsed | 79609 | -| total_timesteps | 1919488 | -| train/ | | -| approx_kl | 0.29527792 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 149950 | -| policy_gradient_loss | 0.0359 | -| std | 0.00976 | -| value_loss | 1.2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14997 | -| time_elapsed | 79617 | -| total_timesteps | 1919616 | -| train/ | | -| approx_kl | 0.018227281 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00219 | -| learning_rate | 0.0003 | -| loss | -0.0076 | -| n_updates | 149960 | -| policy_gradient_loss | -0.00253 | -| std | 0.00976 | -| value_loss | 4.34e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14998 | -| time_elapsed | 79627 | -| total_timesteps | 1919744 | -| train/ | | -| approx_kl | 0.025866091 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00883 | -| learning_rate | 0.0003 | -| loss | -0.00813 | -| n_updates | 149970 | -| policy_gradient_loss | -0.00438 | -| std | 0.00977 | -| value_loss | 9.4e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 24 | -| iterations | 14999 | -| time_elapsed | 79636 | -| total_timesteps | 1919872 | -| train/ | | -| approx_kl | 0.0050877635 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00891 | -| learning_rate | 0.0003 | -| loss | -0.000748 | -| n_updates | 149980 | -| policy_gradient_loss | 0.0037 | -| std | 0.00977 | -| value_loss | 5.69e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15000 | -| time_elapsed | 79651 | -| total_timesteps | 1920000 | -| train/ | | -| approx_kl | 0.037322648 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.00479 | -| n_updates | 149990 | -| policy_gradient_loss | 0.0178 | -| std | 0.00977 | -| value_loss | 3.8e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15001 | -| time_elapsed | 79660 | -| total_timesteps | 1920128 | -| train/ | | -| approx_kl | 0.0477967 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00228 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 150000 | -| policy_gradient_loss | 0.0231 | -| std | 0.00978 | -| value_loss | 1.95e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15002 | -| time_elapsed | 79674 | -| total_timesteps | 1920256 | -| train/ | | -| approx_kl | 0.0010935552 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.689 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 150010 | -| policy_gradient_loss | 0.0043 | -| std | 0.00978 | -| value_loss | 0.00689 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15003 | -| time_elapsed | 79680 | -| total_timesteps | 1920384 | -| train/ | | -| approx_kl | 0.0035523726 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 150020 | -| policy_gradient_loss | -0.00179 | -| std | 0.00977 | -| value_loss | 2.36e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15004 | -| time_elapsed | 79687 | -| total_timesteps | 1920512 | -| train/ | | -| approx_kl | 0.12468647 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0452 | -| learning_rate | 0.0003 | -| loss | 0.0774 | -| n_updates | 150030 | -| policy_gradient_loss | 0.0248 | -| std | 0.00977 | -| value_loss | 4.86e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15005 | -| time_elapsed | 79694 | -| total_timesteps | 1920640 | -| train/ | | -| approx_kl | 0.018035945 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 150040 | -| policy_gradient_loss | 0.0339 | -| std | 0.00983 | -| value_loss | 2.85e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15006 | -| time_elapsed | 79699 | -| total_timesteps | 1920768 | -| train/ | | -| approx_kl | 0.0030531678 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00815 | -| learning_rate | 0.0003 | -| loss | 0.00809 | -| n_updates | 150050 | -| policy_gradient_loss | 0.00881 | -| std | 0.00986 | -| value_loss | 6.16e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15007 | -| time_elapsed | 79705 | -| total_timesteps | 1920896 | -| train/ | | -| approx_kl | 0.09531789 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00417 | -| learning_rate | 0.0003 | -| loss | 0.0675 | -| n_updates | 150060 | -| policy_gradient_loss | 0.026 | -| std | 0.00987 | -| value_loss | 1.28e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15008 | -| time_elapsed | 79711 | -| total_timesteps | 1921024 | -| train/ | | -| approx_kl | 0.024808265 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 150070 | -| policy_gradient_loss | 0.0426 | -| std | 0.00987 | -| value_loss | 5.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15009 | -| time_elapsed | 79724 | -| total_timesteps | 1921152 | -| train/ | | -| approx_kl | 0.052978575 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 150080 | -| policy_gradient_loss | -0.014 | -| std | 0.00987 | -| value_loss | 0.000231 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15010 | -| time_elapsed | 79727 | -| total_timesteps | 1921280 | -| train/ | | -| approx_kl | 0.12357565 | -| clip_fraction | 0.612 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.12 | -| learning_rate | 0.0003 | -| loss | 0.0861 | -| n_updates | 150090 | -| policy_gradient_loss | 0.0572 | -| std | 0.00987 | -| value_loss | 1.94e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15011 | -| time_elapsed | 79732 | -| total_timesteps | 1921408 | -| train/ | | -| approx_kl | 0.024994118 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 150100 | -| policy_gradient_loss | 0.0148 | -| std | 0.00988 | -| value_loss | 1.7e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15012 | -| time_elapsed | 79738 | -| total_timesteps | 1921536 | -| train/ | | -| approx_kl | 0.33728504 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0912 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 150110 | -| policy_gradient_loss | 0.0428 | -| std | 0.00988 | -| value_loss | 3.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15013 | -| time_elapsed | 79743 | -| total_timesteps | 1921664 | -| train/ | | -| approx_kl | 0.018107856 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.00696 | -| n_updates | 150120 | -| policy_gradient_loss | 0.00395 | -| std | 0.00987 | -| value_loss | 2.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15014 | -| time_elapsed | 79748 | -| total_timesteps | 1921792 | -| train/ | | -| approx_kl | 0.039350715 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | -0.000333 | -| n_updates | 150130 | -| policy_gradient_loss | 0.0143 | -| std | 0.00987 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 24 | -| iterations | 15015 | -| time_elapsed | 79753 | -| total_timesteps | 1921920 | -| train/ | | -| approx_kl | 0.053264663 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0646 | -| n_updates | 150140 | -| policy_gradient_loss | 0.0309 | -| std | 0.00986 | -| value_loss | 7.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15016 | -| time_elapsed | 79759 | -| total_timesteps | 1922048 | -| train/ | | -| approx_kl | 0.08278862 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.0606 | -| n_updates | 150150 | -| policy_gradient_loss | 0.0152 | -| std | 0.00986 | -| value_loss | 4.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15017 | -| time_elapsed | 79770 | -| total_timesteps | 1922176 | -| train/ | | -| approx_kl | 0.103107914 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.886 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 150160 | -| policy_gradient_loss | 0.000855 | -| std | 0.00986 | -| value_loss | 0.00123 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15018 | -| time_elapsed | 79776 | -| total_timesteps | 1922304 | -| train/ | | -| approx_kl | 0.017508393 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 150170 | -| policy_gradient_loss | 0.0344 | -| std | 0.00986 | -| value_loss | 1.06e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15019 | -| time_elapsed | 79781 | -| total_timesteps | 1922432 | -| train/ | | -| approx_kl | 0.37427965 | -| clip_fraction | 0.656 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00279 | -| learning_rate | 0.0003 | -| loss | 0.153 | -| n_updates | 150180 | -| policy_gradient_loss | 0.0931 | -| std | 0.00988 | -| value_loss | 1.18e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15020 | -| time_elapsed | 79785 | -| total_timesteps | 1922560 | -| train/ | | -| approx_kl | 0.0034041335 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 150190 | -| policy_gradient_loss | 0.00783 | -| std | 0.00988 | -| value_loss | 4.5e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15021 | -| time_elapsed | 79791 | -| total_timesteps | 1922688 | -| train/ | | -| approx_kl | 0.00012027752 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | 0.000116 | -| n_updates | 150200 | -| policy_gradient_loss | 0.0161 | -| std | 0.00988 | -| value_loss | 2.4e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15022 | -| time_elapsed | 79795 | -| total_timesteps | 1922816 | -| train/ | | -| approx_kl | 0.25028223 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 150210 | -| policy_gradient_loss | 0.0317 | -| std | 0.00987 | -| value_loss | 1.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 24 | -| iterations | 15023 | -| time_elapsed | 79801 | -| total_timesteps | 1922944 | -| train/ | | -| approx_kl | 0.01810002 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.000473 | -| n_updates | 150220 | -| policy_gradient_loss | 0.000436 | -| std | 0.00986 | -| value_loss | 8.94e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15024 | -| time_elapsed | 79807 | -| total_timesteps | 1923072 | -| train/ | | -| approx_kl | 2.1265354e-05 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0211 | -| learning_rate | 0.0003 | -| loss | -0.000519 | -| n_updates | 150230 | -| policy_gradient_loss | 0.002 | -| std | 0.00985 | -| value_loss | 4.78e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15025 | -| time_elapsed | 79816 | -| total_timesteps | 1923200 | -| train/ | | -| approx_kl | 0.0020270557 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 150240 | -| policy_gradient_loss | -0.013 | -| std | 0.00983 | -| value_loss | 7.29e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15026 | -| time_elapsed | 79822 | -| total_timesteps | 1923328 | -| train/ | | -| approx_kl | 0.0027152738 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 150250 | -| policy_gradient_loss | 0.0128 | -| std | 0.00982 | -| value_loss | 6.08e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15027 | -| time_elapsed | 79827 | -| total_timesteps | 1923456 | -| train/ | | -| approx_kl | 0.106459595 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.000754 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 150260 | -| policy_gradient_loss | 0.0354 | -| std | 0.00979 | -| value_loss | 0.0015 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15028 | -| time_elapsed | 79832 | -| total_timesteps | 1923584 | -| train/ | | -| approx_kl | 0.031544447 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 150270 | -| policy_gradient_loss | 0.042 | -| std | 0.00978 | -| value_loss | 7.48e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15029 | -| time_elapsed | 79837 | -| total_timesteps | 1923712 | -| train/ | | -| approx_kl | 0.09996398 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00541 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 150280 | -| policy_gradient_loss | 0.0162 | -| std | 0.00977 | -| value_loss | 4.07e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15030 | -| time_elapsed | 79843 | -| total_timesteps | 1923840 | -| train/ | | -| approx_kl | 0.028859176 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.00137 | -| n_updates | 150290 | -| policy_gradient_loss | 0.0363 | -| std | 0.00977 | -| value_loss | 2.65e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 24 | -| iterations | 15031 | -| time_elapsed | 79847 | -| total_timesteps | 1923968 | -| train/ | | -| approx_kl | 0.119451195 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 150300 | -| policy_gradient_loss | 0.0212 | -| std | 0.00977 | -| value_loss | 1.53e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15032 | -| time_elapsed | 79852 | -| total_timesteps | 1924096 | -| train/ | | -| approx_kl | 0.0006935885 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 150310 | -| policy_gradient_loss | 0.00219 | -| std | 0.00977 | -| value_loss | 1.12e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15033 | -| time_elapsed | 79862 | -| total_timesteps | 1924224 | -| train/ | | -| approx_kl | 0.0019347351 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | -0.00818 | -| n_updates | 150320 | -| policy_gradient_loss | 0.000659 | -| std | 0.00976 | -| value_loss | 0.00112 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15034 | -| time_elapsed | 79867 | -| total_timesteps | 1924352 | -| train/ | | -| approx_kl | 0.0013443981 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.00116 | -| n_updates | 150330 | -| policy_gradient_loss | 0.00322 | -| std | 0.00976 | -| value_loss | 1.04e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15035 | -| time_elapsed | 79873 | -| total_timesteps | 1924480 | -| train/ | | -| approx_kl | 0.09100693 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.0746 | -| n_updates | 150340 | -| policy_gradient_loss | 0.0672 | -| std | 0.00977 | -| value_loss | 1.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15036 | -| time_elapsed | 79878 | -| total_timesteps | 1924608 | -| train/ | | -| approx_kl | 0.015218416 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.00046 | -| n_updates | 150350 | -| policy_gradient_loss | 0.00813 | -| std | 0.00977 | -| value_loss | 1.17e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15037 | -| time_elapsed | 79883 | -| total_timesteps | 1924736 | -| train/ | | -| approx_kl | 0.00042034034 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.000264 | -| n_updates | 150360 | -| policy_gradient_loss | 0.00316 | -| std | 0.00978 | -| value_loss | 1.05e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15038 | -| time_elapsed | 79888 | -| total_timesteps | 1924864 | -| train/ | | -| approx_kl | 0.066795915 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | 0.0618 | -| n_updates | 150370 | -| policy_gradient_loss | 0.0567 | -| std | 0.00978 | -| value_loss | 2.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 24 | -| iterations | 15039 | -| time_elapsed | 79894 | -| total_timesteps | 1924992 | -| train/ | | -| approx_kl | 0.018252008 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00342 | -| learning_rate | 0.0003 | -| loss | -0.0235 | -| n_updates | 150380 | -| policy_gradient_loss | 0.0104 | -| std | 0.00978 | -| value_loss | 8.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 15040 | -| time_elapsed | 79899 | -| total_timesteps | 1925120 | -| train/ | | -| approx_kl | 0.25756127 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00962 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 150390 | -| policy_gradient_loss | 0.0282 | -| std | 0.00978 | -| value_loss | 4.82e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 15041 | -| time_elapsed | 79918 | -| total_timesteps | 1925248 | -| train/ | | -| approx_kl | 0.053693146 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 150400 | -| policy_gradient_loss | -0.00858 | -| std | 0.00978 | -| value_loss | 0.000649 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 15042 | -| time_elapsed | 79923 | -| total_timesteps | 1925376 | -| train/ | | -| approx_kl | 0.022628605 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.000199 | -| learning_rate | 0.0003 | -| loss | 0.00612 | -| n_updates | 150410 | -| policy_gradient_loss | 0.0388 | -| std | 0.00977 | -| value_loss | 6.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 15043 | -| time_elapsed | 79930 | -| total_timesteps | 1925504 | -| train/ | | -| approx_kl | 0.007868964 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00239 | -| learning_rate | 0.0003 | -| loss | -0.00545 | -| n_updates | 150420 | -| policy_gradient_loss | 0.00852 | -| std | 0.00977 | -| value_loss | 1.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 15044 | -| time_elapsed | 79939 | -| total_timesteps | 1925632 | -| train/ | | -| approx_kl | 0.078070775 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.0518 | -| n_updates | 150430 | -| policy_gradient_loss | 0.00764 | -| std | 0.00977 | -| value_loss | 9.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 15045 | -| time_elapsed | 79948 | -| total_timesteps | 1925760 | -| train/ | | -| approx_kl | 0.023091337 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 150440 | -| policy_gradient_loss | 0.018 | -| std | 0.00977 | -| value_loss | 4.53e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 24 | -| iterations | 15046 | -| time_elapsed | 79955 | -| total_timesteps | 1925888 | -| train/ | | -| approx_kl | 0.16277923 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 150450 | -| policy_gradient_loss | 0.0794 | -| std | 0.00977 | -| value_loss | 2.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15047 | -| time_elapsed | 79960 | -| total_timesteps | 1926016 | -| train/ | | -| approx_kl | 0.026690625 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 150460 | -| policy_gradient_loss | 0.0131 | -| std | 0.00977 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15048 | -| time_elapsed | 79970 | -| total_timesteps | 1926144 | -| train/ | | -| approx_kl | 0.0013058395 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.73 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 150470 | -| policy_gradient_loss | -0.00348 | -| std | 0.00976 | -| value_loss | 0.0061 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15049 | -| time_elapsed | 79976 | -| total_timesteps | 1926272 | -| train/ | | -| approx_kl | 0.035701215 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 150480 | -| policy_gradient_loss | 0.0202 | -| std | 0.00976 | -| value_loss | 1.36e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15050 | -| time_elapsed | 79983 | -| total_timesteps | 1926400 | -| train/ | | -| approx_kl | 0.15053307 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.531 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 150490 | -| policy_gradient_loss | 0.0605 | -| std | 0.00976 | -| value_loss | 1.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15051 | -| time_elapsed | 79989 | -| total_timesteps | 1926528 | -| train/ | | -| approx_kl | 0.076053694 | -| clip_fraction | 0.581 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0616 | -| n_updates | 150500 | -| policy_gradient_loss | 0.0722 | -| std | 0.00976 | -| value_loss | 7.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15052 | -| time_elapsed | 79998 | -| total_timesteps | 1926656 | -| train/ | | -| approx_kl | 0.022244632 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0834 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 150510 | -| policy_gradient_loss | 0.017 | -| std | 0.00976 | -| value_loss | 4.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15053 | -| time_elapsed | 80006 | -| total_timesteps | 1926784 | -| train/ | | -| approx_kl | 0.25481197 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 150520 | -| policy_gradient_loss | 0.0323 | -| std | 0.00976 | -| value_loss | 2.82e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15054 | -| time_elapsed | 80012 | -| total_timesteps | 1926912 | -| train/ | | -| approx_kl | 0.006258593 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | -0.00697 | -| n_updates | 150530 | -| policy_gradient_loss | 0.00102 | -| std | 0.00976 | -| value_loss | 7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15055 | -| time_elapsed | 80016 | -| total_timesteps | 1927040 | -| train/ | | -| approx_kl | 0.001337653 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 150540 | -| policy_gradient_loss | 0.0029 | -| std | 0.00976 | -| value_loss | 2.97e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15056 | -| time_elapsed | 80034 | -| total_timesteps | 1927168 | -| train/ | | -| approx_kl | 0.03413053 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.0236 | -| n_updates | 150550 | -| policy_gradient_loss | -0.00209 | -| std | 0.00976 | -| value_loss | 0.000373 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15057 | -| time_elapsed | 80042 | -| total_timesteps | 1927296 | -| train/ | | -| approx_kl | 0.012071395 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.477 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 150560 | -| policy_gradient_loss | -0.00532 | -| std | 0.00976 | -| value_loss | 8.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15058 | -| time_elapsed | 80055 | -| total_timesteps | 1927424 | -| train/ | | -| approx_kl | 0.030052654 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.818 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 150570 | -| policy_gradient_loss | -0.00327 | -| std | 0.00976 | -| value_loss | 2.31e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15059 | -| time_elapsed | 80069 | -| total_timesteps | 1927552 | -| train/ | | -| approx_kl | 0.00020620879 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0029 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 150580 | -| policy_gradient_loss | -0.00012 | -| std | 0.00976 | -| value_loss | 1.24e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15060 | -| time_elapsed | 80084 | -| total_timesteps | 1927680 | -| train/ | | -| approx_kl | 0.0041394657 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 150590 | -| policy_gradient_loss | 0.00091 | -| std | 0.00976 | -| value_loss | 7.11e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15061 | -| time_elapsed | 80092 | -| total_timesteps | 1927808 | -| train/ | | -| approx_kl | 0.0155146085 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00918 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 150600 | -| policy_gradient_loss | 0.0864 | -| std | 0.00976 | -| value_loss | 5.13e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 24 | -| iterations | 15062 | -| time_elapsed | 80104 | -| total_timesteps | 1927936 | -| train/ | | -| approx_kl | 0.050634682 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 150610 | -| policy_gradient_loss | 0.0792 | -| std | 0.00976 | -| value_loss | 5.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15063 | -| time_elapsed | 80114 | -| total_timesteps | 1928064 | -| train/ | | -| approx_kl | 0.010826168 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0771 | -| learning_rate | 0.0003 | -| loss | 0.00457 | -| n_updates | 150620 | -| policy_gradient_loss | 0.0141 | -| std | 0.00976 | -| value_loss | 2.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15064 | -| time_elapsed | 80136 | -| total_timesteps | 1928192 | -| train/ | | -| approx_kl | 0.036805864 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.648 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 150630 | -| policy_gradient_loss | -0.0149 | -| std | 0.00976 | -| value_loss | 0.000762 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15065 | -| time_elapsed | 80144 | -| total_timesteps | 1928320 | -| train/ | | -| approx_kl | 0.032476265 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 150640 | -| policy_gradient_loss | 0.0177 | -| std | 0.00976 | -| value_loss | 7.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15066 | -| time_elapsed | 80152 | -| total_timesteps | 1928448 | -| train/ | | -| approx_kl | 0.048356306 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0776 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 150650 | -| policy_gradient_loss | -0.014 | -| std | 0.00976 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15067 | -| time_elapsed | 80165 | -| total_timesteps | 1928576 | -| train/ | | -| approx_kl | 0.0057228818 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | -0.00769 | -| n_updates | 150660 | -| policy_gradient_loss | 0.0478 | -| std | 0.00976 | -| value_loss | 7.64e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15068 | -| time_elapsed | 80173 | -| total_timesteps | 1928704 | -| train/ | | -| approx_kl | 0.019694569 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 150670 | -| policy_gradient_loss | 0.0297 | -| std | 0.00976 | -| value_loss | 2.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15069 | -| time_elapsed | 80180 | -| total_timesteps | 1928832 | -| train/ | | -| approx_kl | 0.04929963 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.0284 | -| n_updates | 150680 | -| policy_gradient_loss | 0.0138 | -| std | 0.00975 | -| value_loss | 1.94e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15070 | -| time_elapsed | 80187 | -| total_timesteps | 1928960 | -| train/ | | -| approx_kl | 0.00014650682 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | -6.71e-05 | -| n_updates | 150690 | -| policy_gradient_loss | 0.0148 | -| std | 0.00975 | -| value_loss | 1.22e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15071 | -| time_elapsed | 80196 | -| total_timesteps | 1929088 | -| train/ | | -| approx_kl | 0.08846645 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 150700 | -| policy_gradient_loss | 0.00969 | -| std | 0.00975 | -| value_loss | 8.2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15072 | -| time_elapsed | 80212 | -| total_timesteps | 1929216 | -| train/ | | -| approx_kl | 0.027361734 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.764 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 150710 | -| policy_gradient_loss | -0.0174 | -| std | 0.00976 | -| value_loss | 0.00488 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15073 | -| time_elapsed | 80218 | -| total_timesteps | 1929344 | -| train/ | | -| approx_kl | 0.030732738 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 150720 | -| policy_gradient_loss | 0.031 | -| std | 0.00979 | -| value_loss | 1.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15074 | -| time_elapsed | 80224 | -| total_timesteps | 1929472 | -| train/ | | -| approx_kl | 0.058974415 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00511 | -| learning_rate | 0.0003 | -| loss | 0.0043 | -| n_updates | 150730 | -| policy_gradient_loss | 0.00634 | -| std | 0.00981 | -| value_loss | 8.13e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15075 | -| time_elapsed | 80231 | -| total_timesteps | 1929600 | -| train/ | | -| approx_kl | 0.0705042 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00725 | -| learning_rate | 0.0003 | -| loss | 0.032 | -| n_updates | 150740 | -| policy_gradient_loss | 0.0236 | -| std | 0.00981 | -| value_loss | 8.18e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15076 | -| time_elapsed | 80239 | -| total_timesteps | 1929728 | -| train/ | | -| approx_kl | 0.06808533 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 150750 | -| policy_gradient_loss | 0.0214 | -| std | 0.00981 | -| value_loss | 4.74e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15077 | -| time_elapsed | 80249 | -| total_timesteps | 1929856 | -| train/ | | -| approx_kl | 0.12905595 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.073 | -| n_updates | 150760 | -| policy_gradient_loss | 0.0222 | -| std | 0.00981 | -| value_loss | 2.75e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 24 | -| iterations | 15078 | -| time_elapsed | 80261 | -| total_timesteps | 1929984 | -| train/ | | -| approx_kl | 0.026969496 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.00778 | -| n_updates | 150770 | -| policy_gradient_loss | 0.0351 | -| std | 0.00981 | -| value_loss | 2.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15079 | -| time_elapsed | 80273 | -| total_timesteps | 1930112 | -| train/ | | -| approx_kl | 0.04868562 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 150780 | -| policy_gradient_loss | 0.0138 | -| std | 0.00979 | -| value_loss | 6.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15080 | -| time_elapsed | 80304 | -| total_timesteps | 1930240 | -| train/ | | -| approx_kl | 0.052460294 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.616 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 150790 | -| policy_gradient_loss | -0.0164 | -| std | 0.00979 | -| value_loss | 0.00176 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15081 | -| time_elapsed | 80316 | -| total_timesteps | 1930368 | -| train/ | | -| approx_kl | 0.00011581322 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -6.16e-05 | -| n_updates | 150800 | -| policy_gradient_loss | 0.0051 | -| std | 0.00979 | -| value_loss | 8.72e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15082 | -| time_elapsed | 80328 | -| total_timesteps | 1930496 | -| train/ | | -| approx_kl | 0.032718405 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | -0.000744 | -| n_updates | 150810 | -| policy_gradient_loss | 0.00765 | -| std | 0.0098 | -| value_loss | 5.04e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15083 | -| time_elapsed | 80342 | -| total_timesteps | 1930624 | -| train/ | | -| approx_kl | 0.0015531131 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.297 | -| learning_rate | 0.0003 | -| loss | 0.00343 | -| n_updates | 150820 | -| policy_gradient_loss | 0.00341 | -| std | 0.0098 | -| value_loss | 1.1e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15084 | -| time_elapsed | 80353 | -| total_timesteps | 1930752 | -| train/ | | -| approx_kl | 0.11552681 | -| clip_fraction | 0.619 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 150830 | -| policy_gradient_loss | 0.0856 | -| std | 0.00979 | -| value_loss | 1.88e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 24 | -| iterations | 15085 | -| time_elapsed | 80364 | -| total_timesteps | 1930880 | -| train/ | | -| approx_kl | 0.06418861 | -| clip_fraction | 0.612 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00395 | -| learning_rate | 0.0003 | -| loss | 0.0339 | -| n_updates | 150840 | -| policy_gradient_loss | 0.0816 | -| std | 0.0098 | -| value_loss | 2.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15086 | -| time_elapsed | 80375 | -| total_timesteps | 1931008 | -| train/ | | -| approx_kl | 0.010553893 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 150850 | -| policy_gradient_loss | 0.00899 | -| std | 0.0098 | -| value_loss | 1.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15087 | -| time_elapsed | 80409 | -| total_timesteps | 1931136 | -| train/ | | -| approx_kl | 0.015880577 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 150860 | -| policy_gradient_loss | 0.000677 | -| std | 0.00979 | -| value_loss | 0.000147 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15088 | -| time_elapsed | 80418 | -| total_timesteps | 1931264 | -| train/ | | -| approx_kl | 0.39069548 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.259 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 150870 | -| policy_gradient_loss | 0.0236 | -| std | 0.00979 | -| value_loss | 3.31e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15089 | -| time_elapsed | 80428 | -| total_timesteps | 1931392 | -| train/ | | -| approx_kl | 0.015175456 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 150880 | -| policy_gradient_loss | 0.000415 | -| std | 0.00979 | -| value_loss | 4.51e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15090 | -| time_elapsed | 80437 | -| total_timesteps | 1931520 | -| train/ | | -| approx_kl | 0.038579375 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 150890 | -| policy_gradient_loss | 0.0192 | -| std | 0.00979 | -| value_loss | 2.38e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15091 | -| time_elapsed | 80447 | -| total_timesteps | 1931648 | -| train/ | | -| approx_kl | 0.5556175 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.193 | -| n_updates | 150900 | -| policy_gradient_loss | 0.126 | -| std | 0.00979 | -| value_loss | 1.3e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15092 | -| time_elapsed | 80458 | -| total_timesteps | 1931776 | -| train/ | | -| approx_kl | 0.0020974684 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 150910 | -| policy_gradient_loss | 0.00702 | -| std | 0.00979 | -| value_loss | 8.43e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 24 | -| iterations | 15093 | -| time_elapsed | 80470 | -| total_timesteps | 1931904 | -| train/ | | -| approx_kl | 0.07341253 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0548 | -| n_updates | 150920 | -| policy_gradient_loss | 0.0131 | -| std | 0.0098 | -| value_loss | 6.21e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 24 | -| iterations | 15094 | -| time_elapsed | 80483 | -| total_timesteps | 1932032 | -| train/ | | -| approx_kl | 0.010732379 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.00418 | -| n_updates | 150930 | -| policy_gradient_loss | 0.0145 | -| std | 0.0098 | -| value_loss | 3.78e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15095 | -| time_elapsed | 80516 | -| total_timesteps | 1932160 | -| train/ | | -| approx_kl | 0.06905001 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 150940 | -| policy_gradient_loss | -0.014 | -| std | 0.00979 | -| value_loss | 0.000129 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15096 | -| time_elapsed | 80526 | -| total_timesteps | 1932288 | -| train/ | | -| approx_kl | 0.0023467303 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | 0.00523 | -| n_updates | 150950 | -| policy_gradient_loss | 0.00397 | -| std | 0.00979 | -| value_loss | 2.03e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15097 | -| time_elapsed | 80538 | -| total_timesteps | 1932416 | -| train/ | | -| approx_kl | 0.03802808 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | -7.13e-05 | -| n_updates | 150960 | -| policy_gradient_loss | -0.00239 | -| std | 0.0098 | -| value_loss | 5.62e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15098 | -| time_elapsed | 80549 | -| total_timesteps | 1932544 | -| train/ | | -| approx_kl | 0.018660042 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | 0.00375 | -| n_updates | 150970 | -| policy_gradient_loss | 0.00251 | -| std | 0.0098 | -| value_loss | 2.02e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15099 | -| time_elapsed | 80558 | -| total_timesteps | 1932672 | -| train/ | | -| approx_kl | 0.03923138 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00125 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 150980 | -| policy_gradient_loss | 0.0111 | -| std | 0.0098 | -| value_loss | 6.45e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15100 | -| time_elapsed | 80566 | -| total_timesteps | 1932800 | -| train/ | | -| approx_kl | 0.059212863 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0941 | -| learning_rate | 0.0003 | -| loss | 0.0541 | -| n_updates | 150990 | -| policy_gradient_loss | 0.042 | -| std | 0.0098 | -| value_loss | 6.15e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15101 | -| time_elapsed | 80575 | -| total_timesteps | 1932928 | -| train/ | | -| approx_kl | 0.09018008 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.0605 | -| n_updates | 151000 | -| policy_gradient_loss | 0.0163 | -| std | 0.0098 | -| value_loss | 1.87e-11 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15102 | -| time_elapsed | 80585 | -| total_timesteps | 1933056 | -| train/ | | -| approx_kl | 0.00068046525 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 151010 | -| policy_gradient_loss | 4.31e-05 | -| std | 0.0098 | -| value_loss | 7.03e-12 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15103 | -| time_elapsed | 80608 | -| total_timesteps | 1933184 | -| train/ | | -| approx_kl | 0.26348984 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.902 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 151020 | -| policy_gradient_loss | 0.00499 | -| std | 0.0098 | -| value_loss | 0.00113 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15104 | -| time_elapsed | 80619 | -| total_timesteps | 1933312 | -| train/ | | -| approx_kl | 0.037279725 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 151030 | -| policy_gradient_loss | 0.0132 | -| std | 0.0098 | -| value_loss | 3.81e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15105 | -| time_elapsed | 80627 | -| total_timesteps | 1933440 | -| train/ | | -| approx_kl | 0.0745406 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00249 | -| learning_rate | 0.0003 | -| loss | 0.0713 | -| n_updates | 151040 | -| policy_gradient_loss | 0.0412 | -| std | 0.0098 | -| value_loss | 4.35e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15106 | -| time_elapsed | 80633 | -| total_timesteps | 1933568 | -| train/ | | -| approx_kl | 0.014219565 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 151050 | -| policy_gradient_loss | 0.0173 | -| std | 0.0098 | -| value_loss | 2.58e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15107 | -| time_elapsed | 80639 | -| total_timesteps | 1933696 | -| train/ | | -| approx_kl | 0.4895651 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.331 | -| n_updates | 151060 | -| policy_gradient_loss | 0.108 | -| std | 0.0098 | -| value_loss | 1.88e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15108 | -| time_elapsed | 80645 | -| total_timesteps | 1933824 | -| train/ | | -| approx_kl | 0.0049694404 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.00582 | -| n_updates | 151070 | -| policy_gradient_loss | 0.0114 | -| std | 0.0098 | -| value_loss | 1.27e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15109 | -| time_elapsed | 80651 | -| total_timesteps | 1933952 | -| train/ | | -| approx_kl | 0.02109259 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 151080 | -| policy_gradient_loss | 0.0066 | -| std | 0.00979 | -| value_loss | 1.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15110 | -| time_elapsed | 80655 | -| total_timesteps | 1934080 | -| train/ | | -| approx_kl | 0.017732013 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 151090 | -| policy_gradient_loss | 0.000903 | -| std | 0.00979 | -| value_loss | 4.71e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15111 | -| time_elapsed | 80665 | -| total_timesteps | 1934208 | -| train/ | | -| approx_kl | 0.1040372 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | 0.0753 | -| n_updates | 151100 | -| policy_gradient_loss | 0.0139 | -| std | 0.0098 | -| value_loss | 0.00112 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15112 | -| time_elapsed | 80669 | -| total_timesteps | 1934336 | -| train/ | | -| approx_kl | 0.03871571 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | 0.0643 | -| n_updates | 151110 | -| policy_gradient_loss | 0.0427 | -| std | 0.00979 | -| value_loss | 3.89e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15113 | -| time_elapsed | 80674 | -| total_timesteps | 1934464 | -| train/ | | -| approx_kl | 4.0104147e-05 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -14.2 | -| learning_rate | 0.0003 | -| loss | -0.0009 | -| n_updates | 151120 | -| policy_gradient_loss | -0.00286 | -| std | 0.00979 | -| value_loss | 1.51e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15114 | -| time_elapsed | 80679 | -| total_timesteps | 1934592 | -| train/ | | -| approx_kl | 0.040083855 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -3.98 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 151130 | -| policy_gradient_loss | -0.00202 | -| std | 0.00978 | -| value_loss | 2.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15115 | -| time_elapsed | 80685 | -| total_timesteps | 1934720 | -| train/ | | -| approx_kl | 0.002810337 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00452 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 151140 | -| policy_gradient_loss | 0.00278 | -| std | 0.00977 | -| value_loss | 1.99e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15116 | -| time_elapsed | 80691 | -| total_timesteps | 1934848 | -| train/ | | -| approx_kl | 0.08412311 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00524 | -| learning_rate | 0.0003 | -| loss | 0.0735 | -| n_updates | 151150 | -| policy_gradient_loss | 0.0601 | -| std | 0.00976 | -| value_loss | 6.23e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 15117 | -| time_elapsed | 80697 | -| total_timesteps | 1934976 | -| train/ | | -| approx_kl | 0.017919516 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00837 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 151160 | -| policy_gradient_loss | 0.00892 | -| std | 0.00976 | -| value_loss | 8.95e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15118 | -| time_elapsed | 80703 | -| total_timesteps | 1935104 | -| train/ | | -| approx_kl | 0.0006690454 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 151170 | -| policy_gradient_loss | 0.00266 | -| std | 0.00976 | -| value_loss | 4.92e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15119 | -| time_elapsed | 80713 | -| total_timesteps | 1935232 | -| train/ | | -| approx_kl | 0.99106735 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.907 | -| learning_rate | 0.0003 | -| loss | -0.0274 | -| n_updates | 151180 | -| policy_gradient_loss | -0.00596 | -| std | 0.00976 | -| value_loss | 0.000323 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15120 | -| time_elapsed | 80718 | -| total_timesteps | 1935360 | -| train/ | | -| approx_kl | 0.0017907135 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.325 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 151190 | -| policy_gradient_loss | 0.0167 | -| std | 0.00975 | -| value_loss | 1.48e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15121 | -| time_elapsed | 80724 | -| total_timesteps | 1935488 | -| train/ | | -| approx_kl | 0.10071934 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.645 | -| learning_rate | 0.0003 | -| loss | 0.0679 | -| n_updates | 151200 | -| policy_gradient_loss | 0.0783 | -| std | 0.00976 | -| value_loss | 6.78e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15122 | -| time_elapsed | 80729 | -| total_timesteps | 1935616 | -| train/ | | -| approx_kl | 0.020403402 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.00953 | -| n_updates | 151210 | -| policy_gradient_loss | 0.0136 | -| std | 0.00976 | -| value_loss | 5.51e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15123 | -| time_elapsed | 80736 | -| total_timesteps | 1935744 | -| train/ | | -| approx_kl | 0.098021954 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00777 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 151220 | -| policy_gradient_loss | 0.0126 | -| std | 0.00976 | -| value_loss | 2.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15124 | -| time_elapsed | 80741 | -| total_timesteps | 1935872 | -| train/ | | -| approx_kl | 0.087301806 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.043 | -| n_updates | 151230 | -| policy_gradient_loss | 0.0197 | -| std | 0.00975 | -| value_loss | 1.64e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15125 | -| time_elapsed | 80746 | -| total_timesteps | 1936000 | -| train/ | | -| approx_kl | 0.022802645 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 151240 | -| policy_gradient_loss | 0.00345 | -| std | 0.00975 | -| value_loss | 7.07e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15126 | -| time_elapsed | 80751 | -| total_timesteps | 1936128 | -| train/ | | -| approx_kl | 0.077378385 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00229 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 151250 | -| policy_gradient_loss | 0.0121 | -| std | 0.00975 | -| value_loss | 3.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15127 | -| time_elapsed | 80762 | -| total_timesteps | 1936256 | -| train/ | | -| approx_kl | 0.020928822 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.917 | -| learning_rate | 0.0003 | -| loss | -0.00703 | -| n_updates | 151260 | -| policy_gradient_loss | -0.000107 | -| std | 0.00975 | -| value_loss | 0.00089 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15128 | -| time_elapsed | 80767 | -| total_timesteps | 1936384 | -| train/ | | -| approx_kl | 0.093678996 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.032 | -| n_updates | 151270 | -| policy_gradient_loss | 0.00695 | -| std | 0.00974 | -| value_loss | 1.57e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15129 | -| time_elapsed | 80771 | -| total_timesteps | 1936512 | -| train/ | | -| approx_kl | 0.00891209 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.000223 | -| n_updates | 151280 | -| policy_gradient_loss | 0.0133 | -| std | 0.00974 | -| value_loss | 3.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15130 | -| time_elapsed | 80776 | -| total_timesteps | 1936640 | -| train/ | | -| approx_kl | 0.051603436 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0858 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 151290 | -| policy_gradient_loss | 0.014 | -| std | 0.00974 | -| value_loss | 1.52e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15131 | -| time_elapsed | 80781 | -| total_timesteps | 1936768 | -| train/ | | -| approx_kl | 4.564738e-05 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 151300 | -| policy_gradient_loss | 0.0126 | -| std | 0.00974 | -| value_loss | 9.91e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15132 | -| time_elapsed | 80787 | -| total_timesteps | 1936896 | -| train/ | | -| approx_kl | 0.07742423 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.0323 | -| n_updates | 151310 | -| policy_gradient_loss | 0.00705 | -| std | 0.00974 | -| value_loss | 6.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15133 | -| time_elapsed | 80793 | -| total_timesteps | 1937024 | -| train/ | | -| approx_kl | 0.010190805 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 151320 | -| policy_gradient_loss | 0.00809 | -| std | 0.00974 | -| value_loss | 4.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15134 | -| time_elapsed | 80803 | -| total_timesteps | 1937152 | -| train/ | | -| approx_kl | 0.020585144 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.78 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 151330 | -| policy_gradient_loss | -0.0039 | -| std | 0.00974 | -| value_loss | 0.00216 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15135 | -| time_elapsed | 80808 | -| total_timesteps | 1937280 | -| train/ | | -| approx_kl | 0.040200423 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 151340 | -| policy_gradient_loss | 0.00211 | -| std | 0.00974 | -| value_loss | 9.69e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15136 | -| time_elapsed | 80813 | -| total_timesteps | 1937408 | -| train/ | | -| approx_kl | 0.0032775523 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.00341 | -| n_updates | 151350 | -| policy_gradient_loss | 0.00747 | -| std | 0.00975 | -| value_loss | 1.57e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15137 | -| time_elapsed | 80819 | -| total_timesteps | 1937536 | -| train/ | | -| approx_kl | 0.015202681 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 151360 | -| policy_gradient_loss | 0.0138 | -| std | 0.00975 | -| value_loss | 2.48e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15138 | -| time_elapsed | 80824 | -| total_timesteps | 1937664 | -| train/ | | -| approx_kl | 0.06417439 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00742 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 151370 | -| policy_gradient_loss | 0.0304 | -| std | 0.00976 | -| value_loss | 3.02e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15139 | -| time_elapsed | 80829 | -| total_timesteps | 1937792 | -| train/ | | -| approx_kl | 0.09979483 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.063 | -| learning_rate | 0.0003 | -| loss | 0.0453 | -| n_updates | 151380 | -| policy_gradient_loss | 0.012 | -| std | 0.00977 | -| value_loss | 1.34e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15140 | -| time_elapsed | 80835 | -| total_timesteps | 1937920 | -| train/ | | -| approx_kl | 0.023752589 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 151390 | -| policy_gradient_loss | -0.00348 | -| std | 0.00978 | -| value_loss | 8.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15141 | -| time_elapsed | 80840 | -| total_timesteps | 1938048 | -| train/ | | -| approx_kl | 0.13178608 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.06 | -| n_updates | 151400 | -| policy_gradient_loss | 0.0226 | -| std | 0.00979 | -| value_loss | 1.83e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15142 | -| time_elapsed | 80851 | -| total_timesteps | 1938176 | -| train/ | | -| approx_kl | 0.0114615355 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.753 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 151410 | -| policy_gradient_loss | -0.0098 | -| std | 0.00979 | -| value_loss | 0.00538 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15143 | -| time_elapsed | 80857 | -| total_timesteps | 1938304 | -| train/ | | -| approx_kl | 0.1936375 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 151420 | -| policy_gradient_loss | 0.0851 | -| std | 0.00979 | -| value_loss | 1.81e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15144 | -| time_elapsed | 80862 | -| total_timesteps | 1938432 | -| train/ | | -| approx_kl | 0.02695606 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.00931 | -| n_updates | 151430 | -| policy_gradient_loss | 0.00938 | -| std | 0.00978 | -| value_loss | 3.82e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15145 | -| time_elapsed | 80868 | -| total_timesteps | 1938560 | -| train/ | | -| approx_kl | 0.24060059 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.0749 | -| n_updates | 151440 | -| policy_gradient_loss | 0.0224 | -| std | 0.00978 | -| value_loss | 1.74e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15146 | -| time_elapsed | 80874 | -| total_timesteps | 1938688 | -| train/ | | -| approx_kl | 0.019224675 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 151450 | -| policy_gradient_loss | -0.00232 | -| std | 0.00979 | -| value_loss | 4.57e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15147 | -| time_elapsed | 80880 | -| total_timesteps | 1938816 | -| train/ | | -| approx_kl | 0.0013581612 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.00883 | -| n_updates | 151460 | -| policy_gradient_loss | -0.0094 | -| std | 0.00978 | -| value_loss | 4.46e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 15148 | -| time_elapsed | 80884 | -| total_timesteps | 1938944 | -| train/ | | -| approx_kl | 0.018063247 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | -0.00427 | -| n_updates | 151470 | -| policy_gradient_loss | -0.00139 | -| std | 0.00978 | -| value_loss | 8.51e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15149 | -| time_elapsed | 80890 | -| total_timesteps | 1939072 | -| train/ | | -| approx_kl | 0.024123024 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0893 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 151480 | -| policy_gradient_loss | -6.16e-06 | -| std | 0.00978 | -| value_loss | 4.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15150 | -| time_elapsed | 80902 | -| total_timesteps | 1939200 | -| train/ | | -| approx_kl | 0.097804606 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.778 | -| learning_rate | 0.0003 | -| loss | 0.00388 | -| n_updates | 151490 | -| policy_gradient_loss | -0.00909 | -| std | 0.00978 | -| value_loss | 0.0046 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15151 | -| time_elapsed | 80907 | -| total_timesteps | 1939328 | -| train/ | | -| approx_kl | 0.007554085 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | -0.00436 | -| n_updates | 151500 | -| policy_gradient_loss | 0.000374 | -| std | 0.00979 | -| value_loss | 4.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15152 | -| time_elapsed | 80912 | -| total_timesteps | 1939456 | -| train/ | | -| approx_kl | 0.002242844 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | 0.00702 | -| n_updates | 151510 | -| policy_gradient_loss | -0.00384 | -| std | 0.00979 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15153 | -| time_elapsed | 80919 | -| total_timesteps | 1939584 | -| train/ | | -| approx_kl | 0.048920553 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 151520 | -| policy_gradient_loss | 0.0162 | -| std | 0.00978 | -| value_loss | 3.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15154 | -| time_elapsed | 80923 | -| total_timesteps | 1939712 | -| train/ | | -| approx_kl | 0.040849797 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.367 | -| learning_rate | 0.0003 | -| loss | 0.0296 | -| n_updates | 151530 | -| policy_gradient_loss | 0.0166 | -| std | 0.00978 | -| value_loss | 4.87e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15155 | -| time_elapsed | 80927 | -| total_timesteps | 1939840 | -| train/ | | -| approx_kl | 0.19983613 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -14.9 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 151540 | -| policy_gradient_loss | 1.55e-05 | -| std | 0.00978 | -| value_loss | 1.07e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15156 | -| time_elapsed | 80932 | -| total_timesteps | 1939968 | -| train/ | | -| approx_kl | 0.11172654 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.094 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 151550 | -| policy_gradient_loss | 0.0034 | -| std | 0.00979 | -| value_loss | 5.31e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15157 | -| time_elapsed | 80937 | -| total_timesteps | 1940096 | -| train/ | | -| approx_kl | 0.008362904 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00766 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 151560 | -| policy_gradient_loss | 0.0137 | -| std | 0.00979 | -| value_loss | 7.28e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15158 | -| time_elapsed | 80946 | -| total_timesteps | 1940224 | -| train/ | | -| approx_kl | 0.04063683 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.808 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 151570 | -| policy_gradient_loss | -0.00194 | -| std | 0.00979 | -| value_loss | 0.00374 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15159 | -| time_elapsed | 80951 | -| total_timesteps | 1940352 | -| train/ | | -| approx_kl | 0.01595635 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 151580 | -| policy_gradient_loss | -0.0053 | -| std | 0.00979 | -| value_loss | 5.73e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15160 | -| time_elapsed | 80956 | -| total_timesteps | 1940480 | -| train/ | | -| approx_kl | 0.003949159 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 151590 | -| policy_gradient_loss | 0.00131 | -| std | 0.00978 | -| value_loss | 9.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15161 | -| time_elapsed | 80960 | -| total_timesteps | 1940608 | -| train/ | | -| approx_kl | 0.038842607 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0971 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 151600 | -| policy_gradient_loss | 0.00316 | -| std | 0.00978 | -| value_loss | 6.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15162 | -| time_elapsed | 80964 | -| total_timesteps | 1940736 | -| train/ | | -| approx_kl | 0.02397145 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | 0.00535 | -| n_updates | 151610 | -| policy_gradient_loss | 0.0181 | -| std | 0.00978 | -| value_loss | 3.84e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15163 | -| time_elapsed | 80970 | -| total_timesteps | 1940864 | -| train/ | | -| approx_kl | 0.05557303 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 151620 | -| policy_gradient_loss | 0.0313 | -| std | 0.00979 | -| value_loss | 2.33e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 15164 | -| time_elapsed | 80975 | -| total_timesteps | 1940992 | -| train/ | | -| approx_kl | 0.06841935 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 151630 | -| policy_gradient_loss | 0.00585 | -| std | 0.00979 | -| value_loss | 1.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15165 | -| time_elapsed | 80980 | -| total_timesteps | 1941120 | -| train/ | | -| approx_kl | 0.014752853 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.0047 | -| n_updates | 151640 | -| policy_gradient_loss | 0.00341 | -| std | 0.0098 | -| value_loss | 7.52e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15166 | -| time_elapsed | 80991 | -| total_timesteps | 1941248 | -| train/ | | -| approx_kl | 0.051368225 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.000384 | -| n_updates | 151650 | -| policy_gradient_loss | -0.00241 | -| std | 0.00981 | -| value_loss | 0.000625 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15167 | -| time_elapsed | 80995 | -| total_timesteps | 1941376 | -| train/ | | -| approx_kl | 0.02561108 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.000292 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 151660 | -| policy_gradient_loss | -0.000689 | -| std | 0.00981 | -| value_loss | 1.17e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15168 | -| time_elapsed | 81001 | -| total_timesteps | 1941504 | -| train/ | | -| approx_kl | 0.004852558 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 151670 | -| policy_gradient_loss | 0.00361 | -| std | 0.00982 | -| value_loss | 3.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15169 | -| time_elapsed | 81006 | -| total_timesteps | 1941632 | -| train/ | | -| approx_kl | 0.033607073 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 151680 | -| policy_gradient_loss | 0.00495 | -| std | 0.00982 | -| value_loss | 1.92e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15170 | -| time_elapsed | 81011 | -| total_timesteps | 1941760 | -| train/ | | -| approx_kl | 0.0053007663 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | -0.000459 | -| n_updates | 151690 | -| policy_gradient_loss | 0.00225 | -| std | 0.00982 | -| value_loss | 1.34e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15171 | -| time_elapsed | 81016 | -| total_timesteps | 1941888 | -| train/ | | -| approx_kl | 0.025805198 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | -0.00983 | -| n_updates | 151700 | -| policy_gradient_loss | -0.0066 | -| std | 0.00982 | -| value_loss | 1.64e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15172 | -| time_elapsed | 81020 | -| total_timesteps | 1942016 | -| train/ | | -| approx_kl | 0.02083805 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.00074 | -| n_updates | 151710 | -| policy_gradient_loss | 0.000756 | -| std | 0.00981 | -| value_loss | 5.1e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15173 | -| time_elapsed | 81030 | -| total_timesteps | 1942144 | -| train/ | | -| approx_kl | 0.00029876595 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 151720 | -| policy_gradient_loss | -0.00599 | -| std | 0.0098 | -| value_loss | 0.000602 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15174 | -| time_elapsed | 81037 | -| total_timesteps | 1942272 | -| train/ | | -| approx_kl | 0.0058248923 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.271 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 151730 | -| policy_gradient_loss | 0.0189 | -| std | 0.00978 | -| value_loss | 1.53e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15175 | -| time_elapsed | 81042 | -| total_timesteps | 1942400 | -| train/ | | -| approx_kl | 0.08485734 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -92.1 | -| learning_rate | 0.0003 | -| loss | 0.0754 | -| n_updates | 151740 | -| policy_gradient_loss | 0.017 | -| std | 0.00977 | -| value_loss | 3.74e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15176 | -| time_elapsed | 81047 | -| total_timesteps | 1942528 | -| train/ | | -| approx_kl | 0.030203478 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | -0.00755 | -| n_updates | 151750 | -| policy_gradient_loss | -0.00696 | -| std | 0.00977 | -| value_loss | 1.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15177 | -| time_elapsed | 81052 | -| total_timesteps | 1942656 | -| train/ | | -| approx_kl | 0.05030907 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.244 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 151760 | -| policy_gradient_loss | 0.0103 | -| std | 0.00977 | -| value_loss | 6.46e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15178 | -| time_elapsed | 81058 | -| total_timesteps | 1942784 | -| train/ | | -| approx_kl | 0.0027134996 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.00477 | -| n_updates | 151770 | -| policy_gradient_loss | 0.00404 | -| std | 0.00977 | -| value_loss | 1.82e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15179 | -| time_elapsed | 81063 | -| total_timesteps | 1942912 | -| train/ | | -| approx_kl | 0.021620562 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0917 | -| learning_rate | 0.0003 | -| loss | 0.00622 | -| n_updates | 151780 | -| policy_gradient_loss | 0.00738 | -| std | 0.00977 | -| value_loss | 7.91e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15180 | -| time_elapsed | 81068 | -| total_timesteps | 1943040 | -| train/ | | -| approx_kl | 0.4029827 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0619 | -| learning_rate | 0.0003 | -| loss | 0.0832 | -| n_updates | 151790 | -| policy_gradient_loss | 0.0255 | -| std | 0.00976 | -| value_loss | 9.75e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15181 | -| time_elapsed | 81077 | -| total_timesteps | 1943168 | -| train/ | | -| approx_kl | 0.018222619 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 151800 | -| policy_gradient_loss | -0.00328 | -| std | 0.00976 | -| value_loss | 0.000706 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15182 | -| time_elapsed | 81082 | -| total_timesteps | 1943296 | -| train/ | | -| approx_kl | 0.00011880463 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | -0.000925 | -| n_updates | 151810 | -| policy_gradient_loss | 0.000799 | -| std | 0.00976 | -| value_loss | 8.1e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15183 | -| time_elapsed | 81086 | -| total_timesteps | 1943424 | -| train/ | | -| approx_kl | 0.02121641 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 151820 | -| policy_gradient_loss | -0.00634 | -| std | 0.00976 | -| value_loss | 2.9e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15184 | -| time_elapsed | 81091 | -| total_timesteps | 1943552 | -| train/ | | -| approx_kl | 0.023503382 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 151830 | -| policy_gradient_loss | 0.00528 | -| std | 0.00976 | -| value_loss | 3.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15185 | -| time_elapsed | 81095 | -| total_timesteps | 1943680 | -| train/ | | -| approx_kl | 0.024192305 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.00603 | -| n_updates | 151840 | -| policy_gradient_loss | 0.00285 | -| std | 0.00976 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15186 | -| time_elapsed | 81100 | -| total_timesteps | 1943808 | -| train/ | | -| approx_kl | 0.0038469988 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 151850 | -| policy_gradient_loss | 0.000708 | -| std | 0.00976 | -| value_loss | 7e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15187 | -| time_elapsed | 81104 | -| total_timesteps | 1943936 | -| train/ | | -| approx_kl | 0.00012238044 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.000278 | -| n_updates | 151860 | -| policy_gradient_loss | 0.0161 | -| std | 0.00976 | -| value_loss | 1.79e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15188 | -| time_elapsed | 81108 | -| total_timesteps | 1944064 | -| train/ | | -| approx_kl | 0.30307496 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.216 | -| n_updates | 151870 | -| policy_gradient_loss | 0.0827 | -| std | 0.00976 | -| value_loss | 3.25e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15189 | -| time_elapsed | 81117 | -| total_timesteps | 1944192 | -| train/ | | -| approx_kl | 0.024096597 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | 0.00107 | -| n_updates | 151880 | -| policy_gradient_loss | 0.00413 | -| std | 0.00976 | -| value_loss | 0.000238 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15190 | -| time_elapsed | 81123 | -| total_timesteps | 1944320 | -| train/ | | -| approx_kl | 0.02359616 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 151890 | -| policy_gradient_loss | 0.0108 | -| std | 0.00976 | -| value_loss | 8.46e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15191 | -| time_elapsed | 81128 | -| total_timesteps | 1944448 | -| train/ | | -| approx_kl | 0.014264883 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 151900 | -| policy_gradient_loss | 0.00975 | -| std | 0.00975 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15192 | -| time_elapsed | 81133 | -| total_timesteps | 1944576 | -| train/ | | -| approx_kl | 0.0029909476 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 151910 | -| policy_gradient_loss | 0.02 | -| std | 0.00975 | -| value_loss | 1.04e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15193 | -| time_elapsed | 81139 | -| total_timesteps | 1944704 | -| train/ | | -| approx_kl | 0.042290017 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 151920 | -| policy_gradient_loss | 0.0158 | -| std | 0.00976 | -| value_loss | 2.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15194 | -| time_elapsed | 81145 | -| total_timesteps | 1944832 | -| train/ | | -| approx_kl | 0.17637604 | -| clip_fraction | 0.61 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00509 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 151930 | -| policy_gradient_loss | 0.0941 | -| std | 0.00976 | -| value_loss | 6.98e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15195 | -| time_elapsed | 81150 | -| total_timesteps | 1944960 | -| train/ | | -| approx_kl | 0.022744186 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 151940 | -| policy_gradient_loss | 0.00974 | -| std | 0.00976 | -| value_loss | 8.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15196 | -| time_elapsed | 81154 | -| total_timesteps | 1945088 | -| train/ | | -| approx_kl | 0.31603473 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 151950 | -| policy_gradient_loss | 0.0316 | -| std | 0.00976 | -| value_loss | 8.45e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15197 | -| time_elapsed | 81163 | -| total_timesteps | 1945216 | -| train/ | | -| approx_kl | 0.025735933 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.756 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 151960 | -| policy_gradient_loss | -0.00692 | -| std | 0.00976 | -| value_loss | 0.0065 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15198 | -| time_elapsed | 81169 | -| total_timesteps | 1945344 | -| train/ | | -| approx_kl | 0.058271732 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 151970 | -| policy_gradient_loss | 0.0508 | -| std | 0.0098 | -| value_loss | 0.00192 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15199 | -| time_elapsed | 81173 | -| total_timesteps | 1945472 | -| train/ | | -| approx_kl | 0.07373676 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 151980 | -| policy_gradient_loss | 0.000788 | -| std | 0.00982 | -| value_loss | 0.000794 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15200 | -| time_elapsed | 81178 | -| total_timesteps | 1945600 | -| train/ | | -| approx_kl | 0.016243473 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00867 | -| learning_rate | 0.0003 | -| loss | 0.00499 | -| n_updates | 151990 | -| policy_gradient_loss | 0.00434 | -| std | 0.00982 | -| value_loss | 0.000147 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15201 | -| time_elapsed | 81183 | -| total_timesteps | 1945728 | -| train/ | | -| approx_kl | 0.026255038 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0808 | -| learning_rate | 0.0003 | -| loss | 0.00776 | -| n_updates | 152000 | -| policy_gradient_loss | 0.00255 | -| std | 0.00983 | -| value_loss | 0.0001 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15202 | -| time_elapsed | 81188 | -| total_timesteps | 1945856 | -| train/ | | -| approx_kl | 0.01768475 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00221 | -| learning_rate | 0.0003 | -| loss | 0.00567 | -| n_updates | 152010 | -| policy_gradient_loss | 0.00283 | -| std | 0.00984 | -| value_loss | 1.66e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15203 | -| time_elapsed | 81193 | -| total_timesteps | 1945984 | -| train/ | | -| approx_kl | 0.0040964545 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.00988 | -| learning_rate | 0.0003 | -| loss | -0.00284 | -| n_updates | 152020 | -| policy_gradient_loss | 0.00141 | -| std | 0.00986 | -| value_loss | 3.11e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15204 | -| time_elapsed | 81198 | -| total_timesteps | 1946112 | -| train/ | | -| approx_kl | 0.01660844 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 152030 | -| policy_gradient_loss | 0.0576 | -| std | 0.00987 | -| value_loss | 1.04e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15205 | -| time_elapsed | 81210 | -| total_timesteps | 1946240 | -| train/ | | -| approx_kl | 0.054692414 | -| clip_fraction | 0.599 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | 0.0462 | -| n_updates | 152040 | -| policy_gradient_loss | 0.0816 | -| std | 0.00987 | -| value_loss | 0.00031 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15206 | -| time_elapsed | 81214 | -| total_timesteps | 1946368 | -| train/ | | -| approx_kl | 0.008663596 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.000435 | -| n_updates | 152050 | -| policy_gradient_loss | 0.00965 | -| std | 0.00987 | -| value_loss | 1.29e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15207 | -| time_elapsed | 81219 | -| total_timesteps | 1946496 | -| train/ | | -| approx_kl | 0.0004921723 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | -0.000305 | -| n_updates | 152060 | -| policy_gradient_loss | 0.00148 | -| std | 0.0099 | -| value_loss | 3.93e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15208 | -| time_elapsed | 81224 | -| total_timesteps | 1946624 | -| train/ | | -| approx_kl | 0.028371412 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00807 | -| learning_rate | 0.0003 | -| loss | 0.00364 | -| n_updates | 152070 | -| policy_gradient_loss | 0.00764 | -| std | 0.00992 | -| value_loss | 2.2e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15209 | -| time_elapsed | 81228 | -| total_timesteps | 1946752 | -| train/ | | -| approx_kl | 0.12659183 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.00848 | -| learning_rate | 0.0003 | -| loss | 0.000336 | -| n_updates | 152080 | -| policy_gradient_loss | -0.0138 | -| std | 0.00992 | -| value_loss | 1.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15210 | -| time_elapsed | 81233 | -| total_timesteps | 1946880 | -| train/ | | -| approx_kl | 0.046294786 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.0064 | -| n_updates | 152090 | -| policy_gradient_loss | 0.0105 | -| std | 0.00992 | -| value_loss | 1.3e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15211 | -| time_elapsed | 81238 | -| total_timesteps | 1947008 | -| train/ | | -| approx_kl | 0.0023896755 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 152100 | -| policy_gradient_loss | 0.00198 | -| std | 0.00996 | -| value_loss | 0.000883 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15212 | -| time_elapsed | 81253 | -| total_timesteps | 1947136 | -| train/ | | -| approx_kl | 0.030894876 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.429 | -| learning_rate | 0.0003 | -| loss | -0.00965 | -| n_updates | 152110 | -| policy_gradient_loss | -0.00656 | -| std | 0.00999 | -| value_loss | 0.00294 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15213 | -| time_elapsed | 81259 | -| total_timesteps | 1947264 | -| train/ | | -| approx_kl | 0.03203041 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.535 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 152120 | -| policy_gradient_loss | 0.0382 | -| std | 0.00999 | -| value_loss | 2.8e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15214 | -| time_elapsed | 81264 | -| total_timesteps | 1947392 | -| train/ | | -| approx_kl | 0.0477364 | -| clip_fraction | 0.524 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.00527 | -| learning_rate | 0.0003 | -| loss | 0.0621 | -| n_updates | 152130 | -| policy_gradient_loss | 0.0612 | -| std | 0.01 | -| value_loss | 6.69e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15215 | -| time_elapsed | 81269 | -| total_timesteps | 1947520 | -| train/ | | -| approx_kl | 0.06398473 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 152140 | -| policy_gradient_loss | 0.0985 | -| std | 0.01 | -| value_loss | 6.23e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15216 | -| time_elapsed | 81275 | -| total_timesteps | 1947648 | -| train/ | | -| approx_kl | 0.011472459 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -4.05 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 152150 | -| policy_gradient_loss | 0.00792 | -| std | 0.01 | -| value_loss | 3.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15217 | -| time_elapsed | 81279 | -| total_timesteps | 1947776 | -| train/ | | -| approx_kl | 0.028856358 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -2.27 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 152160 | -| policy_gradient_loss | -0.000422 | -| std | 0.01 | -| value_loss | 2.13e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15218 | -| time_elapsed | 81284 | -| total_timesteps | 1947904 | -| train/ | | -| approx_kl | 0.32352924 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.0673 | -| n_updates | 152170 | -| policy_gradient_loss | 0.0206 | -| std | 0.01 | -| value_loss | 5.54e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15219 | -| time_elapsed | 81289 | -| total_timesteps | 1948032 | -| train/ | | -| approx_kl | 0.0015034643 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 152180 | -| policy_gradient_loss | -0.00232 | -| std | 0.01 | -| value_loss | 1.06e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15220 | -| time_elapsed | 81300 | -| total_timesteps | 1948160 | -| train/ | | -| approx_kl | 0.100257635 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | 0.869 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 152190 | -| policy_gradient_loss | -0.0136 | -| std | 0.01 | -| value_loss | 0.000508 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15221 | -| time_elapsed | 81306 | -| total_timesteps | 1948288 | -| train/ | | -| approx_kl | 0.1157319 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 152200 | -| policy_gradient_loss | -0.00922 | -| std | 0.01 | -| value_loss | 1.65e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15222 | -| time_elapsed | 81310 | -| total_timesteps | 1948416 | -| train/ | | -| approx_kl | 0.012292491 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 152210 | -| policy_gradient_loss | 0.0137 | -| std | 0.01 | -| value_loss | 2.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15223 | -| time_elapsed | 81316 | -| total_timesteps | 1948544 | -| train/ | | -| approx_kl | 0.020652184 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.498 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 152220 | -| policy_gradient_loss | -0.009 | -| std | 0.01 | -| value_loss | 1.4e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15224 | -| time_elapsed | 81320 | -| total_timesteps | 1948672 | -| train/ | | -| approx_kl | 0.0879849 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.0881 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 152230 | -| policy_gradient_loss | 0.00726 | -| std | 0.01 | -| value_loss | 5.5e-09 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15225 | -| time_elapsed | 81326 | -| total_timesteps | 1948800 | -| train/ | | -| approx_kl | 0.00022429228 | -| clip_fraction | 0.00234 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | -0.000361 | -| n_updates | 152240 | -| policy_gradient_loss | 6.03e-05 | -| std | 0.00997 | -| value_loss | 6.36e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15226 | -| time_elapsed | 81330 | -| total_timesteps | 1948928 | -| train/ | | -| approx_kl | 0.06302761 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.19 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 152250 | -| policy_gradient_loss | -0.00303 | -| std | 0.00992 | -| value_loss | 3.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15227 | -| time_elapsed | 81334 | -| total_timesteps | 1949056 | -| train/ | | -| approx_kl | 0.052343823 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.613 | -| learning_rate | 0.0003 | -| loss | 0.00463 | -| n_updates | 152260 | -| policy_gradient_loss | 0.0134 | -| std | 0.0099 | -| value_loss | 8.39e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15228 | -| time_elapsed | 81343 | -| total_timesteps | 1949184 | -| train/ | | -| approx_kl | 0.17709112 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | 0.0899 | -| n_updates | 152270 | -| policy_gradient_loss | 0.0225 | -| std | 0.00989 | -| value_loss | 3.71e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15229 | -| time_elapsed | 81347 | -| total_timesteps | 1949312 | -| train/ | | -| approx_kl | 0.025191298 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 152280 | -| policy_gradient_loss | -0.00569 | -| std | 0.00989 | -| value_loss | 6.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15230 | -| time_elapsed | 81353 | -| total_timesteps | 1949440 | -| train/ | | -| approx_kl | 0.022900876 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.00747 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 152290 | -| policy_gradient_loss | -0.00522 | -| std | 0.00989 | -| value_loss | 1.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15231 | -| time_elapsed | 81358 | -| total_timesteps | 1949568 | -| train/ | | -| approx_kl | 0.01776753 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.000452 | -| n_updates | 152300 | -| policy_gradient_loss | 3.53e-05 | -| std | 0.00989 | -| value_loss | 5.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15232 | -| time_elapsed | 81362 | -| total_timesteps | 1949696 | -| train/ | | -| approx_kl | 0.022912076 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.00823 | -| n_updates | 152310 | -| policy_gradient_loss | 0.0041 | -| std | 0.00987 | -| value_loss | 4.23e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15233 | -| time_elapsed | 81367 | -| total_timesteps | 1949824 | -| train/ | | -| approx_kl | 1.6454142e-05 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.448 | -| learning_rate | 0.0003 | -| loss | -0.000885 | -| n_updates | 152320 | -| policy_gradient_loss | 0.00266 | -| std | 0.00985 | -| value_loss | 6.87e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15234 | -| time_elapsed | 81372 | -| total_timesteps | 1949952 | -| train/ | | -| approx_kl | 0.022444582 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.00973 | -| n_updates | 152330 | -| policy_gradient_loss | -0.00503 | -| std | 0.00983 | -| value_loss | 0.000119 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15235 | -| time_elapsed | 81379 | -| total_timesteps | 1950080 | -| train/ | | -| approx_kl | 0.047374967 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.00429 | -| n_updates | 152340 | -| policy_gradient_loss | 0.0168 | -| std | 0.00982 | -| value_loss | 2.14e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15236 | -| time_elapsed | 81386 | -| total_timesteps | 1950208 | -| train/ | | -| approx_kl | 0.44690472 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0813 | -| learning_rate | 0.0003 | -| loss | 0.0616 | -| n_updates | 152350 | -| policy_gradient_loss | 0.0295 | -| std | 0.00981 | -| value_loss | 0.00192 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15237 | -| time_elapsed | 81391 | -| total_timesteps | 1950336 | -| train/ | | -| approx_kl | 0.0074839843 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 152360 | -| policy_gradient_loss | 0.00862 | -| std | 0.00981 | -| value_loss | 3.12e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15238 | -| time_elapsed | 81397 | -| total_timesteps | 1950464 | -| train/ | | -| approx_kl | 0.04554091 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00192 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 152370 | -| policy_gradient_loss | 0.0144 | -| std | 0.00981 | -| value_loss | 3.07e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15239 | -| time_elapsed | 81401 | -| total_timesteps | 1950592 | -| train/ | | -| approx_kl | 0.259252 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.000399 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 152380 | -| policy_gradient_loss | 0.0326 | -| std | 0.00981 | -| value_loss | 1.52e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15240 | -| time_elapsed | 81404 | -| total_timesteps | 1950720 | -| train/ | | -| approx_kl | 0.020398745 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | -0.00495 | -| n_updates | 152390 | -| policy_gradient_loss | -0.000694 | -| std | 0.00981 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15241 | -| time_elapsed | 81409 | -| total_timesteps | 1950848 | -| train/ | | -| approx_kl | 0.026709344 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.00554 | -| n_updates | 152400 | -| policy_gradient_loss | 0.00202 | -| std | 0.00981 | -| value_loss | 8.58e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15242 | -| time_elapsed | 81414 | -| total_timesteps | 1950976 | -| train/ | | -| approx_kl | 0.004233891 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 152410 | -| policy_gradient_loss | 0.00186 | -| std | 0.0098 | -| value_loss | 5.31e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15243 | -| time_elapsed | 81418 | -| total_timesteps | 1951104 | -| train/ | | -| approx_kl | 0.03833186 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 152420 | -| policy_gradient_loss | 0.00614 | -| std | 0.0098 | -| value_loss | 6.73e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15244 | -| time_elapsed | 81428 | -| total_timesteps | 1951232 | -| train/ | | -| approx_kl | 0.050062127 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | 0.0013 | -| n_updates | 152430 | -| policy_gradient_loss | -0.000467 | -| std | 0.0098 | -| value_loss | 0.0017 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15245 | -| time_elapsed | 81434 | -| total_timesteps | 1951360 | -| train/ | | -| approx_kl | 0.00095145265 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00974 | -| learning_rate | 0.0003 | -| loss | -0.000867 | -| n_updates | 152440 | -| policy_gradient_loss | 0.00433 | -| std | 0.0098 | -| value_loss | 2.56e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15246 | -| time_elapsed | 81440 | -| total_timesteps | 1951488 | -| train/ | | -| approx_kl | 8.852687e-06 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.869 | -| learning_rate | 0.0003 | -| loss | 1.85e-05 | -| n_updates | 152450 | -| policy_gradient_loss | 0.00419 | -| std | 0.00981 | -| value_loss | 6.84e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15247 | -| time_elapsed | 81445 | -| total_timesteps | 1951616 | -| train/ | | -| approx_kl | 0.0026570144 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 152460 | -| policy_gradient_loss | 0.00451 | -| std | 0.0098 | -| value_loss | 5.63e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15248 | -| time_elapsed | 81448 | -| total_timesteps | 1951744 | -| train/ | | -| approx_kl | 0.015050809 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0965 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 152470 | -| policy_gradient_loss | 0.0183 | -| std | 0.0098 | -| value_loss | 3.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15249 | -| time_elapsed | 81453 | -| total_timesteps | 1951872 | -| train/ | | -| approx_kl | 0.06699584 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 152480 | -| policy_gradient_loss | 0.0309 | -| std | 0.0098 | -| value_loss | 1.44e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15250 | -| time_elapsed | 81457 | -| total_timesteps | 1952000 | -| train/ | | -| approx_kl | 0.0206476 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 152490 | -| policy_gradient_loss | 0.0153 | -| std | 0.0098 | -| value_loss | 8.3e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15251 | -| time_elapsed | 81463 | -| total_timesteps | 1952128 | -| train/ | | -| approx_kl | 0.33350676 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.0037 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 152500 | -| policy_gradient_loss | 0.0872 | -| std | 0.0098 | -| value_loss | 4.07e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15252 | -| time_elapsed | 81475 | -| total_timesteps | 1952256 | -| train/ | | -| approx_kl | 0.009881081 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | 0.0071 | -| n_updates | 152510 | -| policy_gradient_loss | -0.00184 | -| std | 0.00979 | -| value_loss | 8.66e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15253 | -| time_elapsed | 81481 | -| total_timesteps | 1952384 | -| train/ | | -| approx_kl | 0.0013661664 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 152520 | -| policy_gradient_loss | 0.00556 | -| std | 0.00979 | -| value_loss | 2.06e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15254 | -| time_elapsed | 81485 | -| total_timesteps | 1952512 | -| train/ | | -| approx_kl | 0.04852083 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 152530 | -| policy_gradient_loss | -0.00721 | -| std | 0.00979 | -| value_loss | 9.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15255 | -| time_elapsed | 81491 | -| total_timesteps | 1952640 | -| train/ | | -| approx_kl | 0.008952854 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.061 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 152540 | -| policy_gradient_loss | 0.000218 | -| std | 0.00979 | -| value_loss | 6.77e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15256 | -| time_elapsed | 81496 | -| total_timesteps | 1952768 | -| train/ | | -| approx_kl | 0.0033373842 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 152550 | -| policy_gradient_loss | 0.0091 | -| std | 0.00979 | -| value_loss | 4.2e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15257 | -| time_elapsed | 81501 | -| total_timesteps | 1952896 | -| train/ | | -| approx_kl | 0.0018761926 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | -0.00015 | -| n_updates | 152560 | -| policy_gradient_loss | 0.00459 | -| std | 0.00978 | -| value_loss | 3.78e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15258 | -| time_elapsed | 81506 | -| total_timesteps | 1953024 | -| train/ | | -| approx_kl | 0.030174235 | -| clip_fraction | 0.575 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00502 | -| learning_rate | 0.0003 | -| loss | 0.0374 | -| n_updates | 152570 | -| policy_gradient_loss | 0.0742 | -| std | 0.00977 | -| value_loss | 1.87e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15259 | -| time_elapsed | 81517 | -| total_timesteps | 1953152 | -| train/ | | -| approx_kl | 0.0004703179 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.857 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 152580 | -| policy_gradient_loss | -0.014 | -| std | 0.00976 | -| value_loss | 0.00261 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15260 | -| time_elapsed | 81521 | -| total_timesteps | 1953280 | -| train/ | | -| approx_kl | 0.008565461 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.0247 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 152590 | -| policy_gradient_loss | 0.00101 | -| std | 0.00975 | -| value_loss | 0.000209 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15261 | -| time_elapsed | 81527 | -| total_timesteps | 1953408 | -| train/ | | -| approx_kl | 0.033883296 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0901 | -| learning_rate | 0.0003 | -| loss | 0.0532 | -| n_updates | 152600 | -| policy_gradient_loss | 0.0719 | -| std | 0.00975 | -| value_loss | 9.59e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15262 | -| time_elapsed | 81531 | -| total_timesteps | 1953536 | -| train/ | | -| approx_kl | 0.04915484 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 152610 | -| policy_gradient_loss | 0.0689 | -| std | 0.00975 | -| value_loss | 0.00027 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15263 | -| time_elapsed | 81535 | -| total_timesteps | 1953664 | -| train/ | | -| approx_kl | 0.011634314 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 152620 | -| policy_gradient_loss | 0.00852 | -| std | 0.00975 | -| value_loss | 1.31e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15264 | -| time_elapsed | 81539 | -| total_timesteps | 1953792 | -| train/ | | -| approx_kl | 0.13405867 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00521 | -| learning_rate | 0.0003 | -| loss | 0.09 | -| n_updates | 152630 | -| policy_gradient_loss | 0.03 | -| std | 0.00975 | -| value_loss | 1.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15265 | -| time_elapsed | 81543 | -| total_timesteps | 1953920 | -| train/ | | -| approx_kl | 0.03977152 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 152640 | -| policy_gradient_loss | 0.00972 | -| std | 0.00976 | -| value_loss | 1.7e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15266 | -| time_elapsed | 81548 | -| total_timesteps | 1954048 | -| train/ | | -| approx_kl | 0.0072813174 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.000788 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 152650 | -| policy_gradient_loss | 0.000404 | -| std | 0.00977 | -| value_loss | 3.54e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15267 | -| time_elapsed | 81559 | -| total_timesteps | 1954176 | -| train/ | | -| approx_kl | 0.017261896 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 152660 | -| policy_gradient_loss | 0.0842 | -| std | 0.0098 | -| value_loss | 0.000317 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15268 | -| time_elapsed | 81564 | -| total_timesteps | 1954304 | -| train/ | | -| approx_kl | 0.07737653 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.362 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 152670 | -| policy_gradient_loss | -0.00308 | -| std | 0.00981 | -| value_loss | 2.26e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15269 | -| time_elapsed | 81570 | -| total_timesteps | 1954432 | -| train/ | | -| approx_kl | 0.09408274 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.0056 | -| learning_rate | 0.0003 | -| loss | 0.085 | -| n_updates | 152680 | -| policy_gradient_loss | 0.0167 | -| std | 0.00981 | -| value_loss | 2.49e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15270 | -| time_elapsed | 81574 | -| total_timesteps | 1954560 | -| train/ | | -| approx_kl | 0.24205303 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.0661 | -| n_updates | 152690 | -| policy_gradient_loss | 0.0191 | -| std | 0.00981 | -| value_loss | 1.96e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15271 | -| time_elapsed | 81580 | -| total_timesteps | 1954688 | -| train/ | | -| approx_kl | 0.005114699 | -| clip_fraction | 0.0656 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 152700 | -| policy_gradient_loss | -0.000295 | -| std | 0.00981 | -| value_loss | 1.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15272 | -| time_elapsed | 81585 | -| total_timesteps | 1954816 | -| train/ | | -| approx_kl | 0.020097744 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0559 | -| learning_rate | 0.0003 | -| loss | -0.00982 | -| n_updates | 152710 | -| policy_gradient_loss | 0.00204 | -| std | 0.0098 | -| value_loss | 7.3e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15273 | -| time_elapsed | 81591 | -| total_timesteps | 1954944 | -| train/ | | -| approx_kl | 0.03575271 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 152720 | -| policy_gradient_loss | 0.0741 | -| std | 0.0098 | -| value_loss | 4.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15274 | -| time_elapsed | 81595 | -| total_timesteps | 1955072 | -| train/ | | -| approx_kl | 0.007086153 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.000427 | -| n_updates | 152730 | -| policy_gradient_loss | 0.00683 | -| std | 0.0098 | -| value_loss | 7.8e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15275 | -| time_elapsed | 81606 | -| total_timesteps | 1955200 | -| train/ | | -| approx_kl | 0.0011303299 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 152740 | -| policy_gradient_loss | -0.0108 | -| std | 0.0098 | -| value_loss | 0.000921 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15276 | -| time_elapsed | 81611 | -| total_timesteps | 1955328 | -| train/ | | -| approx_kl | 0.022647196 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00327 | -| learning_rate | 0.0003 | -| loss | 0.00778 | -| n_updates | 152750 | -| policy_gradient_loss | 0.0297 | -| std | 0.00979 | -| value_loss | 1.98e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15277 | -| time_elapsed | 81615 | -| total_timesteps | 1955456 | -| train/ | | -| approx_kl | 0.0899535 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | 0.0524 | -| n_updates | 152760 | -| policy_gradient_loss | 0.0213 | -| std | 0.00979 | -| value_loss | 1.07e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15278 | -| time_elapsed | 81620 | -| total_timesteps | 1955584 | -| train/ | | -| approx_kl | 0.0017260322 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00428 | -| n_updates | 152770 | -| policy_gradient_loss | 0.00499 | -| std | 0.0098 | -| value_loss | 7.55e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15279 | -| time_elapsed | 81624 | -| total_timesteps | 1955712 | -| train/ | | -| approx_kl | 8.753035e-06 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.000211 | -| n_updates | 152780 | -| policy_gradient_loss | 0.00176 | -| std | 0.0098 | -| value_loss | 4.65e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15280 | -| time_elapsed | 81630 | -| total_timesteps | 1955840 | -| train/ | | -| approx_kl | 0.0001361128 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | -0.000453 | -| n_updates | 152790 | -| policy_gradient_loss | 0.00311 | -| std | 0.00979 | -| value_loss | 2.99e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15281 | -| time_elapsed | 81633 | -| total_timesteps | 1955968 | -| train/ | | -| approx_kl | 0.032608934 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 152800 | -| policy_gradient_loss | 0.0367 | -| std | 0.00979 | -| value_loss | 2.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15282 | -| time_elapsed | 81638 | -| total_timesteps | 1956096 | -| train/ | | -| approx_kl | 0.10805705 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.0478 | -| n_updates | 152810 | -| policy_gradient_loss | 0.0206 | -| std | 0.00979 | -| value_loss | 1.8e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15283 | -| time_elapsed | 81649 | -| total_timesteps | 1956224 | -| train/ | | -| approx_kl | 0.06788451 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 152820 | -| policy_gradient_loss | -0.0157 | -| std | 0.00979 | -| value_loss | 0.000411 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15284 | -| time_elapsed | 81654 | -| total_timesteps | 1956352 | -| train/ | | -| approx_kl | 0.054567724 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 152830 | -| policy_gradient_loss | 0.0239 | -| std | 0.00978 | -| value_loss | 4.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15285 | -| time_elapsed | 81659 | -| total_timesteps | 1956480 | -| train/ | | -| approx_kl | 0.016457116 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | 0.00437 | -| n_updates | 152840 | -| policy_gradient_loss | 0.0099 | -| std | 0.00978 | -| value_loss | 2.37e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15286 | -| time_elapsed | 81665 | -| total_timesteps | 1956608 | -| train/ | | -| approx_kl | 0.014915477 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 152850 | -| policy_gradient_loss | 0.0147 | -| std | 0.00978 | -| value_loss | 8.22e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15287 | -| time_elapsed | 81670 | -| total_timesteps | 1956736 | -| train/ | | -| approx_kl | 0.12510961 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.0594 | -| n_updates | 152860 | -| policy_gradient_loss | 0.0297 | -| std | 0.00978 | -| value_loss | 4.27e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15288 | -| time_elapsed | 81676 | -| total_timesteps | 1956864 | -| train/ | | -| approx_kl | 0.022437666 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00683 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 152870 | -| policy_gradient_loss | 0.0355 | -| std | 0.00979 | -| value_loss | 2.27e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 15289 | -| time_elapsed | 81680 | -| total_timesteps | 1956992 | -| train/ | | -| approx_kl | 0.116772205 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00768 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 152880 | -| policy_gradient_loss | 0.018 | -| std | 0.00979 | -| value_loss | 1.75e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15290 | -| time_elapsed | 81686 | -| total_timesteps | 1957120 | -| train/ | | -| approx_kl | 0.00039991876 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -0.000899 | -| n_updates | 152890 | -| policy_gradient_loss | 0.00278 | -| std | 0.00978 | -| value_loss | 1.1e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15291 | -| time_elapsed | 81700 | -| total_timesteps | 1957248 | -| train/ | | -| approx_kl | 0.03276811 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | 0.00404 | -| n_updates | 152900 | -| policy_gradient_loss | 0.0182 | -| std | 0.00978 | -| value_loss | 0.000441 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15292 | -| time_elapsed | 81706 | -| total_timesteps | 1957376 | -| train/ | | -| approx_kl | 0.021283787 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.062 | -| learning_rate | 0.0003 | -| loss | -0.00686 | -| n_updates | 152910 | -| policy_gradient_loss | 0.00755 | -| std | 0.00978 | -| value_loss | 1.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15293 | -| time_elapsed | 81710 | -| total_timesteps | 1957504 | -| train/ | | -| approx_kl | 0.14643501 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 152920 | -| policy_gradient_loss | 0.0102 | -| std | 0.00978 | -| value_loss | 2.06e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15294 | -| time_elapsed | 81714 | -| total_timesteps | 1957632 | -| train/ | | -| approx_kl | 0.030222196 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0542 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 152930 | -| policy_gradient_loss | 0.0311 | -| std | 0.00978 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15295 | -| time_elapsed | 81719 | -| total_timesteps | 1957760 | -| train/ | | -| approx_kl | 5.848706e-07 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | -6.05e-05 | -| n_updates | 152940 | -| policy_gradient_loss | 0.0548 | -| std | 0.00978 | -| value_loss | 8.73e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15296 | -| time_elapsed | 81725 | -| total_timesteps | 1957888 | -| train/ | | -| approx_kl | 0.0099400915 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 152950 | -| policy_gradient_loss | 0.0214 | -| std | 0.00979 | -| value_loss | 1.49e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15297 | -| time_elapsed | 81729 | -| total_timesteps | 1958016 | -| train/ | | -| approx_kl | 0.13846424 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.285 | -| learning_rate | 0.0003 | -| loss | 0.0876 | -| n_updates | 152960 | -| policy_gradient_loss | 0.0817 | -| std | 0.0098 | -| value_loss | 4.83e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15298 | -| time_elapsed | 81740 | -| total_timesteps | 1958144 | -| train/ | | -| approx_kl | 0.1492756 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | 0.0565 | -| n_updates | 152970 | -| policy_gradient_loss | 0.059 | -| std | 0.0098 | -| value_loss | 0.0004 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15299 | -| time_elapsed | 81744 | -| total_timesteps | 1958272 | -| train/ | | -| approx_kl | 0.12544659 | -| clip_fraction | 0.608 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00573 | -| learning_rate | 0.0003 | -| loss | 0.055 | -| n_updates | 152980 | -| policy_gradient_loss | 0.0469 | -| std | 0.00981 | -| value_loss | 8.94e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15300 | -| time_elapsed | 81749 | -| total_timesteps | 1958400 | -| train/ | | -| approx_kl | 0.02446749 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.0068 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 152990 | -| policy_gradient_loss | 0.0113 | -| std | 0.00981 | -| value_loss | 2.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15301 | -| time_elapsed | 81753 | -| total_timesteps | 1958528 | -| train/ | | -| approx_kl | 0.06732023 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 153000 | -| policy_gradient_loss | 0.00936 | -| std | 0.00981 | -| value_loss | 1.19e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15302 | -| time_elapsed | 81756 | -| total_timesteps | 1958656 | -| train/ | | -| approx_kl | 0.0064578485 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | 0.00152 | -| n_updates | 153010 | -| policy_gradient_loss | 0.000515 | -| std | 0.00982 | -| value_loss | 8.46e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15303 | -| time_elapsed | 81760 | -| total_timesteps | 1958784 | -| train/ | | -| approx_kl | 0.07657004 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.062 | -| learning_rate | 0.0003 | -| loss | 0.0357 | -| n_updates | 153020 | -| policy_gradient_loss | 0.0166 | -| std | 0.00982 | -| value_loss | 4.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 15304 | -| time_elapsed | 81764 | -| total_timesteps | 1958912 | -| train/ | | -| approx_kl | 0.025877051 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 153030 | -| policy_gradient_loss | 0.0144 | -| std | 0.00981 | -| value_loss | 1.09e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15305 | -| time_elapsed | 81769 | -| total_timesteps | 1959040 | -| train/ | | -| approx_kl | 0.06432157 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | 0.0357 | -| n_updates | 153040 | -| policy_gradient_loss | 0.0238 | -| std | 0.00981 | -| value_loss | 8.84e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15306 | -| time_elapsed | 81778 | -| total_timesteps | 1959168 | -| train/ | | -| approx_kl | 0.0011858363 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 153050 | -| policy_gradient_loss | -0.00852 | -| std | 0.00981 | -| value_loss | 0.00339 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15307 | -| time_elapsed | 81784 | -| total_timesteps | 1959296 | -| train/ | | -| approx_kl | 0.039464984 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 153060 | -| policy_gradient_loss | -0.0128 | -| std | 0.00981 | -| value_loss | 3.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15308 | -| time_elapsed | 81790 | -| total_timesteps | 1959424 | -| train/ | | -| approx_kl | 0.055612043 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | 0.0607 | -| n_updates | 153070 | -| policy_gradient_loss | 0.0757 | -| std | 0.0098 | -| value_loss | 2.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15309 | -| time_elapsed | 81795 | -| total_timesteps | 1959552 | -| train/ | | -| approx_kl | 0.061445795 | -| clip_fraction | 0.607 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 153080 | -| policy_gradient_loss | 0.0625 | -| std | 0.0098 | -| value_loss | 1.94e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15310 | -| time_elapsed | 81801 | -| total_timesteps | 1959680 | -| train/ | | -| approx_kl | 0.011202317 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.00496 | -| n_updates | 153090 | -| policy_gradient_loss | 0.011 | -| std | 0.00981 | -| value_loss | 3.34e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15311 | -| time_elapsed | 81806 | -| total_timesteps | 1959808 | -| train/ | | -| approx_kl | 0.2910251 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.0943 | -| n_updates | 153100 | -| policy_gradient_loss | 0.0309 | -| std | 0.00982 | -| value_loss | 6.66e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 15312 | -| time_elapsed | 81811 | -| total_timesteps | 1959936 | -| train/ | | -| approx_kl | 0.00027914112 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 153110 | -| policy_gradient_loss | -0.00125 | -| std | 0.00982 | -| value_loss | 3.73e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15313 | -| time_elapsed | 81817 | -| total_timesteps | 1960064 | -| train/ | | -| approx_kl | 0.024167709 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | -0.0094 | -| n_updates | 153120 | -| policy_gradient_loss | -0.00444 | -| std | 0.00982 | -| value_loss | 2.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15314 | -| time_elapsed | 81828 | -| total_timesteps | 1960192 | -| train/ | | -| approx_kl | 0.0031266944 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.2 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 153130 | -| policy_gradient_loss | -0.00317 | -| std | 0.00981 | -| value_loss | 0.000593 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15315 | -| time_elapsed | 81833 | -| total_timesteps | 1960320 | -| train/ | | -| approx_kl | 0.0012392984 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00302 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 153140 | -| policy_gradient_loss | -0.00324 | -| std | 0.00981 | -| value_loss | 4.76e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15316 | -| time_elapsed | 81838 | -| total_timesteps | 1960448 | -| train/ | | -| approx_kl | 0.0062393467 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 153150 | -| policy_gradient_loss | -0.00206 | -| std | 0.0098 | -| value_loss | 7.37e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15317 | -| time_elapsed | 81843 | -| total_timesteps | 1960576 | -| train/ | | -| approx_kl | 0.014035832 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.452 | -| learning_rate | 0.0003 | -| loss | 0.00421 | -| n_updates | 153160 | -| policy_gradient_loss | 0.0551 | -| std | 0.0098 | -| value_loss | 5.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15318 | -| time_elapsed | 81849 | -| total_timesteps | 1960704 | -| train/ | | -| approx_kl | 0.046941817 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.0406 | -| n_updates | 153170 | -| policy_gradient_loss | 0.0875 | -| std | 0.0098 | -| value_loss | 1.11e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15319 | -| time_elapsed | 81853 | -| total_timesteps | 1960832 | -| train/ | | -| approx_kl | 0.011046906 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | -0.000509 | -| n_updates | 153180 | -| policy_gradient_loss | 0.014 | -| std | 0.0098 | -| value_loss | 6.98e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 15320 | -| time_elapsed | 81857 | -| total_timesteps | 1960960 | -| train/ | | -| approx_kl | 0.19315572 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.0625 | -| n_updates | 153190 | -| policy_gradient_loss | 0.0206 | -| std | 0.0098 | -| value_loss | 3.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15321 | -| time_elapsed | 81862 | -| total_timesteps | 1961088 | -| train/ | | -| approx_kl | 0.019486709 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | 0.000782 | -| n_updates | 153200 | -| policy_gradient_loss | 0.000586 | -| std | 0.0098 | -| value_loss | 1.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15322 | -| time_elapsed | 81871 | -| total_timesteps | 1961216 | -| train/ | | -| approx_kl | 0.0045444267 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.283 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 153210 | -| policy_gradient_loss | -0.008 | -| std | 0.0098 | -| value_loss | 0.00181 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15323 | -| time_elapsed | 81875 | -| total_timesteps | 1961344 | -| train/ | | -| approx_kl | 0.071285225 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -25.4 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 153220 | -| policy_gradient_loss | 0.0121 | -| std | 0.0098 | -| value_loss | 2.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15324 | -| time_elapsed | 81880 | -| total_timesteps | 1961472 | -| train/ | | -| approx_kl | 0.009813651 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -2.17 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 153230 | -| policy_gradient_loss | -0.00323 | -| std | 0.0098 | -| value_loss | 5.6e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15325 | -| time_elapsed | 81885 | -| total_timesteps | 1961600 | -| train/ | | -| approx_kl | 0.00034063216 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0535 | -| learning_rate | 0.0003 | -| loss | -0.000164 | -| n_updates | 153240 | -| policy_gradient_loss | 0.00429 | -| std | 0.00978 | -| value_loss | 1.97e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15326 | -| time_elapsed | 81890 | -| total_timesteps | 1961728 | -| train/ | | -| approx_kl | 0.037997745 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0877 | -| learning_rate | 0.0003 | -| loss | 0.00411 | -| n_updates | 153250 | -| policy_gradient_loss | -0.0012 | -| std | 0.00976 | -| value_loss | 8.6e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15327 | -| time_elapsed | 81895 | -| total_timesteps | 1961856 | -| train/ | | -| approx_kl | 0.16122994 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | 0.0417 | -| n_updates | 153260 | -| policy_gradient_loss | -0.00194 | -| std | 0.00975 | -| value_loss | 1.41e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 15328 | -| time_elapsed | 81900 | -| total_timesteps | 1961984 | -| train/ | | -| approx_kl | 0.09909745 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -27.8 | -| learning_rate | 0.0003 | -| loss | 0.0035 | -| n_updates | 153270 | -| policy_gradient_loss | -0.000133 | -| std | 0.00974 | -| value_loss | 2.58e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15329 | -| time_elapsed | 81905 | -| total_timesteps | 1962112 | -| train/ | | -| approx_kl | 0.03431137 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.00763 | -| n_updates | 153280 | -| policy_gradient_loss | 0.0103 | -| std | 0.00974 | -| value_loss | 6.23e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15330 | -| time_elapsed | 81917 | -| total_timesteps | 1962240 | -| train/ | | -| approx_kl | 0.005857982 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -4.58 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 153290 | -| policy_gradient_loss | -0.0145 | -| std | 0.00974 | -| value_loss | 0.00404 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15331 | -| time_elapsed | 81922 | -| total_timesteps | 1962368 | -| train/ | | -| approx_kl | 0.014779674 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.00687 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 153300 | -| policy_gradient_loss | 0.0127 | -| std | 0.00974 | -| value_loss | 2.8e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15332 | -| time_elapsed | 81926 | -| total_timesteps | 1962496 | -| train/ | | -| approx_kl | 0.00030706404 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.0028 | -| n_updates | 153310 | -| policy_gradient_loss | 0.000551 | -| std | 0.00974 | -| value_loss | 8.84e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15333 | -| time_elapsed | 81930 | -| total_timesteps | 1962624 | -| train/ | | -| approx_kl | 0.07065641 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0909 | -| n_updates | 153320 | -| policy_gradient_loss | 0.0633 | -| std | 0.00973 | -| value_loss | 5.85e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15334 | -| time_elapsed | 81934 | -| total_timesteps | 1962752 | -| train/ | | -| approx_kl | 0.0680733 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 153330 | -| policy_gradient_loss | 0.076 | -| std | 0.00973 | -| value_loss | 3.42e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 15335 | -| time_elapsed | 81939 | -| total_timesteps | 1962880 | -| train/ | | -| approx_kl | 0.05404382 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.047 | -| n_updates | 153340 | -| policy_gradient_loss | 0.0506 | -| std | 0.00973 | -| value_loss | 2.69e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15336 | -| time_elapsed | 81944 | -| total_timesteps | 1963008 | -| train/ | | -| approx_kl | 0.05678058 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.0447 | -| n_updates | 153350 | -| policy_gradient_loss | 0.0408 | -| std | 0.00974 | -| value_loss | 1.75e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15337 | -| time_elapsed | 81956 | -| total_timesteps | 1963136 | -| train/ | | -| approx_kl | 0.12382402 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.00209 | -| n_updates | 153360 | -| policy_gradient_loss | 0.00357 | -| std | 0.00974 | -| value_loss | 0.00205 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15338 | -| time_elapsed | 81962 | -| total_timesteps | 1963264 | -| train/ | | -| approx_kl | 0.048675105 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.478 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 153370 | -| policy_gradient_loss | 0.0094 | -| std | 0.00974 | -| value_loss | 2.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15339 | -| time_elapsed | 81968 | -| total_timesteps | 1963392 | -| train/ | | -| approx_kl | 0.06791773 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0957 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 153380 | -| policy_gradient_loss | 0.0161 | -| std | 0.00975 | -| value_loss | 3.66e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15340 | -| time_elapsed | 81973 | -| total_timesteps | 1963520 | -| train/ | | -| approx_kl | 0.16087238 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 153390 | -| policy_gradient_loss | 0.109 | -| std | 0.00975 | -| value_loss | 2.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15341 | -| time_elapsed | 81979 | -| total_timesteps | 1963648 | -| train/ | | -| approx_kl | 0.023798168 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 153400 | -| policy_gradient_loss | 0.0024 | -| std | 0.00975 | -| value_loss | 2.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15342 | -| time_elapsed | 81984 | -| total_timesteps | 1963776 | -| train/ | | -| approx_kl | 0.27444375 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 153410 | -| policy_gradient_loss | 0.0269 | -| std | 0.00975 | -| value_loss | 1.32e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15343 | -| time_elapsed | 81989 | -| total_timesteps | 1963904 | -| train/ | | -| approx_kl | 0.019093951 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 153420 | -| policy_gradient_loss | -0.000228 | -| std | 0.00976 | -| value_loss | 8.71e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15344 | -| time_elapsed | 81995 | -| total_timesteps | 1964032 | -| train/ | | -| approx_kl | 1.2761448e-05 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.000236 | -| n_updates | 153430 | -| policy_gradient_loss | 0.000681 | -| std | 0.00976 | -| value_loss | 5.76e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15345 | -| time_elapsed | 82005 | -| total_timesteps | 1964160 | -| train/ | | -| approx_kl | 0.029882254 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | 0.000719 | -| n_updates | 153440 | -| policy_gradient_loss | -0.00543 | -| std | 0.00977 | -| value_loss | 4.34e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15346 | -| time_elapsed | 82009 | -| total_timesteps | 1964288 | -| train/ | | -| approx_kl | 0.0018376219 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -7.07 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 153450 | -| policy_gradient_loss | -0.0106 | -| std | 0.00977 | -| value_loss | 2.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15347 | -| time_elapsed | 82014 | -| total_timesteps | 1964416 | -| train/ | | -| approx_kl | 0.040843587 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 153460 | -| policy_gradient_loss | 0.0342 | -| std | 0.00977 | -| value_loss | 2.25e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15348 | -| time_elapsed | 82018 | -| total_timesteps | 1964544 | -| train/ | | -| approx_kl | 0.09795633 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.525 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 153470 | -| policy_gradient_loss | 0.015 | -| std | 0.00977 | -| value_loss | 8.61e-10 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15349 | -| time_elapsed | 82023 | -| total_timesteps | 1964672 | -| train/ | | -| approx_kl | 0.00060969964 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0923 | -| learning_rate | 0.0003 | -| loss | -0.000647 | -| n_updates | 153480 | -| policy_gradient_loss | 0.00426 | -| std | 0.00977 | -| value_loss | 4.69e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15350 | -| time_elapsed | 82029 | -| total_timesteps | 1964800 | -| train/ | | -| approx_kl | 0.035116136 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.00223 | -| n_updates | 153490 | -| policy_gradient_loss | 0.033 | -| std | 0.00977 | -| value_loss | 1.09e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15351 | -| time_elapsed | 82034 | -| total_timesteps | 1964928 | -| train/ | | -| approx_kl | 0.01189615 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.00455 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 153500 | -| policy_gradient_loss | 0.000726 | -| std | 0.00977 | -| value_loss | 3.62e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15352 | -| time_elapsed | 82039 | -| total_timesteps | 1965056 | -| train/ | | -| approx_kl | 0.08944024 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0483 | -| n_updates | 153510 | -| policy_gradient_loss | 0.00613 | -| std | 0.00977 | -| value_loss | 1.81e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15353 | -| time_elapsed | 82049 | -| total_timesteps | 1965184 | -| train/ | | -| approx_kl | 0.15565085 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 153520 | -| policy_gradient_loss | 0.00886 | -| std | 0.00976 | -| value_loss | 0.00311 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15354 | -| time_elapsed | 82054 | -| total_timesteps | 1965312 | -| train/ | | -| approx_kl | 0.024108123 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 3.21 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 153530 | -| policy_gradient_loss | 0.00405 | -| std | 0.00971 | -| value_loss | 5.59e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15355 | -| time_elapsed | 82058 | -| total_timesteps | 1965440 | -| train/ | | -| approx_kl | 0.0042610182 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.0054 | -| learning_rate | 0.0003 | -| loss | -0.00391 | -| n_updates | 153540 | -| policy_gradient_loss | 0.00633 | -| std | 0.00968 | -| value_loss | 0.000338 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15356 | -| time_elapsed | 82064 | -| total_timesteps | 1965568 | -| train/ | | -| approx_kl | 0.03963112 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.00185 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 153550 | -| policy_gradient_loss | 0.0397 | -| std | 0.00967 | -| value_loss | 5.13e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15357 | -| time_elapsed | 82069 | -| total_timesteps | 1965696 | -| train/ | | -| approx_kl | 0.0133366035 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 153560 | -| policy_gradient_loss | 0.00212 | -| std | 0.00967 | -| value_loss | 3.24e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15358 | -| time_elapsed | 82074 | -| total_timesteps | 1965824 | -| train/ | | -| approx_kl | 0.0148606 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 153570 | -| policy_gradient_loss | 0.0216 | -| std | 0.00967 | -| value_loss | 2.64e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15359 | -| time_elapsed | 82080 | -| total_timesteps | 1965952 | -| train/ | | -| approx_kl | 0.040695406 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | -0.000743 | -| n_updates | 153580 | -| policy_gradient_loss | -0.00242 | -| std | 0.00967 | -| value_loss | 1.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15360 | -| time_elapsed | 82084 | -| total_timesteps | 1966080 | -| train/ | | -| approx_kl | 0.005828827 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.000205 | -| n_updates | 153590 | -| policy_gradient_loss | 0.0364 | -| std | 0.00967 | -| value_loss | 1.19e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15361 | -| time_elapsed | 82092 | -| total_timesteps | 1966208 | -| train/ | | -| approx_kl | 0.0012075659 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.00647 | -| n_updates | 153600 | -| policy_gradient_loss | 0.000522 | -| std | 0.00967 | -| value_loss | 0.000621 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15362 | -| time_elapsed | 82097 | -| total_timesteps | 1966336 | -| train/ | | -| approx_kl | 0.009849152 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 153610 | -| policy_gradient_loss | 0.0132 | -| std | 0.00967 | -| value_loss | 6.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15363 | -| time_elapsed | 82102 | -| total_timesteps | 1966464 | -| train/ | | -| approx_kl | 0.04631635 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 153620 | -| policy_gradient_loss | 0.0112 | -| std | 0.00967 | -| value_loss | 6.06e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15364 | -| time_elapsed | 82107 | -| total_timesteps | 1966592 | -| train/ | | -| approx_kl | 0.24616708 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.00569 | -| learning_rate | 0.0003 | -| loss | 0.0811 | -| n_updates | 153630 | -| policy_gradient_loss | 0.0222 | -| std | 0.00967 | -| value_loss | 4.26e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15365 | -| time_elapsed | 82111 | -| total_timesteps | 1966720 | -| train/ | | -| approx_kl | 3.6813784e-05 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 153640 | -| policy_gradient_loss | -0.00978 | -| std | 0.00967 | -| value_loss | 9.59e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15366 | -| time_elapsed | 82116 | -| total_timesteps | 1966848 | -| train/ | | -| approx_kl | 0.009087919 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 153650 | -| policy_gradient_loss | -0.000213 | -| std | 0.00967 | -| value_loss | 8.2e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15367 | -| time_elapsed | 82120 | -| total_timesteps | 1966976 | -| train/ | | -| approx_kl | 0.027706077 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 153660 | -| policy_gradient_loss | 0.00421 | -| std | 0.00967 | -| value_loss | 5.23e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15368 | -| time_elapsed | 82125 | -| total_timesteps | 1967104 | -| train/ | | -| approx_kl | 0.00024672644 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.00476 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 153670 | -| policy_gradient_loss | -0.00666 | -| std | 0.00967 | -| value_loss | 3.79e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15369 | -| time_elapsed | 82136 | -| total_timesteps | 1967232 | -| train/ | | -| approx_kl | 0.071748115 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 153680 | -| policy_gradient_loss | -0.00069 | -| std | 0.00966 | -| value_loss | 1.73e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15370 | -| time_elapsed | 82141 | -| total_timesteps | 1967360 | -| train/ | | -| approx_kl | 0.006419485 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 8.25e-05 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 153690 | -| policy_gradient_loss | 0.0191 | -| std | 0.00965 | -| value_loss | 3.33e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15371 | -| time_elapsed | 82146 | -| total_timesteps | 1967488 | -| train/ | | -| approx_kl | 0.0675354 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0699 | -| n_updates | 153700 | -| policy_gradient_loss | 0.0283 | -| std | 0.00965 | -| value_loss | 2.41e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15372 | -| time_elapsed | 82150 | -| total_timesteps | 1967616 | -| train/ | | -| approx_kl | 0.10292944 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 153710 | -| policy_gradient_loss | 0.0203 | -| std | 0.00965 | -| value_loss | 1.43e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15373 | -| time_elapsed | 82155 | -| total_timesteps | 1967744 | -| train/ | | -| approx_kl | 0.0004387903 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.000122 | -| n_updates | 153720 | -| policy_gradient_loss | 0.0118 | -| std | 0.00964 | -| value_loss | 4.31e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15374 | -| time_elapsed | 82161 | -| total_timesteps | 1967872 | -| train/ | | -| approx_kl | 0.028625231 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.0654 | -| n_updates | 153730 | -| policy_gradient_loss | -0.00694 | -| std | 0.00963 | -| value_loss | 2.58e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15375 | -| time_elapsed | 82165 | -| total_timesteps | 1968000 | -| train/ | | -| approx_kl | 0.0003709728 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.00204 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 153740 | -| policy_gradient_loss | 0.0091 | -| std | 0.00963 | -| value_loss | 4.31e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15376 | -| time_elapsed | 82170 | -| total_timesteps | 1968128 | -| train/ | | -| approx_kl | 0.016318843 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.00512 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 153750 | -| policy_gradient_loss | -0.00281 | -| std | 0.00963 | -| value_loss | 1.49e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15377 | -| time_elapsed | 82181 | -| total_timesteps | 1968256 | -| train/ | | -| approx_kl | 0.09653849 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 153760 | -| policy_gradient_loss | 0.0223 | -| std | 0.00963 | -| value_loss | 0.000616 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15378 | -| time_elapsed | 82186 | -| total_timesteps | 1968384 | -| train/ | | -| approx_kl | 0.12023428 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0609 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 153770 | -| policy_gradient_loss | 0.0763 | -| std | 0.00963 | -| value_loss | 2.45e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15379 | -| time_elapsed | 82192 | -| total_timesteps | 1968512 | -| train/ | | -| approx_kl | 0.08035983 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.00672 | -| learning_rate | 0.0003 | -| loss | 0.0817 | -| n_updates | 153780 | -| policy_gradient_loss | 0.0877 | -| std | 0.00963 | -| value_loss | 4.18e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15380 | -| time_elapsed | 82197 | -| total_timesteps | 1968640 | -| train/ | | -| approx_kl | 0.01729578 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.00549 | -| n_updates | 153790 | -| policy_gradient_loss | 0.0111 | -| std | 0.00963 | -| value_loss | 3.13e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15381 | -| time_elapsed | 82202 | -| total_timesteps | 1968768 | -| train/ | | -| approx_kl | 0.22207919 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.0984 | -| n_updates | 153800 | -| policy_gradient_loss | 0.0258 | -| std | 0.00963 | -| value_loss | 7.41e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15382 | -| time_elapsed | 82207 | -| total_timesteps | 1968896 | -| train/ | | -| approx_kl | 0.021974226 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 153810 | -| policy_gradient_loss | 0.00123 | -| std | 0.00963 | -| value_loss | 4.99e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15383 | -| time_elapsed | 82212 | -| total_timesteps | 1969024 | -| train/ | | -| approx_kl | 0.0033704578 | -| clip_fraction | 0.0766 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | -0.000779 | -| n_updates | 153820 | -| policy_gradient_loss | 0.00195 | -| std | 0.00963 | -| value_loss | 3.77e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15384 | -| time_elapsed | 82222 | -| total_timesteps | 1969152 | -| train/ | | -| approx_kl | 0.06074404 | -| clip_fraction | 0.597 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | 0.00653 | -| n_updates | 153830 | -| policy_gradient_loss | 0.00667 | -| std | 0.00963 | -| value_loss | 0.00293 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15385 | -| time_elapsed | 82227 | -| total_timesteps | 1969280 | -| train/ | | -| approx_kl | 0.103707395 | -| clip_fraction | 0.599 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.0635 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 153840 | -| policy_gradient_loss | 0.0511 | -| std | 0.00963 | -| value_loss | 3.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15386 | -| time_elapsed | 82231 | -| total_timesteps | 1969408 | -| train/ | | -| approx_kl | 0.024449296 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | 0.00475 | -| n_updates | 153850 | -| policy_gradient_loss | 0.0159 | -| std | 0.00963 | -| value_loss | 2.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15387 | -| time_elapsed | 82235 | -| total_timesteps | 1969536 | -| train/ | | -| approx_kl | 0.024453823 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 153860 | -| policy_gradient_loss | 0.00624 | -| std | 0.00963 | -| value_loss | 2.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15388 | -| time_elapsed | 82242 | -| total_timesteps | 1969664 | -| train/ | | -| approx_kl | 0.11880827 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 153870 | -| policy_gradient_loss | 0.00831 | -| std | 0.00963 | -| value_loss | 1.69e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15389 | -| time_elapsed | 82247 | -| total_timesteps | 1969792 | -| train/ | | -| approx_kl | 0.038068127 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 153880 | -| policy_gradient_loss | 0.0178 | -| std | 0.00963 | -| value_loss | 7.29e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15390 | -| time_elapsed | 82252 | -| total_timesteps | 1969920 | -| train/ | | -| approx_kl | 0.07190843 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 153890 | -| policy_gradient_loss | 0.0181 | -| std | 0.00963 | -| value_loss | 1.54e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15391 | -| time_elapsed | 82257 | -| total_timesteps | 1970048 | -| train/ | | -| approx_kl | 0.17150739 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.0589 | -| n_updates | 153900 | -| policy_gradient_loss | 0.0539 | -| std | 0.00965 | -| value_loss | 6.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15392 | -| time_elapsed | 82265 | -| total_timesteps | 1970176 | -| train/ | | -| approx_kl | 0.005841764 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 153910 | -| policy_gradient_loss | -0.004 | -| std | 0.00965 | -| value_loss | 4.22e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15393 | -| time_elapsed | 82270 | -| total_timesteps | 1970304 | -| train/ | | -| approx_kl | 0.03087267 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | 0.0365 | -| n_updates | 153920 | -| policy_gradient_loss | 0.0458 | -| std | 0.00966 | -| value_loss | 1.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15394 | -| time_elapsed | 82274 | -| total_timesteps | 1970432 | -| train/ | | -| approx_kl | 0.007835051 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 153930 | -| policy_gradient_loss | 0.0087 | -| std | 0.00966 | -| value_loss | 6.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15395 | -| time_elapsed | 82278 | -| total_timesteps | 1970560 | -| train/ | | -| approx_kl | 0.015847486 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 153940 | -| policy_gradient_loss | -0.00675 | -| std | 0.00966 | -| value_loss | 4.16e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15396 | -| time_elapsed | 82283 | -| total_timesteps | 1970688 | -| train/ | | -| approx_kl | 0.0055106063 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.000212 | -| n_updates | 153950 | -| policy_gradient_loss | 0.00851 | -| std | 0.00965 | -| value_loss | 6.52e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15397 | -| time_elapsed | 82289 | -| total_timesteps | 1970816 | -| train/ | | -| approx_kl | 2.0897482e-05 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.000301 | -| n_updates | 153960 | -| policy_gradient_loss | 0.000297 | -| std | 0.00965 | -| value_loss | 4.95e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15398 | -| time_elapsed | 82294 | -| total_timesteps | 1970944 | -| train/ | | -| approx_kl | 0.06892863 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0626 | -| n_updates | 153970 | -| policy_gradient_loss | 0.0571 | -| std | 0.00965 | -| value_loss | 2.31e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15399 | -| time_elapsed | 82300 | -| total_timesteps | 1971072 | -| train/ | | -| approx_kl | 0.014878282 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.00457 | -| learning_rate | 0.0003 | -| loss | -0.00215 | -| n_updates | 153980 | -| policy_gradient_loss | 0.00913 | -| std | 0.00965 | -| value_loss | 4.85e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15400 | -| time_elapsed | 82308 | -| total_timesteps | 1971200 | -| train/ | | -| approx_kl | 0.0463361 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 153990 | -| policy_gradient_loss | -0.0119 | -| std | 0.00965 | -| value_loss | 9.02e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15401 | -| time_elapsed | 82313 | -| total_timesteps | 1971328 | -| train/ | | -| approx_kl | 0.002091168 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.00655 | -| n_updates | 154000 | -| policy_gradient_loss | 0.0488 | -| std | 0.00965 | -| value_loss | 1.75e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15402 | -| time_elapsed | 82319 | -| total_timesteps | 1971456 | -| train/ | | -| approx_kl | 0.0495553 | -| clip_fraction | 0.579 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.00783 | -| learning_rate | 0.0003 | -| loss | 0.0671 | -| n_updates | 154010 | -| policy_gradient_loss | 0.104 | -| std | 0.00965 | -| value_loss | 6.88e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15403 | -| time_elapsed | 82324 | -| total_timesteps | 1971584 | -| train/ | | -| approx_kl | 0.041749764 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.002 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 154020 | -| policy_gradient_loss | 0.0197 | -| std | 0.00965 | -| value_loss | 2.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15404 | -| time_elapsed | 82329 | -| total_timesteps | 1971712 | -| train/ | | -| approx_kl | 0.019623091 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | 0.00343 | -| n_updates | 154030 | -| policy_gradient_loss | 0.0122 | -| std | 0.00964 | -| value_loss | 8.33e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15405 | -| time_elapsed | 82334 | -| total_timesteps | 1971840 | -| train/ | | -| approx_kl | 0.16585183 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.0597 | -| n_updates | 154040 | -| policy_gradient_loss | 0.0145 | -| std | 0.00964 | -| value_loss | 3.79e-10 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15406 | -| time_elapsed | 82338 | -| total_timesteps | 1971968 | -| train/ | | -| approx_kl | 1.1366792e-05 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | -0.000274 | -| n_updates | 154050 | -| policy_gradient_loss | 0.00524 | -| std | 0.00965 | -| value_loss | 2.28e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15407 | -| time_elapsed | 82343 | -| total_timesteps | 1972096 | -| train/ | | -| approx_kl | 0.023875423 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.000114 | -| n_updates | 154060 | -| policy_gradient_loss | 0.0222 | -| std | 0.00965 | -| value_loss | 1.53e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15408 | -| time_elapsed | 82354 | -| total_timesteps | 1972224 | -| train/ | | -| approx_kl | 0.0049958033 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 154070 | -| policy_gradient_loss | -0.017 | -| std | 0.00965 | -| value_loss | 0.00187 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15409 | -| time_elapsed | 82358 | -| total_timesteps | 1972352 | -| train/ | | -| approx_kl | 0.00020651007 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.000233 | -| n_updates | 154080 | -| policy_gradient_loss | 0.00386 | -| std | 0.00965 | -| value_loss | 8.25e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15410 | -| time_elapsed | 82363 | -| total_timesteps | 1972480 | -| train/ | | -| approx_kl | 0.00028079003 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | -0.00275 | -| n_updates | 154090 | -| policy_gradient_loss | -0.000372 | -| std | 0.00966 | -| value_loss | 6.05e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15411 | -| time_elapsed | 82367 | -| total_timesteps | 1972608 | -| train/ | | -| approx_kl | 2.9091723e-05 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | -0.000818 | -| n_updates | 154100 | -| policy_gradient_loss | -0.00331 | -| std | 0.00966 | -| value_loss | 2.8e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15412 | -| time_elapsed | 82371 | -| total_timesteps | 1972736 | -| train/ | | -| approx_kl | 7.545203e-05 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0559 | -| learning_rate | 0.0003 | -| loss | -0.000722 | -| n_updates | 154110 | -| policy_gradient_loss | -0.000228 | -| std | 0.00966 | -| value_loss | 1.68e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15413 | -| time_elapsed | 82375 | -| total_timesteps | 1972864 | -| train/ | | -| approx_kl | 0.028310219 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | 0.00218 | -| n_updates | 154120 | -| policy_gradient_loss | 0.0248 | -| std | 0.00966 | -| value_loss | 9.63e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15414 | -| time_elapsed | 82378 | -| total_timesteps | 1972992 | -| train/ | | -| approx_kl | 0.010379794 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | -0.00874 | -| n_updates | 154130 | -| policy_gradient_loss | 0.00166 | -| std | 0.00966 | -| value_loss | 6.76e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15415 | -| time_elapsed | 82382 | -| total_timesteps | 1973120 | -| train/ | | -| approx_kl | 0.08676906 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.0505 | -| n_updates | 154140 | -| policy_gradient_loss | 0.00746 | -| std | 0.00966 | -| value_loss | 6.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15416 | -| time_elapsed | 82393 | -| total_timesteps | 1973248 | -| train/ | | -| approx_kl | 0.047527038 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | 0.00521 | -| n_updates | 154150 | -| policy_gradient_loss | 0.00371 | -| std | 0.00966 | -| value_loss | 0.0022 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15417 | -| time_elapsed | 82398 | -| total_timesteps | 1973376 | -| train/ | | -| approx_kl | 0.0584485 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.0481 | -| n_updates | 154160 | -| policy_gradient_loss | 0.0322 | -| std | 0.00966 | -| value_loss | 1.92e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15418 | -| time_elapsed | 82402 | -| total_timesteps | 1973504 | -| train/ | | -| approx_kl | 0.07708988 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0411 | -| n_updates | 154170 | -| policy_gradient_loss | 0.0164 | -| std | 0.00966 | -| value_loss | 1.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15419 | -| time_elapsed | 82407 | -| total_timesteps | 1973632 | -| train/ | | -| approx_kl | 0.029931918 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 154180 | -| policy_gradient_loss | 0.00318 | -| std | 0.00963 | -| value_loss | 0.000198 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15420 | -| time_elapsed | 82413 | -| total_timesteps | 1973760 | -| train/ | | -| approx_kl | 0.015098319 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.22 | -| explained_variance | -0.309 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 154190 | -| policy_gradient_loss | -0.00255 | -| std | 0.00961 | -| value_loss | 0.00207 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 15421 | -| time_elapsed | 82418 | -| total_timesteps | 1973888 | -| train/ | | -| approx_kl | 0.117048286 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.556 | -| learning_rate | 0.0003 | -| loss | 0.0922 | -| n_updates | 154200 | -| policy_gradient_loss | 0.036 | -| std | 0.0096 | -| value_loss | 0.00149 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15422 | -| time_elapsed | 82423 | -| total_timesteps | 1974016 | -| train/ | | -| approx_kl | 0.026481774 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.413 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 154210 | -| policy_gradient_loss | 0.0264 | -| std | 0.0096 | -| value_loss | 2.91e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15423 | -| time_elapsed | 82436 | -| total_timesteps | 1974144 | -| train/ | | -| approx_kl | 0.0045995526 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 154220 | -| policy_gradient_loss | 0.00727 | -| std | 0.00959 | -| value_loss | 0.000297 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15424 | -| time_elapsed | 82441 | -| total_timesteps | 1974272 | -| train/ | | -| approx_kl | 0.07348016 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.0569 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 154230 | -| policy_gradient_loss | 0.0361 | -| std | 0.00959 | -| value_loss | 5.39e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15425 | -| time_elapsed | 82446 | -| total_timesteps | 1974400 | -| train/ | | -| approx_kl | 1.2712553e-07 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | -3.65e-05 | -| n_updates | 154240 | -| policy_gradient_loss | 0.00497 | -| std | 0.00959 | -| value_loss | 3.07e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15426 | -| time_elapsed | 82450 | -| total_timesteps | 1974528 | -| train/ | | -| approx_kl | 0.00012373133 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 154250 | -| policy_gradient_loss | -0.00791 | -| std | 0.00959 | -| value_loss | 2.87e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15427 | -| time_elapsed | 82455 | -| total_timesteps | 1974656 | -| train/ | | -| approx_kl | 4.571909e-05 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.000851 | -| n_updates | 154260 | -| policy_gradient_loss | -0.00252 | -| std | 0.00959 | -| value_loss | 2.25e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15428 | -| time_elapsed | 82460 | -| total_timesteps | 1974784 | -| train/ | | -| approx_kl | 0.03490235 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 154270 | -| policy_gradient_loss | 0.0391 | -| std | 0.00959 | -| value_loss | 1.68e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 15429 | -| time_elapsed | 82465 | -| total_timesteps | 1974912 | -| train/ | | -| approx_kl | 0.12461729 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.0398 | -| n_updates | 154280 | -| policy_gradient_loss | 0.018 | -| std | 0.00959 | -| value_loss | 1.29e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15430 | -| time_elapsed | 82471 | -| total_timesteps | 1975040 | -| train/ | | -| approx_kl | 0.029157054 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0542 | -| learning_rate | 0.0003 | -| loss | 0.00761 | -| n_updates | 154290 | -| policy_gradient_loss | 0.0413 | -| std | 0.00959 | -| value_loss | 5.11e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15431 | -| time_elapsed | 82482 | -| total_timesteps | 1975168 | -| train/ | | -| approx_kl | 0.13175415 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | 0.0438 | -| n_updates | 154300 | -| policy_gradient_loss | 0.0144 | -| std | 0.00959 | -| value_loss | 0.00125 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15432 | -| time_elapsed | 82486 | -| total_timesteps | 1975296 | -| train/ | | -| approx_kl | 0.0048496234 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 154310 | -| policy_gradient_loss | -0.0106 | -| std | 0.00959 | -| value_loss | 1.38e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15433 | -| time_elapsed | 82491 | -| total_timesteps | 1975424 | -| train/ | | -| approx_kl | 0.033870466 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.00646 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 154320 | -| policy_gradient_loss | 0.0297 | -| std | 0.00959 | -| value_loss | 4.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15434 | -| time_elapsed | 82496 | -| total_timesteps | 1975552 | -| train/ | | -| approx_kl | 0.019933075 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 154330 | -| policy_gradient_loss | 0.0193 | -| std | 0.00959 | -| value_loss | 2.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15435 | -| time_elapsed | 82501 | -| total_timesteps | 1975680 | -| train/ | | -| approx_kl | 0.04084924 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.0047 | -| n_updates | 154340 | -| policy_gradient_loss | -0.00069 | -| std | 0.00959 | -| value_loss | 1.05e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15436 | -| time_elapsed | 82505 | -| total_timesteps | 1975808 | -| train/ | | -| approx_kl | 0.06648311 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.0385 | -| n_updates | 154350 | -| policy_gradient_loss | 0.0205 | -| std | 0.0096 | -| value_loss | 1.1e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 15437 | -| time_elapsed | 82512 | -| total_timesteps | 1975936 | -| train/ | | -| approx_kl | 0.014230686 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 154360 | -| policy_gradient_loss | 0.0329 | -| std | 0.0096 | -| value_loss | 2.54e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15438 | -| time_elapsed | 82517 | -| total_timesteps | 1976064 | -| train/ | | -| approx_kl | 0.11737671 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.00711 | -| learning_rate | 0.0003 | -| loss | 0.0519 | -| n_updates | 154370 | -| policy_gradient_loss | 0.0175 | -| std | 0.0096 | -| value_loss | 9.28e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15439 | -| time_elapsed | 82526 | -| total_timesteps | 1976192 | -| train/ | | -| approx_kl | 0.07092545 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.0999 | -| learning_rate | 0.0003 | -| loss | -0.00993 | -| n_updates | 154380 | -| policy_gradient_loss | -0.0101 | -| std | 0.0096 | -| value_loss | 0.00183 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15440 | -| time_elapsed | 82531 | -| total_timesteps | 1976320 | -| train/ | | -| approx_kl | 0.073819846 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 154390 | -| policy_gradient_loss | 0.00835 | -| std | 0.00957 | -| value_loss | 1.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15441 | -| time_elapsed | 82536 | -| total_timesteps | 1976448 | -| train/ | | -| approx_kl | 0.020971656 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.477 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 154400 | -| policy_gradient_loss | -0.0031 | -| std | 0.00956 | -| value_loss | 2.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15442 | -| time_elapsed | 82542 | -| total_timesteps | 1976576 | -| train/ | | -| approx_kl | 0.007183585 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.00615 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 154410 | -| policy_gradient_loss | 0.0109 | -| std | 0.00955 | -| value_loss | 8.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15443 | -| time_elapsed | 82546 | -| total_timesteps | 1976704 | -| train/ | | -| approx_kl | 0.038544737 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.00793 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 154420 | -| policy_gradient_loss | -0.00167 | -| std | 0.00955 | -| value_loss | 8.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15444 | -| time_elapsed | 82551 | -| total_timesteps | 1976832 | -| train/ | | -| approx_kl | 0.30048954 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 154430 | -| policy_gradient_loss | 0.0309 | -| std | 0.00955 | -| value_loss | 6.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 15445 | -| time_elapsed | 82556 | -| total_timesteps | 1976960 | -| train/ | | -| approx_kl | 0.019000415 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.00066 | -| n_updates | 154440 | -| policy_gradient_loss | 0.00152 | -| std | 0.00954 | -| value_loss | 4.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15446 | -| time_elapsed | 82562 | -| total_timesteps | 1977088 | -| train/ | | -| approx_kl | 0.022862878 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.00373 | -| n_updates | 154450 | -| policy_gradient_loss | 0.00131 | -| std | 0.00954 | -| value_loss | 3.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15447 | -| time_elapsed | 82571 | -| total_timesteps | 1977216 | -| train/ | | -| approx_kl | 0.04745197 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.000933 | -| n_updates | 154460 | -| policy_gradient_loss | -0.00445 | -| std | 0.00954 | -| value_loss | 0.00298 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15448 | -| time_elapsed | 82577 | -| total_timesteps | 1977344 | -| train/ | | -| approx_kl | 0.0126513075 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0899 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 154470 | -| policy_gradient_loss | -0.002 | -| std | 0.00954 | -| value_loss | 1.85e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15449 | -| time_elapsed | 82582 | -| total_timesteps | 1977472 | -| train/ | | -| approx_kl | 0.002530775 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.00525 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 154480 | -| policy_gradient_loss | 0.00149 | -| std | 0.00954 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15450 | -| time_elapsed | 82586 | -| total_timesteps | 1977600 | -| train/ | | -| approx_kl | 0.016194738 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 154490 | -| policy_gradient_loss | 0.0681 | -| std | 0.00954 | -| value_loss | 7.31e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15451 | -| time_elapsed | 82592 | -| total_timesteps | 1977728 | -| train/ | | -| approx_kl | 0.0054912507 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | -0.00786 | -| n_updates | 154500 | -| policy_gradient_loss | 0.0132 | -| std | 0.00954 | -| value_loss | 5.85e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15452 | -| time_elapsed | 82596 | -| total_timesteps | 1977856 | -| train/ | | -| approx_kl | 0.035392568 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 154510 | -| policy_gradient_loss | 0.0809 | -| std | 0.00952 | -| value_loss | 2.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 15453 | -| time_elapsed | 82601 | -| total_timesteps | 1977984 | -| train/ | | -| approx_kl | 0.050233185 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.453 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 154520 | -| policy_gradient_loss | 0.0626 | -| std | 0.00949 | -| value_loss | 6.84e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15454 | -| time_elapsed | 82606 | -| total_timesteps | 1978112 | -| train/ | | -| approx_kl | 0.06541341 | -| clip_fraction | 0.589 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -2.28 | -| learning_rate | 0.0003 | -| loss | 0.0483 | -| n_updates | 154530 | -| policy_gradient_loss | 0.0578 | -| std | 0.00948 | -| value_loss | 6.04e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15455 | -| time_elapsed | 82619 | -| total_timesteps | 1978240 | -| train/ | | -| approx_kl | 0.12805124 | -| clip_fraction | 0.565 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -7.4 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 154540 | -| policy_gradient_loss | 0.00822 | -| std | 0.00948 | -| value_loss | 0.00417 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15456 | -| time_elapsed | 82624 | -| total_timesteps | 1978368 | -| train/ | | -| approx_kl | 0.0934743 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.00367 | -| learning_rate | 0.0003 | -| loss | 0.0672 | -| n_updates | 154550 | -| policy_gradient_loss | 0.0254 | -| std | 0.00948 | -| value_loss | 2.77e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15457 | -| time_elapsed | 82629 | -| total_timesteps | 1978496 | -| train/ | | -| approx_kl | 0.024595765 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0632 | -| learning_rate | 0.0003 | -| loss | 0.00815 | -| n_updates | 154560 | -| policy_gradient_loss | 0.000271 | -| std | 0.00946 | -| value_loss | 3.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15458 | -| time_elapsed | 82634 | -| total_timesteps | 1978624 | -| train/ | | -| approx_kl | 0.009903021 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | -0.000247 | -| n_updates | 154570 | -| policy_gradient_loss | -0.000472 | -| std | 0.00946 | -| value_loss | 5.92e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15459 | -| time_elapsed | 82639 | -| total_timesteps | 1978752 | -| train/ | | -| approx_kl | 0.00816777 | -| clip_fraction | 0.0539 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0975 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 154580 | -| policy_gradient_loss | -0.00632 | -| std | 0.00946 | -| value_loss | 2.91e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15460 | -| time_elapsed | 82644 | -| total_timesteps | 1978880 | -| train/ | | -| approx_kl | 0.010306537 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 154590 | -| policy_gradient_loss | -0.000545 | -| std | 0.00946 | -| value_loss | 1.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15461 | -| time_elapsed | 82647 | -| total_timesteps | 1979008 | -| train/ | | -| approx_kl | 0.36562234 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.00845 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 154600 | -| policy_gradient_loss | 0.0307 | -| std | 0.00946 | -| value_loss | 3.58e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15462 | -| time_elapsed | 82657 | -| total_timesteps | 1979136 | -| train/ | | -| approx_kl | 0.060074862 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.652 | -| learning_rate | 0.0003 | -| loss | -0.00999 | -| n_updates | 154610 | -| policy_gradient_loss | -0.00488 | -| std | 0.00947 | -| value_loss | 0.00102 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15463 | -| time_elapsed | 82663 | -| total_timesteps | 1979264 | -| train/ | | -| approx_kl | 0.0072641964 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.36 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 154620 | -| policy_gradient_loss | 0.000547 | -| std | 0.00947 | -| value_loss | 3.11e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15464 | -| time_elapsed | 82668 | -| total_timesteps | 1979392 | -| train/ | | -| approx_kl | 0.07990885 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 154630 | -| policy_gradient_loss | 0.0291 | -| std | 0.00947 | -| value_loss | 1.13e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15465 | -| time_elapsed | 82673 | -| total_timesteps | 1979520 | -| train/ | | -| approx_kl | 0.0016711112 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0976 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 154640 | -| policy_gradient_loss | 0.0016 | -| std | 0.00947 | -| value_loss | 8.82e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15466 | -| time_elapsed | 82678 | -| total_timesteps | 1979648 | -| train/ | | -| approx_kl | 6.5667555e-06 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.000501 | -| n_updates | 154650 | -| policy_gradient_loss | -0.00297 | -| std | 0.00947 | -| value_loss | 6.66e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15467 | -| time_elapsed | 82683 | -| total_timesteps | 1979776 | -| train/ | | -| approx_kl | 0.029692601 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 154660 | -| policy_gradient_loss | 0.0244 | -| std | 0.00947 | -| value_loss | 4.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15468 | -| time_elapsed | 82687 | -| total_timesteps | 1979904 | -| train/ | | -| approx_kl | 0.013723233 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 154670 | -| policy_gradient_loss | 0.00466 | -| std | 0.00947 | -| value_loss | 4.44e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15469 | -| time_elapsed | 82691 | -| total_timesteps | 1980032 | -| train/ | | -| approx_kl | 0.07413027 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 154680 | -| policy_gradient_loss | 0.00447 | -| std | 0.00947 | -| value_loss | 2.9e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15470 | -| time_elapsed | 82704 | -| total_timesteps | 1980160 | -| train/ | | -| approx_kl | 0.015965953 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.00901 | -| n_updates | 154690 | -| policy_gradient_loss | -0.0116 | -| std | 0.00947 | -| value_loss | 0.00253 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15471 | -| time_elapsed | 82708 | -| total_timesteps | 1980288 | -| train/ | | -| approx_kl | 0.0840818 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00274 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 154700 | -| policy_gradient_loss | 0.0206 | -| std | 0.00947 | -| value_loss | 3.63e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15472 | -| time_elapsed | 82712 | -| total_timesteps | 1980416 | -| train/ | | -| approx_kl | 0.08290824 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 154710 | -| policy_gradient_loss | 0.017 | -| std | 0.00947 | -| value_loss | 2.71e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15473 | -| time_elapsed | 82717 | -| total_timesteps | 1980544 | -| train/ | | -| approx_kl | 0.1316844 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.0924 | -| n_updates | 154720 | -| policy_gradient_loss | 0.0335 | -| std | 0.00947 | -| value_loss | 2.16e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15474 | -| time_elapsed | 82723 | -| total_timesteps | 1980672 | -| train/ | | -| approx_kl | 0.02112075 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 154730 | -| policy_gradient_loss | 0.0407 | -| std | 0.00947 | -| value_loss | 1.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15475 | -| time_elapsed | 82727 | -| total_timesteps | 1980800 | -| train/ | | -| approx_kl | 0.013707801 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 154740 | -| policy_gradient_loss | 0.00921 | -| std | 0.00947 | -| value_loss | 1.34e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15476 | -| time_elapsed | 82734 | -| total_timesteps | 1980928 | -| train/ | | -| approx_kl | 0.09335606 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.0673 | -| n_updates | 154750 | -| policy_gradient_loss | 0.0217 | -| std | 0.00947 | -| value_loss | 9.06e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15477 | -| time_elapsed | 82740 | -| total_timesteps | 1981056 | -| train/ | | -| approx_kl | 0.00047893077 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 154760 | -| policy_gradient_loss | -0.000414 | -| std | 0.00947 | -| value_loss | 6.53e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15478 | -| time_elapsed | 82751 | -| total_timesteps | 1981184 | -| train/ | | -| approx_kl | 0.008534338 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | -0.000284 | -| n_updates | 154770 | -| policy_gradient_loss | 0.0225 | -| std | 0.00947 | -| value_loss | 0.00539 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15479 | -| time_elapsed | 82756 | -| total_timesteps | 1981312 | -| train/ | | -| approx_kl | 0.15287608 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | 0.0691 | -| n_updates | 154780 | -| policy_gradient_loss | 0.0214 | -| std | 0.00947 | -| value_loss | 1.93e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15480 | -| time_elapsed | 82761 | -| total_timesteps | 1981440 | -| train/ | | -| approx_kl | 0.029825388 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00282 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 154790 | -| policy_gradient_loss | 0.0381 | -| std | 0.00947 | -| value_loss | 3.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15481 | -| time_elapsed | 82765 | -| total_timesteps | 1981568 | -| train/ | | -| approx_kl | 0.009382535 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00567 | -| learning_rate | 0.0003 | -| loss | 0.000184 | -| n_updates | 154800 | -| policy_gradient_loss | 0.011 | -| std | 0.00947 | -| value_loss | 1.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15482 | -| time_elapsed | 82772 | -| total_timesteps | 1981696 | -| train/ | | -| approx_kl | 0.08899969 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.0472 | -| n_updates | 154810 | -| policy_gradient_loss | 0.00627 | -| std | 0.00946 | -| value_loss | 6.35e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15483 | -| time_elapsed | 82776 | -| total_timesteps | 1981824 | -| train/ | | -| approx_kl | 0.025294414 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 154820 | -| policy_gradient_loss | 0.0488 | -| std | 0.00948 | -| value_loss | 5.93e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 15484 | -| time_elapsed | 82780 | -| total_timesteps | 1981952 | -| train/ | | -| approx_kl | 0.0022597918 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.00078 | -| n_updates | 154830 | -| policy_gradient_loss | 0.0129 | -| std | 0.00949 | -| value_loss | 3.3e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15485 | -| time_elapsed | 82783 | -| total_timesteps | 1982080 | -| train/ | | -| approx_kl | 0.15651955 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 154840 | -| policy_gradient_loss | 0.0826 | -| std | 0.00949 | -| value_loss | 2.27e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15486 | -| time_elapsed | 82791 | -| total_timesteps | 1982208 | -| train/ | | -| approx_kl | 0.1959292 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 154850 | -| policy_gradient_loss | 0.00562 | -| std | 0.0095 | -| value_loss | 0.000397 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15487 | -| time_elapsed | 82796 | -| total_timesteps | 1982336 | -| train/ | | -| approx_kl | 0.14002913 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00262 | -| learning_rate | 0.0003 | -| loss | 0.0739 | -| n_updates | 154860 | -| policy_gradient_loss | 0.0223 | -| std | 0.0095 | -| value_loss | 1.85e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15488 | -| time_elapsed | 82802 | -| total_timesteps | 1982464 | -| train/ | | -| approx_kl | 0.20247701 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0937 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 154870 | -| policy_gradient_loss | 0.0216 | -| std | 0.0095 | -| value_loss | 1.34e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15489 | -| time_elapsed | 82807 | -| total_timesteps | 1982592 | -| train/ | | -| approx_kl | 0.0312771 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.00613 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 154880 | -| policy_gradient_loss | 0.0101 | -| std | 0.00951 | -| value_loss | 1.04e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15490 | -| time_elapsed | 82813 | -| total_timesteps | 1982720 | -| train/ | | -| approx_kl | 0.013948195 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 154890 | -| policy_gradient_loss | 0.0106 | -| std | 0.00951 | -| value_loss | 2.57e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15491 | -| time_elapsed | 82819 | -| total_timesteps | 1982848 | -| train/ | | -| approx_kl | 0.039620634 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.308 | -| learning_rate | 0.0003 | -| loss | 0.0427 | -| n_updates | 154900 | -| policy_gradient_loss | 0.0108 | -| std | 0.00951 | -| value_loss | 2.11e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15492 | -| time_elapsed | 82823 | -| total_timesteps | 1982976 | -| train/ | | -| approx_kl | 0.026549842 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0916 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 154910 | -| policy_gradient_loss | 0.0294 | -| std | 0.00951 | -| value_loss | 5e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15493 | -| time_elapsed | 82828 | -| total_timesteps | 1983104 | -| train/ | | -| approx_kl | 0.10727073 | -| clip_fraction | 0.6 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 154920 | -| policy_gradient_loss | 0.0663 | -| std | 0.00951 | -| value_loss | 4.09e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15494 | -| time_elapsed | 82840 | -| total_timesteps | 1983232 | -| train/ | | -| approx_kl | 0.1108231 | -| clip_fraction | 0.575 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -3.99 | -| learning_rate | 0.0003 | -| loss | -0.00439 | -| n_updates | 154930 | -| policy_gradient_loss | 0.000912 | -| std | 0.00952 | -| value_loss | 0.00327 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15495 | -| time_elapsed | 82845 | -| total_timesteps | 1983360 | -| train/ | | -| approx_kl | 0.011258226 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00822 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 154940 | -| policy_gradient_loss | 0.00909 | -| std | 0.00952 | -| value_loss | 4.97e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15496 | -| time_elapsed | 82850 | -| total_timesteps | 1983488 | -| train/ | | -| approx_kl | 0.06848924 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 154950 | -| policy_gradient_loss | 0.0061 | -| std | 0.00952 | -| value_loss | 3.62e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15497 | -| time_elapsed | 82853 | -| total_timesteps | 1983616 | -| train/ | | -| approx_kl | 0.09205367 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.0329 | -| n_updates | 154960 | -| policy_gradient_loss | 0.0139 | -| std | 0.00952 | -| value_loss | 2.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15498 | -| time_elapsed | 82858 | -| total_timesteps | 1983744 | -| train/ | | -| approx_kl | 0.042012364 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 154970 | -| policy_gradient_loss | -0.00951 | -| std | 0.00952 | -| value_loss | 1.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 15499 | -| time_elapsed | 82864 | -| total_timesteps | 1983872 | -| train/ | | -| approx_kl | 0.010497627 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.00319 | -| n_updates | 154980 | -| policy_gradient_loss | 0.0134 | -| std | 0.00955 | -| value_loss | 9.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15500 | -| time_elapsed | 82869 | -| total_timesteps | 1984000 | -| train/ | | -| approx_kl | 0.05744673 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 154990 | -| policy_gradient_loss | 0.0113 | -| std | 0.00956 | -| value_loss | 4.84e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15501 | -| time_elapsed | 82874 | -| total_timesteps | 1984128 | -| train/ | | -| approx_kl | 0.06493068 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 155000 | -| policy_gradient_loss | 0.0266 | -| std | 0.00957 | -| value_loss | 1.21e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15502 | -| time_elapsed | 82885 | -| total_timesteps | 1984256 | -| train/ | | -| approx_kl | 0.024750516 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | -0.00935 | -| n_updates | 155010 | -| policy_gradient_loss | -0.00414 | -| std | 0.00957 | -| value_loss | 0.00187 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15503 | -| time_elapsed | 82891 | -| total_timesteps | 1984384 | -| train/ | | -| approx_kl | 0.0810791 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -54.5 | -| learning_rate | 0.0003 | -| loss | -0.00643 | -| n_updates | 155020 | -| policy_gradient_loss | -0.00269 | -| std | 0.00957 | -| value_loss | 1.3e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15504 | -| time_elapsed | 82896 | -| total_timesteps | 1984512 | -| train/ | | -| approx_kl | 0.0025961027 | -| clip_fraction | 0.00937 | -| clip_range | 0.2 | -| entropy_loss | 3.23 | -| explained_variance | -0.0095 | -| learning_rate | 0.0003 | -| loss | 6.48e-05 | -| n_updates | 155030 | -| policy_gradient_loss | 7.03e-05 | -| std | 0.00953 | -| value_loss | 2.69e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15505 | -| time_elapsed | 82903 | -| total_timesteps | 1984640 | -| train/ | | -| approx_kl | 0.0052992837 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | -5.04e-05 | -| n_updates | 155040 | -| policy_gradient_loss | 0.016 | -| std | 0.00949 | -| value_loss | 3.13e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15506 | -| time_elapsed | 82908 | -| total_timesteps | 1984768 | -| train/ | | -| approx_kl | 0.037432935 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -5.05 | -| learning_rate | 0.0003 | -| loss | 0.00634 | -| n_updates | 155050 | -| policy_gradient_loss | 0.00377 | -| std | 0.00948 | -| value_loss | 3.92e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 15507 | -| time_elapsed | 82913 | -| total_timesteps | 1984896 | -| train/ | | -| approx_kl | 0.13155772 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00418 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 155060 | -| policy_gradient_loss | 0.00287 | -| std | 0.00949 | -| value_loss | 2.57e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15508 | -| time_elapsed | 82920 | -| total_timesteps | 1985024 | -| train/ | | -| approx_kl | 0.005110963 | -| clip_fraction | 0.0258 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.000237 | -| learning_rate | 0.0003 | -| loss | 6.08e-05 | -| n_updates | 155070 | -| policy_gradient_loss | 0.000637 | -| std | 0.00945 | -| value_loss | 4.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15509 | -| time_elapsed | 82934 | -| total_timesteps | 1985152 | -| train/ | | -| approx_kl | 0.11176523 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.903 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 155080 | -| policy_gradient_loss | -0.00473 | -| std | 0.00941 | -| value_loss | 0.00141 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15510 | -| time_elapsed | 82940 | -| total_timesteps | 1985280 | -| train/ | | -| approx_kl | 0.06546834 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | 0.0373 | -| n_updates | 155090 | -| policy_gradient_loss | 0.0197 | -| std | 0.0094 | -| value_loss | 4.55e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15511 | -| time_elapsed | 82944 | -| total_timesteps | 1985408 | -| train/ | | -| approx_kl | 0.023297582 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00127 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 155100 | -| policy_gradient_loss | 0.0148 | -| std | 0.0094 | -| value_loss | 4.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15512 | -| time_elapsed | 82949 | -| total_timesteps | 1985536 | -| train/ | | -| approx_kl | 0.074674256 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 155110 | -| policy_gradient_loss | 0.021 | -| std | 0.00939 | -| value_loss | 3.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15513 | -| time_elapsed | 82954 | -| total_timesteps | 1985664 | -| train/ | | -| approx_kl | 0.07990409 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 155120 | -| policy_gradient_loss | -0.00146 | -| std | 0.00939 | -| value_loss | 2.63e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15514 | -| time_elapsed | 82958 | -| total_timesteps | 1985792 | -| train/ | | -| approx_kl | 0.0009694444 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 155130 | -| policy_gradient_loss | 0.0142 | -| std | 0.00939 | -| value_loss | 2.1e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15515 | -| time_elapsed | 82963 | -| total_timesteps | 1985920 | -| train/ | | -| approx_kl | 0.25563014 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 155140 | -| policy_gradient_loss | 0.0308 | -| std | 0.00939 | -| value_loss | 1.48e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15516 | -| time_elapsed | 82968 | -| total_timesteps | 1986048 | -| train/ | | -| approx_kl | 0.006160162 | -| clip_fraction | 0.0953 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | -0.00377 | -| n_updates | 155150 | -| policy_gradient_loss | 0.00281 | -| std | 0.00939 | -| value_loss | 1.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15517 | -| time_elapsed | 82979 | -| total_timesteps | 1986176 | -| train/ | | -| approx_kl | 0.030417018 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0249 | -| n_updates | 155160 | -| policy_gradient_loss | -0.0152 | -| std | 0.00939 | -| value_loss | 0.00042 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15518 | -| time_elapsed | 82983 | -| total_timesteps | 1986304 | -| train/ | | -| approx_kl | 9.718677e-05 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | -0.000601 | -| n_updates | 155170 | -| policy_gradient_loss | 0.00256 | -| std | 0.00938 | -| value_loss | 3.64e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15519 | -| time_elapsed | 82988 | -| total_timesteps | 1986432 | -| train/ | | -| approx_kl | 0.046307918 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00279 | -| learning_rate | 0.0003 | -| loss | 0.00428 | -| n_updates | 155180 | -| policy_gradient_loss | 0.0165 | -| std | 0.00938 | -| value_loss | 4.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15520 | -| time_elapsed | 82993 | -| total_timesteps | 1986560 | -| train/ | | -| approx_kl | 0.04461415 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0884 | -| learning_rate | 0.0003 | -| loss | 0.0504 | -| n_updates | 155190 | -| policy_gradient_loss | 0.0275 | -| std | 0.00938 | -| value_loss | 2.08e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15521 | -| time_elapsed | 82999 | -| total_timesteps | 1986688 | -| train/ | | -| approx_kl | 0.020196095 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00527 | -| n_updates | 155200 | -| policy_gradient_loss | 0.0278 | -| std | 0.00938 | -| value_loss | 1.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15522 | -| time_elapsed | 83004 | -| total_timesteps | 1986816 | -| train/ | | -| approx_kl | 0.34085327 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 155210 | -| policy_gradient_loss | 0.103 | -| std | 0.00938 | -| value_loss | 8.02e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 15523 | -| time_elapsed | 83009 | -| total_timesteps | 1986944 | -| train/ | | -| approx_kl | 0.019050978 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 155220 | -| policy_gradient_loss | -0.00982 | -| std | 0.00938 | -| value_loss | 6.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15524 | -| time_elapsed | 83014 | -| total_timesteps | 1987072 | -| train/ | | -| approx_kl | 0.009356892 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 155230 | -| policy_gradient_loss | -0.00421 | -| std | 0.00937 | -| value_loss | 1.23e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15525 | -| time_elapsed | 83022 | -| total_timesteps | 1987200 | -| train/ | | -| approx_kl | 0.2330341 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.512 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 155240 | -| policy_gradient_loss | -0.00851 | -| std | 0.00938 | -| value_loss | 0.00206 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15526 | -| time_elapsed | 83027 | -| total_timesteps | 1987328 | -| train/ | | -| approx_kl | 0.044275105 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | 7.57e-05 | -| n_updates | 155250 | -| policy_gradient_loss | 0.00978 | -| std | 0.00939 | -| value_loss | 2.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15527 | -| time_elapsed | 83034 | -| total_timesteps | 1987456 | -| train/ | | -| approx_kl | 0.011639969 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -9.66 | -| learning_rate | 0.0003 | -| loss | -0.00904 | -| n_updates | 155260 | -| policy_gradient_loss | 0.023 | -| std | 0.00939 | -| value_loss | 6.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15528 | -| time_elapsed | 83039 | -| total_timesteps | 1987584 | -| train/ | | -| approx_kl | 0.013232538 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 155270 | -| policy_gradient_loss | 0.047 | -| std | 0.00939 | -| value_loss | 5.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15529 | -| time_elapsed | 83045 | -| total_timesteps | 1987712 | -| train/ | | -| approx_kl | 0.004576132 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.0071 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 155280 | -| policy_gradient_loss | 0.0125 | -| std | 0.00938 | -| value_loss | 4.08e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15530 | -| time_elapsed | 83051 | -| total_timesteps | 1987840 | -| train/ | | -| approx_kl | 0.00035895547 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00361 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 155290 | -| policy_gradient_loss | 0.000212 | -| std | 0.00936 | -| value_loss | 3.14e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15531 | -| time_elapsed | 83056 | -| total_timesteps | 1987968 | -| train/ | | -| approx_kl | 0.024112985 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 155300 | -| policy_gradient_loss | 0.0123 | -| std | 0.00935 | -| value_loss | 1.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15532 | -| time_elapsed | 83062 | -| total_timesteps | 1988096 | -| train/ | | -| approx_kl | 0.34906033 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 155310 | -| policy_gradient_loss | 0.0415 | -| std | 0.00934 | -| value_loss | 9.8e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15533 | -| time_elapsed | 83073 | -| total_timesteps | 1988224 | -| train/ | | -| approx_kl | 0.04204586 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | 0.000815 | -| n_updates | 155320 | -| policy_gradient_loss | -0.00431 | -| std | 0.00934 | -| value_loss | 0.00223 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15534 | -| time_elapsed | 83077 | -| total_timesteps | 1988352 | -| train/ | | -| approx_kl | 0.00961778 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.000616 | -| n_updates | 155330 | -| policy_gradient_loss | 0.00223 | -| std | 0.00934 | -| value_loss | 4.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15535 | -| time_elapsed | 83081 | -| total_timesteps | 1988480 | -| train/ | | -| approx_kl | 0.028999565 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00381 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 155340 | -| policy_gradient_loss | -0.00225 | -| std | 0.00934 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15536 | -| time_elapsed | 83085 | -| total_timesteps | 1988608 | -| train/ | | -| approx_kl | 0.021158807 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 155350 | -| policy_gradient_loss | -0.00855 | -| std | 0.00934 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15537 | -| time_elapsed | 83090 | -| total_timesteps | 1988736 | -| train/ | | -| approx_kl | 0.026787788 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0069 | -| n_updates | 155360 | -| policy_gradient_loss | 0.0031 | -| std | 0.00934 | -| value_loss | 7.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15538 | -| time_elapsed | 83094 | -| total_timesteps | 1988864 | -| train/ | | -| approx_kl | 0.027609147 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | -0.00418 | -| n_updates | 155370 | -| policy_gradient_loss | -0.00196 | -| std | 0.00934 | -| value_loss | 6.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 15539 | -| time_elapsed | 83099 | -| total_timesteps | 1988992 | -| train/ | | -| approx_kl | 0.057810638 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.00671 | -| n_updates | 155380 | -| policy_gradient_loss | 0.0193 | -| std | 0.00934 | -| value_loss | 5.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15540 | -| time_elapsed | 83104 | -| total_timesteps | 1989120 | -| train/ | | -| approx_kl | 0.049572024 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 155390 | -| policy_gradient_loss | 0.0307 | -| std | 0.00934 | -| value_loss | 2.14e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15541 | -| time_elapsed | 83118 | -| total_timesteps | 1989248 | -| train/ | | -| approx_kl | 0.0051614684 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 155400 | -| policy_gradient_loss | -0.012 | -| std | 0.00934 | -| value_loss | 0.000255 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15542 | -| time_elapsed | 83121 | -| total_timesteps | 1989376 | -| train/ | | -| approx_kl | 2.771616e-06 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.063 | -| learning_rate | 0.0003 | -| loss | 6.86e-05 | -| n_updates | 155410 | -| policy_gradient_loss | 0.0188 | -| std | 0.00934 | -| value_loss | 2.25e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15543 | -| time_elapsed | 83125 | -| total_timesteps | 1989504 | -| train/ | | -| approx_kl | 0.42972475 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.309 | -| learning_rate | 0.0003 | -| loss | 0.226 | -| n_updates | 155420 | -| policy_gradient_loss | 0.113 | -| std | 0.00934 | -| value_loss | 9.76e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15544 | -| time_elapsed | 83130 | -| total_timesteps | 1989632 | -| train/ | | -| approx_kl | 0.110400885 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00425 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 155430 | -| policy_gradient_loss | 0.0188 | -| std | 0.00934 | -| value_loss | 7.52e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15545 | -| time_elapsed | 83133 | -| total_timesteps | 1989760 | -| train/ | | -| approx_kl | 0.04361683 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00446 | -| learning_rate | 0.0003 | -| loss | 0.0318 | -| n_updates | 155440 | -| policy_gradient_loss | 0.0265 | -| std | 0.00934 | -| value_loss | 5.47e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 15546 | -| time_elapsed | 83138 | -| total_timesteps | 1989888 | -| train/ | | -| approx_kl | 0.1688453 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0096 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 155450 | -| policy_gradient_loss | 0.0869 | -| std | 0.00934 | -| value_loss | 4.15e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15547 | -| time_elapsed | 83142 | -| total_timesteps | 1990016 | -| train/ | | -| approx_kl | 0.11597815 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0997 | -| n_updates | 155460 | -| policy_gradient_loss | 0.108 | -| std | 0.00934 | -| value_loss | 3.31e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15548 | -| time_elapsed | 83156 | -| total_timesteps | 1990144 | -| train/ | | -| approx_kl | 0.02083702 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 155470 | -| policy_gradient_loss | 0.00289 | -| std | 0.00934 | -| value_loss | 0.000127 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15549 | -| time_elapsed | 83161 | -| total_timesteps | 1990272 | -| train/ | | -| approx_kl | 0.14761582 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | 0.0291 | -| n_updates | 155480 | -| policy_gradient_loss | 0.0077 | -| std | 0.00934 | -| value_loss | 4.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15550 | -| time_elapsed | 83165 | -| total_timesteps | 1990400 | -| train/ | | -| approx_kl | 0.048513874 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00248 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 155490 | -| policy_gradient_loss | 0.0152 | -| std | 0.00934 | -| value_loss | 4.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15551 | -| time_elapsed | 83171 | -| total_timesteps | 1990528 | -| train/ | | -| approx_kl | 0.01126247 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 155500 | -| policy_gradient_loss | 0.0143 | -| std | 0.00933 | -| value_loss | 3.03e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15552 | -| time_elapsed | 83177 | -| total_timesteps | 1990656 | -| train/ | | -| approx_kl | 0.0023487946 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.952 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 155510 | -| policy_gradient_loss | 0.0161 | -| std | 0.00932 | -| value_loss | 1.49e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15553 | -| time_elapsed | 83182 | -| total_timesteps | 1990784 | -| train/ | | -| approx_kl | 0.03655769 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 155520 | -| policy_gradient_loss | 0.0183 | -| std | 0.00932 | -| value_loss | 1.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15554 | -| time_elapsed | 83188 | -| total_timesteps | 1990912 | -| train/ | | -| approx_kl | 0.021668287 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.547 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 155530 | -| policy_gradient_loss | 0.0137 | -| std | 0.00932 | -| value_loss | 1.27e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15555 | -| time_elapsed | 83193 | -| total_timesteps | 1991040 | -| train/ | | -| approx_kl | 0.21150477 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | 0.0049 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 155540 | -| policy_gradient_loss | 0.0144 | -| std | 0.00932 | -| value_loss | 3.55e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15556 | -| time_elapsed | 83201 | -| total_timesteps | 1991168 | -| train/ | | -| approx_kl | 0.05896108 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 155550 | -| policy_gradient_loss | 0.0201 | -| std | 0.00932 | -| value_loss | 0.000422 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15557 | -| time_elapsed | 83206 | -| total_timesteps | 1991296 | -| train/ | | -| approx_kl | 0.13491556 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.0617 | -| n_updates | 155560 | -| policy_gradient_loss | 0.0236 | -| std | 0.00932 | -| value_loss | 1.06e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15558 | -| time_elapsed | 83211 | -| total_timesteps | 1991424 | -| train/ | | -| approx_kl | 0.00050630374 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | 0.00464 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 155570 | -| policy_gradient_loss | -0.00704 | -| std | 0.00932 | -| value_loss | 1.53e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15559 | -| time_elapsed | 83217 | -| total_timesteps | 1991552 | -| train/ | | -| approx_kl | 0.03751302 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 155580 | -| policy_gradient_loss | 0.0418 | -| std | 0.00932 | -| value_loss | 6.31e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15560 | -| time_elapsed | 83221 | -| total_timesteps | 1991680 | -| train/ | | -| approx_kl | 0.012760009 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 155590 | -| policy_gradient_loss | -0.00361 | -| std | 0.00932 | -| value_loss | 6.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15561 | -| time_elapsed | 83226 | -| total_timesteps | 1991808 | -| train/ | | -| approx_kl | 0.10675253 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 155600 | -| policy_gradient_loss | 0.00534 | -| std | 0.00932 | -| value_loss | 4.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 15562 | -| time_elapsed | 83231 | -| total_timesteps | 1991936 | -| train/ | | -| approx_kl | 0.023506429 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.00371 | -| n_updates | 155610 | -| policy_gradient_loss | 0.0112 | -| std | 0.00932 | -| value_loss | 3.26e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15563 | -| time_elapsed | 83235 | -| total_timesteps | 1992064 | -| train/ | | -| approx_kl | 0.17556584 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 155620 | -| policy_gradient_loss | 0.0963 | -| std | 0.00932 | -| value_loss | 2.2e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15564 | -| time_elapsed | 83243 | -| total_timesteps | 1992192 | -| train/ | | -| approx_kl | 0.33439162 | -| clip_fraction | 0.589 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | 0.741 | -| learning_rate | 0.0003 | -| loss | 0.063 | -| n_updates | 155630 | -| policy_gradient_loss | 0.0483 | -| std | 0.00932 | -| value_loss | 0.00644 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15565 | -| time_elapsed | 83247 | -| total_timesteps | 1992320 | -| train/ | | -| approx_kl | 0.04552997 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 155640 | -| policy_gradient_loss | 0.0108 | -| std | 0.00932 | -| value_loss | 3.41e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15566 | -| time_elapsed | 83250 | -| total_timesteps | 1992448 | -| train/ | | -| approx_kl | 0.00015443005 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.00517 | -| learning_rate | 0.0003 | -| loss | -0.000259 | -| n_updates | 155650 | -| policy_gradient_loss | 0.0144 | -| std | 0.00933 | -| value_loss | 4.99e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15567 | -| time_elapsed | 83255 | -| total_timesteps | 1992576 | -| train/ | | -| approx_kl | 0.030878792 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.00385 | -| learning_rate | 0.0003 | -| loss | -0.00673 | -| n_updates | 155660 | -| policy_gradient_loss | 0.00851 | -| std | 0.00934 | -| value_loss | 3.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15568 | -| time_elapsed | 83261 | -| total_timesteps | 1992704 | -| train/ | | -| approx_kl | 0.028806716 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00307 | -| learning_rate | 0.0003 | -| loss | 0.00714 | -| n_updates | 155670 | -| policy_gradient_loss | -0.00175 | -| std | 0.00934 | -| value_loss | 6.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15569 | -| time_elapsed | 83270 | -| total_timesteps | 1992832 | -| train/ | | -| approx_kl | 0.009865524 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 155680 | -| policy_gradient_loss | -0.0019 | -| std | 0.00934 | -| value_loss | 7.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 15570 | -| time_elapsed | 83276 | -| total_timesteps | 1992960 | -| train/ | | -| approx_kl | 0.009011304 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.000553 | -| n_updates | 155690 | -| policy_gradient_loss | 0.0128 | -| std | 0.00936 | -| value_loss | 5.45e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15571 | -| time_elapsed | 83281 | -| total_timesteps | 1993088 | -| train/ | | -| approx_kl | 0.01387264 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -12.2 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 155700 | -| policy_gradient_loss | -0.0114 | -| std | 0.00937 | -| value_loss | 9.88e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15572 | -| time_elapsed | 83291 | -| total_timesteps | 1993216 | -| train/ | | -| approx_kl | 0.087801665 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.735 | -| learning_rate | 0.0003 | -| loss | 0.0295 | -| n_updates | 155710 | -| policy_gradient_loss | 0.0115 | -| std | 0.00936 | -| value_loss | 0.00569 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15573 | -| time_elapsed | 83300 | -| total_timesteps | 1993344 | -| train/ | | -| approx_kl | 0.02544598 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 155720 | -| policy_gradient_loss | 0.00999 | -| std | 0.00936 | -| value_loss | 7.68e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15574 | -| time_elapsed | 83306 | -| total_timesteps | 1993472 | -| train/ | | -| approx_kl | 0.07570762 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.000835 | -| learning_rate | 0.0003 | -| loss | 0.0505 | -| n_updates | 155730 | -| policy_gradient_loss | 0.0338 | -| std | 0.00936 | -| value_loss | 1.21e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15575 | -| time_elapsed | 83310 | -| total_timesteps | 1993600 | -| train/ | | -| approx_kl | 0.09188595 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0377 | -| n_updates | 155740 | -| policy_gradient_loss | 0.0151 | -| std | 0.00936 | -| value_loss | 8.08e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15576 | -| time_elapsed | 83316 | -| total_timesteps | 1993728 | -| train/ | | -| approx_kl | 0.11176487 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 155750 | -| policy_gradient_loss | 0.0106 | -| std | 0.00936 | -| value_loss | 5.75e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15577 | -| time_elapsed | 83321 | -| total_timesteps | 1993856 | -| train/ | | -| approx_kl | 0.040112715 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 155760 | -| policy_gradient_loss | 0.0166 | -| std | 0.00936 | -| value_loss | 9.63e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 15578 | -| time_elapsed | 83327 | -| total_timesteps | 1993984 | -| train/ | | -| approx_kl | 0.02320167 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.0077 | -| n_updates | 155770 | -| policy_gradient_loss | 0.016 | -| std | 0.00935 | -| value_loss | 1.37e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15579 | -| time_elapsed | 83334 | -| total_timesteps | 1994112 | -| train/ | | -| approx_kl | 0.0021994356 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | -0.00229 | -| n_updates | 155780 | -| policy_gradient_loss | 0.013 | -| std | 0.00935 | -| value_loss | 9e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15580 | -| time_elapsed | 83347 | -| total_timesteps | 1994240 | -| train/ | | -| approx_kl | 0.09067443 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 155790 | -| policy_gradient_loss | 0.0101 | -| std | 0.00935 | -| value_loss | 0.000321 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15581 | -| time_elapsed | 83351 | -| total_timesteps | 1994368 | -| train/ | | -| approx_kl | 0.0041500586 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00673 | -| learning_rate | 0.0003 | -| loss | -0.000802 | -| n_updates | 155800 | -| policy_gradient_loss | 0.0111 | -| std | 0.00937 | -| value_loss | 9.48e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15582 | -| time_elapsed | 83355 | -| total_timesteps | 1994496 | -| train/ | | -| approx_kl | 0.008772985 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.000212 | -| learning_rate | 0.0003 | -| loss | 0.000925 | -| n_updates | 155810 | -| policy_gradient_loss | 0.0508 | -| std | 0.0094 | -| value_loss | 0.00011 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15583 | -| time_elapsed | 83360 | -| total_timesteps | 1994624 | -| train/ | | -| approx_kl | 0.0064210347 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00785 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 155820 | -| policy_gradient_loss | -0.00141 | -| std | 0.00941 | -| value_loss | 1.72e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15584 | -| time_elapsed | 83364 | -| total_timesteps | 1994752 | -| train/ | | -| approx_kl | 0.03619674 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 155830 | -| policy_gradient_loss | 0.0118 | -| std | 0.00941 | -| value_loss | 6.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15585 | -| time_elapsed | 83369 | -| total_timesteps | 1994880 | -| train/ | | -| approx_kl | 0.070948645 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0907 | -| learning_rate | 0.0003 | -| loss | 0.0431 | -| n_updates | 155840 | -| policy_gradient_loss | 0.0293 | -| std | 0.00941 | -| value_loss | 2.11e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15586 | -| time_elapsed | 83376 | -| total_timesteps | 1995008 | -| train/ | | -| approx_kl | 0.08852835 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0197 | -| n_updates | 155850 | -| policy_gradient_loss | 0.00762 | -| std | 0.00941 | -| value_loss | 1.63e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15587 | -| time_elapsed | 83389 | -| total_timesteps | 1995136 | -| train/ | | -| approx_kl | 0.07492916 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 155860 | -| policy_gradient_loss | 0.00229 | -| std | 0.00941 | -| value_loss | 8.94e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15588 | -| time_elapsed | 83395 | -| total_timesteps | 1995264 | -| train/ | | -| approx_kl | 0.028417557 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.182 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 155870 | -| policy_gradient_loss | 0.00831 | -| std | 0.00941 | -| value_loss | 1.17e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15589 | -| time_elapsed | 83403 | -| total_timesteps | 1995392 | -| train/ | | -| approx_kl | 0.07852041 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 155880 | -| policy_gradient_loss | 0.0174 | -| std | 0.00941 | -| value_loss | 1.35e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15590 | -| time_elapsed | 83409 | -| total_timesteps | 1995520 | -| train/ | | -| approx_kl | 0.07881864 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | 0.0286 | -| n_updates | 155890 | -| policy_gradient_loss | 0.0108 | -| std | 0.00941 | -| value_loss | 7.34e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15591 | -| time_elapsed | 83415 | -| total_timesteps | 1995648 | -| train/ | | -| approx_kl | 0.017918043 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 155900 | -| policy_gradient_loss | 0.00086 | -| std | 0.00941 | -| value_loss | 3.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15592 | -| time_elapsed | 83420 | -| total_timesteps | 1995776 | -| train/ | | -| approx_kl | 0.009766231 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 155910 | -| policy_gradient_loss | -0.00173 | -| std | 0.00941 | -| value_loss | 4.18e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 15593 | -| time_elapsed | 83425 | -| total_timesteps | 1995904 | -| train/ | | -| approx_kl | 0.0051709157 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 155920 | -| policy_gradient_loss | 0.0156 | -| std | 0.00941 | -| value_loss | 2.19e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15594 | -| time_elapsed | 83430 | -| total_timesteps | 1996032 | -| train/ | | -| approx_kl | 0.3422787 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 155930 | -| policy_gradient_loss | 0.115 | -| std | 0.00941 | -| value_loss | 1.27e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15595 | -| time_elapsed | 83441 | -| total_timesteps | 1996160 | -| train/ | | -| approx_kl | 0.029285528 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 155940 | -| policy_gradient_loss | -0.00525 | -| std | 0.00941 | -| value_loss | 0.0034 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15596 | -| time_elapsed | 83446 | -| total_timesteps | 1996288 | -| train/ | | -| approx_kl | 0.1753956 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0838 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 155950 | -| policy_gradient_loss | 0.0872 | -| std | 0.00941 | -| value_loss | 2.98e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15597 | -| time_elapsed | 83450 | -| total_timesteps | 1996416 | -| train/ | | -| approx_kl | 0.098362215 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00559 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 155960 | -| policy_gradient_loss | 0.0755 | -| std | 0.00941 | -| value_loss | 6.78e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15598 | -| time_elapsed | 83456 | -| total_timesteps | 1996544 | -| train/ | | -| approx_kl | 0.081148654 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00474 | -| learning_rate | 0.0003 | -| loss | 0.0684 | -| n_updates | 155970 | -| policy_gradient_loss | 0.0924 | -| std | 0.00941 | -| value_loss | 3.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15599 | -| time_elapsed | 83461 | -| total_timesteps | 1996672 | -| train/ | | -| approx_kl | 0.014924383 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 155980 | -| policy_gradient_loss | 0.0111 | -| std | 0.00941 | -| value_loss | 1.99e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15600 | -| time_elapsed | 83468 | -| total_timesteps | 1996800 | -| train/ | | -| approx_kl | 0.28644523 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 155990 | -| policy_gradient_loss | 0.0411 | -| std | 0.00941 | -| value_loss | 1.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 15601 | -| time_elapsed | 83473 | -| total_timesteps | 1996928 | -| train/ | | -| approx_kl | 0.023449317 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 156000 | -| policy_gradient_loss | -0.000498 | -| std | 0.00941 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15602 | -| time_elapsed | 83480 | -| total_timesteps | 1997056 | -| train/ | | -| approx_kl | 0.058760002 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.00332 | -| n_updates | 156010 | -| policy_gradient_loss | 0.0192 | -| std | 0.0094 | -| value_loss | 6.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15603 | -| time_elapsed | 83488 | -| total_timesteps | 1997184 | -| train/ | | -| approx_kl | 0.024658106 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | 0.0385 | -| n_updates | 156020 | -| policy_gradient_loss | 0.0102 | -| std | 0.0094 | -| value_loss | 0.00465 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15604 | -| time_elapsed | 83492 | -| total_timesteps | 1997312 | -| train/ | | -| approx_kl | 0.12413384 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | 0.0623 | -| n_updates | 156030 | -| policy_gradient_loss | 0.0109 | -| std | 0.0094 | -| value_loss | 1.29e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15605 | -| time_elapsed | 83498 | -| total_timesteps | 1997440 | -| train/ | | -| approx_kl | 0.0043593296 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00751 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 156040 | -| policy_gradient_loss | 0.00728 | -| std | 0.0094 | -| value_loss | 1.61e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15606 | -| time_elapsed | 83504 | -| total_timesteps | 1997568 | -| train/ | | -| approx_kl | 0.30463436 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 156050 | -| policy_gradient_loss | 0.0362 | -| std | 0.0094 | -| value_loss | 9.21e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15607 | -| time_elapsed | 83511 | -| total_timesteps | 1997696 | -| train/ | | -| approx_kl | 0.01799414 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.00792 | -| n_updates | 156060 | -| policy_gradient_loss | 0.00442 | -| std | 0.0094 | -| value_loss | 7.11e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15608 | -| time_elapsed | 83518 | -| total_timesteps | 1997824 | -| train/ | | -| approx_kl | 0.027589282 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 156070 | -| policy_gradient_loss | -0.00119 | -| std | 0.0094 | -| value_loss | 1.44e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 15609 | -| time_elapsed | 83523 | -| total_timesteps | 1997952 | -| train/ | | -| approx_kl | 0.0038362443 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.000701 | -| learning_rate | 0.0003 | -| loss | -0.00212 | -| n_updates | 156080 | -| policy_gradient_loss | 0.00186 | -| std | 0.00941 | -| value_loss | 4.93e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15610 | -| time_elapsed | 83527 | -| total_timesteps | 1998080 | -| train/ | | -| approx_kl | 0.029437726 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0715 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 156090 | -| policy_gradient_loss | -0.00532 | -| std | 0.00941 | -| value_loss | 2.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15611 | -| time_elapsed | 83537 | -| total_timesteps | 1998208 | -| train/ | | -| approx_kl | 0.009723786 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.371 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 156100 | -| policy_gradient_loss | -0.014 | -| std | 0.00942 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15612 | -| time_elapsed | 83542 | -| total_timesteps | 1998336 | -| train/ | | -| approx_kl | 0.020537011 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -143 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 156110 | -| policy_gradient_loss | -0.00422 | -| std | 0.00942 | -| value_loss | 4.25e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15613 | -| time_elapsed | 83548 | -| total_timesteps | 1998464 | -| train/ | | -| approx_kl | 0.0020383224 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | -0.000659 | -| n_updates | 156120 | -| policy_gradient_loss | 0.0105 | -| std | 0.00941 | -| value_loss | 2.28e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15614 | -| time_elapsed | 83553 | -| total_timesteps | 1998592 | -| train/ | | -| approx_kl | 0.33492452 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 156130 | -| policy_gradient_loss | 0.0363 | -| std | 0.00941 | -| value_loss | 8.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15615 | -| time_elapsed | 83557 | -| total_timesteps | 1998720 | -| train/ | | -| approx_kl | 0.02070548 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | -0.00573 | -| n_updates | 156140 | -| policy_gradient_loss | -0.00167 | -| std | 0.0094 | -| value_loss | 1.39e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15616 | -| time_elapsed | 83562 | -| total_timesteps | 1998848 | -| train/ | | -| approx_kl | 0.0038051982 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00461 | -| learning_rate | 0.0003 | -| loss | -0.00083 | -| n_updates | 156150 | -| policy_gradient_loss | 0.00233 | -| std | 0.0094 | -| value_loss | 4.43e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 15617 | -| time_elapsed | 83567 | -| total_timesteps | 1998976 | -| train/ | | -| approx_kl | 0.038125407 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00248 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 156160 | -| policy_gradient_loss | 0.00282 | -| std | 0.0094 | -| value_loss | 1.31e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15618 | -| time_elapsed | 83573 | -| total_timesteps | 1999104 | -| train/ | | -| approx_kl | 0.01916029 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | 0.000488 | -| n_updates | 156170 | -| policy_gradient_loss | 0.0268 | -| std | 0.00938 | -| value_loss | 9.04e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15619 | -| time_elapsed | 83584 | -| total_timesteps | 1999232 | -| train/ | | -| approx_kl | 0.0021578325 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.815 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 156180 | -| policy_gradient_loss | -0.00298 | -| std | 0.00937 | -| value_loss | 0.000605 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15620 | -| time_elapsed | 83590 | -| total_timesteps | 1999360 | -| train/ | | -| approx_kl | 0.06748552 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.258 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 156190 | -| policy_gradient_loss | 0.0636 | -| std | 0.00937 | -| value_loss | 0.000118 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15621 | -| time_elapsed | 83594 | -| total_timesteps | 1999488 | -| train/ | | -| approx_kl | 0.011031523 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00484 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 156200 | -| policy_gradient_loss | 0.00473 | -| std | 0.00937 | -| value_loss | 1.33e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15622 | -| time_elapsed | 83598 | -| total_timesteps | 1999616 | -| train/ | | -| approx_kl | 0.084335625 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 156210 | -| policy_gradient_loss | 0.00919 | -| std | 0.00937 | -| value_loss | 4.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15623 | -| time_elapsed | 83603 | -| total_timesteps | 1999744 | -| train/ | | -| approx_kl | 0.011484349 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0629 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 156220 | -| policy_gradient_loss | 0.00774 | -| std | 0.00937 | -| value_loss | 3.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 15624 | -| time_elapsed | 83608 | -| total_timesteps | 1999872 | -| train/ | | -| approx_kl | 0.13061893 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 156230 | -| policy_gradient_loss | 0.0957 | -| std | 0.00936 | -| value_loss | 2.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15625 | -| time_elapsed | 83613 | -| total_timesteps | 2000000 | -| train/ | | -| approx_kl | 0.077190116 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.0678 | -| n_updates | 156240 | -| policy_gradient_loss | 0.0818 | -| std | 0.00936 | -| value_loss | 1.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15626 | -| time_elapsed | 83618 | -| total_timesteps | 2000128 | -| train/ | | -| approx_kl | 0.071228825 | -| clip_fraction | 0.583 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00256 | -| learning_rate | 0.0003 | -| loss | 0.091 | -| n_updates | 156250 | -| policy_gradient_loss | 0.0681 | -| std | 0.00937 | -| value_loss | 1.04e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15627 | -| time_elapsed | 83632 | -| total_timesteps | 2000256 | -| train/ | | -| approx_kl | 0.14207937 | -| clip_fraction | 0.619 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | 0.00335 | -| n_updates | 156260 | -| policy_gradient_loss | -0.000805 | -| std | 0.00937 | -| value_loss | 0.00042 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15628 | -| time_elapsed | 83638 | -| total_timesteps | 2000384 | -| train/ | | -| approx_kl | 0.10066123 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | 0.0492 | -| n_updates | 156270 | -| policy_gradient_loss | 0.0196 | -| std | 0.00937 | -| value_loss | 5.03e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15629 | -| time_elapsed | 83644 | -| total_timesteps | 2000512 | -| train/ | | -| approx_kl | 0.00041864114 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | -0.000361 | -| n_updates | 156280 | -| policy_gradient_loss | 0.00717 | -| std | 0.00938 | -| value_loss | 3.51e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15630 | -| time_elapsed | 83649 | -| total_timesteps | 2000640 | -| train/ | | -| approx_kl | 0.084327266 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | 0.0596 | -| n_updates | 156290 | -| policy_gradient_loss | 0.016 | -| std | 0.00939 | -| value_loss | 1.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15631 | -| time_elapsed | 83654 | -| total_timesteps | 2000768 | -| train/ | | -| approx_kl | 0.07201097 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00878 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 156300 | -| policy_gradient_loss | 0.0172 | -| std | 0.00939 | -| value_loss | 8.65e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 15632 | -| time_elapsed | 83659 | -| total_timesteps | 2000896 | -| train/ | | -| approx_kl | 0.05386323 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 156310 | -| policy_gradient_loss | 0.0314 | -| std | 0.00939 | -| value_loss | 4.33e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15633 | -| time_elapsed | 83663 | -| total_timesteps | 2001024 | -| train/ | | -| approx_kl | 0.074139744 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | 0.0462 | -| n_updates | 156320 | -| policy_gradient_loss | 0.0193 | -| std | 0.00939 | -| value_loss | 3.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15634 | -| time_elapsed | 83674 | -| total_timesteps | 2001152 | -| train/ | | -| approx_kl | 0.030035587 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 156330 | -| policy_gradient_loss | -0.00316 | -| std | 0.00939 | -| value_loss | 0.000831 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15635 | -| time_elapsed | 83679 | -| total_timesteps | 2001280 | -| train/ | | -| approx_kl | 0.2621008 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.741 | -| learning_rate | 0.0003 | -| loss | 0.0577 | -| n_updates | 156340 | -| policy_gradient_loss | 0.0168 | -| std | 0.00939 | -| value_loss | 2.51e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15636 | -| time_elapsed | 83684 | -| total_timesteps | 2001408 | -| train/ | | -| approx_kl | 0.16823968 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.0871 | -| n_updates | 156350 | -| policy_gradient_loss | 0.0189 | -| std | 0.00942 | -| value_loss | 1.95e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15637 | -| time_elapsed | 83689 | -| total_timesteps | 2001536 | -| train/ | | -| approx_kl | 0.21080819 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.0754 | -| n_updates | 156360 | -| policy_gradient_loss | 0.0256 | -| std | 0.00945 | -| value_loss | 7.04e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15638 | -| time_elapsed | 83693 | -| total_timesteps | 2001664 | -| train/ | | -| approx_kl | 0.0041552647 | -| clip_fraction | 0.0961 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.000469 | -| n_updates | 156370 | -| policy_gradient_loss | 0.00218 | -| std | 0.00945 | -| value_loss | 2.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15639 | -| time_elapsed | 83698 | -| total_timesteps | 2001792 | -| train/ | | -| approx_kl | 0.032168366 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 156380 | -| policy_gradient_loss | 0.00939 | -| std | 0.00946 | -| value_loss | 5.56e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15640 | -| time_elapsed | 83702 | -| total_timesteps | 2001920 | -| train/ | | -| approx_kl | 0.0053712064 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 156390 | -| policy_gradient_loss | 0.00231 | -| std | 0.00946 | -| value_loss | 2.59e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15641 | -| time_elapsed | 83707 | -| total_timesteps | 2002048 | -| train/ | | -| approx_kl | 0.034097373 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 156400 | -| policy_gradient_loss | 0.00762 | -| std | 0.00946 | -| value_loss | 1.94e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15642 | -| time_elapsed | 83716 | -| total_timesteps | 2002176 | -| train/ | | -| approx_kl | 0.0277766 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.803 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 156410 | -| policy_gradient_loss | 0.00737 | -| std | 0.00946 | -| value_loss | 0.000878 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15643 | -| time_elapsed | 83721 | -| total_timesteps | 2002304 | -| train/ | | -| approx_kl | 0.41358343 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.231 | -| n_updates | 156420 | -| policy_gradient_loss | 0.121 | -| std | 0.00946 | -| value_loss | 2.07e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15644 | -| time_elapsed | 83725 | -| total_timesteps | 2002432 | -| train/ | | -| approx_kl | 0.3631614 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.00808 | -| learning_rate | 0.0003 | -| loss | 0.0491 | -| n_updates | 156430 | -| policy_gradient_loss | 0.0114 | -| std | 0.00946 | -| value_loss | 3.68e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15645 | -| time_elapsed | 83730 | -| total_timesteps | 2002560 | -| train/ | | -| approx_kl | 0.009714757 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 156440 | -| policy_gradient_loss | -0.00154 | -| std | 0.00946 | -| value_loss | 1.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15646 | -| time_elapsed | 83735 | -| total_timesteps | 2002688 | -| train/ | | -| approx_kl | 0.01948231 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 156450 | -| policy_gradient_loss | -0.000477 | -| std | 0.00946 | -| value_loss | 1.11e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15647 | -| time_elapsed | 83738 | -| total_timesteps | 2002816 | -| train/ | | -| approx_kl | 0.0043961112 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.00959 | -| n_updates | 156460 | -| policy_gradient_loss | -0.000248 | -| std | 0.00946 | -| value_loss | 7.51e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 15648 | -| time_elapsed | 83744 | -| total_timesteps | 2002944 | -| train/ | | -| approx_kl | 0.0340243 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.00719 | -| n_updates | 156470 | -| policy_gradient_loss | 0.0199 | -| std | 0.00946 | -| value_loss | 4.9e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15649 | -| time_elapsed | 83749 | -| total_timesteps | 2003072 | -| train/ | | -| approx_kl | 0.048897956 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.0384 | -| n_updates | 156480 | -| policy_gradient_loss | 0.0297 | -| std | 0.00946 | -| value_loss | 3.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15650 | -| time_elapsed | 83756 | -| total_timesteps | 2003200 | -| train/ | | -| approx_kl | 0.010672447 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.84 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 156490 | -| policy_gradient_loss | -0.00953 | -| std | 0.00946 | -| value_loss | 0.00179 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15651 | -| time_elapsed | 83761 | -| total_timesteps | 2003328 | -| train/ | | -| approx_kl | 0.06731094 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0842 | -| learning_rate | 0.0003 | -| loss | 0.0291 | -| n_updates | 156500 | -| policy_gradient_loss | 0.0433 | -| std | 0.00946 | -| value_loss | 0.000103 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15652 | -| time_elapsed | 83766 | -| total_timesteps | 2003456 | -| train/ | | -| approx_kl | 0.10917267 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.00824 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 156510 | -| policy_gradient_loss | 0.0194 | -| std | 0.00946 | -| value_loss | 2.07e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15653 | -| time_elapsed | 83770 | -| total_timesteps | 2003584 | -| train/ | | -| approx_kl | 0.026609786 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.00837 | -| n_updates | 156520 | -| policy_gradient_loss | 0.0399 | -| std | 0.00946 | -| value_loss | 7.49e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15654 | -| time_elapsed | 83775 | -| total_timesteps | 2003712 | -| train/ | | -| approx_kl | 0.10790647 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.0499 | -| n_updates | 156530 | -| policy_gradient_loss | 0.0204 | -| std | 0.00946 | -| value_loss | 6.47e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15655 | -| time_elapsed | 83781 | -| total_timesteps | 2003840 | -| train/ | | -| approx_kl | 0.00082761934 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 156540 | -| policy_gradient_loss | 0.015 | -| std | 0.00944 | -| value_loss | 0.00174 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 15656 | -| time_elapsed | 83786 | -| total_timesteps | 2003968 | -| train/ | | -| approx_kl | 0.076989576 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.097 | -| n_updates | 156550 | -| policy_gradient_loss | 0.0343 | -| std | 0.00943 | -| value_loss | 0.00795 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15657 | -| time_elapsed | 83792 | -| total_timesteps | 2004096 | -| train/ | | -| approx_kl | 0.16342962 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.452 | -| learning_rate | 0.0003 | -| loss | 0.0513 | -| n_updates | 156560 | -| policy_gradient_loss | 0.00708 | -| std | 0.00943 | -| value_loss | 0.00075 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15658 | -| time_elapsed | 83802 | -| total_timesteps | 2004224 | -| train/ | | -| approx_kl | 0.06330097 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.971 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 156570 | -| policy_gradient_loss | 0.0241 | -| std | 0.00943 | -| value_loss | 0.00318 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15659 | -| time_elapsed | 83806 | -| total_timesteps | 2004352 | -| train/ | | -| approx_kl | 0.0007298663 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 156580 | -| policy_gradient_loss | 0.0899 | -| std | 0.00943 | -| value_loss | 5.94e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15660 | -| time_elapsed | 83811 | -| total_timesteps | 2004480 | -| train/ | | -| approx_kl | 0.039205156 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.0605 | -| n_updates | 156590 | -| policy_gradient_loss | 0.0624 | -| std | 0.00943 | -| value_loss | 6.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15661 | -| time_elapsed | 83817 | -| total_timesteps | 2004608 | -| train/ | | -| approx_kl | 0.006516953 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 156600 | -| policy_gradient_loss | 0.00819 | -| std | 0.00943 | -| value_loss | 3.78e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15662 | -| time_elapsed | 83822 | -| total_timesteps | 2004736 | -| train/ | | -| approx_kl | 0.07883068 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 156610 | -| policy_gradient_loss | 0.00513 | -| std | 0.00943 | -| value_loss | 2.77e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15663 | -| time_elapsed | 83827 | -| total_timesteps | 2004864 | -| train/ | | -| approx_kl | 0.010184109 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 156620 | -| policy_gradient_loss | 0.00541 | -| std | 0.00943 | -| value_loss | 1.85e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 15664 | -| time_elapsed | 83831 | -| total_timesteps | 2004992 | -| train/ | | -| approx_kl | 0.012900457 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 156630 | -| policy_gradient_loss | -0.00662 | -| std | 0.00943 | -| value_loss | 1.17e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15665 | -| time_elapsed | 83837 | -| total_timesteps | 2005120 | -| train/ | | -| approx_kl | 0.22753023 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 156640 | -| policy_gradient_loss | 0.0473 | -| std | 0.00942 | -| value_loss | 6.67e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15666 | -| time_elapsed | 83847 | -| total_timesteps | 2005248 | -| train/ | | -| approx_kl | 0.0374374 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.00798 | -| n_updates | 156650 | -| policy_gradient_loss | -0.0092 | -| std | 0.00941 | -| value_loss | 0.000177 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15667 | -| time_elapsed | 83852 | -| total_timesteps | 2005376 | -| train/ | | -| approx_kl | 0.007058925 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00585 | -| n_updates | 156660 | -| policy_gradient_loss | -2.88e-05 | -| std | 0.00941 | -| value_loss | 1.99e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15668 | -| time_elapsed | 83856 | -| total_timesteps | 2005504 | -| train/ | | -| approx_kl | 0.03853302 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 156670 | -| policy_gradient_loss | 0.0343 | -| std | 0.00941 | -| value_loss | 1.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15669 | -| time_elapsed | 83860 | -| total_timesteps | 2005632 | -| train/ | | -| approx_kl | 0.015477978 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | -0.00544 | -| n_updates | 156680 | -| policy_gradient_loss | 0.00814 | -| std | 0.00942 | -| value_loss | 1.31e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15670 | -| time_elapsed | 83865 | -| total_timesteps | 2005760 | -| train/ | | -| approx_kl | 0.11412108 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 156690 | -| policy_gradient_loss | 0.0416 | -| std | 0.00942 | -| value_loss | 9.98e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15671 | -| time_elapsed | 83870 | -| total_timesteps | 2005888 | -| train/ | | -| approx_kl | 0.00038825534 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 156700 | -| policy_gradient_loss | -0.00384 | -| std | 0.00942 | -| value_loss | 8.85e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15672 | -| time_elapsed | 83875 | -| total_timesteps | 2006016 | -| train/ | | -| approx_kl | 0.038379453 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.00357 | -| n_updates | 156710 | -| policy_gradient_loss | 0.0347 | -| std | 0.00942 | -| value_loss | 7.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15673 | -| time_elapsed | 83889 | -| total_timesteps | 2006144 | -| train/ | | -| approx_kl | 0.014595137 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -2.29 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 156720 | -| policy_gradient_loss | -0.00885 | -| std | 0.00942 | -| value_loss | 0.00232 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15674 | -| time_elapsed | 83896 | -| total_timesteps | 2006272 | -| train/ | | -| approx_kl | 0.014422433 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.0323 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 156730 | -| policy_gradient_loss | 0.00128 | -| std | 0.00942 | -| value_loss | 4.85e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15675 | -| time_elapsed | 83901 | -| total_timesteps | 2006400 | -| train/ | | -| approx_kl | 0.0017314288 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0966 | -| learning_rate | 0.0003 | -| loss | 0.00995 | -| n_updates | 156740 | -| policy_gradient_loss | -0.00831 | -| std | 0.00942 | -| value_loss | 3.78e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15676 | -| time_elapsed | 83907 | -| total_timesteps | 2006528 | -| train/ | | -| approx_kl | 0.0058977054 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00581 | -| n_updates | 156750 | -| policy_gradient_loss | 0.000356 | -| std | 0.00942 | -| value_loss | 1.79e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15677 | -| time_elapsed | 83912 | -| total_timesteps | 2006656 | -| train/ | | -| approx_kl | 0.017280608 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 156760 | -| policy_gradient_loss | 0.0536 | -| std | 0.00942 | -| value_loss | 2.11e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15678 | -| time_elapsed | 83918 | -| total_timesteps | 2006784 | -| train/ | | -| approx_kl | 0.0042452277 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 156770 | -| policy_gradient_loss | 0.00712 | -| std | 0.00943 | -| value_loss | 1.21e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15679 | -| time_elapsed | 83923 | -| total_timesteps | 2006912 | -| train/ | | -| approx_kl | 0.37757182 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 156780 | -| policy_gradient_loss | 0.131 | -| std | 0.00943 | -| value_loss | 9.3e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15680 | -| time_elapsed | 83928 | -| total_timesteps | 2007040 | -| train/ | | -| approx_kl | 0.0063182837 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 156790 | -| policy_gradient_loss | -0.00341 | -| std | 0.00943 | -| value_loss | 8.53e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15681 | -| time_elapsed | 83937 | -| total_timesteps | 2007168 | -| train/ | | -| approx_kl | 0.007992759 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 156800 | -| policy_gradient_loss | -0.0108 | -| std | 0.00944 | -| value_loss | 0.000104 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15682 | -| time_elapsed | 83942 | -| total_timesteps | 2007296 | -| train/ | | -| approx_kl | 0.0038079307 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -15.6 | -| learning_rate | 0.0003 | -| loss | 0.00266 | -| n_updates | 156810 | -| policy_gradient_loss | 0.00196 | -| std | 0.00944 | -| value_loss | 2.21e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15683 | -| time_elapsed | 83948 | -| total_timesteps | 2007424 | -| train/ | | -| approx_kl | 0.0015365728 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -2.63 | -| learning_rate | 0.0003 | -| loss | 0.00918 | -| n_updates | 156820 | -| policy_gradient_loss | -0.00768 | -| std | 0.00943 | -| value_loss | 6.69e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15684 | -| time_elapsed | 83954 | -| total_timesteps | 2007552 | -| train/ | | -| approx_kl | 0.057283916 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.613 | -| learning_rate | 0.0003 | -| loss | -0.00966 | -| n_updates | 156830 | -| policy_gradient_loss | -0.0157 | -| std | 0.00943 | -| value_loss | 3.97e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15685 | -| time_elapsed | 83959 | -| total_timesteps | 2007680 | -| train/ | | -| approx_kl | 0.015121976 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | -0.000352 | -| n_updates | 156840 | -| policy_gradient_loss | 0.00104 | -| std | 0.00944 | -| value_loss | 9.55e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15686 | -| time_elapsed | 83963 | -| total_timesteps | 2007808 | -| train/ | | -| approx_kl | 0.024856854 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.000896 | -| n_updates | 156850 | -| policy_gradient_loss | -0.000245 | -| std | 0.00945 | -| value_loss | 4.16e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15687 | -| time_elapsed | 83967 | -| total_timesteps | 2007936 | -| train/ | | -| approx_kl | 0.00016157748 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | -0.000806 | -| n_updates | 156860 | -| policy_gradient_loss | 0.000622 | -| std | 0.00945 | -| value_loss | 3.25e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15688 | -| time_elapsed | 83971 | -| total_timesteps | 2008064 | -| train/ | | -| approx_kl | 0.0044770148 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | -9.75e-05 | -| n_updates | 156870 | -| policy_gradient_loss | 0.00309 | -| std | 0.00945 | -| value_loss | 4.33e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15689 | -| time_elapsed | 83979 | -| total_timesteps | 2008192 | -| train/ | | -| approx_kl | 0.01554336 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 156880 | -| policy_gradient_loss | -0.016 | -| std | 0.00945 | -| value_loss | 7.69e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15690 | -| time_elapsed | 83985 | -| total_timesteps | 2008320 | -| train/ | | -| approx_kl | 0.0003363127 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.000717 | -| n_updates | 156890 | -| policy_gradient_loss | 0.00263 | -| std | 0.00945 | -| value_loss | 5.68e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15691 | -| time_elapsed | 83989 | -| total_timesteps | 2008448 | -| train/ | | -| approx_kl | 0.026312277 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.00289 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 156900 | -| policy_gradient_loss | 0.00608 | -| std | 0.00946 | -| value_loss | 2.75e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15692 | -| time_elapsed | 83994 | -| total_timesteps | 2008576 | -| train/ | | -| approx_kl | 0.024800263 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | 0.00737 | -| n_updates | 156910 | -| policy_gradient_loss | 0.00361 | -| std | 0.00946 | -| value_loss | 2.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15693 | -| time_elapsed | 83999 | -| total_timesteps | 2008704 | -| train/ | | -| approx_kl | 0.028944377 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.00271 | -| n_updates | 156920 | -| policy_gradient_loss | 0.00111 | -| std | 0.00946 | -| value_loss | 1.79e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15694 | -| time_elapsed | 84003 | -| total_timesteps | 2008832 | -| train/ | | -| approx_kl | 0.026049944 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 156930 | -| policy_gradient_loss | 0.006 | -| std | 0.00946 | -| value_loss | 1.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15695 | -| time_elapsed | 84007 | -| total_timesteps | 2008960 | -| train/ | | -| approx_kl | 0.019096054 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | -0.00728 | -| n_updates | 156940 | -| policy_gradient_loss | -0.00358 | -| std | 0.00946 | -| value_loss | 7.97e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15696 | -| time_elapsed | 84013 | -| total_timesteps | 2009088 | -| train/ | | -| approx_kl | 0.0044630263 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | -0.00815 | -| n_updates | 156950 | -| policy_gradient_loss | 0.00127 | -| std | 0.00945 | -| value_loss | 6.69e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15697 | -| time_elapsed | 84022 | -| total_timesteps | 2009216 | -| train/ | | -| approx_kl | 0.24926724 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 156960 | -| policy_gradient_loss | 0.00768 | -| std | 0.00945 | -| value_loss | 0.000148 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15698 | -| time_elapsed | 84027 | -| total_timesteps | 2009344 | -| train/ | | -| approx_kl | 0.012694436 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0961 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 156970 | -| policy_gradient_loss | 0.00532 | -| std | 0.00945 | -| value_loss | 1.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15699 | -| time_elapsed | 84032 | -| total_timesteps | 2009472 | -| train/ | | -| approx_kl | 0.086116455 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.000296 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 156980 | -| policy_gradient_loss | 0.00571 | -| std | 0.00945 | -| value_loss | 2.92e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15700 | -| time_elapsed | 84039 | -| total_timesteps | 2009600 | -| train/ | | -| approx_kl | 0.004304423 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00744 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 156990 | -| policy_gradient_loss | 0.0147 | -| std | 0.00945 | -| value_loss | 1.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15701 | -| time_elapsed | 84044 | -| total_timesteps | 2009728 | -| train/ | | -| approx_kl | 0.013502888 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.0043 | -| n_updates | 157000 | -| policy_gradient_loss | 0.00128 | -| std | 0.00945 | -| value_loss | 1.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15702 | -| time_elapsed | 84050 | -| total_timesteps | 2009856 | -| train/ | | -| approx_kl | 0.010275278 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 157010 | -| policy_gradient_loss | 0.0115 | -| std | 0.00945 | -| value_loss | 9.08e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 15703 | -| time_elapsed | 84056 | -| total_timesteps | 2009984 | -| train/ | | -| approx_kl | 0.10679319 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.0647 | -| n_updates | 157020 | -| policy_gradient_loss | 0.0616 | -| std | 0.00945 | -| value_loss | 7.23e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 15704 | -| time_elapsed | 84059 | -| total_timesteps | 2010112 | -| train/ | | -| approx_kl | 0.028593251 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 157030 | -| policy_gradient_loss | 0.0154 | -| std | 0.00945 | -| value_loss | 6.33e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 15705 | -| time_elapsed | 84071 | -| total_timesteps | 2010240 | -| train/ | | -| approx_kl | 0.025003318 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.917 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 157040 | -| policy_gradient_loss | -0.000529 | -| std | 0.00945 | -| value_loss | 0.000886 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 15706 | -| time_elapsed | 84076 | -| total_timesteps | 2010368 | -| train/ | | -| approx_kl | 0.031227186 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 157050 | -| policy_gradient_loss | -0.00801 | -| std | 0.00945 | -| value_loss | 8.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 15707 | -| time_elapsed | 84081 | -| total_timesteps | 2010496 | -| train/ | | -| approx_kl | 0.011108821 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 157060 | -| policy_gradient_loss | -0.00186 | -| std | 0.00944 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 15708 | -| time_elapsed | 84087 | -| total_timesteps | 2010624 | -| train/ | | -| approx_kl | 0.010169106 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | -0.00594 | -| n_updates | 157070 | -| policy_gradient_loss | 0.00888 | -| std | 0.00944 | -| value_loss | 1.39e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 15709 | -| time_elapsed | 84092 | -| total_timesteps | 2010752 | -| train/ | | -| approx_kl | 0.05897955 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.00781 | -| n_updates | 157080 | -| policy_gradient_loss | 0.00906 | -| std | 0.00944 | -| value_loss | 1.26e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 15710 | -| time_elapsed | 84098 | -| total_timesteps | 2010880 | -| train/ | | -| approx_kl | 0.3087293 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 157090 | -| policy_gradient_loss | 0.0369 | -| std | 0.00944 | -| value_loss | 7.92e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15711 | -| time_elapsed | 84104 | -| total_timesteps | 2011008 | -| train/ | | -| approx_kl | 0.008426245 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 157100 | -| policy_gradient_loss | 0.00231 | -| std | 0.00944 | -| value_loss | 5.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15712 | -| time_elapsed | 84116 | -| total_timesteps | 2011136 | -| train/ | | -| approx_kl | 0.021317115 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 157110 | -| policy_gradient_loss | -0.00521 | -| std | 0.00945 | -| value_loss | 0.00138 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15713 | -| time_elapsed | 84122 | -| total_timesteps | 2011264 | -| train/ | | -| approx_kl | 0.0656686 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.399 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 157120 | -| policy_gradient_loss | 0.00544 | -| std | 0.00945 | -| value_loss | 2.3e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15714 | -| time_elapsed | 84126 | -| total_timesteps | 2011392 | -| train/ | | -| approx_kl | 0.030585917 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 157130 | -| policy_gradient_loss | 0.000745 | -| std | 0.00945 | -| value_loss | 1.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15715 | -| time_elapsed | 84131 | -| total_timesteps | 2011520 | -| train/ | | -| approx_kl | 0.08077743 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0934 | -| learning_rate | 0.0003 | -| loss | 0.0294 | -| n_updates | 157140 | -| policy_gradient_loss | 0.0209 | -| std | 0.00945 | -| value_loss | 1.32e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15716 | -| time_elapsed | 84137 | -| total_timesteps | 2011648 | -| train/ | | -| approx_kl | 0.08642054 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.0405 | -| n_updates | 157150 | -| policy_gradient_loss | 0.0159 | -| std | 0.00945 | -| value_loss | 1.05e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15717 | -| time_elapsed | 84143 | -| total_timesteps | 2011776 | -| train/ | | -| approx_kl | 0.0010481649 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 157160 | -| policy_gradient_loss | 0.0131 | -| std | 0.00945 | -| value_loss | 8.3e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15718 | -| time_elapsed | 84147 | -| total_timesteps | 2011904 | -| train/ | | -| approx_kl | 0.07907609 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 157170 | -| policy_gradient_loss | 0.0136 | -| std | 0.00945 | -| value_loss | 5.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15719 | -| time_elapsed | 84151 | -| total_timesteps | 2012032 | -| train/ | | -| approx_kl | 0.011846049 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 157180 | -| policy_gradient_loss | 0.0144 | -| std | 0.00945 | -| value_loss | 3.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15720 | -| time_elapsed | 84163 | -| total_timesteps | 2012160 | -| train/ | | -| approx_kl | 0.005077455 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.00513 | -| n_updates | 157190 | -| policy_gradient_loss | -0.00668 | -| std | 0.00945 | -| value_loss | 0.00114 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15721 | -| time_elapsed | 84168 | -| total_timesteps | 2012288 | -| train/ | | -| approx_kl | 0.0046612453 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.715 | -| learning_rate | 0.0003 | -| loss | 0.00505 | -| n_updates | 157200 | -| policy_gradient_loss | 0.00552 | -| std | 0.00943 | -| value_loss | 2.97e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15722 | -| time_elapsed | 84171 | -| total_timesteps | 2012416 | -| train/ | | -| approx_kl | 0.016490111 | -| clip_fraction | 0.479 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.588 | -| learning_rate | 0.0003 | -| loss | 0.0436 | -| n_updates | 157210 | -| policy_gradient_loss | 0.0339 | -| std | 0.00941 | -| value_loss | 5.92e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15723 | -| time_elapsed | 84176 | -| total_timesteps | 2012544 | -| train/ | | -| approx_kl | 0.01161897 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | -0.00852 | -| n_updates | 157220 | -| policy_gradient_loss | 0.00212 | -| std | 0.0094 | -| value_loss | 1.1e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15724 | -| time_elapsed | 84181 | -| total_timesteps | 2012672 | -| train/ | | -| approx_kl | 0.002382719 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00637 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 157230 | -| policy_gradient_loss | 0.0105 | -| std | 0.0094 | -| value_loss | 3.16e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15725 | -| time_elapsed | 84184 | -| total_timesteps | 2012800 | -| train/ | | -| approx_kl | 0.4078832 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.307 | -| n_updates | 157240 | -| policy_gradient_loss | 0.155 | -| std | 0.0094 | -| value_loss | 1.35e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 15726 | -| time_elapsed | 84189 | -| total_timesteps | 2012928 | -| train/ | | -| approx_kl | 0.012741527 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.00242 | -| n_updates | 157250 | -| policy_gradient_loss | -0.000408 | -| std | 0.0094 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15727 | -| time_elapsed | 84194 | -| total_timesteps | 2013056 | -| train/ | | -| approx_kl | 0.010032791 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.000515 | -| n_updates | 157260 | -| policy_gradient_loss | 0.0111 | -| std | 0.0094 | -| value_loss | 6.44e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15728 | -| time_elapsed | 84204 | -| total_timesteps | 2013184 | -| train/ | | -| approx_kl | 0.0035744878 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | -0.00613 | -| n_updates | 157270 | -| policy_gradient_loss | 0.00844 | -| std | 0.0094 | -| value_loss | 0.00245 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15729 | -| time_elapsed | 84209 | -| total_timesteps | 2013312 | -| train/ | | -| approx_kl | 0.022429347 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -1.71 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 157280 | -| policy_gradient_loss | -0.000834 | -| std | 0.00939 | -| value_loss | 6.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15730 | -| time_elapsed | 84215 | -| total_timesteps | 2013440 | -| train/ | | -| approx_kl | 0.071286865 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 157290 | -| policy_gradient_loss | 0.0346 | -| std | 0.00939 | -| value_loss | 2.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15731 | -| time_elapsed | 84218 | -| total_timesteps | 2013568 | -| train/ | | -| approx_kl | 0.09758468 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -38.2 | -| learning_rate | 0.0003 | -| loss | -0.0096 | -| n_updates | 157300 | -| policy_gradient_loss | -0.00358 | -| std | 0.00939 | -| value_loss | 1.04e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15732 | -| time_elapsed | 84224 | -| total_timesteps | 2013696 | -| train/ | | -| approx_kl | 0.0067930147 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -18.1 | -| learning_rate | 0.0003 | -| loss | 0.00143 | -| n_updates | 157310 | -| policy_gradient_loss | 0.00379 | -| std | 0.00939 | -| value_loss | 1.14e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15733 | -| time_elapsed | 84229 | -| total_timesteps | 2013824 | -| train/ | | -| approx_kl | 0.02754717 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.884 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 157320 | -| policy_gradient_loss | 0.0161 | -| std | 0.00936 | -| value_loss | 1.96e-11 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 15734 | -| time_elapsed | 84234 | -| total_timesteps | 2013952 | -| train/ | | -| approx_kl | 0.232199 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0811 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 157330 | -| policy_gradient_loss | 0.0357 | -| std | 0.00934 | -| value_loss | 1.31e-11 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15735 | -| time_elapsed | 84239 | -| total_timesteps | 2014080 | -| train/ | | -| approx_kl | 0.006173234 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 157340 | -| policy_gradient_loss | 0.000431 | -| std | 0.00934 | -| value_loss | 6.03e-12 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15736 | -| time_elapsed | 84247 | -| total_timesteps | 2014208 | -| train/ | | -| approx_kl | 0.26154065 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.849 | -| learning_rate | 0.0003 | -| loss | 0.0481 | -| n_updates | 157350 | -| policy_gradient_loss | -0.00506 | -| std | 0.00934 | -| value_loss | 0.00225 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15737 | -| time_elapsed | 84253 | -| total_timesteps | 2014336 | -| train/ | | -| approx_kl | 0.052064102 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.086 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 157360 | -| policy_gradient_loss | 0.00455 | -| std | 0.00934 | -| value_loss | 9.93e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15738 | -| time_elapsed | 84259 | -| total_timesteps | 2014464 | -| train/ | | -| approx_kl | 0.0073450636 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00562 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 157370 | -| policy_gradient_loss | 0.00305 | -| std | 0.00934 | -| value_loss | 1.66e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15739 | -| time_elapsed | 84264 | -| total_timesteps | 2014592 | -| train/ | | -| approx_kl | 0.03358346 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 157380 | -| policy_gradient_loss | -0.00474 | -| std | 0.00934 | -| value_loss | 1.1e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15740 | -| time_elapsed | 84268 | -| total_timesteps | 2014720 | -| train/ | | -| approx_kl | 0.021068659 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0054 | -| n_updates | 157390 | -| policy_gradient_loss | 0.00307 | -| std | 0.00934 | -| value_loss | 7.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15741 | -| time_elapsed | 84273 | -| total_timesteps | 2014848 | -| train/ | | -| approx_kl | 0.023579622 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | -0.000236 | -| n_updates | 157400 | -| policy_gradient_loss | -0.000382 | -| std | 0.00934 | -| value_loss | 5.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 15742 | -| time_elapsed | 84277 | -| total_timesteps | 2014976 | -| train/ | | -| approx_kl | 0.0051120743 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | -0.0051 | -| n_updates | 157410 | -| policy_gradient_loss | 0.00185 | -| std | 0.00934 | -| value_loss | 4.15e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 15743 | -| time_elapsed | 84282 | -| total_timesteps | 2015104 | -| train/ | | -| approx_kl | 0.03057734 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0047 | -| n_updates | 157420 | -| policy_gradient_loss | -8.08e-05 | -| std | 0.00934 | -| value_loss | 2.88e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 15744 | -| time_elapsed | 84292 | -| total_timesteps | 2015232 | -| train/ | | -| approx_kl | 0.0025164378 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 157430 | -| policy_gradient_loss | -0.00682 | -| std | 0.00934 | -| value_loss | 0.00457 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 15745 | -| time_elapsed | 84297 | -| total_timesteps | 2015360 | -| train/ | | -| approx_kl | 0.049057454 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00154 | -| learning_rate | 0.0003 | -| loss | -0.00684 | -| n_updates | 157440 | -| policy_gradient_loss | 0.00346 | -| std | 0.00934 | -| value_loss | 4.29e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 15746 | -| time_elapsed | 84300 | -| total_timesteps | 2015488 | -| train/ | | -| approx_kl | 0.05720838 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.0541 | -| n_updates | 157450 | -| policy_gradient_loss | 0.046 | -| std | 0.00934 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 15747 | -| time_elapsed | 84304 | -| total_timesteps | 2015616 | -| train/ | | -| approx_kl | 0.05211998 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0813 | -| learning_rate | 0.0003 | -| loss | 0.00888 | -| n_updates | 157460 | -| policy_gradient_loss | -0.00295 | -| std | 0.00934 | -| value_loss | 7.42e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 15748 | -| time_elapsed | 84308 | -| total_timesteps | 2015744 | -| train/ | | -| approx_kl | 0.18693501 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 157470 | -| policy_gradient_loss | 0.0223 | -| std | 0.00937 | -| value_loss | 7.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 15749 | -| time_elapsed | 84314 | -| total_timesteps | 2015872 | -| train/ | | -| approx_kl | 0.10280295 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0603 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 157480 | -| policy_gradient_loss | 0.00447 | -| std | 0.0094 | -| value_loss | 1.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15750 | -| time_elapsed | 84320 | -| total_timesteps | 2016000 | -| train/ | | -| approx_kl | 0.086461686 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00433 | -| learning_rate | 0.0003 | -| loss | 0.00814 | -| n_updates | 157490 | -| policy_gradient_loss | 0.00138 | -| std | 0.00941 | -| value_loss | 5.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15751 | -| time_elapsed | 84325 | -| total_timesteps | 2016128 | -| train/ | | -| approx_kl | 0.033685658 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00168 | -| learning_rate | 0.0003 | -| loss | -0.00822 | -| n_updates | 157500 | -| policy_gradient_loss | 0.006 | -| std | 0.00941 | -| value_loss | 2.67e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15752 | -| time_elapsed | 84335 | -| total_timesteps | 2016256 | -| train/ | | -| approx_kl | 0.11681175 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 157510 | -| policy_gradient_loss | 0.0223 | -| std | 0.00941 | -| value_loss | 9.71e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15753 | -| time_elapsed | 84340 | -| total_timesteps | 2016384 | -| train/ | | -| approx_kl | 0.27130133 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00753 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 157520 | -| policy_gradient_loss | 0.112 | -| std | 0.00941 | -| value_loss | 1.6e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15754 | -| time_elapsed | 84344 | -| total_timesteps | 2016512 | -| train/ | | -| approx_kl | 0.08374125 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00558 | -| learning_rate | 0.0003 | -| loss | 0.0887 | -| n_updates | 157530 | -| policy_gradient_loss | 0.0779 | -| std | 0.00941 | -| value_loss | 8.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15755 | -| time_elapsed | 84349 | -| total_timesteps | 2016640 | -| train/ | | -| approx_kl | 0.088076234 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00412 | -| learning_rate | 0.0003 | -| loss | 0.0753 | -| n_updates | 157540 | -| policy_gradient_loss | 0.0842 | -| std | 0.00941 | -| value_loss | 5.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15756 | -| time_elapsed | 84354 | -| total_timesteps | 2016768 | -| train/ | | -| approx_kl | 0.06872132 | -| clip_fraction | 0.593 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0773 | -| n_updates | 157550 | -| policy_gradient_loss | 0.0656 | -| std | 0.00941 | -| value_loss | 4.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 15757 | -| time_elapsed | 84359 | -| total_timesteps | 2016896 | -| train/ | | -| approx_kl | 0.06777122 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 157560 | -| policy_gradient_loss | 0.0819 | -| std | 0.00941 | -| value_loss | 2.98e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15758 | -| time_elapsed | 84363 | -| total_timesteps | 2017024 | -| train/ | | -| approx_kl | 0.058394734 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.0689 | -| n_updates | 157570 | -| policy_gradient_loss | 0.0616 | -| std | 0.00941 | -| value_loss | 2.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15759 | -| time_elapsed | 84374 | -| total_timesteps | 2017152 | -| train/ | | -| approx_kl | 0.13978148 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | 0.0395 | -| n_updates | 157580 | -| policy_gradient_loss | 0.0461 | -| std | 0.00941 | -| value_loss | 0.000674 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15760 | -| time_elapsed | 84378 | -| total_timesteps | 2017280 | -| train/ | | -| approx_kl | 0.0329134 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 157590 | -| policy_gradient_loss | 0.0058 | -| std | 0.00941 | -| value_loss | 1.28e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15761 | -| time_elapsed | 84383 | -| total_timesteps | 2017408 | -| train/ | | -| approx_kl | 0.0014686608 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00186 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 157600 | -| policy_gradient_loss | -0.00218 | -| std | 0.00941 | -| value_loss | 9.25e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15762 | -| time_elapsed | 84388 | -| total_timesteps | 2017536 | -| train/ | | -| approx_kl | 0.116860256 | -| clip_fraction | 0.619 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00563 | -| learning_rate | 0.0003 | -| loss | 0.0948 | -| n_updates | 157610 | -| policy_gradient_loss | 0.0971 | -| std | 0.00941 | -| value_loss | 9.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15763 | -| time_elapsed | 84391 | -| total_timesteps | 2017664 | -| train/ | | -| approx_kl | 0.084096245 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.0017 | -| learning_rate | 0.0003 | -| loss | 0.0775 | -| n_updates | 157620 | -| policy_gradient_loss | 0.0864 | -| std | 0.00942 | -| value_loss | 3.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15764 | -| time_elapsed | 84395 | -| total_timesteps | 2017792 | -| train/ | | -| approx_kl | 0.017996322 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00328 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 157630 | -| policy_gradient_loss | 0.0149 | -| std | 0.00942 | -| value_loss | 1.78e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 15765 | -| time_elapsed | 84401 | -| total_timesteps | 2017920 | -| train/ | | -| approx_kl | 0.26181558 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00778 | -| learning_rate | 0.0003 | -| loss | 0.0943 | -| n_updates | 157640 | -| policy_gradient_loss | 0.028 | -| std | 0.00942 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15766 | -| time_elapsed | 84405 | -| total_timesteps | 2018048 | -| train/ | | -| approx_kl | 0.027744032 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 157650 | -| policy_gradient_loss | 0.0075 | -| std | 0.00941 | -| value_loss | 6.2e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15767 | -| time_elapsed | 84416 | -| total_timesteps | 2018176 | -| train/ | | -| approx_kl | 0.0012864037 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 157660 | -| policy_gradient_loss | -0.00388 | -| std | 0.0094 | -| value_loss | 0.00218 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15768 | -| time_elapsed | 84421 | -| total_timesteps | 2018304 | -| train/ | | -| approx_kl | 2.8084964e-05 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | -0.000891 | -| n_updates | 157670 | -| policy_gradient_loss | -0.00486 | -| std | 0.0094 | -| value_loss | 1.78e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15769 | -| time_elapsed | 84425 | -| total_timesteps | 2018432 | -| train/ | | -| approx_kl | 0.008813048 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00337 | -| learning_rate | 0.0003 | -| loss | -0.000417 | -| n_updates | 157680 | -| policy_gradient_loss | 0.00168 | -| std | 0.0094 | -| value_loss | 2.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15770 | -| time_elapsed | 84429 | -| total_timesteps | 2018560 | -| train/ | | -| approx_kl | 0.03356631 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 157690 | -| policy_gradient_loss | 0.00483 | -| std | 0.0094 | -| value_loss | 1.74e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15771 | -| time_elapsed | 84433 | -| total_timesteps | 2018688 | -| train/ | | -| approx_kl | 0.027295176 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 157700 | -| policy_gradient_loss | 0.00582 | -| std | 0.00939 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15772 | -| time_elapsed | 84437 | -| total_timesteps | 2018816 | -| train/ | | -| approx_kl | 0.004318517 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 157710 | -| policy_gradient_loss | 0.00355 | -| std | 0.00938 | -| value_loss | 6.86e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 15773 | -| time_elapsed | 84440 | -| total_timesteps | 2018944 | -| train/ | | -| approx_kl | 0.00050165365 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 157720 | -| policy_gradient_loss | 0.00265 | -| std | 0.00937 | -| value_loss | 5.44e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15774 | -| time_elapsed | 84445 | -| total_timesteps | 2019072 | -| train/ | | -| approx_kl | 5.736947e-07 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -6.98e-05 | -| n_updates | 157730 | -| policy_gradient_loss | 0.00507 | -| std | 0.00937 | -| value_loss | 3.53e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15775 | -| time_elapsed | 84454 | -| total_timesteps | 2019200 | -| train/ | | -| approx_kl | 0.0019146879 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | -0.0049 | -| n_updates | 157740 | -| policy_gradient_loss | -0.000846 | -| std | 0.00936 | -| value_loss | 0.00344 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15776 | -| time_elapsed | 84460 | -| total_timesteps | 2019328 | -| train/ | | -| approx_kl | 0.021692522 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | -0.000643 | -| n_updates | 157750 | -| policy_gradient_loss | 0.000254 | -| std | 0.00936 | -| value_loss | 2.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15777 | -| time_elapsed | 84465 | -| total_timesteps | 2019456 | -| train/ | | -| approx_kl | 0.022121496 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00273 | -| learning_rate | 0.0003 | -| loss | -0.00851 | -| n_updates | 157760 | -| policy_gradient_loss | -0.00436 | -| std | 0.00935 | -| value_loss | 6.81e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15778 | -| time_elapsed | 84470 | -| total_timesteps | 2019584 | -| train/ | | -| approx_kl | 9.0476125e-05 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 157770 | -| policy_gradient_loss | 0.000978 | -| std | 0.00935 | -| value_loss | 4.03e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15779 | -| time_elapsed | 84474 | -| total_timesteps | 2019712 | -| train/ | | -| approx_kl | 0.023940906 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 157780 | -| policy_gradient_loss | 0.00183 | -| std | 0.00935 | -| value_loss | 2.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15780 | -| time_elapsed | 84477 | -| total_timesteps | 2019840 | -| train/ | | -| approx_kl | 0.027787626 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.00782 | -| n_updates | 157790 | -| policy_gradient_loss | 0.00353 | -| std | 0.00935 | -| value_loss | 1.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 15781 | -| time_elapsed | 84484 | -| total_timesteps | 2019968 | -| train/ | | -| approx_kl | 0.024708703 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | 0.00896 | -| n_updates | 157800 | -| policy_gradient_loss | 0.00422 | -| std | 0.00934 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15782 | -| time_elapsed | 84487 | -| total_timesteps | 2020096 | -| train/ | | -| approx_kl | 0.020947345 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.00335 | -| n_updates | 157810 | -| policy_gradient_loss | 0.0015 | -| std | 0.00934 | -| value_loss | 8.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15783 | -| time_elapsed | 84498 | -| total_timesteps | 2020224 | -| train/ | | -| approx_kl | 0.015598778 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.788 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 157820 | -| policy_gradient_loss | -0.0177 | -| std | 0.00934 | -| value_loss | 0.000616 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15784 | -| time_elapsed | 84503 | -| total_timesteps | 2020352 | -| train/ | | -| approx_kl | 0.003973319 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00985 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 157830 | -| policy_gradient_loss | 0.0148 | -| std | 0.00934 | -| value_loss | 3.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15785 | -| time_elapsed | 84506 | -| total_timesteps | 2020480 | -| train/ | | -| approx_kl | 0.10170286 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -1.02 | -| learning_rate | 0.0003 | -| loss | 0.0253 | -| n_updates | 157840 | -| policy_gradient_loss | 0.00457 | -| std | 0.00934 | -| value_loss | 7.49e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15786 | -| time_elapsed | 84508 | -| total_timesteps | 2020608 | -| train/ | | -| approx_kl | 0.008447794 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 157850 | -| policy_gradient_loss | 0.000665 | -| std | 0.00934 | -| value_loss | 3.59e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15787 | -| time_elapsed | 84512 | -| total_timesteps | 2020736 | -| train/ | | -| approx_kl | 0.2719293 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00719 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 157860 | -| policy_gradient_loss | 0.0283 | -| std | 0.00934 | -| value_loss | 2.69e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15788 | -| time_elapsed | 84516 | -| total_timesteps | 2020864 | -| train/ | | -| approx_kl | 0.0005381014 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00118 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 157870 | -| policy_gradient_loss | -0.00183 | -| std | 0.00934 | -| value_loss | 1.88e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 15789 | -| time_elapsed | 84519 | -| total_timesteps | 2020992 | -| train/ | | -| approx_kl | 0.0053792694 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 157880 | -| policy_gradient_loss | 0.00237 | -| std | 0.00937 | -| value_loss | 1.21e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15790 | -| time_elapsed | 84524 | -| total_timesteps | 2021120 | -| train/ | | -| approx_kl | 0.0412403 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 157890 | -| policy_gradient_loss | 0.00287 | -| std | 0.00939 | -| value_loss | 9.53e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15791 | -| time_elapsed | 84536 | -| total_timesteps | 2021248 | -| train/ | | -| approx_kl | 0.034963485 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 157900 | -| policy_gradient_loss | 0.0165 | -| std | 0.0094 | -| value_loss | 0.000237 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15792 | -| time_elapsed | 84542 | -| total_timesteps | 2021376 | -| train/ | | -| approx_kl | 0.013705928 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | 0.0261 | -| n_updates | 157910 | -| policy_gradient_loss | 0.0448 | -| std | 0.0094 | -| value_loss | 1.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15793 | -| time_elapsed | 84547 | -| total_timesteps | 2021504 | -| train/ | | -| approx_kl | 0.004917236 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00633 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 157920 | -| policy_gradient_loss | 0.0186 | -| std | 0.00941 | -| value_loss | 3.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15794 | -| time_elapsed | 84553 | -| total_timesteps | 2021632 | -| train/ | | -| approx_kl | 0.08938365 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00161 | -| learning_rate | 0.0003 | -| loss | 0.068 | -| n_updates | 157930 | -| policy_gradient_loss | 0.029 | -| std | 0.00941 | -| value_loss | 1.6e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15795 | -| time_elapsed | 84558 | -| total_timesteps | 2021760 | -| train/ | | -| approx_kl | 0.05003726 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 157940 | -| policy_gradient_loss | 0.00286 | -| std | 0.00941 | -| value_loss | 1.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.958 | -| time/ | | -| fps | 23 | -| iterations | 15796 | -| time_elapsed | 84563 | -| total_timesteps | 2021888 | -| train/ | | -| approx_kl | 0.014968148 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 157950 | -| policy_gradient_loss | -0.00232 | -| std | 0.0094 | -| value_loss | 7.76e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15797 | -| time_elapsed | 84568 | -| total_timesteps | 2022016 | -| train/ | | -| approx_kl | 0.21921365 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.0914 | -| n_updates | 157960 | -| policy_gradient_loss | 0.0179 | -| std | 0.00944 | -| value_loss | 4.98e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15798 | -| time_elapsed | 84579 | -| total_timesteps | 2022144 | -| train/ | | -| approx_kl | 0.0007159491 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.685 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 157970 | -| policy_gradient_loss | -0.00647 | -| std | 0.00946 | -| value_loss | 0.000751 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15799 | -| time_elapsed | 84583 | -| total_timesteps | 2022272 | -| train/ | | -| approx_kl | 0.09071448 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.0742 | -| learning_rate | 0.0003 | -| loss | 0.00563 | -| n_updates | 157980 | -| policy_gradient_loss | 0.0069 | -| std | 0.00947 | -| value_loss | 8.48e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15800 | -| time_elapsed | 84586 | -| total_timesteps | 2022400 | -| train/ | | -| approx_kl | 0.00021339022 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.000249 | -| n_updates | 157990 | -| policy_gradient_loss | 0.0717 | -| std | 0.00947 | -| value_loss | 1.1e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15801 | -| time_elapsed | 84592 | -| total_timesteps | 2022528 | -| train/ | | -| approx_kl | 0.012802233 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -23.6 | -| learning_rate | 0.0003 | -| loss | -0.00089 | -| n_updates | 158000 | -| policy_gradient_loss | 0.00508 | -| std | 0.00946 | -| value_loss | 1.78e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15802 | -| time_elapsed | 84597 | -| total_timesteps | 2022656 | -| train/ | | -| approx_kl | 0.029190945 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -4.82 | -| learning_rate | 0.0003 | -| loss | 0.00405 | -| n_updates | 158010 | -| policy_gradient_loss | 0.00914 | -| std | 0.00945 | -| value_loss | 1.02e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15803 | -| time_elapsed | 84602 | -| total_timesteps | 2022784 | -| train/ | | -| approx_kl | 0.05152775 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -25 | -| learning_rate | 0.0003 | -| loss | 0.00588 | -| n_updates | 158020 | -| policy_gradient_loss | 0.0035 | -| std | 0.00945 | -| value_loss | 9.23e-13 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 15804 | -| time_elapsed | 84607 | -| total_timesteps | 2022912 | -| train/ | | -| approx_kl | 0.0033312533 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -2.59 | -| learning_rate | 0.0003 | -| loss | 0.00555 | -| n_updates | 158030 | -| policy_gradient_loss | 0.00163 | -| std | 0.00944 | -| value_loss | 2.02e-13 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15805 | -| time_elapsed | 84612 | -| total_timesteps | 2023040 | -| train/ | | -| approx_kl | 0.03396701 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.497 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 158040 | -| policy_gradient_loss | 0.00849 | -| std | 0.00944 | -| value_loss | 1.47e-13 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15806 | -| time_elapsed | 84623 | -| total_timesteps | 2023168 | -| train/ | | -| approx_kl | 0.045560364 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 158050 | -| policy_gradient_loss | -0.0114 | -| std | 0.00944 | -| value_loss | 7.89e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15807 | -| time_elapsed | 84628 | -| total_timesteps | 2023296 | -| train/ | | -| approx_kl | 0.018485436 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.722 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 158060 | -| policy_gradient_loss | 0.00985 | -| std | 0.00944 | -| value_loss | 1.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15808 | -| time_elapsed | 84633 | -| total_timesteps | 2023424 | -| train/ | | -| approx_kl | 0.014278426 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.000822 | -| n_updates | 158070 | -| policy_gradient_loss | 0.0144 | -| std | 0.00944 | -| value_loss | 2.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15809 | -| time_elapsed | 84638 | -| total_timesteps | 2023552 | -| train/ | | -| approx_kl | 0.13511704 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.00465 | -| learning_rate | 0.0003 | -| loss | 0.0703 | -| n_updates | 158080 | -| policy_gradient_loss | 0.017 | -| std | 0.00944 | -| value_loss | 1.29e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15810 | -| time_elapsed | 84643 | -| total_timesteps | 2023680 | -| train/ | | -| approx_kl | 0.032395184 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.00932 | -| n_updates | 158090 | -| policy_gradient_loss | 0.0331 | -| std | 0.00944 | -| value_loss | 9.8e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15811 | -| time_elapsed | 84648 | -| total_timesteps | 2023808 | -| train/ | | -| approx_kl | 0.009340588 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | -0.000695 | -| n_updates | 158100 | -| policy_gradient_loss | 0.0125 | -| std | 0.00944 | -| value_loss | 2.92e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15812 | -| time_elapsed | 84655 | -| total_timesteps | 2023936 | -| train/ | | -| approx_kl | 0.0188651 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.24 | -| explained_variance | 0.000678 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 158110 | -| policy_gradient_loss | 0.0237 | -| std | 0.00943 | -| value_loss | 8.44e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15813 | -| time_elapsed | 84660 | -| total_timesteps | 2024064 | -| train/ | | -| approx_kl | 0.002058378 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00422 | -| learning_rate | 0.0003 | -| loss | -0.00811 | -| n_updates | 158120 | -| policy_gradient_loss | 0.0592 | -| std | 0.00942 | -| value_loss | 5.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15814 | -| time_elapsed | 84668 | -| total_timesteps | 2024192 | -| train/ | | -| approx_kl | 0.015586853 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 158130 | -| policy_gradient_loss | -0.000273 | -| std | 0.00942 | -| value_loss | 0.00242 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15815 | -| time_elapsed | 84673 | -| total_timesteps | 2024320 | -| train/ | | -| approx_kl | 0.12973648 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | 0.0648 | -| n_updates | 158140 | -| policy_gradient_loss | 0.0253 | -| std | 0.00942 | -| value_loss | 1.37e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15816 | -| time_elapsed | 84679 | -| total_timesteps | 2024448 | -| train/ | | -| approx_kl | 0.0007307087 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00127 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 158150 | -| policy_gradient_loss | 0.00497 | -| std | 0.00941 | -| value_loss | 1.04e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15817 | -| time_elapsed | 84684 | -| total_timesteps | 2024576 | -| train/ | | -| approx_kl | 0.03784127 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0619 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 158160 | -| policy_gradient_loss | 0.0402 | -| std | 0.00941 | -| value_loss | 6.61e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15818 | -| time_elapsed | 84690 | -| total_timesteps | 2024704 | -| train/ | | -| approx_kl | 0.024089795 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 158170 | -| policy_gradient_loss | 0.0172 | -| std | 0.00941 | -| value_loss | 5.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15819 | -| time_elapsed | 84695 | -| total_timesteps | 2024832 | -| train/ | | -| approx_kl | 0.116152555 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.0654 | -| n_updates | 158180 | -| policy_gradient_loss | 0.0242 | -| std | 0.00942 | -| value_loss | 6.74e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15820 | -| time_elapsed | 84698 | -| total_timesteps | 2024960 | -| train/ | | -| approx_kl | 0.00066116964 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0941 | -| learning_rate | 0.0003 | -| loss | -0.00029 | -| n_updates | 158190 | -| policy_gradient_loss | 0.00592 | -| std | 0.00941 | -| value_loss | 1.47e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15821 | -| time_elapsed | 84704 | -| total_timesteps | 2025088 | -| train/ | | -| approx_kl | 0.034167722 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 158200 | -| policy_gradient_loss | 0.0408 | -| std | 0.00939 | -| value_loss | 3.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15822 | -| time_elapsed | 84713 | -| total_timesteps | 2025216 | -| train/ | | -| approx_kl | 0.006922948 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 158210 | -| policy_gradient_loss | -0.00304 | -| std | 0.00939 | -| value_loss | 0.000697 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15823 | -| time_elapsed | 84717 | -| total_timesteps | 2025344 | -| train/ | | -| approx_kl | 0.007431769 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.0058 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 158220 | -| policy_gradient_loss | 0.0088 | -| std | 0.00938 | -| value_loss | 2.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15824 | -| time_elapsed | 84722 | -| total_timesteps | 2025472 | -| train/ | | -| approx_kl | 0.016809655 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | -0.00308 | -| n_updates | 158230 | -| policy_gradient_loss | 0.0266 | -| std | 0.00938 | -| value_loss | 2.77e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15825 | -| time_elapsed | 84728 | -| total_timesteps | 2025600 | -| train/ | | -| approx_kl | 0.03859971 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 158240 | -| policy_gradient_loss | 0.00366 | -| std | 0.00937 | -| value_loss | 8.64e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15826 | -| time_elapsed | 84733 | -| total_timesteps | 2025728 | -| train/ | | -| approx_kl | 0.014710696 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.52 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 158250 | -| policy_gradient_loss | -0.00837 | -| std | 0.00937 | -| value_loss | 3.14e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15827 | -| time_elapsed | 84739 | -| total_timesteps | 2025856 | -| train/ | | -| approx_kl | 0.0066309455 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0784 | -| learning_rate | 0.0003 | -| loss | -0.000705 | -| n_updates | 158260 | -| policy_gradient_loss | 0.0542 | -| std | 0.00936 | -| value_loss | 3e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 15828 | -| time_elapsed | 84743 | -| total_timesteps | 2025984 | -| train/ | | -| approx_kl | 0.15661682 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.0799 | -| n_updates | 158270 | -| policy_gradient_loss | 0.0244 | -| std | 0.00936 | -| value_loss | 3.1e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 15829 | -| time_elapsed | 84748 | -| total_timesteps | 2026112 | -| train/ | | -| approx_kl | 0.00018412014 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00363 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 158280 | -| policy_gradient_loss | -0.00407 | -| std | 0.00936 | -| value_loss | 1.88e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 15830 | -| time_elapsed | 84762 | -| total_timesteps | 2026240 | -| train/ | | -| approx_kl | 0.032995626 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 158290 | -| policy_gradient_loss | -0.0113 | -| std | 0.00937 | -| value_loss | 0.000213 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 15831 | -| time_elapsed | 84767 | -| total_timesteps | 2026368 | -| train/ | | -| approx_kl | 0.055583823 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 158300 | -| policy_gradient_loss | 0.0436 | -| std | 0.00937 | -| value_loss | 1.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 15832 | -| time_elapsed | 84772 | -| total_timesteps | 2026496 | -| train/ | | -| approx_kl | 0.110024594 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00109 | -| learning_rate | 0.0003 | -| loss | 0.0479 | -| n_updates | 158310 | -| policy_gradient_loss | 0.0249 | -| std | 0.00937 | -| value_loss | 9.87e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 15833 | -| time_elapsed | 84777 | -| total_timesteps | 2026624 | -| train/ | | -| approx_kl | 0.029775977 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00814 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 158320 | -| policy_gradient_loss | 0.0446 | -| std | 0.00937 | -| value_loss | 7.51e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 15834 | -| time_elapsed | 84783 | -| total_timesteps | 2026752 | -| train/ | | -| approx_kl | 0.15585124 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00322 | -| learning_rate | 0.0003 | -| loss | 0.0918 | -| n_updates | 158330 | -| policy_gradient_loss | 0.0276 | -| std | 0.00937 | -| value_loss | 5.84e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 15835 | -| time_elapsed | 84789 | -| total_timesteps | 2026880 | -| train/ | | -| approx_kl | 0.00043297 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 158340 | -| policy_gradient_loss | 0.0027 | -| std | 0.00937 | -| value_loss | 3.53e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15836 | -| time_elapsed | 84794 | -| total_timesteps | 2027008 | -| train/ | | -| approx_kl | 0.045471244 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 158350 | -| policy_gradient_loss | 0.0484 | -| std | 0.00937 | -| value_loss | 1.98e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15837 | -| time_elapsed | 84804 | -| total_timesteps | 2027136 | -| train/ | | -| approx_kl | 0.05855945 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 1 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 158360 | -| policy_gradient_loss | -0.012 | -| std | 0.00937 | -| value_loss | 1.48e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15838 | -| time_elapsed | 84809 | -| total_timesteps | 2027264 | -| train/ | | -| approx_kl | 0.026898753 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.38 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 158370 | -| policy_gradient_loss | -0.0112 | -| std | 0.00937 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15839 | -| time_elapsed | 84814 | -| total_timesteps | 2027392 | -| train/ | | -| approx_kl | 0.0033168136 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00419 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 158380 | -| policy_gradient_loss | 0.0512 | -| std | 0.00937 | -| value_loss | 3.64e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15840 | -| time_elapsed | 84819 | -| total_timesteps | 2027520 | -| train/ | | -| approx_kl | 0.013588591 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00581 | -| learning_rate | 0.0003 | -| loss | 0.000242 | -| n_updates | 158390 | -| policy_gradient_loss | 0.0138 | -| std | 0.00937 | -| value_loss | 3.94e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15841 | -| time_elapsed | 84824 | -| total_timesteps | 2027648 | -| train/ | | -| approx_kl | 0.020698508 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.009 | -| n_updates | 158400 | -| policy_gradient_loss | 0.0158 | -| std | 0.00936 | -| value_loss | 3.68e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15842 | -| time_elapsed | 84829 | -| total_timesteps | 2027776 | -| train/ | | -| approx_kl | 0.05469133 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0361 | -| n_updates | 158410 | -| policy_gradient_loss | 0.0167 | -| std | 0.00936 | -| value_loss | 9.75e-10 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15843 | -| time_elapsed | 84834 | -| total_timesteps | 2027904 | -| train/ | | -| approx_kl | 0.00021804776 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 158420 | -| policy_gradient_loss | 0.0181 | -| std | 0.00936 | -| value_loss | 5.84e-10 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15844 | -| time_elapsed | 84839 | -| total_timesteps | 2028032 | -| train/ | | -| approx_kl | 0.08835392 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 158430 | -| policy_gradient_loss | 0.00842 | -| std | 0.00936 | -| value_loss | 4.36e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15845 | -| time_elapsed | 84850 | -| total_timesteps | 2028160 | -| train/ | | -| approx_kl | 0.0019742087 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 158440 | -| policy_gradient_loss | -0.00642 | -| std | 0.00936 | -| value_loss | 0.00237 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15846 | -| time_elapsed | 84855 | -| total_timesteps | 2028288 | -| train/ | | -| approx_kl | 0.0038647046 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.0458 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 158450 | -| policy_gradient_loss | 0.0169 | -| std | 0.00938 | -| value_loss | 2.86e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15847 | -| time_elapsed | 84860 | -| total_timesteps | 2028416 | -| train/ | | -| approx_kl | 0.08132998 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -4.8 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 158460 | -| policy_gradient_loss | 0.00425 | -| std | 0.00938 | -| value_loss | 1.57e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15848 | -| time_elapsed | 84865 | -| total_timesteps | 2028544 | -| train/ | | -| approx_kl | 0.027162364 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -10 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 158470 | -| policy_gradient_loss | -0.00144 | -| std | 0.00939 | -| value_loss | 3.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15849 | -| time_elapsed | 84870 | -| total_timesteps | 2028672 | -| train/ | | -| approx_kl | 0.076645106 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0736 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 158480 | -| policy_gradient_loss | 0.0195 | -| std | 0.00939 | -| value_loss | 7.51e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15850 | -| time_elapsed | 84875 | -| total_timesteps | 2028800 | -| train/ | | -| approx_kl | 0.014740143 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 158490 | -| policy_gradient_loss | -0.00353 | -| std | 0.00938 | -| value_loss | 3.99e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15851 | -| time_elapsed | 84880 | -| total_timesteps | 2028928 | -| train/ | | -| approx_kl | 0.06439396 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00196 | -| learning_rate | 0.0003 | -| loss | 0.098 | -| n_updates | 158500 | -| policy_gradient_loss | 0.0552 | -| std | 0.00937 | -| value_loss | 1.94e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15852 | -| time_elapsed | 84885 | -| total_timesteps | 2029056 | -| train/ | | -| approx_kl | 0.023905715 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 158510 | -| policy_gradient_loss | 0.00418 | -| std | 0.00937 | -| value_loss | 1.28e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15853 | -| time_elapsed | 84896 | -| total_timesteps | 2029184 | -| train/ | | -| approx_kl | 0.006206306 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.79 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 158520 | -| policy_gradient_loss | -0.00707 | -| std | 0.00937 | -| value_loss | 0.00421 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15854 | -| time_elapsed | 84900 | -| total_timesteps | 2029312 | -| train/ | | -| approx_kl | 0.004827058 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 158530 | -| policy_gradient_loss | 0.0185 | -| std | 0.00937 | -| value_loss | 8.57e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15855 | -| time_elapsed | 84905 | -| total_timesteps | 2029440 | -| train/ | | -| approx_kl | 0.03820807 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.361 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 158540 | -| policy_gradient_loss | 0.0251 | -| std | 0.00939 | -| value_loss | 8.2e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15856 | -| time_elapsed | 84909 | -| total_timesteps | 2029568 | -| train/ | | -| approx_kl | 0.07981849 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.75 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 158550 | -| policy_gradient_loss | 0.0146 | -| std | 0.0094 | -| value_loss | 4.58e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15857 | -| time_elapsed | 84913 | -| total_timesteps | 2029696 | -| train/ | | -| approx_kl | 0.000377601 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 158560 | -| policy_gradient_loss | 0.013 | -| std | 0.0094 | -| value_loss | 3.91e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15858 | -| time_elapsed | 84917 | -| total_timesteps | 2029824 | -| train/ | | -| approx_kl | 0.29439166 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 158570 | -| policy_gradient_loss | 0.0247 | -| std | 0.0094 | -| value_loss | 2.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15859 | -| time_elapsed | 84922 | -| total_timesteps | 2029952 | -| train/ | | -| approx_kl | 0.004685391 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0907 | -| learning_rate | 0.0003 | -| loss | -0.00697 | -| n_updates | 158580 | -| policy_gradient_loss | -0.000358 | -| std | 0.0094 | -| value_loss | 7.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15860 | -| time_elapsed | 84926 | -| total_timesteps | 2030080 | -| train/ | | -| approx_kl | 0.024956912 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 158590 | -| policy_gradient_loss | 0.00368 | -| std | 0.0094 | -| value_loss | 4.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15861 | -| time_elapsed | 84935 | -| total_timesteps | 2030208 | -| train/ | | -| approx_kl | 0.05217877 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -5.25 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 158600 | -| policy_gradient_loss | -0.00898 | -| std | 0.0094 | -| value_loss | 0.00305 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15862 | -| time_elapsed | 84940 | -| total_timesteps | 2030336 | -| train/ | | -| approx_kl | 0.013352678 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.000497 | -| learning_rate | 0.0003 | -| loss | -0.000197 | -| n_updates | 158610 | -| policy_gradient_loss | 0.0124 | -| std | 0.0094 | -| value_loss | 2.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15863 | -| time_elapsed | 84944 | -| total_timesteps | 2030464 | -| train/ | | -| approx_kl | 0.113594644 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.0657 | -| n_updates | 158620 | -| policy_gradient_loss | 0.0324 | -| std | 0.00939 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15864 | -| time_elapsed | 84949 | -| total_timesteps | 2030592 | -| train/ | | -| approx_kl | 0.027905628 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.529 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 158630 | -| policy_gradient_loss | 0.0409 | -| std | 0.00939 | -| value_loss | 1.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15865 | -| time_elapsed | 84953 | -| total_timesteps | 2030720 | -| train/ | | -| approx_kl | 0.012598757 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 158640 | -| policy_gradient_loss | -7.06e-05 | -| std | 0.00939 | -| value_loss | 2.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15866 | -| time_elapsed | 84959 | -| total_timesteps | 2030848 | -| train/ | | -| approx_kl | 0.014557341 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.000586 | -| n_updates | 158650 | -| policy_gradient_loss | 0.0206 | -| std | 0.0094 | -| value_loss | 2.33e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15867 | -| time_elapsed | 84964 | -| total_timesteps | 2030976 | -| train/ | | -| approx_kl | 0.0024771574 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 158660 | -| policy_gradient_loss | 0.053 | -| std | 0.0094 | -| value_loss | 1.6e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 15868 | -| time_elapsed | 84968 | -| total_timesteps | 2031104 | -| train/ | | -| approx_kl | 0.06191367 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | 0.00038 | -| n_updates | 158670 | -| policy_gradient_loss | 0.0624 | -| std | 0.0094 | -| value_loss | 1.45e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 15869 | -| time_elapsed | 84978 | -| total_timesteps | 2031232 | -| train/ | | -| approx_kl | 0.24149959 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.864 | -| learning_rate | 0.0003 | -| loss | 0.0925 | -| n_updates | 158680 | -| policy_gradient_loss | 0.0352 | -| std | 0.0094 | -| value_loss | 0.00203 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 15870 | -| time_elapsed | 84984 | -| total_timesteps | 2031360 | -| train/ | | -| approx_kl | 8.456409e-07 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -1.48e-05 | -| n_updates | 158690 | -| policy_gradient_loss | 0.0203 | -| std | 0.0094 | -| value_loss | 3.74e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 15871 | -| time_elapsed | 84989 | -| total_timesteps | 2031488 | -| train/ | | -| approx_kl | 0.067173645 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | 0.0754 | -| n_updates | 158700 | -| policy_gradient_loss | 0.0552 | -| std | 0.00939 | -| value_loss | 9.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 15872 | -| time_elapsed | 84993 | -| total_timesteps | 2031616 | -| train/ | | -| approx_kl | 0.026561325 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 158710 | -| policy_gradient_loss | 0.00533 | -| std | 0.00939 | -| value_loss | 4.38e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 15873 | -| time_elapsed | 84998 | -| total_timesteps | 2031744 | -| train/ | | -| approx_kl | 0.0045591258 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.248 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 158720 | -| policy_gradient_loss | 0.0131 | -| std | 0.00938 | -| value_loss | 4.04e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 15874 | -| time_elapsed | 85003 | -| total_timesteps | 2031872 | -| train/ | | -| approx_kl | 0.10780932 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 158730 | -| policy_gradient_loss | 0.0078 | -| std | 0.00938 | -| value_loss | 5.79e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15875 | -| time_elapsed | 85008 | -| total_timesteps | 2032000 | -| train/ | | -| approx_kl | 0.09092099 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 158740 | -| policy_gradient_loss | 0.00599 | -| std | 0.00937 | -| value_loss | 2.31e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15876 | -| time_elapsed | 85013 | -| total_timesteps | 2032128 | -| train/ | | -| approx_kl | 0.050607856 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.00293 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 158750 | -| policy_gradient_loss | 0.0249 | -| std | 0.00937 | -| value_loss | 1.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15877 | -| time_elapsed | 85025 | -| total_timesteps | 2032256 | -| train/ | | -| approx_kl | 0.038674418 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.908 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 158760 | -| policy_gradient_loss | -0.00889 | -| std | 0.00937 | -| value_loss | 0.00113 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15878 | -| time_elapsed | 85028 | -| total_timesteps | 2032384 | -| train/ | | -| approx_kl | 0.041104592 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.00844 | -| n_updates | 158770 | -| policy_gradient_loss | 0.00111 | -| std | 0.00937 | -| value_loss | 2.32e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15879 | -| time_elapsed | 85033 | -| total_timesteps | 2032512 | -| train/ | | -| approx_kl | 0.0059840456 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.00343 | -| n_updates | 158780 | -| policy_gradient_loss | 0.0411 | -| std | 0.00937 | -| value_loss | 1.97e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15880 | -| time_elapsed | 85036 | -| total_timesteps | 2032640 | -| train/ | | -| approx_kl | 0.041726585 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 158790 | -| policy_gradient_loss | 0.0537 | -| std | 0.00938 | -| value_loss | 3.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15881 | -| time_elapsed | 85041 | -| total_timesteps | 2032768 | -| train/ | | -| approx_kl | 0.0010179868 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0055 | -| learning_rate | 0.0003 | -| loss | 0.00536 | -| n_updates | 158800 | -| policy_gradient_loss | 0.024 | -| std | 0.00938 | -| value_loss | 1.71e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15882 | -| time_elapsed | 85045 | -| total_timesteps | 2032896 | -| train/ | | -| approx_kl | 0.13932773 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 158810 | -| policy_gradient_loss | 0.0886 | -| std | 0.00938 | -| value_loss | 1.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15883 | -| time_elapsed | 85049 | -| total_timesteps | 2033024 | -| train/ | | -| approx_kl | 0.020613391 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.00784 | -| n_updates | 158820 | -| policy_gradient_loss | 0.0105 | -| std | 0.00937 | -| value_loss | 6.26e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15884 | -| time_elapsed | 85056 | -| total_timesteps | 2033152 | -| train/ | | -| approx_kl | 0.030142065 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 158830 | -| policy_gradient_loss | -0.00798 | -| std | 0.00936 | -| value_loss | 0.000399 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15885 | -| time_elapsed | 85060 | -| total_timesteps | 2033280 | -| train/ | | -| approx_kl | 0.09201739 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.00426 | -| learning_rate | 0.0003 | -| loss | 0.0498 | -| n_updates | 158840 | -| policy_gradient_loss | 0.0106 | -| std | 0.00935 | -| value_loss | 3.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15886 | -| time_elapsed | 85064 | -| total_timesteps | 2033408 | -| train/ | | -| approx_kl | 0.008470645 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.00459 | -| n_updates | 158850 | -| policy_gradient_loss | 0.00592 | -| std | 0.00935 | -| value_loss | 1.9e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15887 | -| time_elapsed | 85068 | -| total_timesteps | 2033536 | -| train/ | | -| approx_kl | 0.17264244 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 158860 | -| policy_gradient_loss | 0.11 | -| std | 0.00935 | -| value_loss | 1.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15888 | -| time_elapsed | 85072 | -| total_timesteps | 2033664 | -| train/ | | -| approx_kl | 0.09775356 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 158870 | -| policy_gradient_loss | 0.0787 | -| std | 0.00935 | -| value_loss | 1.32e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15889 | -| time_elapsed | 85077 | -| total_timesteps | 2033792 | -| train/ | | -| approx_kl | 0.016540952 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.00526 | -| n_updates | 158880 | -| policy_gradient_loss | 0.0115 | -| std | 0.00934 | -| value_loss | 7.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 15890 | -| time_elapsed | 85082 | -| total_timesteps | 2033920 | -| train/ | | -| approx_kl | 0.026137553 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.25 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 158890 | -| policy_gradient_loss | -0.00451 | -| std | 0.00934 | -| value_loss | 3.78e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15891 | -| time_elapsed | 85087 | -| total_timesteps | 2034048 | -| train/ | | -| approx_kl | 0.0074171633 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.00843 | -| n_updates | 158900 | -| policy_gradient_loss | 0.00697 | -| std | 0.00932 | -| value_loss | 4.4e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15892 | -| time_elapsed | 85096 | -| total_timesteps | 2034176 | -| train/ | | -| approx_kl | 0.007940728 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.00428 | -| n_updates | 158910 | -| policy_gradient_loss | 0.00916 | -| std | 0.00931 | -| value_loss | 1.24e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15893 | -| time_elapsed | 85100 | -| total_timesteps | 2034304 | -| train/ | | -| approx_kl | 0.20886329 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | 0.00865 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 158920 | -| policy_gradient_loss | 0.0309 | -| std | 0.00931 | -| value_loss | 5.76e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15894 | -| time_elapsed | 85105 | -| total_timesteps | 2034432 | -| train/ | | -| approx_kl | 0.02643379 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 158930 | -| policy_gradient_loss | 0.00709 | -| std | 0.00931 | -| value_loss | 1.26e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15895 | -| time_elapsed | 85111 | -| total_timesteps | 2034560 | -| train/ | | -| approx_kl | 0.004048798 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | -2.14e-05 | -| n_updates | 158940 | -| policy_gradient_loss | 0.00213 | -| std | 0.00931 | -| value_loss | 1.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15896 | -| time_elapsed | 85114 | -| total_timesteps | 2034688 | -| train/ | | -| approx_kl | 0.04805781 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 158950 | -| policy_gradient_loss | -0.015 | -| std | 0.0093 | -| value_loss | 1.28e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15897 | -| time_elapsed | 85119 | -| total_timesteps | 2034816 | -| train/ | | -| approx_kl | 0.005324273 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.00901 | -| learning_rate | 0.0003 | -| loss | 6.93e-05 | -| n_updates | 158960 | -| policy_gradient_loss | 0.0201 | -| std | 0.00929 | -| value_loss | 5.1e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15898 | -| time_elapsed | 85124 | -| total_timesteps | 2034944 | -| train/ | | -| approx_kl | 0.42164052 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 158970 | -| policy_gradient_loss | 0.157 | -| std | 0.00929 | -| value_loss | 2.6e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15899 | -| time_elapsed | 85128 | -| total_timesteps | 2035072 | -| train/ | | -| approx_kl | 0.0063298605 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | -0.000745 | -| n_updates | 158980 | -| policy_gradient_loss | 0.0171 | -| std | 0.00929 | -| value_loss | 1.45e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15900 | -| time_elapsed | 85136 | -| total_timesteps | 2035200 | -| train/ | | -| approx_kl | 0.36379477 | -| clip_fraction | 0.603 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | 0.801 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 158990 | -| policy_gradient_loss | 0.015 | -| std | 0.00928 | -| value_loss | 0.000597 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15901 | -| time_elapsed | 85140 | -| total_timesteps | 2035328 | -| train/ | | -| approx_kl | 0.051249642 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.0737 | -| learning_rate | 0.0003 | -| loss | 0.00902 | -| n_updates | 159000 | -| policy_gradient_loss | 0.0224 | -| std | 0.00928 | -| value_loss | 6.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15902 | -| time_elapsed | 85146 | -| total_timesteps | 2035456 | -| train/ | | -| approx_kl | 0.043855786 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -0.00083 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 159010 | -| policy_gradient_loss | 0.0285 | -| std | 0.00927 | -| value_loss | 1.9e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15903 | -| time_elapsed | 85152 | -| total_timesteps | 2035584 | -| train/ | | -| approx_kl | 0.04189177 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.26 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | 0.00825 | -| n_updates | 159020 | -| policy_gradient_loss | 0.00882 | -| std | 0.00926 | -| value_loss | 1.6e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15904 | -| time_elapsed | 85158 | -| total_timesteps | 2035712 | -| train/ | | -| approx_kl | 0.0063539958 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | 0.00138 | -| n_updates | 159030 | -| policy_gradient_loss | 0.00138 | -| std | 0.00921 | -| value_loss | 2.61e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15905 | -| time_elapsed | 85163 | -| total_timesteps | 2035840 | -| train/ | | -| approx_kl | 0.017979689 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | 0.00703 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 159040 | -| policy_gradient_loss | 0.0237 | -| std | 0.00919 | -| value_loss | 2.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 15906 | -| time_elapsed | 85168 | -| total_timesteps | 2035968 | -| train/ | | -| approx_kl | 0.055608455 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 159050 | -| policy_gradient_loss | 0.0102 | -| std | 0.00918 | -| value_loss | 5.45e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15907 | -| time_elapsed | 85172 | -| total_timesteps | 2036096 | -| train/ | | -| approx_kl | 0.0042110994 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 159060 | -| policy_gradient_loss | 0.00372 | -| std | 0.00918 | -| value_loss | 4.02e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15908 | -| time_elapsed | 85183 | -| total_timesteps | 2036224 | -| train/ | | -| approx_kl | 0.045617398 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 159070 | -| policy_gradient_loss | 0.0205 | -| std | 0.00917 | -| value_loss | 1.11e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15909 | -| time_elapsed | 85188 | -| total_timesteps | 2036352 | -| train/ | | -| approx_kl | 0.015968192 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 159080 | -| policy_gradient_loss | 0.0136 | -| std | 0.00917 | -| value_loss | 3.94e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15910 | -| time_elapsed | 85192 | -| total_timesteps | 2036480 | -| train/ | | -| approx_kl | 0.2677698 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.00661 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 159090 | -| policy_gradient_loss | 0.0338 | -| std | 0.00917 | -| value_loss | 1.75e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15911 | -| time_elapsed | 85196 | -| total_timesteps | 2036608 | -| train/ | | -| approx_kl | 0.0003125728 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 159100 | -| policy_gradient_loss | -0.00617 | -| std | 0.00917 | -| value_loss | 1.05e-08 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15912 | -| time_elapsed | 85201 | -| total_timesteps | 2036736 | -| train/ | | -| approx_kl | 0.000106158666 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 159110 | -| policy_gradient_loss | -0.000697 | -| std | 0.00917 | -| value_loss | 6.88e-09 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15913 | -| time_elapsed | 85206 | -| total_timesteps | 2036864 | -| train/ | | -| approx_kl | 0.024462275 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | -0.000224 | -| n_updates | 159120 | -| policy_gradient_loss | -0.000174 | -| std | 0.00917 | -| value_loss | 3.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 15914 | -| time_elapsed | 85212 | -| total_timesteps | 2036992 | -| train/ | | -| approx_kl | 0.017716063 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 159130 | -| policy_gradient_loss | -0.00135 | -| std | 0.00917 | -| value_loss | 2.37e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15915 | -| time_elapsed | 85216 | -| total_timesteps | 2037120 | -| train/ | | -| approx_kl | 0.02439716 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 3.14e-05 | -| n_updates | 159140 | -| policy_gradient_loss | -8.84e-05 | -| std | 0.00917 | -| value_loss | 1.64e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15916 | -| time_elapsed | 85229 | -| total_timesteps | 2037248 | -| train/ | | -| approx_kl | 0.26063937 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | 0.167 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 159150 | -| policy_gradient_loss | -0.0195 | -| std | 0.00917 | -| value_loss | 0.00138 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15917 | -| time_elapsed | 85233 | -| total_timesteps | 2037376 | -| train/ | | -| approx_kl | 0.0012378446 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.000888 | -| n_updates | 159160 | -| policy_gradient_loss | 0.0122 | -| std | 0.00917 | -| value_loss | 8.44e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15918 | -| time_elapsed | 85237 | -| total_timesteps | 2037504 | -| train/ | | -| approx_kl | 0.26397592 | -| clip_fraction | 0.599 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.825 | -| learning_rate | 0.0003 | -| loss | 0.205 | -| n_updates | 159170 | -| policy_gradient_loss | 0.107 | -| std | 0.00917 | -| value_loss | 1.79e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15919 | -| time_elapsed | 85242 | -| total_timesteps | 2037632 | -| train/ | | -| approx_kl | 0.09310699 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -4.35 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 159180 | -| policy_gradient_loss | 0.0428 | -| std | 0.00917 | -| value_loss | 5.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15920 | -| time_elapsed | 85247 | -| total_timesteps | 2037760 | -| train/ | | -| approx_kl | 0.021962743 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0752 | -| learning_rate | 0.0003 | -| loss | 0.00382 | -| n_updates | 159190 | -| policy_gradient_loss | 0.0141 | -| std | 0.00917 | -| value_loss | 2.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15921 | -| time_elapsed | 85253 | -| total_timesteps | 2037888 | -| train/ | | -| approx_kl | 0.09528861 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.00386 | -| learning_rate | 0.0003 | -| loss | 0.0707 | -| n_updates | 159200 | -| policy_gradient_loss | 0.0156 | -| std | 0.00917 | -| value_loss | 1.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15922 | -| time_elapsed | 85258 | -| total_timesteps | 2038016 | -| train/ | | -| approx_kl | 0.009908574 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 159210 | -| policy_gradient_loss | 0.00889 | -| std | 0.00917 | -| value_loss | 7.36e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15923 | -| time_elapsed | 85270 | -| total_timesteps | 2038144 | -| train/ | | -| approx_kl | 0.29288962 | -| clip_fraction | 0.61 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | 0.0323 | -| n_updates | 159220 | -| policy_gradient_loss | 0.0139 | -| std | 0.00917 | -| value_loss | 5.01e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15924 | -| time_elapsed | 85275 | -| total_timesteps | 2038272 | -| train/ | | -| approx_kl | 0.07120555 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | 0.251 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 159230 | -| policy_gradient_loss | 0.0108 | -| std | 0.00917 | -| value_loss | 4.22e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15925 | -| time_elapsed | 85280 | -| total_timesteps | 2038400 | -| train/ | | -| approx_kl | 0.15455881 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | 0.0774 | -| n_updates | 159240 | -| policy_gradient_loss | 0.0262 | -| std | 0.00916 | -| value_loss | 8.23e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15926 | -| time_elapsed | 85285 | -| total_timesteps | 2038528 | -| train/ | | -| approx_kl | 0.000562557 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.27 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.0039 | -| n_updates | 159250 | -| policy_gradient_loss | 0.00839 | -| std | 0.00915 | -| value_loss | 2.45e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15927 | -| time_elapsed | 85289 | -| total_timesteps | 2038656 | -| train/ | | -| approx_kl | 0.0004411796 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.343 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 159260 | -| policy_gradient_loss | 0.0139 | -| std | 0.00914 | -| value_loss | 9.55e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15928 | -| time_elapsed | 85293 | -| total_timesteps | 2038784 | -| train/ | | -| approx_kl | 0.044458214 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 159270 | -| policy_gradient_loss | 0.0193 | -| std | 0.00914 | -| value_loss | 5.21e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 15929 | -| time_elapsed | 85297 | -| total_timesteps | 2038912 | -| train/ | | -| approx_kl | 0.062803894 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0419 | -| n_updates | 159280 | -| policy_gradient_loss | 0.0288 | -| std | 0.00914 | -| value_loss | 2.15e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15930 | -| time_elapsed | 85301 | -| total_timesteps | 2039040 | -| train/ | | -| approx_kl | 0.085233256 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 159290 | -| policy_gradient_loss | 0.0075 | -| std | 0.00914 | -| value_loss | 9.5e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15931 | -| time_elapsed | 85312 | -| total_timesteps | 2039168 | -| train/ | | -| approx_kl | 0.0063151517 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | 0.791 | -| learning_rate | 0.0003 | -| loss | -0.00868 | -| n_updates | 159300 | -| policy_gradient_loss | -0.00998 | -| std | 0.00913 | -| value_loss | 0.00418 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15932 | -| time_elapsed | 85316 | -| total_timesteps | 2039296 | -| train/ | | -| approx_kl | 0.124342024 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.082 | -| n_updates | 159310 | -| policy_gradient_loss | 0.0261 | -| std | 0.00913 | -| value_loss | 6.89e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15933 | -| time_elapsed | 85321 | -| total_timesteps | 2039424 | -| train/ | | -| approx_kl | 0.01984342 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 159320 | -| policy_gradient_loss | 0.0215 | -| std | 0.00913 | -| value_loss | 2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15934 | -| time_elapsed | 85326 | -| total_timesteps | 2039552 | -| train/ | | -| approx_kl | 0.010467907 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 159330 | -| policy_gradient_loss | 0.0107 | -| std | 0.00913 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15935 | -| time_elapsed | 85331 | -| total_timesteps | 2039680 | -| train/ | | -| approx_kl | 0.103828385 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 159340 | -| policy_gradient_loss | 0.022 | -| std | 0.00913 | -| value_loss | 9.96e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15936 | -| time_elapsed | 85335 | -| total_timesteps | 2039808 | -| train/ | | -| approx_kl | 0.0014051837 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | -0.00734 | -| n_updates | 159350 | -| policy_gradient_loss | -0.00385 | -| std | 0.00913 | -| value_loss | 5.75e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 15937 | -| time_elapsed | 85340 | -| total_timesteps | 2039936 | -| train/ | | -| approx_kl | 0.044732973 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.00974 | -| n_updates | 159360 | -| policy_gradient_loss | 0.0398 | -| std | 0.00913 | -| value_loss | 3.71e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15938 | -| time_elapsed | 85344 | -| total_timesteps | 2040064 | -| train/ | | -| approx_kl | 0.1154263 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.0653 | -| n_updates | 159370 | -| policy_gradient_loss | 0.023 | -| std | 0.00913 | -| value_loss | 2.41e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15939 | -| time_elapsed | 85350 | -| total_timesteps | 2040192 | -| train/ | | -| approx_kl | 0.011168762 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | 0.736 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 159380 | -| policy_gradient_loss | -0.00509 | -| std | 0.00913 | -| value_loss | 0.00653 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15940 | -| time_elapsed | 85356 | -| total_timesteps | 2040320 | -| train/ | | -| approx_kl | 0.0003204504 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | -0.000656 | -| n_updates | 159390 | -| policy_gradient_loss | 0.00436 | -| std | 0.00912 | -| value_loss | 5.95e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15941 | -| time_elapsed | 85361 | -| total_timesteps | 2040448 | -| train/ | | -| approx_kl | 0.038608894 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00772 | -| n_updates | 159400 | -| policy_gradient_loss | 0.0395 | -| std | 0.00912 | -| value_loss | 1.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15942 | -| time_elapsed | 85368 | -| total_timesteps | 2040576 | -| train/ | | -| approx_kl | 0.16800718 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.0672 | -| n_updates | 159410 | -| policy_gradient_loss | 0.03 | -| std | 0.00912 | -| value_loss | 2.77e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15943 | -| time_elapsed | 85374 | -| total_timesteps | 2040704 | -| train/ | | -| approx_kl | 6.0474034e-05 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | -0.000745 | -| n_updates | 159420 | -| policy_gradient_loss | 0.00571 | -| std | 0.00908 | -| value_loss | 2.15e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15944 | -| time_elapsed | 85380 | -| total_timesteps | 2040832 | -| train/ | | -| approx_kl | 0.028188542 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.28 | -| explained_variance | 0.00561 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 159430 | -| policy_gradient_loss | 0.0369 | -| std | 0.00905 | -| value_loss | 0.000229 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 15945 | -| time_elapsed | 85386 | -| total_timesteps | 2040960 | -| train/ | | -| approx_kl | 0.11146477 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 159440 | -| policy_gradient_loss | 0.0133 | -| std | 0.00904 | -| value_loss | 5.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15946 | -| time_elapsed | 85392 | -| total_timesteps | 2041088 | -| train/ | | -| approx_kl | 0.030385457 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | 0.00147 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 159450 | -| policy_gradient_loss | 0.0334 | -| std | 0.00903 | -| value_loss | 6.22e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15947 | -| time_elapsed | 85401 | -| total_timesteps | 2041216 | -| train/ | | -| approx_kl | 0.16548039 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | 0.793 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 159460 | -| policy_gradient_loss | 0.00134 | -| std | 0.00903 | -| value_loss | 0.00469 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15948 | -| time_elapsed | 85407 | -| total_timesteps | 2041344 | -| train/ | | -| approx_kl | 0.054829434 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 159470 | -| policy_gradient_loss | 0.0383 | -| std | 0.00903 | -| value_loss | 0.000137 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15949 | -| time_elapsed | 85413 | -| total_timesteps | 2041472 | -| train/ | | -| approx_kl | 0.12234744 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | 0.00688 | -| learning_rate | 0.0003 | -| loss | 0.0652 | -| n_updates | 159480 | -| policy_gradient_loss | 0.0262 | -| std | 0.00903 | -| value_loss | 1.67e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15950 | -| time_elapsed | 85418 | -| total_timesteps | 2041600 | -| train/ | | -| approx_kl | 0.0010606404 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 159490 | -| policy_gradient_loss | 0.00791 | -| std | 0.00903 | -| value_loss | 8.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15951 | -| time_elapsed | 85423 | -| total_timesteps | 2041728 | -| train/ | | -| approx_kl | 0.041058738 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 159500 | -| policy_gradient_loss | 0.036 | -| std | 0.00903 | -| value_loss | 6.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15952 | -| time_elapsed | 85429 | -| total_timesteps | 2041856 | -| train/ | | -| approx_kl | 0.028045973 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 159510 | -| policy_gradient_loss | 0.0234 | -| std | 0.00903 | -| value_loss | 5.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15953 | -| time_elapsed | 85435 | -| total_timesteps | 2041984 | -| train/ | | -| approx_kl | 0.11088615 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | 0.0521 | -| n_updates | 159520 | -| policy_gradient_loss | 0.0199 | -| std | 0.00903 | -| value_loss | 3.76e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 15954 | -| time_elapsed | 85439 | -| total_timesteps | 2042112 | -| train/ | | -| approx_kl | 0.028348923 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0891 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 159530 | -| policy_gradient_loss | 0.0387 | -| std | 0.00903 | -| value_loss | 2.41e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 15955 | -| time_elapsed | 85450 | -| total_timesteps | 2042240 | -| train/ | | -| approx_kl | 0.0180797 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 159540 | -| policy_gradient_loss | -0.0192 | -| std | 0.00903 | -| value_loss | 0.000897 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 15956 | -| time_elapsed | 85456 | -| total_timesteps | 2042368 | -| train/ | | -| approx_kl | 0.038640548 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.00649 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 159550 | -| policy_gradient_loss | 0.0468 | -| std | 0.00903 | -| value_loss | 2.29e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 15957 | -| time_elapsed | 85462 | -| total_timesteps | 2042496 | -| train/ | | -| approx_kl | 0.02697345 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 159560 | -| policy_gradient_loss | 0.0177 | -| std | 0.00902 | -| value_loss | 1.1e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 15958 | -| time_elapsed | 85467 | -| total_timesteps | 2042624 | -| train/ | | -| approx_kl | 0.019752733 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.093 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 159570 | -| policy_gradient_loss | 0.015 | -| std | 0.00902 | -| value_loss | 4.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 15959 | -| time_elapsed | 85471 | -| total_timesteps | 2042752 | -| train/ | | -| approx_kl | 0.017664913 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 159580 | -| policy_gradient_loss | 0.0192 | -| std | 0.00902 | -| value_loss | 4.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 15960 | -| time_elapsed | 85475 | -| total_timesteps | 2042880 | -| train/ | | -| approx_kl | 0.104269505 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.0535 | -| n_updates | 159590 | -| policy_gradient_loss | 0.0227 | -| std | 0.00902 | -| value_loss | 2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15961 | -| time_elapsed | 85480 | -| total_timesteps | 2043008 | -| train/ | | -| approx_kl | 0.029796157 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | 0.00496 | -| n_updates | 159600 | -| policy_gradient_loss | 0.0445 | -| std | 0.00902 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15962 | -| time_elapsed | 85491 | -| total_timesteps | 2043136 | -| train/ | | -| approx_kl | 0.012629569 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | 0.849 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 159610 | -| policy_gradient_loss | -0.0156 | -| std | 0.00902 | -| value_loss | 0.00295 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15963 | -| time_elapsed | 85495 | -| total_timesteps | 2043264 | -| train/ | | -| approx_kl | 0.0041298266 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | 0.0553 | -| learning_rate | 0.0003 | -| loss | -5.69e-05 | -| n_updates | 159620 | -| policy_gradient_loss | 0.0207 | -| std | 0.00902 | -| value_loss | 0.000302 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15964 | -| time_elapsed | 85500 | -| total_timesteps | 2043392 | -| train/ | | -| approx_kl | 0.07340427 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | 0.00424 | -| learning_rate | 0.0003 | -| loss | 0.0841 | -| n_updates | 159630 | -| policy_gradient_loss | 0.0296 | -| std | 0.00901 | -| value_loss | 3.86e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15965 | -| time_elapsed | 85505 | -| total_timesteps | 2043520 | -| train/ | | -| approx_kl | 0.0032479358 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 3.29 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | -0.000275 | -| n_updates | 159640 | -| policy_gradient_loss | 8.43e-05 | -| std | 0.00897 | -| value_loss | 0.000115 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15966 | -| time_elapsed | 85509 | -| total_timesteps | 2043648 | -| train/ | | -| approx_kl | 0.005128045 | -| clip_fraction | 0.0305 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | -0.00556 | -| n_updates | 159650 | -| policy_gradient_loss | -0.00244 | -| std | 0.00894 | -| value_loss | 0.000335 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15967 | -| time_elapsed | 85515 | -| total_timesteps | 2043776 | -| train/ | | -| approx_kl | 0.011345424 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.616 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 159660 | -| policy_gradient_loss | 0.00182 | -| std | 0.00894 | -| value_loss | 8.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 15968 | -| time_elapsed | 85521 | -| total_timesteps | 2043904 | -| train/ | | -| approx_kl | 0.015168939 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 159670 | -| policy_gradient_loss | 0.00127 | -| std | 0.00893 | -| value_loss | 3.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15969 | -| time_elapsed | 85526 | -| total_timesteps | 2044032 | -| train/ | | -| approx_kl | 0.114917725 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 159680 | -| policy_gradient_loss | 0.00721 | -| std | 0.00892 | -| value_loss | 1.72e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15970 | -| time_elapsed | 85538 | -| total_timesteps | 2044160 | -| train/ | | -| approx_kl | 0.13432685 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 159690 | -| policy_gradient_loss | -0.00402 | -| std | 0.00892 | -| value_loss | 2.89e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15971 | -| time_elapsed | 85544 | -| total_timesteps | 2044288 | -| train/ | | -| approx_kl | 0.03457378 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -2.12 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 159700 | -| policy_gradient_loss | 0.0174 | -| std | 0.0089 | -| value_loss | 2.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15972 | -| time_elapsed | 85549 | -| total_timesteps | 2044416 | -| train/ | | -| approx_kl | 0.13245246 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | 0.0608 | -| n_updates | 159710 | -| policy_gradient_loss | 0.0102 | -| std | 0.00887 | -| value_loss | 1.58e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15973 | -| time_elapsed | 85553 | -| total_timesteps | 2044544 | -| train/ | | -| approx_kl | 0.10973249 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.00822 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 159720 | -| policy_gradient_loss | 0.00508 | -| std | 0.00886 | -| value_loss | 3.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15974 | -| time_elapsed | 85558 | -| total_timesteps | 2044672 | -| train/ | | -| approx_kl | 0.041800644 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 159730 | -| policy_gradient_loss | 0.0177 | -| std | 0.00886 | -| value_loss | 1.98e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15975 | -| time_elapsed | 85563 | -| total_timesteps | 2044800 | -| train/ | | -| approx_kl | 0.0784182 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.00876 | -| n_updates | 159740 | -| policy_gradient_loss | 0.00499 | -| std | 0.00886 | -| value_loss | 1.48e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 15976 | -| time_elapsed | 85567 | -| total_timesteps | 2044928 | -| train/ | | -| approx_kl | 0.018824833 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 159750 | -| policy_gradient_loss | -0.000188 | -| std | 0.00886 | -| value_loss | 8.9e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15977 | -| time_elapsed | 85572 | -| total_timesteps | 2045056 | -| train/ | | -| approx_kl | 0.0009404798 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.00369 | -| n_updates | 159760 | -| policy_gradient_loss | 0.000199 | -| std | 0.00886 | -| value_loss | 4.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15978 | -| time_elapsed | 85580 | -| total_timesteps | 2045184 | -| train/ | | -| approx_kl | 0.021303853 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 159770 | -| policy_gradient_loss | -0.0123 | -| std | 0.00887 | -| value_loss | 0.00039 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15979 | -| time_elapsed | 85585 | -| total_timesteps | 2045312 | -| train/ | | -| approx_kl | 0.057801373 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | 0.0374 | -| n_updates | 159780 | -| policy_gradient_loss | 0.0288 | -| std | 0.00887 | -| value_loss | 4.74e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15980 | -| time_elapsed | 85590 | -| total_timesteps | 2045440 | -| train/ | | -| approx_kl | 0.1545322 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0679 | -| n_updates | 159790 | -| policy_gradient_loss | 0.0108 | -| std | 0.00887 | -| value_loss | 3.79e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15981 | -| time_elapsed | 85595 | -| total_timesteps | 2045568 | -| train/ | | -| approx_kl | 0.024106985 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 159800 | -| policy_gradient_loss | 0.00218 | -| std | 0.00887 | -| value_loss | 2.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15982 | -| time_elapsed | 85600 | -| total_timesteps | 2045696 | -| train/ | | -| approx_kl | 0.010005849 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 159810 | -| policy_gradient_loss | 0.00599 | -| std | 0.00888 | -| value_loss | 1.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15983 | -| time_elapsed | 85606 | -| total_timesteps | 2045824 | -| train/ | | -| approx_kl | 0.048342653 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0999 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 159820 | -| policy_gradient_loss | 0.0642 | -| std | 0.00888 | -| value_loss | 5.75e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 15984 | -| time_elapsed | 85612 | -| total_timesteps | 2045952 | -| train/ | | -| approx_kl | 0.06695749 | -| clip_fraction | 0.64 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | 0.0329 | -| n_updates | 159830 | -| policy_gradient_loss | 0.0554 | -| std | 0.00888 | -| value_loss | 3.73e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15985 | -| time_elapsed | 85617 | -| total_timesteps | 2046080 | -| train/ | | -| approx_kl | 0.07074693 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 159840 | -| policy_gradient_loss | 0.0789 | -| std | 0.00888 | -| value_loss | 2.27e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15986 | -| time_elapsed | 85625 | -| total_timesteps | 2046208 | -| train/ | | -| approx_kl | 0.6083554 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -7.55 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 159850 | -| policy_gradient_loss | 0.00704 | -| std | 0.00888 | -| value_loss | 0.00414 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15987 | -| time_elapsed | 85631 | -| total_timesteps | 2046336 | -| train/ | | -| approx_kl | 0.079087526 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.00914 | -| learning_rate | 0.0003 | -| loss | 0.0567 | -| n_updates | 159860 | -| policy_gradient_loss | 0.0159 | -| std | 0.00888 | -| value_loss | 3.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15988 | -| time_elapsed | 85636 | -| total_timesteps | 2046464 | -| train/ | | -| approx_kl | 0.011603303 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0928 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 159870 | -| policy_gradient_loss | 0.00734 | -| std | 0.00888 | -| value_loss | 4.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15989 | -| time_elapsed | 85641 | -| total_timesteps | 2046592 | -| train/ | | -| approx_kl | 0.16530645 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.0924 | -| n_updates | 159880 | -| policy_gradient_loss | 0.062 | -| std | 0.00888 | -| value_loss | 3.34e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15990 | -| time_elapsed | 85647 | -| total_timesteps | 2046720 | -| train/ | | -| approx_kl | 0.11884469 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0892 | -| n_updates | 159890 | -| policy_gradient_loss | 0.0917 | -| std | 0.00888 | -| value_loss | 2.35e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15991 | -| time_elapsed | 85652 | -| total_timesteps | 2046848 | -| train/ | | -| approx_kl | 0.09441829 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.0899 | -| n_updates | 159900 | -| policy_gradient_loss | 0.097 | -| std | 0.00888 | -| value_loss | 2.02e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 15992 | -| time_elapsed | 85658 | -| total_timesteps | 2046976 | -| train/ | | -| approx_kl | 0.016302243 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.00311 | -| n_updates | 159910 | -| policy_gradient_loss | 0.0114 | -| std | 0.00889 | -| value_loss | 1.11e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15993 | -| time_elapsed | 85663 | -| total_timesteps | 2047104 | -| train/ | | -| approx_kl | 0.27057582 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.055 | -| learning_rate | 0.0003 | -| loss | 0.0773 | -| n_updates | 159920 | -| policy_gradient_loss | 0.0211 | -| std | 0.0089 | -| value_loss | 1.2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15994 | -| time_elapsed | 85675 | -| total_timesteps | 2047232 | -| train/ | | -| approx_kl | 0.054057963 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.87 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 159930 | -| policy_gradient_loss | -0.0103 | -| std | 0.0089 | -| value_loss | 0.00231 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15995 | -| time_elapsed | 85680 | -| total_timesteps | 2047360 | -| train/ | | -| approx_kl | 0.053195953 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 159940 | -| policy_gradient_loss | 0.00447 | -| std | 0.0089 | -| value_loss | 8.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15996 | -| time_elapsed | 85685 | -| total_timesteps | 2047488 | -| train/ | | -| approx_kl | 0.19637349 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | 0.0703 | -| n_updates | 159950 | -| policy_gradient_loss | 0.00924 | -| std | 0.0089 | -| value_loss | 1.55e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15997 | -| time_elapsed | 85689 | -| total_timesteps | 2047616 | -| train/ | | -| approx_kl | 0.1227544 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | 0.0559 | -| n_updates | 159960 | -| policy_gradient_loss | 0.0213 | -| std | 0.0089 | -| value_loss | 5.69e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15998 | -| time_elapsed | 85693 | -| total_timesteps | 2047744 | -| train/ | | -| approx_kl | 0.056990243 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | 0.0374 | -| n_updates | 159970 | -| policy_gradient_loss | 0.0296 | -| std | 0.0089 | -| value_loss | 1.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 15999 | -| time_elapsed | 85699 | -| total_timesteps | 2047872 | -| train/ | | -| approx_kl | 0.17571391 | -| clip_fraction | 0.586 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 159980 | -| policy_gradient_loss | 0.0889 | -| std | 0.0089 | -| value_loss | 9.49e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16000 | -| time_elapsed | 85706 | -| total_timesteps | 2048000 | -| train/ | | -| approx_kl | 0.098725125 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.0859 | -| n_updates | 159990 | -| policy_gradient_loss | 0.085 | -| std | 0.0089 | -| value_loss | 7.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16001 | -| time_elapsed | 85711 | -| total_timesteps | 2048128 | -| train/ | | -| approx_kl | 0.085050255 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.00284 | -| learning_rate | 0.0003 | -| loss | 0.0544 | -| n_updates | 160000 | -| policy_gradient_loss | 0.068 | -| std | 0.0089 | -| value_loss | 3.93e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16002 | -| time_elapsed | 85724 | -| total_timesteps | 2048256 | -| train/ | | -| approx_kl | 0.08094397 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.903 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 160010 | -| policy_gradient_loss | 0.0299 | -| std | 0.0089 | -| value_loss | 0.00162 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16003 | -| time_elapsed | 85729 | -| total_timesteps | 2048384 | -| train/ | | -| approx_kl | 0.14754377 | -| clip_fraction | 0.646 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.093 | -| n_updates | 160020 | -| policy_gradient_loss | 0.081 | -| std | 0.00889 | -| value_loss | 5.48e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16004 | -| time_elapsed | 85735 | -| total_timesteps | 2048512 | -| train/ | | -| approx_kl | 0.10744661 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -1.91 | -| learning_rate | 0.0003 | -| loss | 0.0501 | -| n_updates | 160030 | -| policy_gradient_loss | 0.0546 | -| std | 0.00888 | -| value_loss | 2.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16005 | -| time_elapsed | 85743 | -| total_timesteps | 2048640 | -| train/ | | -| approx_kl | 0.018291796 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.00864 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 160040 | -| policy_gradient_loss | 0.00702 | -| std | 0.00888 | -| value_loss | 4.02e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16006 | -| time_elapsed | 85749 | -| total_timesteps | 2048768 | -| train/ | | -| approx_kl | 0.270549 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0826 | -| n_updates | 160050 | -| policy_gradient_loss | 0.023 | -| std | 0.00888 | -| value_loss | 2.81e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 16007 | -| time_elapsed | 85755 | -| total_timesteps | 2048896 | -| train/ | | -| approx_kl | 0.058526576 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | -0.00616 | -| n_updates | 160060 | -| policy_gradient_loss | 0.00792 | -| std | 0.00889 | -| value_loss | 9.75e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16008 | -| time_elapsed | 85761 | -| total_timesteps | 2049024 | -| train/ | | -| approx_kl | 0.5172669 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | 0.381 | -| n_updates | 160070 | -| policy_gradient_loss | 0.125 | -| std | 0.00889 | -| value_loss | 6.3e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16009 | -| time_elapsed | 85774 | -| total_timesteps | 2049152 | -| train/ | | -| approx_kl | 0.087390505 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | 0.00667 | -| n_updates | 160080 | -| policy_gradient_loss | 0.00574 | -| std | 0.00889 | -| value_loss | 0.00245 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16010 | -| time_elapsed | 85780 | -| total_timesteps | 2049280 | -| train/ | | -| approx_kl | 0.069123924 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.344 | -| learning_rate | 0.0003 | -| loss | 0.0494 | -| n_updates | 160090 | -| policy_gradient_loss | 0.0358 | -| std | 0.00888 | -| value_loss | 2.7e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16011 | -| time_elapsed | 85785 | -| total_timesteps | 2049408 | -| train/ | | -| approx_kl | 0.21288952 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 160100 | -| policy_gradient_loss | 0.0891 | -| std | 0.00888 | -| value_loss | 3.34e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16012 | -| time_elapsed | 85789 | -| total_timesteps | 2049536 | -| train/ | | -| approx_kl | 0.1261376 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.789 | -| learning_rate | 0.0003 | -| loss | 0.0783 | -| n_updates | 160110 | -| policy_gradient_loss | 0.0705 | -| std | 0.00888 | -| value_loss | 1.12e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16013 | -| time_elapsed | 85794 | -| total_timesteps | 2049664 | -| train/ | | -| approx_kl | 0.08536088 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0793 | -| n_updates | 160120 | -| policy_gradient_loss | 0.0757 | -| std | 0.00887 | -| value_loss | 4.36e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16014 | -| time_elapsed | 85799 | -| total_timesteps | 2049792 | -| train/ | | -| approx_kl | 0.0006846669 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 160130 | -| policy_gradient_loss | 0.00354 | -| std | 0.00889 | -| value_loss | 0.00122 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16015 | -| time_elapsed | 85804 | -| total_timesteps | 2049920 | -| train/ | | -| approx_kl | 0.035095204 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.21 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 160140 | -| policy_gradient_loss | 0.0429 | -| std | 0.0089 | -| value_loss | 0.00154 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16016 | -| time_elapsed | 85810 | -| total_timesteps | 2050048 | -| train/ | | -| approx_kl | 0.009762925 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -7.12 | -| learning_rate | 0.0003 | -| loss | 0.00071 | -| n_updates | 160150 | -| policy_gradient_loss | 0.00704 | -| std | 0.0089 | -| value_loss | 4.45e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16017 | -| time_elapsed | 85820 | -| total_timesteps | 2050176 | -| train/ | | -| approx_kl | 0.13738035 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.927 | -| learning_rate | 0.0003 | -| loss | -0.00532 | -| n_updates | 160160 | -| policy_gradient_loss | -0.0137 | -| std | 0.0089 | -| value_loss | 0.00101 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16018 | -| time_elapsed | 85825 | -| total_timesteps | 2050304 | -| train/ | | -| approx_kl | 0.03858614 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0853 | -| learning_rate | 0.0003 | -| loss | 0.00612 | -| n_updates | 160170 | -| policy_gradient_loss | 0.0107 | -| std | 0.0089 | -| value_loss | 8.82e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16019 | -| time_elapsed | 85830 | -| total_timesteps | 2050432 | -| train/ | | -| approx_kl | 0.01962632 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 160180 | -| policy_gradient_loss | 0.0149 | -| std | 0.00889 | -| value_loss | 7.18e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16020 | -| time_elapsed | 85835 | -| total_timesteps | 2050560 | -| train/ | | -| approx_kl | 0.26982617 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | 0.182 | -| n_updates | 160190 | -| policy_gradient_loss | 0.113 | -| std | 0.00888 | -| value_loss | 7.89e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16021 | -| time_elapsed | 85839 | -| total_timesteps | 2050688 | -| train/ | | -| approx_kl | 0.12512076 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0929 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 160200 | -| policy_gradient_loss | 0.0788 | -| std | 0.00888 | -| value_loss | 5.34e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16022 | -| time_elapsed | 85845 | -| total_timesteps | 2050816 | -| train/ | | -| approx_kl | 0.089019574 | -| clip_fraction | 0.576 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 160210 | -| policy_gradient_loss | 0.1 | -| std | 0.00887 | -| value_loss | 4.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 16023 | -| time_elapsed | 85851 | -| total_timesteps | 2050944 | -| train/ | | -| approx_kl | 0.07949916 | -| clip_fraction | 0.612 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.0755 | -| n_updates | 160220 | -| policy_gradient_loss | 0.0674 | -| std | 0.00887 | -| value_loss | 3.35e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16024 | -| time_elapsed | 85857 | -| total_timesteps | 2051072 | -| train/ | | -| approx_kl | 0.013381857 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.00237 | -| n_updates | 160230 | -| policy_gradient_loss | 0.0102 | -| std | 0.00887 | -| value_loss | 1.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16025 | -| time_elapsed | 85867 | -| total_timesteps | 2051200 | -| train/ | | -| approx_kl | 0.11037576 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 160240 | -| policy_gradient_loss | -0.0128 | -| std | 0.00888 | -| value_loss | 0.000712 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16026 | -| time_elapsed | 85872 | -| total_timesteps | 2051328 | -| train/ | | -| approx_kl | 0.17956051 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -19.8 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 160250 | -| policy_gradient_loss | 0.0044 | -| std | 0.00888 | -| value_loss | 1.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16027 | -| time_elapsed | 85877 | -| total_timesteps | 2051456 | -| train/ | | -| approx_kl | 0.032867037 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.298 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 160260 | -| policy_gradient_loss | 0.0125 | -| std | 0.00888 | -| value_loss | 1.44e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16028 | -| time_elapsed | 85881 | -| total_timesteps | 2051584 | -| train/ | | -| approx_kl | 0.163765 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.516 | -| learning_rate | 0.0003 | -| loss | 0.0952 | -| n_updates | 160270 | -| policy_gradient_loss | 0.0457 | -| std | 0.00888 | -| value_loss | 1.11e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16029 | -| time_elapsed | 85888 | -| total_timesteps | 2051712 | -| train/ | | -| approx_kl | 0.027530843 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.229 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 160280 | -| policy_gradient_loss | 0.0126 | -| std | 0.00888 | -| value_loss | 5.14e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16030 | -| time_elapsed | 85892 | -| total_timesteps | 2051840 | -| train/ | | -| approx_kl | 0.023729976 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 160290 | -| policy_gradient_loss | -0.00798 | -| std | 0.00888 | -| value_loss | 2.68e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16031 | -| time_elapsed | 85897 | -| total_timesteps | 2051968 | -| train/ | | -| approx_kl | 0.001809787 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0637 | -| learning_rate | 0.0003 | -| loss | -0.00079 | -| n_updates | 160300 | -| policy_gradient_loss | 0.00952 | -| std | 0.00888 | -| value_loss | 1.56e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16032 | -| time_elapsed | 85903 | -| total_timesteps | 2052096 | -| train/ | | -| approx_kl | 0.0008745198 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0668 | -| learning_rate | 0.0003 | -| loss | 0.00582 | -| n_updates | 160310 | -| policy_gradient_loss | -7.32e-05 | -| std | 0.00888 | -| value_loss | 1.31e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16033 | -| time_elapsed | 85913 | -| total_timesteps | 2052224 | -| train/ | | -| approx_kl | 0.08977763 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 160320 | -| policy_gradient_loss | 0.0318 | -| std | 0.00888 | -| value_loss | 0.00356 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16034 | -| time_elapsed | 85918 | -| total_timesteps | 2052352 | -| train/ | | -| approx_kl | 0.39845502 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 160330 | -| policy_gradient_loss | 0.0554 | -| std | 0.00889 | -| value_loss | 1.3e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16035 | -| time_elapsed | 85924 | -| total_timesteps | 2052480 | -| train/ | | -| approx_kl | 0.0087703 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 160340 | -| policy_gradient_loss | 0.0547 | -| std | 0.00889 | -| value_loss | 1.34e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16036 | -| time_elapsed | 85928 | -| total_timesteps | 2052608 | -| train/ | | -| approx_kl | 0.005823157 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.00807 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 160350 | -| policy_gradient_loss | 0.008 | -| std | 0.00889 | -| value_loss | 8.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16037 | -| time_elapsed | 85934 | -| total_timesteps | 2052736 | -| train/ | | -| approx_kl | 0.042095587 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0628 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 160360 | -| policy_gradient_loss | 0.0192 | -| std | 0.00889 | -| value_loss | 1.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16038 | -| time_elapsed | 85938 | -| total_timesteps | 2052864 | -| train/ | | -| approx_kl | 0.14712384 | -| clip_fraction | 0.607 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 160370 | -| policy_gradient_loss | 0.0773 | -| std | 0.00889 | -| value_loss | 5.48e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 16039 | -| time_elapsed | 85944 | -| total_timesteps | 2052992 | -| train/ | | -| approx_kl | 0.09358693 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0886 | -| n_updates | 160380 | -| policy_gradient_loss | 0.0793 | -| std | 0.00889 | -| value_loss | 4.63e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16040 | -| time_elapsed | 85948 | -| total_timesteps | 2053120 | -| train/ | | -| approx_kl | 0.08838986 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.0692 | -| n_updates | 160390 | -| policy_gradient_loss | 0.0938 | -| std | 0.00889 | -| value_loss | 3.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16041 | -| time_elapsed | 85960 | -| total_timesteps | 2053248 | -| train/ | | -| approx_kl | 0.030801386 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 160400 | -| policy_gradient_loss | -0.00579 | -| std | 0.00889 | -| value_loss | 0.000442 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16042 | -| time_elapsed | 85966 | -| total_timesteps | 2053376 | -| train/ | | -| approx_kl | 0.045705374 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.00527 | -| learning_rate | 0.0003 | -| loss | 0.0554 | -| n_updates | 160410 | -| policy_gradient_loss | 0.0208 | -| std | 0.00889 | -| value_loss | 1.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16043 | -| time_elapsed | 85971 | -| total_timesteps | 2053504 | -| train/ | | -| approx_kl | 0.016925886 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.00621 | -| learning_rate | 0.0003 | -| loss | -0.00946 | -| n_updates | 160420 | -| policy_gradient_loss | 0.015 | -| std | 0.00889 | -| value_loss | 4.62e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16044 | -| time_elapsed | 85975 | -| total_timesteps | 2053632 | -| train/ | | -| approx_kl | 0.41019493 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.202 | -| n_updates | 160430 | -| policy_gradient_loss | 0.0972 | -| std | 0.00889 | -| value_loss | 3.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16045 | -| time_elapsed | 85981 | -| total_timesteps | 2053760 | -| train/ | | -| approx_kl | 0.003522769 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 160440 | -| policy_gradient_loss | 0.0113 | -| std | 0.00889 | -| value_loss | 2.01e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 16046 | -| time_elapsed | 85985 | -| total_timesteps | 2053888 | -| train/ | | -| approx_kl | 0.0421239 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 160450 | -| policy_gradient_loss | 0.0098 | -| std | 0.00889 | -| value_loss | 1.61e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16047 | -| time_elapsed | 85990 | -| total_timesteps | 2054016 | -| train/ | | -| approx_kl | 0.047177438 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 2.97e-05 | -| n_updates | 160460 | -| policy_gradient_loss | 0.00487 | -| std | 0.00889 | -| value_loss | 6.08e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16048 | -| time_elapsed | 85999 | -| total_timesteps | 2054144 | -| train/ | | -| approx_kl | 0.0053030755 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 160470 | -| policy_gradient_loss | 0.00823 | -| std | 0.00889 | -| value_loss | 7.79e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16049 | -| time_elapsed | 86003 | -| total_timesteps | 2054272 | -| train/ | | -| approx_kl | 0.025317403 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.3 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.00959 | -| n_updates | 160480 | -| policy_gradient_loss | 0.0166 | -| std | 0.00889 | -| value_loss | 7.55e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16050 | -| time_elapsed | 86006 | -| total_timesteps | 2054400 | -| train/ | | -| approx_kl | 0.045909 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 160490 | -| policy_gradient_loss | 0.0131 | -| std | 0.00886 | -| value_loss | 1.08e-05 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16051 | -| time_elapsed | 86009 | -| total_timesteps | 2054528 | -| train/ | | -| approx_kl | 0.12011585 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.00593 | -| learning_rate | 0.0003 | -| loss | 0.0467 | -| n_updates | 160500 | -| policy_gradient_loss | 0.0181 | -| std | 0.00885 | -| value_loss | 2.3e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16052 | -| time_elapsed | 86013 | -| total_timesteps | 2054656 | -| train/ | | -| approx_kl | 0.031891856 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.0053 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 160510 | -| policy_gradient_loss | 0.0165 | -| std | 0.00884 | -| value_loss | 1.01e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16053 | -| time_elapsed | 86017 | -| total_timesteps | 2054784 | -| train/ | | -| approx_kl | 0.17371841 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.376 | -| learning_rate | 0.0003 | -| loss | 0.0663 | -| n_updates | 160520 | -| policy_gradient_loss | 0.015 | -| std | 0.00884 | -| value_loss | 6.39e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16054 | -| time_elapsed | 86021 | -| total_timesteps | 2054912 | -| train/ | | -| approx_kl | 9.969808e-06 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0718 | -| learning_rate | 0.0003 | -| loss | 0.000474 | -| n_updates | 160530 | -| policy_gradient_loss | -0.00248 | -| std | 0.00884 | -| value_loss | 6.51e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16055 | -| time_elapsed | 86026 | -| total_timesteps | 2055040 | -| train/ | | -| approx_kl | 0.00015939353 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.00882 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 160540 | -| policy_gradient_loss | -0.00398 | -| std | 0.00884 | -| value_loss | 2.98e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16056 | -| time_elapsed | 86036 | -| total_timesteps | 2055168 | -| train/ | | -| approx_kl | 0.03622215 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.593 | -| learning_rate | 0.0003 | -| loss | -0.0257 | -| n_updates | 160550 | -| policy_gradient_loss | 0.00233 | -| std | 0.00884 | -| value_loss | 0.00126 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16057 | -| time_elapsed | 86040 | -| total_timesteps | 2055296 | -| train/ | | -| approx_kl | 0.0040051052 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -19.6 | -| learning_rate | 0.0003 | -| loss | 0.00813 | -| n_updates | 160560 | -| policy_gradient_loss | -0.00866 | -| std | 0.00884 | -| value_loss | 7.96e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16058 | -| time_elapsed | 86044 | -| total_timesteps | 2055424 | -| train/ | | -| approx_kl | 0.049975544 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.416 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 160570 | -| policy_gradient_loss | -0.00143 | -| std | 0.00884 | -| value_loss | 3.31e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16059 | -| time_elapsed | 86051 | -| total_timesteps | 2055552 | -| train/ | | -| approx_kl | 0.0747508 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.0192 | -| n_updates | 160580 | -| policy_gradient_loss | 0.00891 | -| std | 0.00884 | -| value_loss | 3.87e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16060 | -| time_elapsed | 86056 | -| total_timesteps | 2055680 | -| train/ | | -| approx_kl | 0.3559365 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0024 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 160590 | -| policy_gradient_loss | 0.0289 | -| std | 0.00884 | -| value_loss | 2.19e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16061 | -| time_elapsed | 86060 | -| total_timesteps | 2055808 | -| train/ | | -| approx_kl | 0.0072803725 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | -0.00593 | -| n_updates | 160600 | -| policy_gradient_loss | -0.000146 | -| std | 0.00884 | -| value_loss | 1.34e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16062 | -| time_elapsed | 86066 | -| total_timesteps | 2055936 | -| train/ | | -| approx_kl | 0.038442433 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 160610 | -| policy_gradient_loss | 0.0045 | -| std | 0.00884 | -| value_loss | 9.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16063 | -| time_elapsed | 86071 | -| total_timesteps | 2056064 | -| train/ | | -| approx_kl | 0.006594512 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | -0.00814 | -| n_updates | 160620 | -| policy_gradient_loss | 0.00108 | -| std | 0.00884 | -| value_loss | 6.93e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16064 | -| time_elapsed | 86080 | -| total_timesteps | 2056192 | -| train/ | | -| approx_kl | 0.0516136 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | 0.0455 | -| n_updates | 160630 | -| policy_gradient_loss | 0.0409 | -| std | 0.00883 | -| value_loss | 9.45e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16065 | -| time_elapsed | 86086 | -| total_timesteps | 2056320 | -| train/ | | -| approx_kl | 0.021016885 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.0019 | -| learning_rate | 0.0003 | -| loss | 0.00993 | -| n_updates | 160640 | -| policy_gradient_loss | 0.0109 | -| std | 0.00883 | -| value_loss | 1.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16066 | -| time_elapsed | 86091 | -| total_timesteps | 2056448 | -| train/ | | -| approx_kl | 0.025490701 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 160650 | -| policy_gradient_loss | -0.00876 | -| std | 0.00883 | -| value_loss | 3.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16067 | -| time_elapsed | 86096 | -| total_timesteps | 2056576 | -| train/ | | -| approx_kl | 0.009655559 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.061 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 160660 | -| policy_gradient_loss | 0.0177 | -| std | 0.00883 | -| value_loss | 2.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16068 | -| time_elapsed | 86100 | -| total_timesteps | 2056704 | -| train/ | | -| approx_kl | 0.28063902 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 160670 | -| policy_gradient_loss | 0.0359 | -| std | 0.00882 | -| value_loss | 9.24e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16069 | -| time_elapsed | 86104 | -| total_timesteps | 2056832 | -| train/ | | -| approx_kl | 0.02417165 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 160680 | -| policy_gradient_loss | 0.00582 | -| std | 0.00882 | -| value_loss | 6.31e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16070 | -| time_elapsed | 86107 | -| total_timesteps | 2056960 | -| train/ | | -| approx_kl | 0.029211283 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.0071 | -| n_updates | 160690 | -| policy_gradient_loss | 0.00313 | -| std | 0.00882 | -| value_loss | 7.09e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16071 | -| time_elapsed | 86111 | -| total_timesteps | 2057088 | -| train/ | | -| approx_kl | 0.0052270843 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 160700 | -| policy_gradient_loss | 0.00102 | -| std | 0.00882 | -| value_loss | 3.97e-09 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16072 | -| time_elapsed | 86120 | -| total_timesteps | 2057216 | -| train/ | | -| approx_kl | 0.020318 | -| clip_fraction | 0.56 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | 0.00051 | -| n_updates | 160710 | -| policy_gradient_loss | 0.0155 | -| std | 0.00882 | -| value_loss | 1.56e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16073 | -| time_elapsed | 86126 | -| total_timesteps | 2057344 | -| train/ | | -| approx_kl | 0.072494894 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.0104 | -| learning_rate | 0.0003 | -| loss | 0.0545 | -| n_updates | 160720 | -| policy_gradient_loss | 0.0745 | -| std | 0.00882 | -| value_loss | 1.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16074 | -| time_elapsed | 86130 | -| total_timesteps | 2057472 | -| train/ | | -| approx_kl | 0.013535045 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.00734 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 160730 | -| policy_gradient_loss | 0.0105 | -| std | 0.00882 | -| value_loss | 6.14e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16075 | -| time_elapsed | 86134 | -| total_timesteps | 2057600 | -| train/ | | -| approx_kl | 0.0006632167 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 160740 | -| policy_gradient_loss | 0.00243 | -| std | 0.00881 | -| value_loss | 2.59e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16076 | -| time_elapsed | 86139 | -| total_timesteps | 2057728 | -| train/ | | -| approx_kl | 0.12570128 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -2.29 | -| learning_rate | 0.0003 | -| loss | 0.0503 | -| n_updates | 160750 | -| policy_gradient_loss | 0.0508 | -| std | 0.0088 | -| value_loss | 1.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16077 | -| time_elapsed | 86143 | -| total_timesteps | 2057856 | -| train/ | | -| approx_kl | 0.070282795 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -15.8 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 160760 | -| policy_gradient_loss | 0.0246 | -| std | 0.0088 | -| value_loss | 2.27e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 16078 | -| time_elapsed | 86147 | -| total_timesteps | 2057984 | -| train/ | | -| approx_kl | 0.012826396 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.00602 | -| learning_rate | 0.0003 | -| loss | -0.00964 | -| n_updates | 160770 | -| policy_gradient_loss | 0.00723 | -| std | 0.0088 | -| value_loss | 9.38e-12 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 16079 | -| time_elapsed | 86152 | -| total_timesteps | 2058112 | -| train/ | | -| approx_kl | 0.00029673055 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | 0.00293 | -| n_updates | 160780 | -| policy_gradient_loss | -0.000909 | -| std | 0.0088 | -| value_loss | 1.54e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 16080 | -| time_elapsed | 86164 | -| total_timesteps | 2058240 | -| train/ | | -| approx_kl | 0.044886157 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.00975 | -| n_updates | 160790 | -| policy_gradient_loss | -0.0113 | -| std | 0.0088 | -| value_loss | 8.09e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 16081 | -| time_elapsed | 86168 | -| total_timesteps | 2058368 | -| train/ | | -| approx_kl | 0.024551796 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0973 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 160800 | -| policy_gradient_loss | 0.0275 | -| std | 0.0088 | -| value_loss | 3.92e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 16082 | -| time_elapsed | 86173 | -| total_timesteps | 2058496 | -| train/ | | -| approx_kl | 0.5636334 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.309 | -| n_updates | 160810 | -| policy_gradient_loss | 0.125 | -| std | 0.0088 | -| value_loss | 8.56e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 16083 | -| time_elapsed | 86179 | -| total_timesteps | 2058624 | -| train/ | | -| approx_kl | 0.0055194087 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 160820 | -| policy_gradient_loss | 0.0194 | -| std | 0.0088 | -| value_loss | 6.05e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 16084 | -| time_elapsed | 86185 | -| total_timesteps | 2058752 | -| train/ | | -| approx_kl | 0.04801692 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 160830 | -| policy_gradient_loss | 0.0137 | -| std | 0.0088 | -| value_loss | 3.02e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 16085 | -| time_elapsed | 86189 | -| total_timesteps | 2058880 | -| train/ | | -| approx_kl | 0.0028256397 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | 0.00446 | -| n_updates | 160840 | -| policy_gradient_loss | 0.00412 | -| std | 0.00879 | -| value_loss | 2.07e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16086 | -| time_elapsed | 86194 | -| total_timesteps | 2059008 | -| train/ | | -| approx_kl | 0.027074508 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.31 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 160850 | -| policy_gradient_loss | 0.0141 | -| std | 0.00879 | -| value_loss | 1.6e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16087 | -| time_elapsed | 86209 | -| total_timesteps | 2059136 | -| train/ | | -| approx_kl | 0.0006778706 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | -0.0041 | -| n_updates | 160860 | -| policy_gradient_loss | -0.00455 | -| std | 0.00879 | -| value_loss | 0.00205 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16088 | -| time_elapsed | 86215 | -| total_timesteps | 2059264 | -| train/ | | -| approx_kl | 0.004305878 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.0597 | -| learning_rate | 0.0003 | -| loss | -0.000634 | -| n_updates | 160870 | -| policy_gradient_loss | 0.0572 | -| std | 0.00878 | -| value_loss | 0.000244 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16089 | -| time_elapsed | 86220 | -| total_timesteps | 2059392 | -| train/ | | -| approx_kl | 0.060020827 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00468 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 160880 | -| policy_gradient_loss | 0.0751 | -| std | 0.00877 | -| value_loss | 1.55e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16090 | -| time_elapsed | 86224 | -| total_timesteps | 2059520 | -| train/ | | -| approx_kl | 0.00073641306 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 0.00165 | -| n_updates | 160890 | -| policy_gradient_loss | 0.0161 | -| std | 0.00877 | -| value_loss | 1.14e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16091 | -| time_elapsed | 86228 | -| total_timesteps | 2059648 | -| train/ | | -| approx_kl | 0.12013114 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 160900 | -| policy_gradient_loss | 0.0909 | -| std | 0.00877 | -| value_loss | 8.96e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16092 | -| time_elapsed | 86232 | -| total_timesteps | 2059776 | -| train/ | | -| approx_kl | 0.021063324 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.00773 | -| n_updates | 160910 | -| policy_gradient_loss | 0.0144 | -| std | 0.00877 | -| value_loss | 5.88e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16093 | -| time_elapsed | 86238 | -| total_timesteps | 2059904 | -| train/ | | -| approx_kl | 0.3274017 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 160920 | -| policy_gradient_loss | 0.0358 | -| std | 0.00877 | -| value_loss | 4.35e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16094 | -| time_elapsed | 86242 | -| total_timesteps | 2060032 | -| train/ | | -| approx_kl | 0.019116012 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 160930 | -| policy_gradient_loss | -0.00667 | -| std | 0.00877 | -| value_loss | 3.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16095 | -| time_elapsed | 86253 | -| total_timesteps | 2060160 | -| train/ | | -| approx_kl | 0.023589946 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.364 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 160940 | -| policy_gradient_loss | -0.0201 | -| std | 0.00877 | -| value_loss | 0.00251 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16096 | -| time_elapsed | 86258 | -| total_timesteps | 2060288 | -| train/ | | -| approx_kl | 0.045072585 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0936 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 160950 | -| policy_gradient_loss | 0.057 | -| std | 0.00877 | -| value_loss | 8.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16097 | -| time_elapsed | 86263 | -| total_timesteps | 2060416 | -| train/ | | -| approx_kl | 0.065181814 | -| clip_fraction | 0.64 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.438 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 160960 | -| policy_gradient_loss | 0.0837 | -| std | 0.00877 | -| value_loss | 6.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16098 | -| time_elapsed | 86268 | -| total_timesteps | 2060544 | -| train/ | | -| approx_kl | 0.070027635 | -| clip_fraction | 0.619 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.0723 | -| n_updates | 160970 | -| policy_gradient_loss | 0.0846 | -| std | 0.00877 | -| value_loss | 3.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16099 | -| time_elapsed | 86272 | -| total_timesteps | 2060672 | -| train/ | | -| approx_kl | 0.062449176 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | 0.0461 | -| n_updates | 160980 | -| policy_gradient_loss | 0.0522 | -| std | 0.00877 | -| value_loss | 2.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16100 | -| time_elapsed | 86276 | -| total_timesteps | 2060800 | -| train/ | | -| approx_kl | 0.013110888 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 160990 | -| policy_gradient_loss | 0.0128 | -| std | 0.00877 | -| value_loss | 1.64e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 16101 | -| time_elapsed | 86281 | -| total_timesteps | 2060928 | -| train/ | | -| approx_kl | 0.3116538 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.0932 | -| n_updates | 161000 | -| policy_gradient_loss | 0.0282 | -| std | 0.00877 | -| value_loss | 1.17e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16102 | -| time_elapsed | 86287 | -| total_timesteps | 2061056 | -| train/ | | -| approx_kl | 0.02107679 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 161010 | -| policy_gradient_loss | -0.00288 | -| std | 0.00877 | -| value_loss | 9.04e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16103 | -| time_elapsed | 86295 | -| total_timesteps | 2061184 | -| train/ | | -| approx_kl | 0.031210728 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 161020 | -| policy_gradient_loss | -0.00162 | -| std | 0.00877 | -| value_loss | 0.000179 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16104 | -| time_elapsed | 86299 | -| total_timesteps | 2061312 | -| train/ | | -| approx_kl | 0.023310624 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 161030 | -| policy_gradient_loss | -0.00942 | -| std | 0.00877 | -| value_loss | 2.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16105 | -| time_elapsed | 86302 | -| total_timesteps | 2061440 | -| train/ | | -| approx_kl | 0.021644948 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 161040 | -| policy_gradient_loss | 0.00489 | -| std | 0.00876 | -| value_loss | 8.85e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16106 | -| time_elapsed | 86307 | -| total_timesteps | 2061568 | -| train/ | | -| approx_kl | 0.0040242733 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 161050 | -| policy_gradient_loss | 0.000913 | -| std | 0.00876 | -| value_loss | 3.66e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16107 | -| time_elapsed | 86311 | -| total_timesteps | 2061696 | -| train/ | | -| approx_kl | 0.019977028 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.00735 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 161060 | -| policy_gradient_loss | 0.0827 | -| std | 0.00876 | -| value_loss | 5.64e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16108 | -| time_elapsed | 86316 | -| total_timesteps | 2061824 | -| train/ | | -| approx_kl | 0.0057600453 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | -0.00467 | -| n_updates | 161070 | -| policy_gradient_loss | 0.017 | -| std | 0.00876 | -| value_loss | 3.51e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 16109 | -| time_elapsed | 86320 | -| total_timesteps | 2061952 | -| train/ | | -| approx_kl | 0.2874356 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0973 | -| n_updates | 161080 | -| policy_gradient_loss | 0.0301 | -| std | 0.00876 | -| value_loss | 7.07e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16110 | -| time_elapsed | 86323 | -| total_timesteps | 2062080 | -| train/ | | -| approx_kl | 0.020425037 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 161090 | -| policy_gradient_loss | -0.00578 | -| std | 0.00876 | -| value_loss | 1.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16111 | -| time_elapsed | 86331 | -| total_timesteps | 2062208 | -| train/ | | -| approx_kl | 0.024058271 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 161100 | -| policy_gradient_loss | 0.0137 | -| std | 0.00876 | -| value_loss | 0.000354 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16112 | -| time_elapsed | 86337 | -| total_timesteps | 2062336 | -| train/ | | -| approx_kl | 0.07945347 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.0728 | -| n_updates | 161110 | -| policy_gradient_loss | 0.0373 | -| std | 0.00876 | -| value_loss | 8.41e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16113 | -| time_elapsed | 86347 | -| total_timesteps | 2062464 | -| train/ | | -| approx_kl | 0.06598466 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00601 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 161120 | -| policy_gradient_loss | 0.00765 | -| std | 0.00876 | -| value_loss | 1.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16114 | -| time_elapsed | 86352 | -| total_timesteps | 2062592 | -| train/ | | -| approx_kl | 0.008137081 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.00127 | -| n_updates | 161130 | -| policy_gradient_loss | 0.00345 | -| std | 0.00877 | -| value_loss | 5.66e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16115 | -| time_elapsed | 86356 | -| total_timesteps | 2062720 | -| train/ | | -| approx_kl | 0.02782045 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 161140 | -| policy_gradient_loss | 0.00547 | -| std | 0.00878 | -| value_loss | 4.07e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16116 | -| time_elapsed | 86361 | -| total_timesteps | 2062848 | -| train/ | | -| approx_kl | 0.0055613616 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.00603 | -| n_updates | 161150 | -| policy_gradient_loss | 0.000495 | -| std | 0.00877 | -| value_loss | 1.92e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 16117 | -| time_elapsed | 86366 | -| total_timesteps | 2062976 | -| train/ | | -| approx_kl | 0.043321803 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0453 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 161160 | -| policy_gradient_loss | 0.00609 | -| std | 0.00877 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16118 | -| time_elapsed | 86371 | -| total_timesteps | 2063104 | -| train/ | | -| approx_kl | 0.061315026 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 161170 | -| policy_gradient_loss | 0.00271 | -| std | 0.00876 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16119 | -| time_elapsed | 86383 | -| total_timesteps | 2063232 | -| train/ | | -| approx_kl | 0.065497495 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.533 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 161180 | -| policy_gradient_loss | -0.0174 | -| std | 0.00876 | -| value_loss | 0.00131 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16120 | -| time_elapsed | 86388 | -| total_timesteps | 2063360 | -| train/ | | -| approx_kl | 0.0718855 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 161190 | -| policy_gradient_loss | -0.000214 | -| std | 0.00876 | -| value_loss | 5.52e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16121 | -| time_elapsed | 86393 | -| total_timesteps | 2063488 | -| train/ | | -| approx_kl | 0.056690108 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -7.8 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 161200 | -| policy_gradient_loss | -0.00409 | -| std | 0.00876 | -| value_loss | 6.16e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16122 | -| time_elapsed | 86399 | -| total_timesteps | 2063616 | -| train/ | | -| approx_kl | 0.05942926 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -1.52 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 161210 | -| policy_gradient_loss | 0.0119 | -| std | 0.00875 | -| value_loss | 2.54e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16123 | -| time_elapsed | 86405 | -| total_timesteps | 2063744 | -| train/ | | -| approx_kl | 0.06223588 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.581 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 161220 | -| policy_gradient_loss | 0.0361 | -| std | 0.00876 | -| value_loss | 1.07e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16124 | -| time_elapsed | 86409 | -| total_timesteps | 2063872 | -| train/ | | -| approx_kl | 0.07656113 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 161230 | -| policy_gradient_loss | 0.00126 | -| std | 0.00876 | -| value_loss | 2.66e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16125 | -| time_elapsed | 86413 | -| total_timesteps | 2064000 | -| train/ | | -| approx_kl | 0.012401815 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0786 | -| learning_rate | 0.0003 | -| loss | -0.00523 | -| n_updates | 161240 | -| policy_gradient_loss | 0.00238 | -| std | 0.00876 | -| value_loss | 4.32e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16126 | -| time_elapsed | 86417 | -| total_timesteps | 2064128 | -| train/ | | -| approx_kl | 0.002140441 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.0023 | -| learning_rate | 0.0003 | -| loss | -0.000769 | -| n_updates | 161250 | -| policy_gradient_loss | 0.0029 | -| std | 0.00876 | -| value_loss | 1.16e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16127 | -| time_elapsed | 86429 | -| total_timesteps | 2064256 | -| train/ | | -| approx_kl | 0.31945536 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | 0.0042 | -| n_updates | 161260 | -| policy_gradient_loss | -0.00943 | -| std | 0.00876 | -| value_loss | 0.00142 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16128 | -| time_elapsed | 86434 | -| total_timesteps | 2064384 | -| train/ | | -| approx_kl | 0.028826844 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | 0.0025 | -| n_updates | 161270 | -| policy_gradient_loss | 0.000998 | -| std | 0.00876 | -| value_loss | 3.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16129 | -| time_elapsed | 86439 | -| total_timesteps | 2064512 | -| train/ | | -| approx_kl | 0.05375898 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.268 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 161280 | -| policy_gradient_loss | 0.0229 | -| std | 0.00875 | -| value_loss | 1.95e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16130 | -| time_elapsed | 86444 | -| total_timesteps | 2064640 | -| train/ | | -| approx_kl | 0.5707127 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 161290 | -| policy_gradient_loss | 0.107 | -| std | 0.00875 | -| value_loss | 9.85e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16131 | -| time_elapsed | 86449 | -| total_timesteps | 2064768 | -| train/ | | -| approx_kl | 0.0024617058 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 161300 | -| policy_gradient_loss | 0.00652 | -| std | 0.00875 | -| value_loss | 7.85e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 16132 | -| time_elapsed | 86455 | -| total_timesteps | 2064896 | -| train/ | | -| approx_kl | 0.35307696 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 161310 | -| policy_gradient_loss | 0.0305 | -| std | 0.00875 | -| value_loss | 4.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16133 | -| time_elapsed | 86462 | -| total_timesteps | 2065024 | -| train/ | | -| approx_kl | 0.016185727 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.00428 | -| n_updates | 161320 | -| policy_gradient_loss | 0.00259 | -| std | 0.00875 | -| value_loss | 3.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16134 | -| time_elapsed | 86472 | -| total_timesteps | 2065152 | -| train/ | | -| approx_kl | 0.035379753 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | 0.00619 | -| n_updates | 161330 | -| policy_gradient_loss | 0.00293 | -| std | 0.00875 | -| value_loss | 0.00101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16135 | -| time_elapsed | 86477 | -| total_timesteps | 2065280 | -| train/ | | -| approx_kl | 0.006764991 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 161340 | -| policy_gradient_loss | 0.0266 | -| std | 0.00873 | -| value_loss | 6.62e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16136 | -| time_elapsed | 86483 | -| total_timesteps | 2065408 | -| train/ | | -| approx_kl | 0.10756813 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0666 | -| learning_rate | 0.0003 | -| loss | 0.0993 | -| n_updates | 161350 | -| policy_gradient_loss | 0.0429 | -| std | 0.00873 | -| value_loss | 0.000276 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16137 | -| time_elapsed | 86488 | -| total_timesteps | 2065536 | -| train/ | | -| approx_kl | 0.05696965 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.00341 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 161360 | -| policy_gradient_loss | -7.43e-05 | -| std | 0.00872 | -| value_loss | 3.51e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16138 | -| time_elapsed | 86493 | -| total_timesteps | 2065664 | -| train/ | | -| approx_kl | 0.009595264 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 161370 | -| policy_gradient_loss | 0.00119 | -| std | 0.00872 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16139 | -| time_elapsed | 86498 | -| total_timesteps | 2065792 | -| train/ | | -| approx_kl | 0.032474376 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 161380 | -| policy_gradient_loss | 0.00795 | -| std | 0.00873 | -| value_loss | 8.59e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 16140 | -| time_elapsed | 86503 | -| total_timesteps | 2065920 | -| train/ | | -| approx_kl | 0.03872808 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 161390 | -| policy_gradient_loss | 0.0148 | -| std | 0.00872 | -| value_loss | 4.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16141 | -| time_elapsed | 86509 | -| total_timesteps | 2066048 | -| train/ | | -| approx_kl | 0.029480351 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 161400 | -| policy_gradient_loss | 7.34e-05 | -| std | 0.00871 | -| value_loss | 3.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16142 | -| time_elapsed | 86518 | -| total_timesteps | 2066176 | -| train/ | | -| approx_kl | 0.113761194 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 161410 | -| policy_gradient_loss | -0.00667 | -| std | 0.00871 | -| value_loss | 0.00299 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16143 | -| time_elapsed | 86524 | -| total_timesteps | 2066304 | -| train/ | | -| approx_kl | 0.14282523 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.851 | -| learning_rate | 0.0003 | -| loss | 0.0435 | -| n_updates | 161420 | -| policy_gradient_loss | 0.0054 | -| std | 0.00871 | -| value_loss | 5.42e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16144 | -| time_elapsed | 86529 | -| total_timesteps | 2066432 | -| train/ | | -| approx_kl | 0.0070221317 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.412 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 161430 | -| policy_gradient_loss | 0.0182 | -| std | 0.00871 | -| value_loss | 6.43e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16145 | -| time_elapsed | 86535 | -| total_timesteps | 2066560 | -| train/ | | -| approx_kl | 0.13424611 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 161440 | -| policy_gradient_loss | 0.0975 | -| std | 0.00871 | -| value_loss | 2.29e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16146 | -| time_elapsed | 86541 | -| total_timesteps | 2066688 | -| train/ | | -| approx_kl | 0.020720616 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00562 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 161450 | -| policy_gradient_loss | 0.00872 | -| std | 0.00871 | -| value_loss | 1.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16147 | -| time_elapsed | 86547 | -| total_timesteps | 2066816 | -| train/ | | -| approx_kl | 0.075614475 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 161460 | -| policy_gradient_loss | 0.013 | -| std | 0.0087 | -| value_loss | 1.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 16148 | -| time_elapsed | 86553 | -| total_timesteps | 2066944 | -| train/ | | -| approx_kl | 0.00673696 | -| clip_fraction | 0.0375 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00892 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 161470 | -| policy_gradient_loss | -0.000672 | -| std | 0.00869 | -| value_loss | 5.11e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16149 | -| time_elapsed | 86557 | -| total_timesteps | 2067072 | -| train/ | | -| approx_kl | 0.010586135 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 161480 | -| policy_gradient_loss | 0.006 | -| std | 0.00869 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16150 | -| time_elapsed | 86568 | -| total_timesteps | 2067200 | -| train/ | | -| approx_kl | 0.020602338 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -4.09 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 161490 | -| policy_gradient_loss | -0.013 | -| std | 0.00869 | -| value_loss | 0.00391 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16151 | -| time_elapsed | 86573 | -| total_timesteps | 2067328 | -| train/ | | -| approx_kl | 0.005148126 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | -0.00499 | -| n_updates | 161500 | -| policy_gradient_loss | 0.00324 | -| std | 0.00869 | -| value_loss | 6.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16152 | -| time_elapsed | 86578 | -| total_timesteps | 2067456 | -| train/ | | -| approx_kl | 0.08234523 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.521 | -| learning_rate | 0.0003 | -| loss | 0.0638 | -| n_updates | 161510 | -| policy_gradient_loss | 0.0127 | -| std | 0.00869 | -| value_loss | 3.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16153 | -| time_elapsed | 86584 | -| total_timesteps | 2067584 | -| train/ | | -| approx_kl | 0.002229191 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -8.11e-05 | -| n_updates | 161520 | -| policy_gradient_loss | 0.0271 | -| std | 0.00867 | -| value_loss | 3.2e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16154 | -| time_elapsed | 86590 | -| total_timesteps | 2067712 | -| train/ | | -| approx_kl | 0.29855052 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -2.85 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 161530 | -| policy_gradient_loss | 0.0106 | -| std | 0.00866 | -| value_loss | 7.97e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16155 | -| time_elapsed | 86595 | -| total_timesteps | 2067840 | -| train/ | | -| approx_kl | 0.0047215843 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 161540 | -| policy_gradient_loss | 0.00178 | -| std | 0.00866 | -| value_loss | 1.23e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 16156 | -| time_elapsed | 86599 | -| total_timesteps | 2067968 | -| train/ | | -| approx_kl | 0.050274707 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0701 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 161550 | -| policy_gradient_loss | 0.00205 | -| std | 0.00865 | -| value_loss | 2.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16157 | -| time_elapsed | 86604 | -| total_timesteps | 2068096 | -| train/ | | -| approx_kl | 0.028281467 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 161560 | -| policy_gradient_loss | 0.0209 | -| std | 0.00866 | -| value_loss | 5.79e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16158 | -| time_elapsed | 86615 | -| total_timesteps | 2068224 | -| train/ | | -| approx_kl | 0.76843274 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -7.19 | -| learning_rate | 0.0003 | -| loss | 0.047 | -| n_updates | 161570 | -| policy_gradient_loss | 0.0135 | -| std | 0.00866 | -| value_loss | 0.00414 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16159 | -| time_elapsed | 86620 | -| total_timesteps | 2068352 | -| train/ | | -| approx_kl | 0.07646414 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 161580 | -| policy_gradient_loss | 0.00692 | -| std | 0.00866 | -| value_loss | 2.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16160 | -| time_elapsed | 86625 | -| total_timesteps | 2068480 | -| train/ | | -| approx_kl | 0.011694056 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 161590 | -| policy_gradient_loss | 0.00955 | -| std | 0.00866 | -| value_loss | 1.14e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16161 | -| time_elapsed | 86631 | -| total_timesteps | 2068608 | -| train/ | | -| approx_kl | 0.05591284 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.51 | -| learning_rate | 0.0003 | -| loss | 0.00095 | -| n_updates | 161600 | -| policy_gradient_loss | 0.00463 | -| std | 0.00866 | -| value_loss | 7.86e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16162 | -| time_elapsed | 86637 | -| total_timesteps | 2068736 | -| train/ | | -| approx_kl | 0.0030052075 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.000222 | -| n_updates | 161610 | -| policy_gradient_loss | 0.0148 | -| std | 0.00865 | -| value_loss | 2.88e-06 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16163 | -| time_elapsed | 86643 | -| total_timesteps | 2068864 | -| train/ | | -| approx_kl | 0.275919 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00737 | -| learning_rate | 0.0003 | -| loss | 0.0862 | -| n_updates | 161620 | -| policy_gradient_loss | 0.0306 | -| std | 0.00864 | -| value_loss | 4.53e-06 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 16164 | -| time_elapsed | 86649 | -| total_timesteps | 2068992 | -| train/ | | -| approx_kl | 0.0007060715 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -36.4 | -| learning_rate | 0.0003 | -| loss | 0.00573 | -| n_updates | 161630 | -| policy_gradient_loss | -0.0123 | -| std | 0.00864 | -| value_loss | 2.35e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 16165 | -| time_elapsed | 86655 | -| total_timesteps | 2069120 | -| train/ | | -| approx_kl | 0.008046162 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 161640 | -| policy_gradient_loss | 0.00316 | -| std | 0.00864 | -| value_loss | 1.45e-09 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 16166 | -| time_elapsed | 86669 | -| total_timesteps | 2069248 | -| train/ | | -| approx_kl | 0.279142 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 161650 | -| policy_gradient_loss | -0.00474 | -| std | 0.00865 | -| value_loss | 0.00189 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 16167 | -| time_elapsed | 86676 | -| total_timesteps | 2069376 | -| train/ | | -| approx_kl | 0.018168626 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00402 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 161660 | -| policy_gradient_loss | -0.000484 | -| std | 0.00865 | -| value_loss | 2.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 16168 | -| time_elapsed | 86681 | -| total_timesteps | 2069504 | -| train/ | | -| approx_kl | 0.048866853 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 161670 | -| policy_gradient_loss | 0.0112 | -| std | 0.00865 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 16169 | -| time_elapsed | 86687 | -| total_timesteps | 2069632 | -| train/ | | -| approx_kl | 0.048728272 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.0577 | -| n_updates | 161680 | -| policy_gradient_loss | 0.0423 | -| std | 0.00865 | -| value_loss | 9.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 16170 | -| time_elapsed | 86692 | -| total_timesteps | 2069760 | -| train/ | | -| approx_kl | 0.017483763 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.00795 | -| n_updates | 161690 | -| policy_gradient_loss | 0.0223 | -| std | 0.00865 | -| value_loss | 5.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 16171 | -| time_elapsed | 86697 | -| total_timesteps | 2069888 | -| train/ | | -| approx_kl | 0.063417934 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0597 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 161700 | -| policy_gradient_loss | 0.0323 | -| std | 0.00865 | -| value_loss | 3.54e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16172 | -| time_elapsed | 86704 | -| total_timesteps | 2070016 | -| train/ | | -| approx_kl | 0.0034069628 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.00955 | -| n_updates | 161710 | -| policy_gradient_loss | -0.00273 | -| std | 0.00865 | -| value_loss | 2.52e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16173 | -| time_elapsed | 86718 | -| total_timesteps | 2070144 | -| train/ | | -| approx_kl | 0.08929273 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -2.06 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 161720 | -| policy_gradient_loss | -0.0136 | -| std | 0.00866 | -| value_loss | 0.0028 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16174 | -| time_elapsed | 86722 | -| total_timesteps | 2070272 | -| train/ | | -| approx_kl | 0.0016941684 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.0571 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 161730 | -| policy_gradient_loss | 0.00885 | -| std | 0.00866 | -| value_loss | 6.51e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16175 | -| time_elapsed | 86728 | -| total_timesteps | 2070400 | -| train/ | | -| approx_kl | 0.009120299 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | 0.00312 | -| n_updates | 161740 | -| policy_gradient_loss | 0.0219 | -| std | 0.00868 | -| value_loss | 7.81e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16176 | -| time_elapsed | 86732 | -| total_timesteps | 2070528 | -| train/ | | -| approx_kl | 0.0021165279 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.259 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 161750 | -| policy_gradient_loss | 0.0118 | -| std | 0.00869 | -| value_loss | 1.06e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16177 | -| time_elapsed | 86737 | -| total_timesteps | 2070656 | -| train/ | | -| approx_kl | 0.048582323 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0633 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 161760 | -| policy_gradient_loss | 0.0233 | -| std | 0.00869 | -| value_loss | 8.19e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16178 | -| time_elapsed | 86742 | -| total_timesteps | 2070784 | -| train/ | | -| approx_kl | 0.0891596 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 161770 | -| policy_gradient_loss | -0.00315 | -| std | 0.00869 | -| value_loss | 6.71e-08 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 16179 | -| time_elapsed | 86748 | -| total_timesteps | 2070912 | -| train/ | | -| approx_kl | 0.00053977966 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | -0.000297 | -| n_updates | 161780 | -| policy_gradient_loss | 0.0145 | -| std | 0.0087 | -| value_loss | 4.79e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16180 | -| time_elapsed | 86753 | -| total_timesteps | 2071040 | -| train/ | | -| approx_kl | 0.10870602 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0662 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 161790 | -| policy_gradient_loss | 0.00873 | -| std | 0.0087 | -| value_loss | 4.61e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16181 | -| time_elapsed | 86765 | -| total_timesteps | 2071168 | -| train/ | | -| approx_kl | 0.1230291 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.658 | -| learning_rate | 0.0003 | -| loss | -0.0241 | -| n_updates | 161800 | -| policy_gradient_loss | -0.0162 | -| std | 0.0087 | -| value_loss | 0.000881 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16182 | -| time_elapsed | 86769 | -| total_timesteps | 2071296 | -| train/ | | -| approx_kl | 0.00078268955 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00608 | -| learning_rate | 0.0003 | -| loss | 0.00174 | -| n_updates | 161810 | -| policy_gradient_loss | -0.000124 | -| std | 0.0087 | -| value_loss | 2.28e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16183 | -| time_elapsed | 86775 | -| total_timesteps | 2071424 | -| train/ | | -| approx_kl | 0.04489986 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.307 | -| learning_rate | 0.0003 | -| loss | 0.00275 | -| n_updates | 161820 | -| policy_gradient_loss | 0.035 | -| std | 0.00871 | -| value_loss | 1.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16184 | -| time_elapsed | 86780 | -| total_timesteps | 2071552 | -| train/ | | -| approx_kl | 0.023958538 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 161830 | -| policy_gradient_loss | 0.0163 | -| std | 0.00871 | -| value_loss | 8.92e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16185 | -| time_elapsed | 86787 | -| total_timesteps | 2071680 | -| train/ | | -| approx_kl | 0.117760405 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.0466 | -| n_updates | 161840 | -| policy_gradient_loss | 0.0209 | -| std | 0.00871 | -| value_loss | 4.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16186 | -| time_elapsed | 86795 | -| total_timesteps | 2071808 | -| train/ | | -| approx_kl | 0.028378034 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 161850 | -| policy_gradient_loss | 0.0391 | -| std | 0.00871 | -| value_loss | 7.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 16187 | -| time_elapsed | 86800 | -| total_timesteps | 2071936 | -| train/ | | -| approx_kl | 0.013009728 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -8.28 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 161860 | -| policy_gradient_loss | 0.00619 | -| std | 0.00871 | -| value_loss | 1.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16188 | -| time_elapsed | 86805 | -| total_timesteps | 2072064 | -| train/ | | -| approx_kl | 0.11442949 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | 0.093 | -| n_updates | 161870 | -| policy_gradient_loss | 0.0167 | -| std | 0.00869 | -| value_loss | 6.22e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16189 | -| time_elapsed | 86815 | -| total_timesteps | 2072192 | -| train/ | | -| approx_kl | 0.009652113 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -5.26 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 161880 | -| policy_gradient_loss | -0.0152 | -| std | 0.00867 | -| value_loss | 0.00322 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16190 | -| time_elapsed | 86822 | -| total_timesteps | 2072320 | -| train/ | | -| approx_kl | 0.11620843 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 161890 | -| policy_gradient_loss | 0.0881 | -| std | 0.00867 | -| value_loss | 3.37e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16191 | -| time_elapsed | 86828 | -| total_timesteps | 2072448 | -| train/ | | -| approx_kl | 0.08405809 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 161900 | -| policy_gradient_loss | 0.0933 | -| std | 0.00867 | -| value_loss | 8.33e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16192 | -| time_elapsed | 86833 | -| total_timesteps | 2072576 | -| train/ | | -| approx_kl | 0.08910183 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | 0.0833 | -| n_updates | 161910 | -| policy_gradient_loss | 0.112 | -| std | 0.00867 | -| value_loss | 4.33e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16193 | -| time_elapsed | 86838 | -| total_timesteps | 2072704 | -| train/ | | -| approx_kl | 0.08594765 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 161920 | -| policy_gradient_loss | 0.0719 | -| std | 0.00867 | -| value_loss | 3.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16194 | -| time_elapsed | 86843 | -| total_timesteps | 2072832 | -| train/ | | -| approx_kl | 0.012305275 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.00618 | -| n_updates | 161930 | -| policy_gradient_loss | 0.0137 | -| std | 0.00865 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 16195 | -| time_elapsed | 86849 | -| total_timesteps | 2072960 | -| train/ | | -| approx_kl | 0.112193935 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 161940 | -| policy_gradient_loss | 0.0145 | -| std | 0.00864 | -| value_loss | 6.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16196 | -| time_elapsed | 86855 | -| total_timesteps | 2073088 | -| train/ | | -| approx_kl | 0.007034552 | -| clip_fraction | 0.0352 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00732 | -| learning_rate | 0.0003 | -| loss | -0.000628 | -| n_updates | 161950 | -| policy_gradient_loss | -0.000495 | -| std | 0.00864 | -| value_loss | 1.85e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16197 | -| time_elapsed | 86868 | -| total_timesteps | 2073216 | -| train/ | | -| approx_kl | 0.17221323 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 161960 | -| policy_gradient_loss | -0.0113 | -| std | 0.00864 | -| value_loss | 8.27e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16198 | -| time_elapsed | 86872 | -| total_timesteps | 2073344 | -| train/ | | -| approx_kl | 0.11511466 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.253 | -| learning_rate | 0.0003 | -| loss | 0.0622 | -| n_updates | 161970 | -| policy_gradient_loss | 0.0345 | -| std | 0.00863 | -| value_loss | 2.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16199 | -| time_elapsed | 86877 | -| total_timesteps | 2073472 | -| train/ | | -| approx_kl | 0.022725835 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 161980 | -| policy_gradient_loss | 0.0332 | -| std | 0.00863 | -| value_loss | 6.26e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16200 | -| time_elapsed | 86881 | -| total_timesteps | 2073600 | -| train/ | | -| approx_kl | 0.009326016 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 161990 | -| policy_gradient_loss | -0.00201 | -| std | 0.00863 | -| value_loss | 4.15e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16201 | -| time_elapsed | 86886 | -| total_timesteps | 2073728 | -| train/ | | -| approx_kl | 0.020748135 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.00109 | -| n_updates | 162000 | -| policy_gradient_loss | 0.0344 | -| std | 0.00863 | -| value_loss | 2.62e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16202 | -| time_elapsed | 86889 | -| total_timesteps | 2073856 | -| train/ | | -| approx_kl | 0.0029411674 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 162010 | -| policy_gradient_loss | 0.0565 | -| std | 0.00863 | -| value_loss | 1.99e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 16203 | -| time_elapsed | 86896 | -| total_timesteps | 2073984 | -| train/ | | -| approx_kl | 0.056952424 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.0671 | -| n_updates | 162020 | -| policy_gradient_loss | 0.108 | -| std | 0.00863 | -| value_loss | 1.66e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16204 | -| time_elapsed | 86901 | -| total_timesteps | 2074112 | -| train/ | | -| approx_kl | 0.044263236 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.0324 | -| n_updates | 162030 | -| policy_gradient_loss | 0.0283 | -| std | 0.00863 | -| value_loss | 8.95e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16205 | -| time_elapsed | 86913 | -| total_timesteps | 2074240 | -| train/ | | -| approx_kl | 0.32935473 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -6.79 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 162040 | -| policy_gradient_loss | 0.0161 | -| std | 0.00863 | -| value_loss | 0.00313 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16206 | -| time_elapsed | 86918 | -| total_timesteps | 2074368 | -| train/ | | -| approx_kl | 0.15501294 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 162050 | -| policy_gradient_loss | 0.0205 | -| std | 0.00866 | -| value_loss | 6.65e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16207 | -| time_elapsed | 86924 | -| total_timesteps | 2074496 | -| train/ | | -| approx_kl | 0.015588341 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.625 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 162060 | -| policy_gradient_loss | -0.00435 | -| std | 0.00867 | -| value_loss | 4.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16208 | -| time_elapsed | 86929 | -| total_timesteps | 2074624 | -| train/ | | -| approx_kl | 0.027797777 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | 0.00313 | -| n_updates | 162070 | -| policy_gradient_loss | 0.000438 | -| std | 0.00868 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16209 | -| time_elapsed | 86933 | -| total_timesteps | 2074752 | -| train/ | | -| approx_kl | 0.028544443 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00619 | -| learning_rate | 0.0003 | -| loss | 0.00504 | -| n_updates | 162080 | -| policy_gradient_loss | 0.00253 | -| std | 0.00868 | -| value_loss | 1.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16210 | -| time_elapsed | 86939 | -| total_timesteps | 2074880 | -| train/ | | -| approx_kl | 0.004608384 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 162090 | -| policy_gradient_loss | 0.00144 | -| std | 0.00868 | -| value_loss | 9.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16211 | -| time_elapsed | 86945 | -| total_timesteps | 2075008 | -| train/ | | -| approx_kl | 0.021068767 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.00933 | -| n_updates | 162100 | -| policy_gradient_loss | 0.107 | -| std | 0.00868 | -| value_loss | 4.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16212 | -| time_elapsed | 86958 | -| total_timesteps | 2075136 | -| train/ | | -| approx_kl | 0.002967217 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0238 | -| n_updates | 162110 | -| policy_gradient_loss | -0.0152 | -| std | 0.00868 | -| value_loss | 1.24e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16213 | -| time_elapsed | 86962 | -| total_timesteps | 2075264 | -| train/ | | -| approx_kl | 0.02428055 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.537 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 162120 | -| policy_gradient_loss | -0.00242 | -| std | 0.00868 | -| value_loss | 4.95e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16214 | -| time_elapsed | 86967 | -| total_timesteps | 2075392 | -| train/ | | -| approx_kl | 0.0018742178 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | -0.00561 | -| n_updates | 162130 | -| policy_gradient_loss | 0.0111 | -| std | 0.00868 | -| value_loss | 5.29e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16215 | -| time_elapsed | 86972 | -| total_timesteps | 2075520 | -| train/ | | -| approx_kl | 0.08943617 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00642 | -| learning_rate | 0.0003 | -| loss | 0.0418 | -| n_updates | 162140 | -| policy_gradient_loss | 0.0103 | -| std | 0.00868 | -| value_loss | 1.5e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16216 | -| time_elapsed | 86975 | -| total_timesteps | 2075648 | -| train/ | | -| approx_kl | 0.008268448 | -| clip_fraction | 0.0477 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | -0.000605 | -| n_updates | 162150 | -| policy_gradient_loss | -0.000488 | -| std | 0.00868 | -| value_loss | 9.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16217 | -| time_elapsed | 86979 | -| total_timesteps | 2075776 | -| train/ | | -| approx_kl | 0.013147252 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | -0.00999 | -| n_updates | 162160 | -| policy_gradient_loss | 0.00961 | -| std | 0.00868 | -| value_loss | 7.32e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16218 | -| time_elapsed | 86985 | -| total_timesteps | 2075904 | -| train/ | | -| approx_kl | 0.1605116 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 162170 | -| policy_gradient_loss | 0.0993 | -| std | 0.00868 | -| value_loss | 5.46e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16219 | -| time_elapsed | 86990 | -| total_timesteps | 2076032 | -| train/ | | -| approx_kl | 0.036465496 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 162180 | -| policy_gradient_loss | 0.0177 | -| std | 0.00868 | -| value_loss | 3.04e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16220 | -| time_elapsed | 86998 | -| total_timesteps | 2076160 | -| train/ | | -| approx_kl | 0.0041706385 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 162190 | -| policy_gradient_loss | -0.00559 | -| std | 0.00867 | -| value_loss | 0.0017 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16221 | -| time_elapsed | 87004 | -| total_timesteps | 2076288 | -| train/ | | -| approx_kl | 0.0004335367 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 162200 | -| policy_gradient_loss | 0.0179 | -| std | 0.00867 | -| value_loss | 2.43e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16222 | -| time_elapsed | 87009 | -| total_timesteps | 2076416 | -| train/ | | -| approx_kl | 0.050280333 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 162210 | -| policy_gradient_loss | 0.0197 | -| std | 0.00867 | -| value_loss | 5.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16223 | -| time_elapsed | 87013 | -| total_timesteps | 2076544 | -| train/ | | -| approx_kl | 0.06491692 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0993 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 162220 | -| policy_gradient_loss | -0.00413 | -| std | 0.00867 | -| value_loss | 2.18e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16224 | -| time_elapsed | 87017 | -| total_timesteps | 2076672 | -| train/ | | -| approx_kl | 0.20832652 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 162230 | -| policy_gradient_loss | 0.0969 | -| std | 0.00867 | -| value_loss | 1.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16225 | -| time_elapsed | 87021 | -| total_timesteps | 2076800 | -| train/ | | -| approx_kl | 0.034854524 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 162240 | -| policy_gradient_loss | 0.0142 | -| std | 0.00867 | -| value_loss | 1.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16226 | -| time_elapsed | 87026 | -| total_timesteps | 2076928 | -| train/ | | -| approx_kl | 0.07785311 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 162250 | -| policy_gradient_loss | 0.0109 | -| std | 0.00867 | -| value_loss | 7.68e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16227 | -| time_elapsed | 87031 | -| total_timesteps | 2077056 | -| train/ | | -| approx_kl | 0.006375619 | -| clip_fraction | 0.0445 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.00028 | -| n_updates | 162260 | -| policy_gradient_loss | 7.12e-05 | -| std | 0.00867 | -| value_loss | 5.8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16228 | -| time_elapsed | 87039 | -| total_timesteps | 2077184 | -| train/ | | -| approx_kl | 0.015067337 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 162270 | -| policy_gradient_loss | 0.00132 | -| std | 0.00866 | -| value_loss | 0.00011 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16229 | -| time_elapsed | 87044 | -| total_timesteps | 2077312 | -| train/ | | -| approx_kl | 0.06446706 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | 0.035 | -| n_updates | 162280 | -| policy_gradient_loss | 0.0178 | -| std | 0.00866 | -| value_loss | 2.86e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16230 | -| time_elapsed | 87049 | -| total_timesteps | 2077440 | -| train/ | | -| approx_kl | 0.014395235 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00565 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 162290 | -| policy_gradient_loss | -0.00221 | -| std | 0.00867 | -| value_loss | 1.26e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16231 | -| time_elapsed | 87054 | -| total_timesteps | 2077568 | -| train/ | | -| approx_kl | 0.0019140253 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 162300 | -| policy_gradient_loss | 0.0191 | -| std | 0.00867 | -| value_loss | 2.63e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16232 | -| time_elapsed | 87058 | -| total_timesteps | 2077696 | -| train/ | | -| approx_kl | 0.25253952 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00233 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 162310 | -| policy_gradient_loss | 0.0433 | -| std | 0.00867 | -| value_loss | 7.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16233 | -| time_elapsed | 87064 | -| total_timesteps | 2077824 | -| train/ | | -| approx_kl | 0.003534358 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | -0.000602 | -| n_updates | 162320 | -| policy_gradient_loss | 0.00322 | -| std | 0.00867 | -| value_loss | 4.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16234 | -| time_elapsed | 87069 | -| total_timesteps | 2077952 | -| train/ | | -| approx_kl | 0.051433574 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 162330 | -| policy_gradient_loss | 0.00734 | -| std | 0.00866 | -| value_loss | 9.13e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16235 | -| time_elapsed | 87073 | -| total_timesteps | 2078080 | -| train/ | | -| approx_kl | 0.06317104 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 162340 | -| policy_gradient_loss | 0.00711 | -| std | 0.00866 | -| value_loss | 3.07e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16236 | -| time_elapsed | 87084 | -| total_timesteps | 2078208 | -| train/ | | -| approx_kl | 0.0319499 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 162350 | -| policy_gradient_loss | -0.0136 | -| std | 0.00865 | -| value_loss | 1.76e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16237 | -| time_elapsed | 87089 | -| total_timesteps | 2078336 | -| train/ | | -| approx_kl | 0.024296312 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00247 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 162360 | -| policy_gradient_loss | -0.000269 | -| std | 0.00865 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16238 | -| time_elapsed | 87093 | -| total_timesteps | 2078464 | -| train/ | | -| approx_kl | 0.0041432395 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.000885 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 162370 | -| policy_gradient_loss | 0.00202 | -| std | 0.00865 | -| value_loss | 3.71e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16239 | -| time_elapsed | 87097 | -| total_timesteps | 2078592 | -| train/ | | -| approx_kl | 0.014867578 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 162380 | -| policy_gradient_loss | 0.0643 | -| std | 0.00863 | -| value_loss | 4.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16240 | -| time_elapsed | 87102 | -| total_timesteps | 2078720 | -| train/ | | -| approx_kl | 0.005826721 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00865 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 162390 | -| policy_gradient_loss | 0.0136 | -| std | 0.00863 | -| value_loss | 4.73e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16241 | -| time_elapsed | 87106 | -| total_timesteps | 2078848 | -| train/ | | -| approx_kl | 0.13047078 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 162400 | -| policy_gradient_loss | 0.0392 | -| std | 0.00862 | -| value_loss | 3.57e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16242 | -| time_elapsed | 87110 | -| total_timesteps | 2078976 | -| train/ | | -| approx_kl | 0.03004355 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 162410 | -| policy_gradient_loss | 0.0285 | -| std | 0.00863 | -| value_loss | 1.59e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16243 | -| time_elapsed | 87115 | -| total_timesteps | 2079104 | -| train/ | | -| approx_kl | 0.47602051 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.201 | -| n_updates | 162420 | -| policy_gradient_loss | 0.115 | -| std | 0.00863 | -| value_loss | 4.84e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16244 | -| time_elapsed | 87125 | -| total_timesteps | 2079232 | -| train/ | | -| approx_kl | 0.11427201 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 162430 | -| policy_gradient_loss | -0.00468 | -| std | 0.00863 | -| value_loss | 8.07e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16245 | -| time_elapsed | 87131 | -| total_timesteps | 2079360 | -| train/ | | -| approx_kl | 0.008796526 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00662 | -| learning_rate | 0.0003 | -| loss | 0.00714 | -| n_updates | 162440 | -| policy_gradient_loss | 0.0152 | -| std | 0.00863 | -| value_loss | 2.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16246 | -| time_elapsed | 87136 | -| total_timesteps | 2079488 | -| train/ | | -| approx_kl | 0.26393124 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0773 | -| learning_rate | 0.0003 | -| loss | 0.153 | -| n_updates | 162450 | -| policy_gradient_loss | 0.0989 | -| std | 0.00863 | -| value_loss | 5.54e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16247 | -| time_elapsed | 87141 | -| total_timesteps | 2079616 | -| train/ | | -| approx_kl | 0.038767274 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 162460 | -| policy_gradient_loss | 0.0148 | -| std | 0.00862 | -| value_loss | 8.59e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16248 | -| time_elapsed | 87145 | -| total_timesteps | 2079744 | -| train/ | | -| approx_kl | 0.0019983305 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0741 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 162470 | -| policy_gradient_loss | 0.00338 | -| std | 0.00862 | -| value_loss | 3.05e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16249 | -| time_elapsed | 87150 | -| total_timesteps | 2079872 | -| train/ | | -| approx_kl | 0.03244462 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.00839 | -| n_updates | 162480 | -| policy_gradient_loss | 0.0119 | -| std | 0.00861 | -| value_loss | 1.01e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16250 | -| time_elapsed | 87155 | -| total_timesteps | 2080000 | -| train/ | | -| approx_kl | 0.02247516 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 162490 | -| policy_gradient_loss | 9.71e-05 | -| std | 0.00861 | -| value_loss | 5.53e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16251 | -| time_elapsed | 87160 | -| total_timesteps | 2080128 | -| train/ | | -| approx_kl | 0.001635693 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00466 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 162500 | -| policy_gradient_loss | 0.0123 | -| std | 0.0086 | -| value_loss | 2.26e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16252 | -| time_elapsed | 87172 | -| total_timesteps | 2080256 | -| train/ | | -| approx_kl | 0.30182916 | -| clip_fraction | 0.546 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | 0.00185 | -| n_updates | 162510 | -| policy_gradient_loss | -0.00136 | -| std | 0.0086 | -| value_loss | 5.36e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16253 | -| time_elapsed | 87176 | -| total_timesteps | 2080384 | -| train/ | | -| approx_kl | 0.025887718 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 162520 | -| policy_gradient_loss | 0.0154 | -| std | 0.0086 | -| value_loss | 1.27e-09 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16254 | -| time_elapsed | 87182 | -| total_timesteps | 2080512 | -| train/ | | -| approx_kl | 0.400731 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.991 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 162530 | -| policy_gradient_loss | 0.0269 | -| std | 0.0086 | -| value_loss | 1.33e-10 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16255 | -| time_elapsed | 87187 | -| total_timesteps | 2080640 | -| train/ | | -| approx_kl | 0.02944895 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.599 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 162540 | -| policy_gradient_loss | -0.00219 | -| std | 0.00859 | -| value_loss | 4.01e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16256 | -| time_elapsed | 87192 | -| total_timesteps | 2080768 | -| train/ | | -| approx_kl | 0.024280012 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.00189 | -| n_updates | 162550 | -| policy_gradient_loss | 0.000477 | -| std | 0.00859 | -| value_loss | 2.38e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 16257 | -| time_elapsed | 87196 | -| total_timesteps | 2080896 | -| train/ | | -| approx_kl | 0.022559678 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0731 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 162560 | -| policy_gradient_loss | -0.00652 | -| std | 0.00859 | -| value_loss | 1.61e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16258 | -| time_elapsed | 87201 | -| total_timesteps | 2081024 | -| train/ | | -| approx_kl | 6.811926e-05 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 162570 | -| policy_gradient_loss | -0.000858 | -| std | 0.00859 | -| value_loss | 1.16e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16259 | -| time_elapsed | 87212 | -| total_timesteps | 2081152 | -| train/ | | -| approx_kl | 0.09196836 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 162580 | -| policy_gradient_loss | -0.00909 | -| std | 0.00859 | -| value_loss | 0.000257 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16260 | -| time_elapsed | 87217 | -| total_timesteps | 2081280 | -| train/ | | -| approx_kl | 0.08864835 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.0829 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 162590 | -| policy_gradient_loss | 0.0341 | -| std | 0.00859 | -| value_loss | 2.94e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16261 | -| time_elapsed | 87221 | -| total_timesteps | 2081408 | -| train/ | | -| approx_kl | 0.2212665 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 162600 | -| policy_gradient_loss | 0.122 | -| std | 0.00859 | -| value_loss | 1.8e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16262 | -| time_elapsed | 87226 | -| total_timesteps | 2081536 | -| train/ | | -| approx_kl | 0.13179101 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | 0.0796 | -| n_updates | 162610 | -| policy_gradient_loss | 0.0683 | -| std | 0.0086 | -| value_loss | 1.46e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16263 | -| time_elapsed | 87229 | -| total_timesteps | 2081664 | -| train/ | | -| approx_kl | 0.08748207 | -| clip_fraction | 0.607 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0566 | -| n_updates | 162620 | -| policy_gradient_loss | 0.0729 | -| std | 0.0086 | -| value_loss | 1.01e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16264 | -| time_elapsed | 87233 | -| total_timesteps | 2081792 | -| train/ | | -| approx_kl | 0.021980034 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.063 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 162630 | -| policy_gradient_loss | 0.0126 | -| std | 0.0086 | -| value_loss | 4.74e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 16265 | -| time_elapsed | 87237 | -| total_timesteps | 2081920 | -| train/ | | -| approx_kl | 0.3580755 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 162640 | -| policy_gradient_loss | 0.0542 | -| std | 0.0086 | -| value_loss | 3.59e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16266 | -| time_elapsed | 87241 | -| total_timesteps | 2082048 | -| train/ | | -| approx_kl | 0.023675349 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 162650 | -| policy_gradient_loss | 0.00935 | -| std | 0.00859 | -| value_loss | 2.53e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16267 | -| time_elapsed | 87251 | -| total_timesteps | 2082176 | -| train/ | | -| approx_kl | 0.0134852985 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.113 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 162660 | -| policy_gradient_loss | -0.018 | -| std | 0.00858 | -| value_loss | 0.00133 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16268 | -| time_elapsed | 87257 | -| total_timesteps | 2082304 | -| train/ | | -| approx_kl | 0.01809268 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.000256 | -| learning_rate | 0.0003 | -| loss | 0.00321 | -| n_updates | 162670 | -| policy_gradient_loss | 0.0736 | -| std | 0.00858 | -| value_loss | 5.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16269 | -| time_elapsed | 87262 | -| total_timesteps | 2082432 | -| train/ | | -| approx_kl | 0.011633374 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | 0.00237 | -| n_updates | 162680 | -| policy_gradient_loss | 0.0256 | -| std | 0.00857 | -| value_loss | 1.93e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16270 | -| time_elapsed | 87267 | -| total_timesteps | 2082560 | -| train/ | | -| approx_kl | 0.19430178 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | 0.0201 | -| n_updates | 162690 | -| policy_gradient_loss | 0.00855 | -| std | 0.00857 | -| value_loss | 1e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16271 | -| time_elapsed | 87271 | -| total_timesteps | 2082688 | -| train/ | | -| approx_kl | 0.008627441 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.00185 | -| n_updates | 162700 | -| policy_gradient_loss | 0.0406 | -| std | 0.00858 | -| value_loss | 4.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16272 | -| time_elapsed | 87277 | -| total_timesteps | 2082816 | -| train/ | | -| approx_kl | 0.17772512 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.303 | -| learning_rate | 0.0003 | -| loss | 0.0434 | -| n_updates | 162710 | -| policy_gradient_loss | 0.0156 | -| std | 0.00859 | -| value_loss | 2.1e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16273 | -| time_elapsed | 87281 | -| total_timesteps | 2082944 | -| train/ | | -| approx_kl | 0.00017105648 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0561 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 162720 | -| policy_gradient_loss | 0.00294 | -| std | 0.00859 | -| value_loss | 1.27e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16274 | -| time_elapsed | 87286 | -| total_timesteps | 2083072 | -| train/ | | -| approx_kl | 4.3927692e-05 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.000489 | -| n_updates | 162730 | -| policy_gradient_loss | -0.000172 | -| std | 0.00859 | -| value_loss | 5.77e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16275 | -| time_elapsed | 87293 | -| total_timesteps | 2083200 | -| train/ | | -| approx_kl | 0.0038088504 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 162740 | -| policy_gradient_loss | -0.00789 | -| std | 0.0086 | -| value_loss | 0.000129 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16276 | -| time_elapsed | 87298 | -| total_timesteps | 2083328 | -| train/ | | -| approx_kl | 0.15476689 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 162750 | -| policy_gradient_loss | 0.101 | -| std | 0.0086 | -| value_loss | 8.92e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16277 | -| time_elapsed | 87302 | -| total_timesteps | 2083456 | -| train/ | | -| approx_kl | 0.099087894 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.0627 | -| n_updates | 162760 | -| policy_gradient_loss | 0.0846 | -| std | 0.0086 | -| value_loss | 7.3e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16278 | -| time_elapsed | 87307 | -| total_timesteps | 2083584 | -| train/ | | -| approx_kl | 0.016427355 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | 0.00786 | -| n_updates | 162770 | -| policy_gradient_loss | 0.0128 | -| std | 0.0086 | -| value_loss | 4.19e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16279 | -| time_elapsed | 87312 | -| total_timesteps | 2083712 | -| train/ | | -| approx_kl | 0.08329061 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.0419 | -| n_updates | 162780 | -| policy_gradient_loss | 0.0102 | -| std | 0.0086 | -| value_loss | 1.24e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16280 | -| time_elapsed | 87316 | -| total_timesteps | 2083840 | -| train/ | | -| approx_kl | 0.01318168 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.000374 | -| n_updates | 162790 | -| policy_gradient_loss | 0.0177 | -| std | 0.0086 | -| value_loss | 5.81e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16281 | -| time_elapsed | 87321 | -| total_timesteps | 2083968 | -| train/ | | -| approx_kl | 0.061749723 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 162800 | -| policy_gradient_loss | 0.0162 | -| std | 0.0086 | -| value_loss | 4.97e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16282 | -| time_elapsed | 87325 | -| total_timesteps | 2084096 | -| train/ | | -| approx_kl | 0.3154665 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | 0.0739 | -| n_updates | 162810 | -| policy_gradient_loss | 0.021 | -| std | 0.0086 | -| value_loss | 3.4e-10 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16283 | -| time_elapsed | 87335 | -| total_timesteps | 2084224 | -| train/ | | -| approx_kl | 0.0014269813 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 162820 | -| policy_gradient_loss | -0.0132 | -| std | 0.0086 | -| value_loss | 0.000263 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16284 | -| time_elapsed | 87340 | -| total_timesteps | 2084352 | -| train/ | | -| approx_kl | 0.0020913822 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.00854 | -| n_updates | 162830 | -| policy_gradient_loss | 0.00624 | -| std | 0.0086 | -| value_loss | 1.04e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16285 | -| time_elapsed | 87344 | -| total_timesteps | 2084480 | -| train/ | | -| approx_kl | 0.0072012786 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | 0.00493 | -| n_updates | 162840 | -| policy_gradient_loss | 0.0132 | -| std | 0.00859 | -| value_loss | 3.94e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16286 | -| time_elapsed | 87348 | -| total_timesteps | 2084608 | -| train/ | | -| approx_kl | 0.23631032 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.238 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 162850 | -| policy_gradient_loss | 0.0985 | -| std | 0.00859 | -| value_loss | 2.56e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16287 | -| time_elapsed | 87352 | -| total_timesteps | 2084736 | -| train/ | | -| approx_kl | 0.12326681 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 162860 | -| policy_gradient_loss | 0.0941 | -| std | 0.00859 | -| value_loss | 1.84e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16288 | -| time_elapsed | 87356 | -| total_timesteps | 2084864 | -| train/ | | -| approx_kl | 0.093766704 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.058 | -| n_updates | 162870 | -| policy_gradient_loss | 0.0891 | -| std | 0.00859 | -| value_loss | 1.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16289 | -| time_elapsed | 87360 | -| total_timesteps | 2084992 | -| train/ | | -| approx_kl | 0.017697234 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.00605 | -| n_updates | 162880 | -| policy_gradient_loss | 0.013 | -| std | 0.00859 | -| value_loss | 9.69e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16290 | -| time_elapsed | 87365 | -| total_timesteps | 2085120 | -| train/ | | -| approx_kl | 0.08753952 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0606 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 162890 | -| policy_gradient_loss | 0.00793 | -| std | 0.00859 | -| value_loss | 4.11e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16291 | -| time_elapsed | 87375 | -| total_timesteps | 2085248 | -| train/ | | -| approx_kl | 0.0005123266 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 162900 | -| policy_gradient_loss | -0.00465 | -| std | 0.00859 | -| value_loss | 0.00016 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16292 | -| time_elapsed | 87380 | -| total_timesteps | 2085376 | -| train/ | | -| approx_kl | 0.02400208 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.00677 | -| n_updates | 162910 | -| policy_gradient_loss | 0.0332 | -| std | 0.00859 | -| value_loss | 1.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16293 | -| time_elapsed | 87384 | -| total_timesteps | 2085504 | -| train/ | | -| approx_kl | 0.09759496 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.0024 | -| learning_rate | 0.0003 | -| loss | 0.0548 | -| n_updates | 162920 | -| policy_gradient_loss | 0.0264 | -| std | 0.0086 | -| value_loss | 9.6e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16294 | -| time_elapsed | 87389 | -| total_timesteps | 2085632 | -| train/ | | -| approx_kl | 0.0017243247 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 162930 | -| policy_gradient_loss | 0.0035 | -| std | 0.00861 | -| value_loss | 1.58e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16295 | -| time_elapsed | 87393 | -| total_timesteps | 2085760 | -| train/ | | -| approx_kl | 0.052375518 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.00791 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 162940 | -| policy_gradient_loss | 0.0523 | -| std | 0.00862 | -| value_loss | 3.4e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16296 | -| time_elapsed | 87398 | -| total_timesteps | 2085888 | -| train/ | | -| approx_kl | 0.14120178 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.0762 | -| n_updates | 162950 | -| policy_gradient_loss | 0.0318 | -| std | 0.00862 | -| value_loss | 2.82e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16297 | -| time_elapsed | 87401 | -| total_timesteps | 2086016 | -| train/ | | -| approx_kl | 0.0010084696 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 162960 | -| policy_gradient_loss | 0.0104 | -| std | 0.00862 | -| value_loss | 1.74e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16298 | -| time_elapsed | 87409 | -| total_timesteps | 2086144 | -| train/ | | -| approx_kl | 0.017500866 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 162970 | -| policy_gradient_loss | -0.00211 | -| std | 0.00862 | -| value_loss | 0.00414 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16299 | -| time_elapsed | 87414 | -| total_timesteps | 2086272 | -| train/ | | -| approx_kl | 0.09159997 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | 0.00964 | -| n_updates | 162980 | -| policy_gradient_loss | 0.00344 | -| std | 0.00862 | -| value_loss | 9.27e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16300 | -| time_elapsed | 87419 | -| total_timesteps | 2086400 | -| train/ | | -| approx_kl | 0.07449118 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00324 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 162990 | -| policy_gradient_loss | 0.00722 | -| std | 0.00863 | -| value_loss | 8.58e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16301 | -| time_elapsed | 87425 | -| total_timesteps | 2086528 | -| train/ | | -| approx_kl | 0.29276097 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.0958 | -| n_updates | 163000 | -| policy_gradient_loss | 0.0236 | -| std | 0.00863 | -| value_loss | 5.78e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16302 | -| time_elapsed | 87429 | -| total_timesteps | 2086656 | -| train/ | | -| approx_kl | 0.0150556415 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 163010 | -| policy_gradient_loss | 0.0029 | -| std | 0.00863 | -| value_loss | 3.49e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16303 | -| time_elapsed | 87435 | -| total_timesteps | 2086784 | -| train/ | | -| approx_kl | 0.03434579 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.00656 | -| n_updates | 163020 | -| policy_gradient_loss | 0.00212 | -| std | 0.00862 | -| value_loss | 2.52e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16304 | -| time_elapsed | 87441 | -| total_timesteps | 2086912 | -| train/ | | -| approx_kl | 0.0041627632 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | -0.00702 | -| n_updates | 163030 | -| policy_gradient_loss | 0.00065 | -| std | 0.00862 | -| value_loss | 1.6e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16305 | -| time_elapsed | 87446 | -| total_timesteps | 2087040 | -| train/ | | -| approx_kl | 0.056171466 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 163040 | -| policy_gradient_loss | 0.00519 | -| std | 0.00862 | -| value_loss | 1.08e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16306 | -| time_elapsed | 87458 | -| total_timesteps | 2087168 | -| train/ | | -| approx_kl | 0.0051593785 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.934 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 163050 | -| policy_gradient_loss | -0.0132 | -| std | 0.00862 | -| value_loss | 0.000692 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16307 | -| time_elapsed | 87463 | -| total_timesteps | 2087296 | -| train/ | | -| approx_kl | 0.027616864 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00124 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 163060 | -| policy_gradient_loss | 0.0828 | -| std | 0.00861 | -| value_loss | 1.07e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16308 | -| time_elapsed | 87469 | -| total_timesteps | 2087424 | -| train/ | | -| approx_kl | 0.09035151 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.811 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 163070 | -| policy_gradient_loss | -0.0079 | -| std | 0.00861 | -| value_loss | 8.65e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16309 | -| time_elapsed | 87474 | -| total_timesteps | 2087552 | -| train/ | | -| approx_kl | 0.08062285 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | 0.0738 | -| n_updates | 163080 | -| policy_gradient_loss | 0.0131 | -| std | 0.00861 | -| value_loss | 4.95e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16310 | -| time_elapsed | 87479 | -| total_timesteps | 2087680 | -| train/ | | -| approx_kl | 0.3936484 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0749 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 163090 | -| policy_gradient_loss | 0.0489 | -| std | 0.00861 | -| value_loss | 2.42e-08 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16311 | -| time_elapsed | 87482 | -| total_timesteps | 2087808 | -| train/ | | -| approx_kl | 0.00059441663 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 163100 | -| policy_gradient_loss | -0.0021 | -| std | 0.0086 | -| value_loss | 3.12e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 16312 | -| time_elapsed | 87487 | -| total_timesteps | 2087936 | -| train/ | | -| approx_kl | 0.0051549687 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 163110 | -| policy_gradient_loss | 0.0026 | -| std | 0.00861 | -| value_loss | 1.72e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16313 | -| time_elapsed | 87491 | -| total_timesteps | 2088064 | -| train/ | | -| approx_kl | 0.047336362 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 163120 | -| policy_gradient_loss | 0.0105 | -| std | 0.00861 | -| value_loss | 2.63e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16314 | -| time_elapsed | 87500 | -| total_timesteps | 2088192 | -| train/ | | -| approx_kl | 0.06619743 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.516 | -| learning_rate | 0.0003 | -| loss | -0.00858 | -| n_updates | 163130 | -| policy_gradient_loss | -0.00839 | -| std | 0.00861 | -| value_loss | 0.00102 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16315 | -| time_elapsed | 87504 | -| total_timesteps | 2088320 | -| train/ | | -| approx_kl | 0.0072767762 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 163140 | -| policy_gradient_loss | 0.0066 | -| std | 0.00865 | -| value_loss | 6.57e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16316 | -| time_elapsed | 87508 | -| total_timesteps | 2088448 | -| train/ | | -| approx_kl | 0.06757349 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | -0.000118 | -| n_updates | 163150 | -| policy_gradient_loss | -0.0107 | -| std | 0.00868 | -| value_loss | 5.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16317 | -| time_elapsed | 87512 | -| total_timesteps | 2088576 | -| train/ | | -| approx_kl | 0.010140936 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00655 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 163160 | -| policy_gradient_loss | 0.00253 | -| std | 0.00868 | -| value_loss | 4.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16318 | -| time_elapsed | 87517 | -| total_timesteps | 2088704 | -| train/ | | -| approx_kl | 0.027542526 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 163170 | -| policy_gradient_loss | -0.0038 | -| std | 0.00869 | -| value_loss | 2.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16319 | -| time_elapsed | 87522 | -| total_timesteps | 2088832 | -| train/ | | -| approx_kl | 0.005587524 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 163180 | -| policy_gradient_loss | 0.00208 | -| std | 0.00869 | -| value_loss | 1.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 16320 | -| time_elapsed | 87527 | -| total_timesteps | 2088960 | -| train/ | | -| approx_kl | 0.030670032 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 163190 | -| policy_gradient_loss | 0.00107 | -| std | 0.00869 | -| value_loss | 8.91e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16321 | -| time_elapsed | 87531 | -| total_timesteps | 2089088 | -| train/ | | -| approx_kl | 0.0064205085 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.000662 | -| n_updates | 163200 | -| policy_gradient_loss | 0.00203 | -| std | 0.0087 | -| value_loss | 6.13e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16322 | -| time_elapsed | 87538 | -| total_timesteps | 2089216 | -| train/ | | -| approx_kl | 0.025440611 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 163210 | -| policy_gradient_loss | -0.0129 | -| std | 0.0087 | -| value_loss | 0.000563 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16323 | -| time_elapsed | 87542 | -| total_timesteps | 2089344 | -| train/ | | -| approx_kl | 0.11487056 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | 0.0703 | -| n_updates | 163220 | -| policy_gradient_loss | 0.0376 | -| std | 0.0087 | -| value_loss | 1.29e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16324 | -| time_elapsed | 87545 | -| total_timesteps | 2089472 | -| train/ | | -| approx_kl | 0.02172019 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.427 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 163230 | -| policy_gradient_loss | 0.0138 | -| std | 0.0087 | -| value_loss | 4.4e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16325 | -| time_elapsed | 87549 | -| total_timesteps | 2089600 | -| train/ | | -| approx_kl | 0.06419644 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 163240 | -| policy_gradient_loss | 0.016 | -| std | 0.00871 | -| value_loss | 2.73e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16326 | -| time_elapsed | 87553 | -| total_timesteps | 2089728 | -| train/ | | -| approx_kl | 0.0029733563 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | 0.00361 | -| n_updates | 163250 | -| policy_gradient_loss | 0.00648 | -| std | 0.00871 | -| value_loss | 1.67e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16327 | -| time_elapsed | 87557 | -| total_timesteps | 2089856 | -| train/ | | -| approx_kl | 0.0183097 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.000617 | -| n_updates | 163260 | -| policy_gradient_loss | 0.026 | -| std | 0.00871 | -| value_loss | 1.27e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 16328 | -| time_elapsed | 87563 | -| total_timesteps | 2089984 | -| train/ | | -| approx_kl | 0.08155423 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.0772 | -| n_updates | 163270 | -| policy_gradient_loss | 0.0411 | -| std | 0.00871 | -| value_loss | 8.33e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 16329 | -| time_elapsed | 87568 | -| total_timesteps | 2090112 | -| train/ | | -| approx_kl | 0.02265096 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 163280 | -| policy_gradient_loss | 0.0277 | -| std | 0.00871 | -| value_loss | 5.98e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 16330 | -| time_elapsed | 87580 | -| total_timesteps | 2090240 | -| train/ | | -| approx_kl | 0.6737431 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.0733 | -| learning_rate | 0.0003 | -| loss | 0.0356 | -| n_updates | 163290 | -| policy_gradient_loss | 0.0164 | -| std | 0.00871 | -| value_loss | 0.00133 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 16331 | -| time_elapsed | 87585 | -| total_timesteps | 2090368 | -| train/ | | -| approx_kl | 0.0032024859 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00105 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 163300 | -| policy_gradient_loss | 0.0236 | -| std | 0.00871 | -| value_loss | 1.1e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 16332 | -| time_elapsed | 87591 | -| total_timesteps | 2090496 | -| train/ | | -| approx_kl | 0.026495706 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 163310 | -| policy_gradient_loss | 0.00213 | -| std | 0.0087 | -| value_loss | 5.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 16333 | -| time_elapsed | 87595 | -| total_timesteps | 2090624 | -| train/ | | -| approx_kl | 0.030839624 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 163320 | -| policy_gradient_loss | -0.00313 | -| std | 0.00871 | -| value_loss | 6.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 16334 | -| time_elapsed | 87600 | -| total_timesteps | 2090752 | -| train/ | | -| approx_kl | 0.098747276 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 163330 | -| policy_gradient_loss | 0.0151 | -| std | 0.00871 | -| value_loss | 4.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 16335 | -| time_elapsed | 87605 | -| total_timesteps | 2090880 | -| train/ | | -| approx_kl | 0.03581165 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00433 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 163340 | -| policy_gradient_loss | 0.0153 | -| std | 0.00871 | -| value_loss | 1.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16336 | -| time_elapsed | 87609 | -| total_timesteps | 2091008 | -| train/ | | -| approx_kl | 0.16469142 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0981 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 163350 | -| policy_gradient_loss | 0.0115 | -| std | 0.00871 | -| value_loss | 2.16e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16337 | -| time_elapsed | 87620 | -| total_timesteps | 2091136 | -| train/ | | -| approx_kl | 0.05764354 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 163360 | -| policy_gradient_loss | -0.0169 | -| std | 0.00871 | -| value_loss | 0.00139 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16338 | -| time_elapsed | 87625 | -| total_timesteps | 2091264 | -| train/ | | -| approx_kl | 0.016665358 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.554 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 163370 | -| policy_gradient_loss | 0.0226 | -| std | 0.00871 | -| value_loss | 2.77e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16339 | -| time_elapsed | 87629 | -| total_timesteps | 2091392 | -| train/ | | -| approx_kl | 0.17800039 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -34.4 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 163380 | -| policy_gradient_loss | 0.0118 | -| std | 0.00871 | -| value_loss | 5.9e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16340 | -| time_elapsed | 87634 | -| total_timesteps | 2091520 | -| train/ | | -| approx_kl | 0.02865302 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -3.76 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 163390 | -| policy_gradient_loss | 0.023 | -| std | 0.00871 | -| value_loss | 9.38e-09 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16341 | -| time_elapsed | 87638 | -| total_timesteps | 2091648 | -| train/ | | -| approx_kl | 0.129484 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.454 | -| learning_rate | 0.0003 | -| loss | 0.0661 | -| n_updates | 163400 | -| policy_gradient_loss | 0.0228 | -| std | 0.00871 | -| value_loss | 3.82e-09 | --------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16342 | -| time_elapsed | 87642 | -| total_timesteps | 2091776 | -| train/ | | -| approx_kl | 0.0254607 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.00259 | -| n_updates | 163410 | -| policy_gradient_loss | 0.0354 | -| std | 0.00872 | -| value_loss | 2.86e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 16343 | -| time_elapsed | 87645 | -| total_timesteps | 2091904 | -| train/ | | -| approx_kl | 0.16513519 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00798 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 163420 | -| policy_gradient_loss | 0.0346 | -| std | 0.00871 | -| value_loss | 1.66e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16344 | -| time_elapsed | 87650 | -| total_timesteps | 2092032 | -| train/ | | -| approx_kl | 0.035495896 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.00857 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 163430 | -| policy_gradient_loss | 0.0462 | -| std | 0.00871 | -| value_loss | 9.47e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16345 | -| time_elapsed | 87658 | -| total_timesteps | 2092160 | -| train/ | | -| approx_kl | 0.15243825 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -3.7 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 163440 | -| policy_gradient_loss | -0.0168 | -| std | 0.00871 | -| value_loss | 0.00198 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16346 | -| time_elapsed | 87663 | -| total_timesteps | 2092288 | -| train/ | | -| approx_kl | 0.0032165023 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -40.1 | -| learning_rate | 0.0003 | -| loss | -0.000717 | -| n_updates | 163450 | -| policy_gradient_loss | 0.00531 | -| std | 0.0087 | -| value_loss | 0.000118 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16347 | -| time_elapsed | 87667 | -| total_timesteps | 2092416 | -| train/ | | -| approx_kl | 0.039404478 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00595 | -| learning_rate | 0.0003 | -| loss | 0.007 | -| n_updates | 163460 | -| policy_gradient_loss | 0.00969 | -| std | 0.00869 | -| value_loss | 8.95e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16348 | -| time_elapsed | 87672 | -| total_timesteps | 2092544 | -| train/ | | -| approx_kl | 0.07663558 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.00856 | -| n_updates | 163470 | -| policy_gradient_loss | 0.00481 | -| std | 0.00869 | -| value_loss | 5.03e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16349 | -| time_elapsed | 87677 | -| total_timesteps | 2092672 | -| train/ | | -| approx_kl | 0.00054150866 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00082 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 163480 | -| policy_gradient_loss | 0.0179 | -| std | 0.00869 | -| value_loss | 1.2e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16350 | -| time_elapsed | 87683 | -| total_timesteps | 2092800 | -| train/ | | -| approx_kl | 0.0006840923 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 9.54e-05 | -| n_updates | 163490 | -| policy_gradient_loss | 0.0153 | -| std | 0.00869 | -| value_loss | 2.94e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16351 | -| time_elapsed | 87689 | -| total_timesteps | 2092928 | -| train/ | | -| approx_kl | 0.016256921 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 163500 | -| policy_gradient_loss | -0.00551 | -| std | 0.00869 | -| value_loss | 4.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16352 | -| time_elapsed | 87695 | -| total_timesteps | 2093056 | -| train/ | | -| approx_kl | 0.051105108 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00293 | -| learning_rate | 0.0003 | -| loss | 0.0532 | -| n_updates | 163510 | -| policy_gradient_loss | 0.08 | -| std | 0.0087 | -| value_loss | 3.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16353 | -| time_elapsed | 87704 | -| total_timesteps | 2093184 | -| train/ | | -| approx_kl | 0.09984653 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.76 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 163520 | -| policy_gradient_loss | 0.0234 | -| std | 0.0087 | -| value_loss | 0.00348 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16354 | -| time_elapsed | 87709 | -| total_timesteps | 2093312 | -| train/ | | -| approx_kl | 0.09295433 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 163530 | -| policy_gradient_loss | 0.0682 | -| std | 0.0087 | -| value_loss | 1.05e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16355 | -| time_elapsed | 87714 | -| total_timesteps | 2093440 | -| train/ | | -| approx_kl | 0.016872209 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.521 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 163540 | -| policy_gradient_loss | 0.00913 | -| std | 0.0087 | -| value_loss | 8.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16356 | -| time_elapsed | 87719 | -| total_timesteps | 2093568 | -| train/ | | -| approx_kl | 0.08498144 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00785 | -| learning_rate | 0.0003 | -| loss | 0.0515 | -| n_updates | 163550 | -| policy_gradient_loss | 0.0114 | -| std | 0.0087 | -| value_loss | 7.06e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16357 | -| time_elapsed | 87723 | -| total_timesteps | 2093696 | -| train/ | | -| approx_kl | 0.008113608 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 163560 | -| policy_gradient_loss | -0.00164 | -| std | 0.0087 | -| value_loss | 4.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16358 | -| time_elapsed | 87727 | -| total_timesteps | 2093824 | -| train/ | | -| approx_kl | 0.015098279 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 163570 | -| policy_gradient_loss | 0.00671 | -| std | 0.0087 | -| value_loss | 4.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16359 | -| time_elapsed | 87731 | -| total_timesteps | 2093952 | -| train/ | | -| approx_kl | 0.053200155 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00898 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 163580 | -| policy_gradient_loss | 0.014 | -| std | 0.0087 | -| value_loss | 2.01e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16360 | -| time_elapsed | 87735 | -| total_timesteps | 2094080 | -| train/ | | -| approx_kl | 0.17543575 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0477 | -| n_updates | 163590 | -| policy_gradient_loss | 0.0135 | -| std | 0.00869 | -| value_loss | 1.41e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16361 | -| time_elapsed | 87741 | -| total_timesteps | 2094208 | -| train/ | | -| approx_kl | 0.047397263 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.7 | -| learning_rate | 0.0003 | -| loss | 0.000223 | -| n_updates | 163600 | -| policy_gradient_loss | 0.00359 | -| std | 0.00869 | -| value_loss | 0.00545 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16362 | -| time_elapsed | 87745 | -| total_timesteps | 2094336 | -| train/ | | -| approx_kl | 0.2297679 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00884 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 163610 | -| policy_gradient_loss | 0.116 | -| std | 0.00869 | -| value_loss | 1.19e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16363 | -| time_elapsed | 87750 | -| total_timesteps | 2094464 | -| train/ | | -| approx_kl | 0.02847266 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00633 | -| learning_rate | 0.0003 | -| loss | 0.000244 | -| n_updates | 163620 | -| policy_gradient_loss | 0.0103 | -| std | 0.00869 | -| value_loss | 3.09e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16364 | -| time_elapsed | 87755 | -| total_timesteps | 2094592 | -| train/ | | -| approx_kl | 0.34229472 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00727 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 163630 | -| policy_gradient_loss | 0.0463 | -| std | 0.00869 | -| value_loss | 1.13e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16365 | -| time_elapsed | 87760 | -| total_timesteps | 2094720 | -| train/ | | -| approx_kl | 0.0214834 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.00472 | -| n_updates | 163640 | -| policy_gradient_loss | 0.00299 | -| std | 0.00869 | -| value_loss | 7.68e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16366 | -| time_elapsed | 87766 | -| total_timesteps | 2094848 | -| train/ | | -| approx_kl | 1.8337276e-05 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.000317 | -| n_updates | 163650 | -| policy_gradient_loss | 0.0025 | -| std | 0.00868 | -| value_loss | 5.22e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 16367 | -| time_elapsed | 87770 | -| total_timesteps | 2094976 | -| train/ | | -| approx_kl | 0.030018376 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 163660 | -| policy_gradient_loss | 0.00445 | -| std | 0.00868 | -| value_loss | 2.83e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16368 | -| time_elapsed | 87773 | -| total_timesteps | 2095104 | -| train/ | | -| approx_kl | 9.831088e-05 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.000755 | -| n_updates | 163670 | -| policy_gradient_loss | 0.00205 | -| std | 0.00867 | -| value_loss | 1.95e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16369 | -| time_elapsed | 87784 | -| total_timesteps | 2095232 | -| train/ | | -| approx_kl | 0.08677172 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.71 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 163680 | -| policy_gradient_loss | -0.00356 | -| std | 0.00867 | -| value_loss | 0.00517 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16370 | -| time_elapsed | 87788 | -| total_timesteps | 2095360 | -| train/ | | -| approx_kl | 9.774836e-05 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.0025 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 163690 | -| policy_gradient_loss | 0.0421 | -| std | 0.00866 | -| value_loss | 6.48e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16371 | -| time_elapsed | 87793 | -| total_timesteps | 2095488 | -| train/ | | -| approx_kl | 0.051780514 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 163700 | -| policy_gradient_loss | 0.00243 | -| std | 0.00866 | -| value_loss | 2.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16372 | -| time_elapsed | 87798 | -| total_timesteps | 2095616 | -| train/ | | -| approx_kl | 0.09378683 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 163710 | -| policy_gradient_loss | 0.00404 | -| std | 0.00866 | -| value_loss | 1.32e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16373 | -| time_elapsed | 87802 | -| total_timesteps | 2095744 | -| train/ | | -| approx_kl | 0.009301033 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.00256 | -| n_updates | 163720 | -| policy_gradient_loss | 0.00433 | -| std | 0.00866 | -| value_loss | 7.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16374 | -| time_elapsed | 87808 | -| total_timesteps | 2095872 | -| train/ | | -| approx_kl | 0.029605027 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 163730 | -| policy_gradient_loss | 0.00629 | -| std | 0.00866 | -| value_loss | 4.88e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16375 | -| time_elapsed | 87813 | -| total_timesteps | 2096000 | -| train/ | | -| approx_kl | 0.0049335384 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 163740 | -| policy_gradient_loss | 0.001 | -| std | 0.00866 | -| value_loss | 2.97e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16376 | -| time_elapsed | 87818 | -| total_timesteps | 2096128 | -| train/ | | -| approx_kl | 0.052831788 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00215 | -| learning_rate | 0.0003 | -| loss | -0.000159 | -| n_updates | 163750 | -| policy_gradient_loss | -0.00413 | -| std | 0.00866 | -| value_loss | 5.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16377 | -| time_elapsed | 87827 | -| total_timesteps | 2096256 | -| train/ | | -| approx_kl | 0.03154093 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.763 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 163760 | -| policy_gradient_loss | -0.0142 | -| std | 0.00866 | -| value_loss | 0.00366 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16378 | -| time_elapsed | 87833 | -| total_timesteps | 2096384 | -| train/ | | -| approx_kl | 0.14396101 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00412 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 163770 | -| policy_gradient_loss | 0.0101 | -| std | 0.00866 | -| value_loss | 3.43e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16379 | -| time_elapsed | 87837 | -| total_timesteps | 2096512 | -| train/ | | -| approx_kl | 0.0052319136 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0964 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 163780 | -| policy_gradient_loss | 0.0141 | -| std | 0.00865 | -| value_loss | 1.01e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16380 | -| time_elapsed | 87841 | -| total_timesteps | 2096640 | -| train/ | | -| approx_kl | 0.033050325 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 163790 | -| policy_gradient_loss | 0.00598 | -| std | 0.00864 | -| value_loss | 1.09e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16381 | -| time_elapsed | 87845 | -| total_timesteps | 2096768 | -| train/ | | -| approx_kl | 0.13735871 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | 0.0441 | -| n_updates | 163800 | -| policy_gradient_loss | 0.0181 | -| std | 0.00863 | -| value_loss | 5.12e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16382 | -| time_elapsed | 87849 | -| total_timesteps | 2096896 | -| train/ | | -| approx_kl | 0.00037202425 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 163810 | -| policy_gradient_loss | -0.00381 | -| std | 0.00863 | -| value_loss | 4.17e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16383 | -| time_elapsed | 87854 | -| total_timesteps | 2097024 | -| train/ | | -| approx_kl | 0.039256968 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 163820 | -| policy_gradient_loss | 0.0347 | -| std | 0.00863 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16384 | -| time_elapsed | 87865 | -| total_timesteps | 2097152 | -| train/ | | -| approx_kl | 0.018732918 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 163830 | -| policy_gradient_loss | -0.00613 | -| std | 0.00863 | -| value_loss | 1.8e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16385 | -| time_elapsed | 87870 | -| total_timesteps | 2097280 | -| train/ | | -| approx_kl | 0.110600196 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.0406 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 163840 | -| policy_gradient_loss | 0.0131 | -| std | 0.00863 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16386 | -| time_elapsed | 87875 | -| total_timesteps | 2097408 | -| train/ | | -| approx_kl | 0.010089636 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0678 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 163850 | -| policy_gradient_loss | -0.00409 | -| std | 0.00863 | -| value_loss | 3.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16387 | -| time_elapsed | 87880 | -| total_timesteps | 2097536 | -| train/ | | -| approx_kl | 0.010786146 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | -0.00797 | -| n_updates | 163860 | -| policy_gradient_loss | 0.0108 | -| std | 0.00863 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16388 | -| time_elapsed | 87885 | -| total_timesteps | 2097664 | -| train/ | | -| approx_kl | 0.050701257 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 163870 | -| policy_gradient_loss | 0.0137 | -| std | 0.00862 | -| value_loss | 1.68e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16389 | -| time_elapsed | 87890 | -| total_timesteps | 2097792 | -| train/ | | -| approx_kl | 9.382283e-05 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | -0.00014 | -| n_updates | 163880 | -| policy_gradient_loss | 0.0143 | -| std | 0.00862 | -| value_loss | 7.78e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16390 | -| time_elapsed | 87894 | -| total_timesteps | 2097920 | -| train/ | | -| approx_kl | 0.37149113 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 163890 | -| policy_gradient_loss | 0.0428 | -| std | 0.00861 | -| value_loss | 7.98e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16391 | -| time_elapsed | 87898 | -| total_timesteps | 2098048 | -| train/ | | -| approx_kl | 0.005988335 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 163900 | -| policy_gradient_loss | -0.000894 | -| std | 0.00861 | -| value_loss | 3.65e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16392 | -| time_elapsed | 87908 | -| total_timesteps | 2098176 | -| train/ | | -| approx_kl | 0.0019695908 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 163910 | -| policy_gradient_loss | -0.00857 | -| std | 0.00862 | -| value_loss | 0.00033 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16393 | -| time_elapsed | 87911 | -| total_timesteps | 2098304 | -| train/ | | -| approx_kl | 0.029697977 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 163920 | -| policy_gradient_loss | 0.0275 | -| std | 0.00863 | -| value_loss | 8.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16394 | -| time_elapsed | 87915 | -| total_timesteps | 2098432 | -| train/ | | -| approx_kl | 0.47012103 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.94 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 163930 | -| policy_gradient_loss | 0.0861 | -| std | 0.00863 | -| value_loss | 1.98e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16395 | -| time_elapsed | 87921 | -| total_timesteps | 2098560 | -| train/ | | -| approx_kl | 0.14498402 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | 0.0448 | -| n_updates | 163940 | -| policy_gradient_loss | 0.0173 | -| std | 0.00864 | -| value_loss | 3.17e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16396 | -| time_elapsed | 87926 | -| total_timesteps | 2098688 | -| train/ | | -| approx_kl | 0.053562786 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00434 | -| learning_rate | 0.0003 | -| loss | 0.0498 | -| n_updates | 163950 | -| policy_gradient_loss | 0.0409 | -| std | 0.00863 | -| value_loss | 1.22e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16397 | -| time_elapsed | 87932 | -| total_timesteps | 2098816 | -| train/ | | -| approx_kl | 0.09148962 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00889 | -| learning_rate | 0.0003 | -| loss | 0.0572 | -| n_updates | 163960 | -| policy_gradient_loss | 0.0246 | -| std | 0.00862 | -| value_loss | 5.74e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 16398 | -| time_elapsed | 87936 | -| total_timesteps | 2098944 | -| train/ | | -| approx_kl | 0.18413697 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00439 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 163970 | -| policy_gradient_loss | 0.000469 | -| std | 0.00862 | -| value_loss | 1.02e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16399 | -| time_elapsed | 87941 | -| total_timesteps | 2099072 | -| train/ | | -| approx_kl | 0.03568767 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.000365 | -| n_updates | 163980 | -| policy_gradient_loss | 0.00735 | -| std | 0.00861 | -| value_loss | 7.56e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16400 | -| time_elapsed | 87949 | -| total_timesteps | 2099200 | -| train/ | | -| approx_kl | 0.015148023 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.312 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 163990 | -| policy_gradient_loss | -0.0107 | -| std | 0.00861 | -| value_loss | 0.000961 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16401 | -| time_elapsed | 87954 | -| total_timesteps | 2099328 | -| train/ | | -| approx_kl | 0.18074203 | -| clip_fraction | 0.679 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00481 | -| learning_rate | 0.0003 | -| loss | 0.0984 | -| n_updates | 164000 | -| policy_gradient_loss | 0.0793 | -| std | 0.00861 | -| value_loss | 7.02e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16402 | -| time_elapsed | 87958 | -| total_timesteps | 2099456 | -| train/ | | -| approx_kl | 0.10888128 | -| clip_fraction | 0.66 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 164010 | -| policy_gradient_loss | 0.0922 | -| std | 0.00862 | -| value_loss | 2.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16403 | -| time_elapsed | 87961 | -| total_timesteps | 2099584 | -| train/ | | -| approx_kl | 0.021489069 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 164020 | -| policy_gradient_loss | 0.0237 | -| std | 0.00861 | -| value_loss | 2.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16404 | -| time_elapsed | 87966 | -| total_timesteps | 2099712 | -| train/ | | -| approx_kl | 0.091211215 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 164030 | -| policy_gradient_loss | 0.0118 | -| std | 0.00861 | -| value_loss | 5.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16405 | -| time_elapsed | 87969 | -| total_timesteps | 2099840 | -| train/ | | -| approx_kl | 0.10873008 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 164040 | -| policy_gradient_loss | 0.0114 | -| std | 0.00861 | -| value_loss | 8.93e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16406 | -| time_elapsed | 87973 | -| total_timesteps | 2099968 | -| train/ | | -| approx_kl | 0.06484153 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 164050 | -| policy_gradient_loss | 0.0192 | -| std | 0.00862 | -| value_loss | 8.24e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16407 | -| time_elapsed | 87979 | -| total_timesteps | 2100096 | -| train/ | | -| approx_kl | 0.20398311 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 164060 | -| policy_gradient_loss | 0.0758 | -| std | 0.00862 | -| value_loss | 5.19e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16408 | -| time_elapsed | 87987 | -| total_timesteps | 2100224 | -| train/ | | -| approx_kl | 0.06404474 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 164070 | -| policy_gradient_loss | -0.013 | -| std | 0.00862 | -| value_loss | 0.000887 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16409 | -| time_elapsed | 87992 | -| total_timesteps | 2100352 | -| train/ | | -| approx_kl | 0.18768814 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 164080 | -| policy_gradient_loss | 0.0131 | -| std | 0.00863 | -| value_loss | 1.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16410 | -| time_elapsed | 87996 | -| total_timesteps | 2100480 | -| train/ | | -| approx_kl | 0.010409653 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 164090 | -| policy_gradient_loss | 0.00834 | -| std | 0.00861 | -| value_loss | 2.92e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16411 | -| time_elapsed | 88000 | -| total_timesteps | 2100608 | -| train/ | | -| approx_kl | 0.042373918 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00395 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 164100 | -| policy_gradient_loss | 0.0205 | -| std | 0.00859 | -| value_loss | 2.1e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16412 | -| time_elapsed | 88005 | -| total_timesteps | 2100736 | -| train/ | | -| approx_kl | 0.0015651844 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00442 | -| learning_rate | 0.0003 | -| loss | 0.00524 | -| n_updates | 164110 | -| policy_gradient_loss | 0.00151 | -| std | 0.00859 | -| value_loss | 2.76e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16413 | -| time_elapsed | 88010 | -| total_timesteps | 2100864 | -| train/ | | -| approx_kl | 0.10562827 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 164120 | -| policy_gradient_loss | 0.0879 | -| std | 0.00858 | -| value_loss | 2.71e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 16414 | -| time_elapsed | 88014 | -| total_timesteps | 2100992 | -| train/ | | -| approx_kl | 0.024870435 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.00961 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 164130 | -| policy_gradient_loss | 0.0195 | -| std | 0.00859 | -| value_loss | 1.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 16415 | -| time_elapsed | 88018 | -| total_timesteps | 2101120 | -| train/ | | -| approx_kl | 0.11151314 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | 0.0539 | -| n_updates | 164140 | -| policy_gradient_loss | 0.0132 | -| std | 0.00859 | -| value_loss | 9.87e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 16416 | -| time_elapsed | 88032 | -| total_timesteps | 2101248 | -| train/ | | -| approx_kl | 0.018591046 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.826 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 164150 | -| policy_gradient_loss | -0.0187 | -| std | 0.0086 | -| value_loss | 0.0023 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 16417 | -| time_elapsed | 88037 | -| total_timesteps | 2101376 | -| train/ | | -| approx_kl | 0.16003412 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 164160 | -| policy_gradient_loss | -0.0023 | -| std | 0.00861 | -| value_loss | 4.85e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 16418 | -| time_elapsed | 88041 | -| total_timesteps | 2101504 | -| train/ | | -| approx_kl | 0.015544612 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.291 | -| learning_rate | 0.0003 | -| loss | 0.00474 | -| n_updates | 164170 | -| policy_gradient_loss | 0.0168 | -| std | 0.00863 | -| value_loss | 6.45e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 16419 | -| time_elapsed | 88045 | -| total_timesteps | 2101632 | -| train/ | | -| approx_kl | 0.06746248 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.28 | -| learning_rate | 0.0003 | -| loss | 0.000924 | -| n_updates | 164180 | -| policy_gradient_loss | 0.0151 | -| std | 0.00864 | -| value_loss | 3.66e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 16420 | -| time_elapsed | 88051 | -| total_timesteps | 2101760 | -| train/ | | -| approx_kl | 0.14314885 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 0.0652 | -| n_updates | 164190 | -| policy_gradient_loss | 0.0308 | -| std | 0.00865 | -| value_loss | 1.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 16421 | -| time_elapsed | 88055 | -| total_timesteps | 2101888 | -| train/ | | -| approx_kl | 0.0011357139 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | -0.00244 | -| n_updates | 164200 | -| policy_gradient_loss | 0.0063 | -| std | 0.00865 | -| value_loss | 1.21e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16422 | -| time_elapsed | 88060 | -| total_timesteps | 2102016 | -| train/ | | -| approx_kl | 0.04213565 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0557 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 164210 | -| policy_gradient_loss | 0.0445 | -| std | 0.00866 | -| value_loss | 6.91e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16423 | -| time_elapsed | 88071 | -| total_timesteps | 2102144 | -| train/ | | -| approx_kl | 0.03148961 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.697 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 164220 | -| policy_gradient_loss | -0.0183 | -| std | 0.00865 | -| value_loss | 0.00207 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16424 | -| time_elapsed | 88076 | -| total_timesteps | 2102272 | -| train/ | | -| approx_kl | 0.035566002 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.316 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 164230 | -| policy_gradient_loss | 0.0455 | -| std | 0.00865 | -| value_loss | 7.33e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16425 | -| time_elapsed | 88080 | -| total_timesteps | 2102400 | -| train/ | | -| approx_kl | 0.1104797 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.0467 | -| n_updates | 164240 | -| policy_gradient_loss | 0.0179 | -| std | 0.00866 | -| value_loss | 8.17e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16426 | -| time_elapsed | 88085 | -| total_timesteps | 2102528 | -| train/ | | -| approx_kl | 0.0013841754 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | -0.00846 | -| n_updates | 164250 | -| policy_gradient_loss | -0.00806 | -| std | 0.00866 | -| value_loss | 9.93e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16427 | -| time_elapsed | 88091 | -| total_timesteps | 2102656 | -| train/ | | -| approx_kl | 7.6321885e-07 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.000173 | -| n_updates | 164260 | -| policy_gradient_loss | -0.00097 | -| std | 0.00866 | -| value_loss | 3.43e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16428 | -| time_elapsed | 88097 | -| total_timesteps | 2102784 | -| train/ | | -| approx_kl | 0.0317204 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 164270 | -| policy_gradient_loss | 0.0295 | -| std | 0.00866 | -| value_loss | 2.37e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16429 | -| time_elapsed | 88101 | -| total_timesteps | 2102912 | -| train/ | | -| approx_kl | 0.008426452 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 164280 | -| policy_gradient_loss | 0.01 | -| std | 0.00866 | -| value_loss | 1.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16430 | -| time_elapsed | 88106 | -| total_timesteps | 2103040 | -| train/ | | -| approx_kl | 0.09595874 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 164290 | -| policy_gradient_loss | 0.00705 | -| std | 0.00866 | -| value_loss | 1.08e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16431 | -| time_elapsed | 88114 | -| total_timesteps | 2103168 | -| train/ | | -| approx_kl | 0.0012061656 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.826 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 164300 | -| policy_gradient_loss | -0.00742 | -| std | 0.00866 | -| value_loss | 0.00325 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16432 | -| time_elapsed | 88119 | -| total_timesteps | 2103296 | -| train/ | | -| approx_kl | 0.02128639 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0976 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 164310 | -| policy_gradient_loss | -0.00634 | -| std | 0.00865 | -| value_loss | 7.63e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16433 | -| time_elapsed | 88124 | -| total_timesteps | 2103424 | -| train/ | | -| approx_kl | 0.019214243 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.348 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 164320 | -| policy_gradient_loss | 0.0132 | -| std | 0.00865 | -| value_loss | 4.73e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16434 | -| time_elapsed | 88129 | -| total_timesteps | 2103552 | -| train/ | | -| approx_kl | 0.1733017 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 164330 | -| policy_gradient_loss | 0.109 | -| std | 0.00863 | -| value_loss | 5.88e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16435 | -| time_elapsed | 88134 | -| total_timesteps | 2103680 | -| train/ | | -| approx_kl | 0.107042424 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -8.36 | -| learning_rate | 0.0003 | -| loss | 0.0905 | -| n_updates | 164340 | -| policy_gradient_loss | 0.041 | -| std | 0.00863 | -| value_loss | 2.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16436 | -| time_elapsed | 88139 | -| total_timesteps | 2103808 | -| train/ | | -| approx_kl | 0.090508014 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -5.08 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 164350 | -| policy_gradient_loss | 0.0289 | -| std | 0.00863 | -| value_loss | 1.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16437 | -| time_elapsed | 88144 | -| total_timesteps | 2103936 | -| train/ | | -| approx_kl | 0.014439629 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 164360 | -| policy_gradient_loss | 0.00991 | -| std | 0.00863 | -| value_loss | 4.72e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16438 | -| time_elapsed | 88148 | -| total_timesteps | 2104064 | -| train/ | | -| approx_kl | 0.018958252 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0813 | -| learning_rate | 0.0003 | -| loss | -0.00969 | -| n_updates | 164370 | -| policy_gradient_loss | 0.0079 | -| std | 0.00862 | -| value_loss | 2.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16439 | -| time_elapsed | 88156 | -| total_timesteps | 2104192 | -| train/ | | -| approx_kl | 0.029349819 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.823 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 164380 | -| policy_gradient_loss | -0.00735 | -| std | 0.00861 | -| value_loss | 0.00372 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16440 | -| time_elapsed | 88161 | -| total_timesteps | 2104320 | -| train/ | | -| approx_kl | 0.044011634 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.000967 | -| n_updates | 164390 | -| policy_gradient_loss | -0.000367 | -| std | 0.0086 | -| value_loss | 1.01e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16441 | -| time_elapsed | 88166 | -| total_timesteps | 2104448 | -| train/ | | -| approx_kl | 0.3739994 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 164400 | -| policy_gradient_loss | 0.0627 | -| std | 0.00865 | -| value_loss | 0.000132 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16442 | -| time_elapsed | 88170 | -| total_timesteps | 2104576 | -| train/ | | -| approx_kl | 0.011598282 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 164410 | -| policy_gradient_loss | -0.00522 | -| std | 0.00868 | -| value_loss | 0.000439 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16443 | -| time_elapsed | 88174 | -| total_timesteps | 2104704 | -| train/ | | -| approx_kl | 0.006932199 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00187 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 164420 | -| policy_gradient_loss | 0.0464 | -| std | 0.00868 | -| value_loss | 0.000681 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16444 | -| time_elapsed | 88178 | -| total_timesteps | 2104832 | -| train/ | | -| approx_kl | 0.19908302 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -3.46 | -| learning_rate | 0.0003 | -| loss | 0.0429 | -| n_updates | 164430 | -| policy_gradient_loss | 0.0152 | -| std | 0.00868 | -| value_loss | 1.92e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16445 | -| time_elapsed | 88183 | -| total_timesteps | 2104960 | -| train/ | | -| approx_kl | 0.04494383 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0782 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 164440 | -| policy_gradient_loss | 0.0599 | -| std | 0.00868 | -| value_loss | 6.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16446 | -| time_elapsed | 88187 | -| total_timesteps | 2105088 | -| train/ | | -| approx_kl | 0.14002956 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0742 | -| n_updates | 164450 | -| policy_gradient_loss | 0.0247 | -| std | 0.00868 | -| value_loss | 4.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16447 | -| time_elapsed | 88196 | -| total_timesteps | 2105216 | -| train/ | | -| approx_kl | 0.05390593 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 164460 | -| policy_gradient_loss | -0.0168 | -| std | 0.00868 | -| value_loss | 1.73e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16448 | -| time_elapsed | 88201 | -| total_timesteps | 2105344 | -| train/ | | -| approx_kl | 0.014093114 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 164470 | -| policy_gradient_loss | 0.0525 | -| std | 0.00868 | -| value_loss | 3.37e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16449 | -| time_elapsed | 88204 | -| total_timesteps | 2105472 | -| train/ | | -| approx_kl | 0.0070463778 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.296 | -| learning_rate | 0.0003 | -| loss | -0.00969 | -| n_updates | 164480 | -| policy_gradient_loss | 0.00479 | -| std | 0.00868 | -| value_loss | 3.21e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16450 | -| time_elapsed | 88209 | -| total_timesteps | 2105600 | -| train/ | | -| approx_kl | 0.18283473 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 164490 | -| policy_gradient_loss | 0.0528 | -| std | 0.00868 | -| value_loss | 2.77e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16451 | -| time_elapsed | 88214 | -| total_timesteps | 2105728 | -| train/ | | -| approx_kl | 0.025755038 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 164500 | -| policy_gradient_loss | 0.0387 | -| std | 0.00869 | -| value_loss | 1.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16452 | -| time_elapsed | 88219 | -| total_timesteps | 2105856 | -| train/ | | -| approx_kl | 0.013148066 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 164510 | -| policy_gradient_loss | -0.00173 | -| std | 0.00869 | -| value_loss | 1.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16453 | -| time_elapsed | 88225 | -| total_timesteps | 2105984 | -| train/ | | -| approx_kl | 0.10370383 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 164520 | -| policy_gradient_loss | 0.00286 | -| std | 0.00869 | -| value_loss | 8.99e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16454 | -| time_elapsed | 88230 | -| total_timesteps | 2106112 | -| train/ | | -| approx_kl | 0.0031586709 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | 0.00504 | -| n_updates | 164530 | -| policy_gradient_loss | 0.0137 | -| std | 0.00869 | -| value_loss | 4.12e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16455 | -| time_elapsed | 88243 | -| total_timesteps | 2106240 | -| train/ | | -| approx_kl | 0.047577787 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 164540 | -| policy_gradient_loss | -0.0137 | -| std | 0.00869 | -| value_loss | 0.00195 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16456 | -| time_elapsed | 88248 | -| total_timesteps | 2106368 | -| train/ | | -| approx_kl | 0.0016260156 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | -0.000515 | -| n_updates | 164550 | -| policy_gradient_loss | 0.0108 | -| std | 0.00868 | -| value_loss | 5.19e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16457 | -| time_elapsed | 88253 | -| total_timesteps | 2106496 | -| train/ | | -| approx_kl | 0.022492373 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.00414 | -| n_updates | 164560 | -| policy_gradient_loss | 0.0226 | -| std | 0.00868 | -| value_loss | 5.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16458 | -| time_elapsed | 88256 | -| total_timesteps | 2106624 | -| train/ | | -| approx_kl | 0.08616047 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | 0.0753 | -| n_updates | 164570 | -| policy_gradient_loss | 0.0408 | -| std | 0.00868 | -| value_loss | 3.35e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16459 | -| time_elapsed | 88261 | -| total_timesteps | 2106752 | -| train/ | | -| approx_kl | 0.002877599 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 164580 | -| policy_gradient_loss | 0.00719 | -| std | 0.00868 | -| value_loss | 2.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 16460 | -| time_elapsed | 88266 | -| total_timesteps | 2106880 | -| train/ | | -| approx_kl | 0.018075276 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.00739 | -| n_updates | 164590 | -| policy_gradient_loss | 0.0251 | -| std | 0.00868 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16461 | -| time_elapsed | 88271 | -| total_timesteps | 2107008 | -| train/ | | -| approx_kl | 0.091116294 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0709 | -| n_updates | 164600 | -| policy_gradient_loss | 0.0375 | -| std | 0.00868 | -| value_loss | 9.24e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16462 | -| time_elapsed | 88283 | -| total_timesteps | 2107136 | -| train/ | | -| approx_kl | 0.05813933 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | 0.00182 | -| n_updates | 164610 | -| policy_gradient_loss | -0.00393 | -| std | 0.00867 | -| value_loss | 0.000502 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16463 | -| time_elapsed | 88286 | -| total_timesteps | 2107264 | -| train/ | | -| approx_kl | 0.0049216887 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.475 | -| learning_rate | 0.0003 | -| loss | 0.00237 | -| n_updates | 164620 | -| policy_gradient_loss | 0.000713 | -| std | 0.00867 | -| value_loss | 1.13e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16464 | -| time_elapsed | 88290 | -| total_timesteps | 2107392 | -| train/ | | -| approx_kl | 0.03477245 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.651 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 164630 | -| policy_gradient_loss | 0.0357 | -| std | 0.00867 | -| value_loss | 3.57e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16465 | -| time_elapsed | 88296 | -| total_timesteps | 2107520 | -| train/ | | -| approx_kl | 0.013323327 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -40.4 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 164640 | -| policy_gradient_loss | 0.00461 | -| std | 0.00867 | -| value_loss | 4.83e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16466 | -| time_elapsed | 88299 | -| total_timesteps | 2107648 | -| train/ | | -| approx_kl | 0.20829129 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | 0.0863 | -| n_updates | 164650 | -| policy_gradient_loss | 0.0381 | -| std | 0.00867 | -| value_loss | 2.74e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16467 | -| time_elapsed | 88304 | -| total_timesteps | 2107776 | -| train/ | | -| approx_kl | 0.0005857507 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -14.2 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 164660 | -| policy_gradient_loss | 0.00223 | -| std | 0.00867 | -| value_loss | 6.58e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 16468 | -| time_elapsed | 88309 | -| total_timesteps | 2107904 | -| train/ | | -| approx_kl | 0.04646217 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -47.5 | -| learning_rate | 0.0003 | -| loss | 0.00257 | -| n_updates | 164670 | -| policy_gradient_loss | 0.0089 | -| std | 0.00867 | -| value_loss | 8.95e-12 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16469 | -| time_elapsed | 88314 | -| total_timesteps | 2108032 | -| train/ | | -| approx_kl | 0.1670958 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | 0.0573 | -| n_updates | 164680 | -| policy_gradient_loss | 0.0305 | -| std | 0.00868 | -| value_loss | 2.28e-12 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16470 | -| time_elapsed | 88324 | -| total_timesteps | 2108160 | -| train/ | | -| approx_kl | 0.14577127 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | 0.0669 | -| n_updates | 164690 | -| policy_gradient_loss | 0.0161 | -| std | 0.00867 | -| value_loss | 0.00159 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16471 | -| time_elapsed | 88327 | -| total_timesteps | 2108288 | -| train/ | | -| approx_kl | 0.02934196 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | 0.00937 | -| n_updates | 164700 | -| policy_gradient_loss | 0.00295 | -| std | 0.00867 | -| value_loss | 9.28e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16472 | -| time_elapsed | 88330 | -| total_timesteps | 2108416 | -| train/ | | -| approx_kl | 0.0057488675 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.003 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 164710 | -| policy_gradient_loss | -0.000672 | -| std | 0.00867 | -| value_loss | 1.33e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16473 | -| time_elapsed | 88335 | -| total_timesteps | 2108544 | -| train/ | | -| approx_kl | 0.050702807 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 164720 | -| policy_gradient_loss | 0.00528 | -| std | 0.00867 | -| value_loss | 8.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16474 | -| time_elapsed | 88341 | -| total_timesteps | 2108672 | -| train/ | | -| approx_kl | 0.061762735 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | -0.00959 | -| n_updates | 164730 | -| policy_gradient_loss | -0.0128 | -| std | 0.00867 | -| value_loss | 6.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16475 | -| time_elapsed | 88345 | -| total_timesteps | 2108800 | -| train/ | | -| approx_kl | 0.020448744 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 3.32e-05 | -| n_updates | 164740 | -| policy_gradient_loss | 0.00167 | -| std | 0.00867 | -| value_loss | 4.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16476 | -| time_elapsed | 88351 | -| total_timesteps | 2108928 | -| train/ | | -| approx_kl | 0.031960074 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 164750 | -| policy_gradient_loss | 0.00834 | -| std | 0.00867 | -| value_loss | 2.63e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16477 | -| time_elapsed | 88356 | -| total_timesteps | 2109056 | -| train/ | | -| approx_kl | 0.00022087805 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 164760 | -| policy_gradient_loss | -0.000623 | -| std | 0.00867 | -| value_loss | 1.91e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16478 | -| time_elapsed | 88364 | -| total_timesteps | 2109184 | -| train/ | | -| approx_kl | 0.13668384 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | 0.00647 | -| n_updates | 164770 | -| policy_gradient_loss | -0.0111 | -| std | 0.00867 | -| value_loss | 0.000233 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16479 | -| time_elapsed | 88369 | -| total_timesteps | 2109312 | -| train/ | | -| approx_kl | 0.10327251 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.972 | -| learning_rate | 0.0003 | -| loss | -0.00968 | -| n_updates | 164780 | -| policy_gradient_loss | -0.0041 | -| std | 0.00868 | -| value_loss | 3.43e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16480 | -| time_elapsed | 88374 | -| total_timesteps | 2109440 | -| train/ | | -| approx_kl | 0.05749789 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -4 | -| learning_rate | 0.0003 | -| loss | 0.0332 | -| n_updates | 164790 | -| policy_gradient_loss | 0.0243 | -| std | 0.00868 | -| value_loss | 8.7e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16481 | -| time_elapsed | 88378 | -| total_timesteps | 2109568 | -| train/ | | -| approx_kl | 0.25057113 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 164800 | -| policy_gradient_loss | 0.111 | -| std | 0.00868 | -| value_loss | 3.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16482 | -| time_elapsed | 88383 | -| total_timesteps | 2109696 | -| train/ | | -| approx_kl | 0.117655724 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 164810 | -| policy_gradient_loss | 0.103 | -| std | 0.00869 | -| value_loss | 8.92e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16483 | -| time_elapsed | 88388 | -| total_timesteps | 2109824 | -| train/ | | -| approx_kl | 0.07484697 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0494 | -| n_updates | 164820 | -| policy_gradient_loss | 0.07 | -| std | 0.00869 | -| value_loss | 4.24e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 16484 | -| time_elapsed | 88391 | -| total_timesteps | 2109952 | -| train/ | | -| approx_kl | 0.09616921 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0765 | -| n_updates | 164830 | -| policy_gradient_loss | 0.102 | -| std | 0.00869 | -| value_loss | 3.24e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16485 | -| time_elapsed | 88394 | -| total_timesteps | 2110080 | -| train/ | | -| approx_kl | 0.014029715 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00838 | -| n_updates | 164840 | -| policy_gradient_loss | 0.0118 | -| std | 0.00869 | -| value_loss | 2.64e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16486 | -| time_elapsed | 88404 | -| total_timesteps | 2110208 | -| train/ | | -| approx_kl | 0.076550394 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.9 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 164850 | -| policy_gradient_loss | -0.00079 | -| std | 0.00869 | -| value_loss | 0.00164 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16487 | -| time_elapsed | 88408 | -| total_timesteps | 2110336 | -| train/ | | -| approx_kl | 0.18725446 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0723 | -| n_updates | 164860 | -| policy_gradient_loss | 0.01 | -| std | 0.00869 | -| value_loss | 2.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16488 | -| time_elapsed | 88413 | -| total_timesteps | 2110464 | -| train/ | | -| approx_kl | 0.021153335 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 164870 | -| policy_gradient_loss | 0.00349 | -| std | 0.00868 | -| value_loss | 5.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16489 | -| time_elapsed | 88417 | -| total_timesteps | 2110592 | -| train/ | | -| approx_kl | 0.0121259615 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00698 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 164880 | -| policy_gradient_loss | 0.0146 | -| std | 0.00868 | -| value_loss | 2.34e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16490 | -| time_elapsed | 88422 | -| total_timesteps | 2110720 | -| train/ | | -| approx_kl | 0.19404237 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00554 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 164890 | -| policy_gradient_loss | 0.125 | -| std | 0.00867 | -| value_loss | 1.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16491 | -| time_elapsed | 88428 | -| total_timesteps | 2110848 | -| train/ | | -| approx_kl | 0.101407394 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0757 | -| n_updates | 164900 | -| policy_gradient_loss | 0.095 | -| std | 0.00867 | -| value_loss | 8.22e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16492 | -| time_elapsed | 88433 | -| total_timesteps | 2110976 | -| train/ | | -| approx_kl | 0.10421963 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | 0.094 | -| n_updates | 164910 | -| policy_gradient_loss | 0.0834 | -| std | 0.00867 | -| value_loss | 7.11e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 16493 | -| time_elapsed | 88437 | -| total_timesteps | 2111104 | -| train/ | | -| approx_kl | 0.1029534 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0752 | -| n_updates | 164920 | -| policy_gradient_loss | 0.0914 | -| std | 0.00868 | -| value_loss | 4.28e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 16494 | -| time_elapsed | 88447 | -| total_timesteps | 2111232 | -| train/ | | -| approx_kl | 0.36582652 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 164930 | -| policy_gradient_loss | -0.00436 | -| std | 0.00868 | -| value_loss | 0.000221 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 16495 | -| time_elapsed | 88451 | -| total_timesteps | 2111360 | -| train/ | | -| approx_kl | 0.016213253 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00901 | -| learning_rate | 0.0003 | -| loss | -0.00656 | -| n_updates | 164940 | -| policy_gradient_loss | -0.00554 | -| std | 0.00868 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 16496 | -| time_elapsed | 88456 | -| total_timesteps | 2111488 | -| train/ | | -| approx_kl | 0.010301966 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.009 | -| learning_rate | 0.0003 | -| loss | 0.00343 | -| n_updates | 164950 | -| policy_gradient_loss | 0.0165 | -| std | 0.00868 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 16497 | -| time_elapsed | 88459 | -| total_timesteps | 2111616 | -| train/ | | -| approx_kl | 0.055274975 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.0093 | -| n_updates | 164960 | -| policy_gradient_loss | 0.00925 | -| std | 0.00868 | -| value_loss | 8.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 16498 | -| time_elapsed | 88464 | -| total_timesteps | 2111744 | -| train/ | | -| approx_kl | 0.014137179 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.0348 | -| n_updates | 164970 | -| policy_gradient_loss | -0.00807 | -| std | 0.00868 | -| value_loss | 5.9e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 16499 | -| time_elapsed | 88471 | -| total_timesteps | 2111872 | -| train/ | | -| approx_kl | 0.13237041 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.0504 | -| n_updates | 164980 | -| policy_gradient_loss | 0.00742 | -| std | 0.00868 | -| value_loss | 3.66e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16500 | -| time_elapsed | 88476 | -| total_timesteps | 2112000 | -| train/ | | -| approx_kl | 0.1174953 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 164990 | -| policy_gradient_loss | 0.0145 | -| std | 0.00868 | -| value_loss | 2.65e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16501 | -| time_elapsed | 88482 | -| total_timesteps | 2112128 | -| train/ | | -| approx_kl | 0.039765313 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00324 | -| learning_rate | 0.0003 | -| loss | 0.00883 | -| n_updates | 165000 | -| policy_gradient_loss | 0.0147 | -| std | 0.00868 | -| value_loss | 1.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16502 | -| time_elapsed | 88492 | -| total_timesteps | 2112256 | -| train/ | | -| approx_kl | 0.032221243 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 165010 | -| policy_gradient_loss | -0.0149 | -| std | 0.00868 | -| value_loss | 1.43e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16503 | -| time_elapsed | 88498 | -| total_timesteps | 2112384 | -| train/ | | -| approx_kl | 0.05968522 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 165020 | -| policy_gradient_loss | 0.0171 | -| std | 0.00868 | -| value_loss | 1.24e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16504 | -| time_elapsed | 88502 | -| total_timesteps | 2112512 | -| train/ | | -| approx_kl | 0.0032836823 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00348 | -| learning_rate | 0.0003 | -| loss | 0.00789 | -| n_updates | 165030 | -| policy_gradient_loss | 0.00396 | -| std | 0.00868 | -| value_loss | 5.78e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16505 | -| time_elapsed | 88507 | -| total_timesteps | 2112640 | -| train/ | | -| approx_kl | 0.02668469 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.00783 | -| n_updates | 165040 | -| policy_gradient_loss | 0.00916 | -| std | 0.00868 | -| value_loss | 4.86e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16506 | -| time_elapsed | 88512 | -| total_timesteps | 2112768 | -| train/ | | -| approx_kl | 0.08399542 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 165050 | -| policy_gradient_loss | 0.0101 | -| std | 0.00868 | -| value_loss | 2.32e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 16507 | -| time_elapsed | 88517 | -| total_timesteps | 2112896 | -| train/ | | -| approx_kl | 0.017060103 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 165060 | -| policy_gradient_loss | 0.0261 | -| std | 0.00868 | -| value_loss | 1.49e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16508 | -| time_elapsed | 88522 | -| total_timesteps | 2113024 | -| train/ | | -| approx_kl | 0.16177142 | -| clip_fraction | 0.633 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0881 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 165070 | -| policy_gradient_loss | 0.0915 | -| std | 0.00868 | -| value_loss | 6.91e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16509 | -| time_elapsed | 88532 | -| total_timesteps | 2113152 | -| train/ | | -| approx_kl | 0.0010918793 | -| clip_fraction | 0.0195 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 165080 | -| policy_gradient_loss | -0.0133 | -| std | 0.00868 | -| value_loss | 0.000211 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16510 | -| time_elapsed | 88537 | -| total_timesteps | 2113280 | -| train/ | | -| approx_kl | 0.029239085 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -20.1 | -| learning_rate | 0.0003 | -| loss | -0.00617 | -| n_updates | 165090 | -| policy_gradient_loss | 0.00374 | -| std | 0.00868 | -| value_loss | 1.83e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16511 | -| time_elapsed | 88542 | -| total_timesteps | 2113408 | -| train/ | | -| approx_kl | 0.087025225 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.798 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 165100 | -| policy_gradient_loss | 0.0153 | -| std | 0.00868 | -| value_loss | 3.19e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16512 | -| time_elapsed | 88547 | -| total_timesteps | 2113536 | -| train/ | | -| approx_kl | 0.33504114 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00701 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 165110 | -| policy_gradient_loss | 0.0369 | -| std | 0.00868 | -| value_loss | 9.52e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16513 | -| time_elapsed | 88552 | -| total_timesteps | 2113664 | -| train/ | | -| approx_kl | 0.008603799 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00412 | -| learning_rate | 0.0003 | -| loss | -0.00226 | -| n_updates | 165120 | -| policy_gradient_loss | 0.00187 | -| std | 0.00868 | -| value_loss | 5.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16514 | -| time_elapsed | 88556 | -| total_timesteps | 2113792 | -| train/ | | -| approx_kl | 0.027749814 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.00357 | -| n_updates | 165130 | -| policy_gradient_loss | -4.71e-05 | -| std | 0.00868 | -| value_loss | 4.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 16515 | -| time_elapsed | 88560 | -| total_timesteps | 2113920 | -| train/ | | -| approx_kl | 0.024657754 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 165140 | -| policy_gradient_loss | -0.00415 | -| std | 0.00868 | -| value_loss | 3.03e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16516 | -| time_elapsed | 88564 | -| total_timesteps | 2114048 | -| train/ | | -| approx_kl | 0.0034277518 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 165150 | -| policy_gradient_loss | 0.00164 | -| std | 0.00868 | -| value_loss | 2.1e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16517 | -| time_elapsed | 88572 | -| total_timesteps | 2114176 | -| train/ | | -| approx_kl | 0.00350116 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 165160 | -| policy_gradient_loss | -0.00766 | -| std | 0.00868 | -| value_loss | 0.00159 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16518 | -| time_elapsed | 88576 | -| total_timesteps | 2114304 | -| train/ | | -| approx_kl | 0.005867588 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.003 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 165170 | -| policy_gradient_loss | 0.00775 | -| std | 0.00868 | -| value_loss | 1.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16519 | -| time_elapsed | 88581 | -| total_timesteps | 2114432 | -| train/ | | -| approx_kl | 0.037070185 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 165180 | -| policy_gradient_loss | 0.00836 | -| std | 0.00868 | -| value_loss | 3.71e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16520 | -| time_elapsed | 88586 | -| total_timesteps | 2114560 | -| train/ | | -| approx_kl | 0.46558577 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 165190 | -| policy_gradient_loss | 0.0476 | -| std | 0.00868 | -| value_loss | 8.18e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16521 | -| time_elapsed | 88590 | -| total_timesteps | 2114688 | -| train/ | | -| approx_kl | 0.00024531502 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 165200 | -| policy_gradient_loss | -0.0147 | -| std | 0.00868 | -| value_loss | 5.76e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16522 | -| time_elapsed | 88595 | -| total_timesteps | 2114816 | -| train/ | | -| approx_kl | 0.0721713 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 165210 | -| policy_gradient_loss | 0.00801 | -| std | 0.00868 | -| value_loss | 8.85e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16523 | -| time_elapsed | 88600 | -| total_timesteps | 2114944 | -| train/ | | -| approx_kl | 0.011302226 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 165220 | -| policy_gradient_loss | 0.0194 | -| std | 0.00868 | -| value_loss | 2.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16524 | -| time_elapsed | 88604 | -| total_timesteps | 2115072 | -| train/ | | -| approx_kl | 0.022488277 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | 0.0285 | -| n_updates | 165230 | -| policy_gradient_loss | 0.0733 | -| std | 0.00868 | -| value_loss | 1.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16525 | -| time_elapsed | 88616 | -| total_timesteps | 2115200 | -| train/ | | -| approx_kl | 0.010590542 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 165240 | -| policy_gradient_loss | -0.0147 | -| std | 0.00868 | -| value_loss | 0.000776 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16526 | -| time_elapsed | 88622 | -| total_timesteps | 2115328 | -| train/ | | -| approx_kl | 0.0014593559 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0794 | -| learning_rate | 0.0003 | -| loss | 0.000279 | -| n_updates | 165250 | -| policy_gradient_loss | 0.00446 | -| std | 0.00868 | -| value_loss | 2.23e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16527 | -| time_elapsed | 88626 | -| total_timesteps | 2115456 | -| train/ | | -| approx_kl | 0.0023282352 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | 0.000118 | -| n_updates | 165260 | -| policy_gradient_loss | 0.00311 | -| std | 0.00867 | -| value_loss | 5.33e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16528 | -| time_elapsed | 88631 | -| total_timesteps | 2115584 | -| train/ | | -| approx_kl | 0.04310032 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.572 | -| learning_rate | 0.0003 | -| loss | -0.00949 | -| n_updates | 165270 | -| policy_gradient_loss | 0.00799 | -| std | 0.00867 | -| value_loss | 1.41e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16529 | -| time_elapsed | 88637 | -| total_timesteps | 2115712 | -| train/ | | -| approx_kl | 0.6205701 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.325 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 165280 | -| policy_gradient_loss | 0.146 | -| std | 0.00867 | -| value_loss | 6.36e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16530 | -| time_elapsed | 88642 | -| total_timesteps | 2115840 | -| train/ | | -| approx_kl | 0.004238426 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 165290 | -| policy_gradient_loss | 0.00845 | -| std | 0.00867 | -| value_loss | 3.75e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 16531 | -| time_elapsed | 88647 | -| total_timesteps | 2115968 | -| train/ | | -| approx_kl | 0.38083977 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0592 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 165300 | -| policy_gradient_loss | 0.0376 | -| std | 0.00867 | -| value_loss | 2.88e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16532 | -| time_elapsed | 88651 | -| total_timesteps | 2116096 | -| train/ | | -| approx_kl | 0.0007596025 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 165310 | -| policy_gradient_loss | -0.00126 | -| std | 0.00867 | -| value_loss | 1.93e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16533 | -| time_elapsed | 88663 | -| total_timesteps | 2116224 | -| train/ | | -| approx_kl | 0.018881693 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 165320 | -| policy_gradient_loss | -0.012 | -| std | 0.00867 | -| value_loss | 0.002 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16534 | -| time_elapsed | 88668 | -| total_timesteps | 2116352 | -| train/ | | -| approx_kl | 0.086245924 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00722 | -| learning_rate | 0.0003 | -| loss | 0.065 | -| n_updates | 165330 | -| policy_gradient_loss | 0.0307 | -| std | 0.00867 | -| value_loss | 5.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16535 | -| time_elapsed | 88673 | -| total_timesteps | 2116480 | -| train/ | | -| approx_kl | 0.06059783 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 165340 | -| policy_gradient_loss | 0.00175 | -| std | 0.00867 | -| value_loss | 2.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16536 | -| time_elapsed | 88678 | -| total_timesteps | 2116608 | -| train/ | | -| approx_kl | 0.026840745 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 165350 | -| policy_gradient_loss | -0.000931 | -| std | 0.00868 | -| value_loss | 1.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16537 | -| time_elapsed | 88683 | -| total_timesteps | 2116736 | -| train/ | | -| approx_kl | 0.035920724 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 165360 | -| policy_gradient_loss | 0.0108 | -| std | 0.00868 | -| value_loss | 9.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16538 | -| time_elapsed | 88687 | -| total_timesteps | 2116864 | -| train/ | | -| approx_kl | 0.006144119 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 165370 | -| policy_gradient_loss | 0.00537 | -| std | 0.00867 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16539 | -| time_elapsed | 88693 | -| total_timesteps | 2116992 | -| train/ | | -| approx_kl | 0.0005274429 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.00271 | -| n_updates | 165380 | -| policy_gradient_loss | 0.00408 | -| std | 0.00867 | -| value_loss | 5.44e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16540 | -| time_elapsed | 88698 | -| total_timesteps | 2117120 | -| train/ | | -| approx_kl | 0.03328706 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0815 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 165390 | -| policy_gradient_loss | 0.00871 | -| std | 0.00867 | -| value_loss | 6.34e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16541 | -| time_elapsed | 88711 | -| total_timesteps | 2117248 | -| train/ | | -| approx_kl | 0.16602685 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -2.65 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 165400 | -| policy_gradient_loss | -0.0116 | -| std | 0.00868 | -| value_loss | 0.0031 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16542 | -| time_elapsed | 88715 | -| total_timesteps | 2117376 | -| train/ | | -| approx_kl | 0.006745804 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00319 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 165410 | -| policy_gradient_loss | 0.0124 | -| std | 0.00868 | -| value_loss | 9.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16543 | -| time_elapsed | 88718 | -| total_timesteps | 2117504 | -| train/ | | -| approx_kl | 0.009229576 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 165420 | -| policy_gradient_loss | 0.0345 | -| std | 0.00868 | -| value_loss | 9.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16544 | -| time_elapsed | 88723 | -| total_timesteps | 2117632 | -| train/ | | -| approx_kl | 0.008671443 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | -0.00798 | -| n_updates | 165430 | -| policy_gradient_loss | 0.00905 | -| std | 0.00868 | -| value_loss | 1.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16545 | -| time_elapsed | 88728 | -| total_timesteps | 2117760 | -| train/ | | -| approx_kl | 0.027917057 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0827 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 165440 | -| policy_gradient_loss | 0.0813 | -| std | 0.00867 | -| value_loss | 9.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16546 | -| time_elapsed | 88733 | -| total_timesteps | 2117888 | -| train/ | | -| approx_kl | 0.002638576 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 165450 | -| policy_gradient_loss | 0.0484 | -| std | 0.00867 | -| value_loss | 8.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16547 | -| time_elapsed | 88739 | -| total_timesteps | 2118016 | -| train/ | | -| approx_kl | 0.017030347 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.00907 | -| n_updates | 165460 | -| policy_gradient_loss | 0.0178 | -| std | 0.00867 | -| value_loss | 1.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16548 | -| time_elapsed | 88752 | -| total_timesteps | 2118144 | -| train/ | | -| approx_kl | 0.10500156 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | 0.0608 | -| n_updates | 165470 | -| policy_gradient_loss | 0.0448 | -| std | 0.00867 | -| value_loss | 0.00148 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16549 | -| time_elapsed | 88757 | -| total_timesteps | 2118272 | -| train/ | | -| approx_kl | 0.04514403 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.00632 | -| n_updates | 165480 | -| policy_gradient_loss | 0.0083 | -| std | 0.00867 | -| value_loss | 2.21e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16550 | -| time_elapsed | 88763 | -| total_timesteps | 2118400 | -| train/ | | -| approx_kl | 0.09534431 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00428 | -| learning_rate | 0.0003 | -| loss | 0.0551 | -| n_updates | 165490 | -| policy_gradient_loss | 0.0145 | -| std | 0.00867 | -| value_loss | 6.16e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16551 | -| time_elapsed | 88767 | -| total_timesteps | 2118528 | -| train/ | | -| approx_kl | 0.016168993 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 165500 | -| policy_gradient_loss | 0.0201 | -| std | 0.00867 | -| value_loss | 3.53e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16552 | -| time_elapsed | 88773 | -| total_timesteps | 2118656 | -| train/ | | -| approx_kl | 0.1402239 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 165510 | -| policy_gradient_loss | 0.095 | -| std | 0.00867 | -| value_loss | 2.95e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16553 | -| time_elapsed | 88777 | -| total_timesteps | 2118784 | -| train/ | | -| approx_kl | 0.09190895 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.0562 | -| n_updates | 165520 | -| policy_gradient_loss | 0.0708 | -| std | 0.00867 | -| value_loss | 1.07e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16554 | -| time_elapsed | 88783 | -| total_timesteps | 2118912 | -| train/ | | -| approx_kl | 0.01940917 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.363 | -| learning_rate | 0.0003 | -| loss | 0.000456 | -| n_updates | 165530 | -| policy_gradient_loss | 0.0112 | -| std | 0.00867 | -| value_loss | 5.48e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16555 | -| time_elapsed | 88787 | -| total_timesteps | 2119040 | -| train/ | | -| approx_kl | 0.11015609 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0775 | -| learning_rate | 0.0003 | -| loss | 0.0496 | -| n_updates | 165540 | -| policy_gradient_loss | 0.0129 | -| std | 0.00867 | -| value_loss | 2.29e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16556 | -| time_elapsed | 88798 | -| total_timesteps | 2119168 | -| train/ | | -| approx_kl | 0.03448444 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 165550 | -| policy_gradient_loss | 0.00182 | -| std | 0.00867 | -| value_loss | 0.000617 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16557 | -| time_elapsed | 88802 | -| total_timesteps | 2119296 | -| train/ | | -| approx_kl | 0.28558236 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0629 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 165560 | -| policy_gradient_loss | 0.111 | -| std | 0.00867 | -| value_loss | 2.8e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16558 | -| time_elapsed | 88808 | -| total_timesteps | 2119424 | -| train/ | | -| approx_kl | 0.03664768 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00691 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 165570 | -| policy_gradient_loss | 0.00963 | -| std | 0.00867 | -| value_loss | 5.53e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16559 | -| time_elapsed | 88813 | -| total_timesteps | 2119552 | -| train/ | | -| approx_kl | 0.09425074 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.0434 | -| n_updates | 165580 | -| policy_gradient_loss | 0.0113 | -| std | 0.00867 | -| value_loss | 2.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16560 | -| time_elapsed | 88819 | -| total_timesteps | 2119680 | -| train/ | | -| approx_kl | 0.009216632 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | -0.000929 | -| n_updates | 165590 | -| policy_gradient_loss | -0.000614 | -| std | 0.00868 | -| value_loss | 1.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16561 | -| time_elapsed | 88825 | -| total_timesteps | 2119808 | -| train/ | | -| approx_kl | 0.008096993 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | -0.00207 | -| n_updates | 165600 | -| policy_gradient_loss | -0.00111 | -| std | 0.00868 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16562 | -| time_elapsed | 88829 | -| total_timesteps | 2119936 | -| train/ | | -| approx_kl | 0.013926595 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 165610 | -| policy_gradient_loss | 0.0103 | -| std | 0.00868 | -| value_loss | 5.02e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16563 | -| time_elapsed | 88836 | -| total_timesteps | 2120064 | -| train/ | | -| approx_kl | 0.18766022 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 165620 | -| policy_gradient_loss | 0.0999 | -| std | 0.00868 | -| value_loss | 3.06e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16564 | -| time_elapsed | 88845 | -| total_timesteps | 2120192 | -| train/ | | -| approx_kl | 0.026414393 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.693 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 165630 | -| policy_gradient_loss | -0.00205 | -| std | 0.00868 | -| value_loss | 0.00216 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16565 | -| time_elapsed | 88850 | -| total_timesteps | 2120320 | -| train/ | | -| approx_kl | 0.005250887 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 165640 | -| policy_gradient_loss | 0.0154 | -| std | 0.00868 | -| value_loss | 4.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16566 | -| time_elapsed | 88855 | -| total_timesteps | 2120448 | -| train/ | | -| approx_kl | 0.13854654 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -3.87 | -| learning_rate | 0.0003 | -| loss | 0.0357 | -| n_updates | 165650 | -| policy_gradient_loss | 0.0134 | -| std | 0.00867 | -| value_loss | 3.44e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16567 | -| time_elapsed | 88860 | -| total_timesteps | 2120576 | -| train/ | | -| approx_kl | 0.028253363 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | 0.00692 | -| n_updates | 165660 | -| policy_gradient_loss | 0.0366 | -| std | 0.00866 | -| value_loss | 8.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16568 | -| time_elapsed | 88865 | -| total_timesteps | 2120704 | -| train/ | | -| approx_kl | 0.069520906 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -27.9 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 165670 | -| policy_gradient_loss | -0.00306 | -| std | 0.00867 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16569 | -| time_elapsed | 88869 | -| total_timesteps | 2120832 | -| train/ | | -| approx_kl | 0.0056361826 | -| clip_fraction | 0.507 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.283 | -| learning_rate | 0.0003 | -| loss | -0.000931 | -| n_updates | 165680 | -| policy_gradient_loss | 0.0463 | -| std | 0.00867 | -| value_loss | 2.16e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16570 | -| time_elapsed | 88874 | -| total_timesteps | 2120960 | -| train/ | | -| approx_kl | 0.0066830306 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00864 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 165690 | -| policy_gradient_loss | 0.0108 | -| std | 0.00867 | -| value_loss | 3.05e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16571 | -| time_elapsed | 88879 | -| total_timesteps | 2121088 | -| train/ | | -| approx_kl | 0.024849229 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.00329 | -| n_updates | 165700 | -| policy_gradient_loss | 0.0329 | -| std | 0.00867 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16572 | -| time_elapsed | 88889 | -| total_timesteps | 2121216 | -| train/ | | -| approx_kl | 0.061534505 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.441 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 165710 | -| policy_gradient_loss | -0.01 | -| std | 0.00867 | -| value_loss | 0.00119 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16573 | -| time_elapsed | 88894 | -| total_timesteps | 2121344 | -| train/ | | -| approx_kl | 0.013124606 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 165720 | -| policy_gradient_loss | 0.0606 | -| std | 0.00867 | -| value_loss | 2.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16574 | -| time_elapsed | 88898 | -| total_timesteps | 2121472 | -| train/ | | -| approx_kl | 0.007146486 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.479 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 165730 | -| policy_gradient_loss | 0.0109 | -| std | 0.00867 | -| value_loss | 1.93e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16575 | -| time_elapsed | 88903 | -| total_timesteps | 2121600 | -| train/ | | -| approx_kl | 0.17725146 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 165740 | -| policy_gradient_loss | 0.0353 | -| std | 0.00867 | -| value_loss | 1.02e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16576 | -| time_elapsed | 88908 | -| total_timesteps | 2121728 | -| train/ | | -| approx_kl | 0.03341498 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 165750 | -| policy_gradient_loss | 0.0332 | -| std | 0.00868 | -| value_loss | 8.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16577 | -| time_elapsed | 88913 | -| total_timesteps | 2121856 | -| train/ | | -| approx_kl | 0.013802176 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | 0.000941 | -| n_updates | 165760 | -| policy_gradient_loss | 0.00995 | -| std | 0.00868 | -| value_loss | 1.03e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16578 | -| time_elapsed | 88919 | -| total_timesteps | 2121984 | -| train/ | | -| approx_kl | 0.2322396 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0478 | -| learning_rate | 0.0003 | -| loss | 0.0402 | -| n_updates | 165770 | -| policy_gradient_loss | 0.0194 | -| std | 0.00869 | -| value_loss | 2.6e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 16579 | -| time_elapsed | 88925 | -| total_timesteps | 2122112 | -| train/ | | -| approx_kl | 0.043491952 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 165780 | -| policy_gradient_loss | 0.00567 | -| std | 0.00869 | -| value_loss | 1e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 16580 | -| time_elapsed | 88940 | -| total_timesteps | 2122240 | -| train/ | | -| approx_kl | 0.0279879 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 165790 | -| policy_gradient_loss | 0.00802 | -| std | 0.00869 | -| value_loss | 0.00331 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 16581 | -| time_elapsed | 88946 | -| total_timesteps | 2122368 | -| train/ | | -| approx_kl | 0.007638578 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 165800 | -| policy_gradient_loss | 0.024 | -| std | 0.00869 | -| value_loss | 6.33e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 16582 | -| time_elapsed | 88952 | -| total_timesteps | 2122496 | -| train/ | | -| approx_kl | 0.34979272 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00211 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 165810 | -| policy_gradient_loss | 0.0393 | -| std | 0.00869 | -| value_loss | 5.17e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 16583 | -| time_elapsed | 88957 | -| total_timesteps | 2122624 | -| train/ | | -| approx_kl | 0.0068269195 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.093 | -| learning_rate | 0.0003 | -| loss | -0.00873 | -| n_updates | 165820 | -| policy_gradient_loss | 0.00534 | -| std | 0.00869 | -| value_loss | 2.69e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 16584 | -| time_elapsed | 88963 | -| total_timesteps | 2122752 | -| train/ | | -| approx_kl | 0.056283325 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 165830 | -| policy_gradient_loss | 0.0166 | -| std | 0.00869 | -| value_loss | 1.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 16585 | -| time_elapsed | 88968 | -| total_timesteps | 2122880 | -| train/ | | -| approx_kl | 0.028645895 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 165840 | -| policy_gradient_loss | 0.00699 | -| std | 0.00869 | -| value_loss | 1.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16586 | -| time_elapsed | 88973 | -| total_timesteps | 2123008 | -| train/ | | -| approx_kl | 0.031890925 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.00838 | -| n_updates | 165850 | -| policy_gradient_loss | 0.00367 | -| std | 0.00869 | -| value_loss | 7.78e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16587 | -| time_elapsed | 88986 | -| total_timesteps | 2123136 | -| train/ | | -| approx_kl | 0.03852905 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.828 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 165860 | -| policy_gradient_loss | -0.0142 | -| std | 0.00869 | -| value_loss | 0.00055 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16588 | -| time_elapsed | 88991 | -| total_timesteps | 2123264 | -| train/ | | -| approx_kl | 0.11258492 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.606 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 165870 | -| policy_gradient_loss | 0.00837 | -| std | 0.00869 | -| value_loss | 9.63e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16589 | -| time_elapsed | 88997 | -| total_timesteps | 2123392 | -| train/ | | -| approx_kl | 0.02360743 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 165880 | -| policy_gradient_loss | 0.00163 | -| std | 0.00869 | -| value_loss | 2.72e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16590 | -| time_elapsed | 89001 | -| total_timesteps | 2123520 | -| train/ | | -| approx_kl | 0.014371661 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 165890 | -| policy_gradient_loss | 0.00284 | -| std | 0.00869 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16591 | -| time_elapsed | 89007 | -| total_timesteps | 2123648 | -| train/ | | -| approx_kl | 0.0060913903 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.00694 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 165900 | -| policy_gradient_loss | 0.0228 | -| std | 0.00869 | -| value_loss | 1.72e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16592 | -| time_elapsed | 89013 | -| total_timesteps | 2123776 | -| train/ | | -| approx_kl | 0.13699493 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | 0.0994 | -| n_updates | 165910 | -| policy_gradient_loss | 0.0522 | -| std | 0.00869 | -| value_loss | 2.15e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 16593 | -| time_elapsed | 89020 | -| total_timesteps | 2123904 | -| train/ | | -| approx_kl | 0.052409735 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 165920 | -| policy_gradient_loss | 0.00473 | -| std | 0.00869 | -| value_loss | 4.91e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16594 | -| time_elapsed | 89026 | -| total_timesteps | 2124032 | -| train/ | | -| approx_kl | 0.008526085 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 165930 | -| policy_gradient_loss | -0.000262 | -| std | 0.00869 | -| value_loss | 3.51e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16595 | -| time_elapsed | 89040 | -| total_timesteps | 2124160 | -| train/ | | -| approx_kl | 0.10414592 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -4.99 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 165940 | -| policy_gradient_loss | -0.0179 | -| std | 0.00869 | -| value_loss | 0.00314 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16596 | -| time_elapsed | 89045 | -| total_timesteps | 2124288 | -| train/ | | -| approx_kl | 0.030745767 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 165950 | -| policy_gradient_loss | 0.00834 | -| std | 0.0087 | -| value_loss | 3.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16597 | -| time_elapsed | 89050 | -| total_timesteps | 2124416 | -| train/ | | -| approx_kl | 0.01600679 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -1.09 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 165960 | -| policy_gradient_loss | 0.0344 | -| std | 0.0087 | -| value_loss | 1.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16598 | -| time_elapsed | 89055 | -| total_timesteps | 2124544 | -| train/ | | -| approx_kl | 0.17071587 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | 0.0792 | -| n_updates | 165970 | -| policy_gradient_loss | 0.0266 | -| std | 0.0087 | -| value_loss | 4.26e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16599 | -| time_elapsed | 89061 | -| total_timesteps | 2124672 | -| train/ | | -| approx_kl | 0.0004957658 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0634 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 165980 | -| policy_gradient_loss | 0.00253 | -| std | 0.0087 | -| value_loss | 3.26e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16600 | -| time_elapsed | 89066 | -| total_timesteps | 2124800 | -| train/ | | -| approx_kl | 0.0648456 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.0423 | -| n_updates | 165990 | -| policy_gradient_loss | 0.0105 | -| std | 0.00873 | -| value_loss | 4.31e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 16601 | -| time_elapsed | 89072 | -| total_timesteps | 2124928 | -| train/ | | -| approx_kl | 0.07805405 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | 0.0162 | -| n_updates | 166000 | -| policy_gradient_loss | 0.00938 | -| std | 0.00874 | -| value_loss | 5.64e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16602 | -| time_elapsed | 89076 | -| total_timesteps | 2125056 | -| train/ | | -| approx_kl | 0.09291828 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00901 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 166010 | -| policy_gradient_loss | 0.0265 | -| std | 0.00875 | -| value_loss | 5.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16603 | -| time_elapsed | 89086 | -| total_timesteps | 2125184 | -| train/ | | -| approx_kl | 0.014675675 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.771 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 166020 | -| policy_gradient_loss | -0.00224 | -| std | 0.00875 | -| value_loss | 0.00515 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16604 | -| time_elapsed | 89091 | -| total_timesteps | 2125312 | -| train/ | | -| approx_kl | 0.069979414 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | 0.0465 | -| n_updates | 166030 | -| policy_gradient_loss | 0.0506 | -| std | 0.00875 | -| value_loss | 2.84e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16605 | -| time_elapsed | 89096 | -| total_timesteps | 2125440 | -| train/ | | -| approx_kl | 0.05975219 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0087 | -| learning_rate | 0.0003 | -| loss | 0.0326 | -| n_updates | 166040 | -| policy_gradient_loss | 0.0291 | -| std | 0.00875 | -| value_loss | 6.18e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16606 | -| time_elapsed | 89101 | -| total_timesteps | 2125568 | -| train/ | | -| approx_kl | 0.18781848 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 166050 | -| policy_gradient_loss | 0.0649 | -| std | 0.00874 | -| value_loss | 7.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16607 | -| time_elapsed | 89106 | -| total_timesteps | 2125696 | -| train/ | | -| approx_kl | 0.32624397 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0958 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 166060 | -| policy_gradient_loss | 0.0401 | -| std | 0.00874 | -| value_loss | 2.22e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16608 | -| time_elapsed | 89111 | -| total_timesteps | 2125824 | -| train/ | | -| approx_kl | 0.2055234 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 166070 | -| policy_gradient_loss | 0.0665 | -| std | 0.00874 | -| value_loss | 1.11e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 16609 | -| time_elapsed | 89116 | -| total_timesteps | 2125952 | -| train/ | | -| approx_kl | 0.0022333069 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 166080 | -| policy_gradient_loss | 0.0726 | -| std | 0.00874 | -| value_loss | 8.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16610 | -| time_elapsed | 89121 | -| total_timesteps | 2126080 | -| train/ | | -| approx_kl | 0.007479314 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.00599 | -| n_updates | 166090 | -| policy_gradient_loss | 0.0235 | -| std | 0.00874 | -| value_loss | 5.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16611 | -| time_elapsed | 89131 | -| total_timesteps | 2126208 | -| train/ | | -| approx_kl | 0.043954294 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.806 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 166100 | -| policy_gradient_loss | 0.00314 | -| std | 0.00874 | -| value_loss | 0.00392 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16612 | -| time_elapsed | 89137 | -| total_timesteps | 2126336 | -| train/ | | -| approx_kl | 0.06423819 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | 0.00541 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 166110 | -| policy_gradient_loss | 0.0123 | -| std | 0.00873 | -| value_loss | 2.67e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16613 | -| time_elapsed | 89143 | -| total_timesteps | 2126464 | -| train/ | | -| approx_kl | 0.018284865 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 166120 | -| policy_gradient_loss | -0.00553 | -| std | 0.00873 | -| value_loss | 1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16614 | -| time_elapsed | 89148 | -| total_timesteps | 2126592 | -| train/ | | -| approx_kl | 0.015930437 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.32 | -| explained_variance | -0.0647 | -| learning_rate | 0.0003 | -| loss | 0.00746 | -| n_updates | 166130 | -| policy_gradient_loss | 0.00488 | -| std | 0.0087 | -| value_loss | 3.23e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16615 | -| time_elapsed | 89153 | -| total_timesteps | 2126720 | -| train/ | | -| approx_kl | 0.036012687 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00884 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 166140 | -| policy_gradient_loss | 0.00916 | -| std | 0.00869 | -| value_loss | 2.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16616 | -| time_elapsed | 89158 | -| total_timesteps | 2126848 | -| train/ | | -| approx_kl | 0.007006649 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.00028 | -| n_updates | 166150 | -| policy_gradient_loss | 0.00638 | -| std | 0.00869 | -| value_loss | 0.000166 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 16617 | -| time_elapsed | 89164 | -| total_timesteps | 2126976 | -| train/ | | -| approx_kl | 0.04137312 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.526 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 166160 | -| policy_gradient_loss | -0.0116 | -| std | 0.00869 | -| value_loss | 9.38e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16618 | -| time_elapsed | 89170 | -| total_timesteps | 2127104 | -| train/ | | -| approx_kl | 0.03148229 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -1.4e-05 | -| n_updates | 166170 | -| policy_gradient_loss | 0.000877 | -| std | 0.00869 | -| value_loss | 6.29e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16619 | -| time_elapsed | 89184 | -| total_timesteps | 2127232 | -| train/ | | -| approx_kl | 0.0036897254 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | -0.00622 | -| n_updates | 166180 | -| policy_gradient_loss | -0.00721 | -| std | 0.00869 | -| value_loss | 0.00318 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16620 | -| time_elapsed | 89189 | -| total_timesteps | 2127360 | -| train/ | | -| approx_kl | 0.035085414 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.9 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 166190 | -| policy_gradient_loss | 0.0282 | -| std | 0.00869 | -| value_loss | 3.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16621 | -| time_elapsed | 89195 | -| total_timesteps | 2127488 | -| train/ | | -| approx_kl | 0.09166932 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.0758 | -| n_updates | 166200 | -| policy_gradient_loss | 0.0383 | -| std | 0.00868 | -| value_loss | 2.29e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16622 | -| time_elapsed | 89202 | -| total_timesteps | 2127616 | -| train/ | | -| approx_kl | 0.15284595 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0819 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 166210 | -| policy_gradient_loss | 0.0226 | -| std | 0.00868 | -| value_loss | 1.89e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16623 | -| time_elapsed | 89206 | -| total_timesteps | 2127744 | -| train/ | | -| approx_kl | 0.00079709664 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.00743 | -| n_updates | 166220 | -| policy_gradient_loss | -3.39e-05 | -| std | 0.00869 | -| value_loss | 1.13e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 16624 | -| time_elapsed | 89211 | -| total_timesteps | 2127872 | -| train/ | | -| approx_kl | 0.12167608 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | 0.0902 | -| n_updates | 166230 | -| policy_gradient_loss | 0.0915 | -| std | 0.00869 | -| value_loss | 6.47e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16625 | -| time_elapsed | 89217 | -| total_timesteps | 2128000 | -| train/ | | -| approx_kl | 0.022037383 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.00011 | -| n_updates | 166240 | -| policy_gradient_loss | 0.0176 | -| std | 0.00869 | -| value_loss | 5.08e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16626 | -| time_elapsed | 89224 | -| total_timesteps | 2128128 | -| train/ | | -| approx_kl | 0.12442978 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00307 | -| learning_rate | 0.0003 | -| loss | 0.0629 | -| n_updates | 166250 | -| policy_gradient_loss | 0.015 | -| std | 0.00869 | -| value_loss | 2.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16627 | -| time_elapsed | 89238 | -| total_timesteps | 2128256 | -| train/ | | -| approx_kl | 0.23763089 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.00623 | -| learning_rate | 0.0003 | -| loss | 0.00233 | -| n_updates | 166260 | -| policy_gradient_loss | -0.00381 | -| std | 0.00869 | -| value_loss | 0.00174 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16628 | -| time_elapsed | 89241 | -| total_timesteps | 2128384 | -| train/ | | -| approx_kl | 0.01781478 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0965 | -| learning_rate | 0.0003 | -| loss | 0.00117 | -| n_updates | 166270 | -| policy_gradient_loss | 0.0173 | -| std | 0.00869 | -| value_loss | 1.19e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16629 | -| time_elapsed | 89245 | -| total_timesteps | 2128512 | -| train/ | | -| approx_kl | 0.12578815 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0656 | -| learning_rate | 0.0003 | -| loss | 0.0869 | -| n_updates | 166280 | -| policy_gradient_loss | 0.0539 | -| std | 0.00869 | -| value_loss | 9.53e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16630 | -| time_elapsed | 89249 | -| total_timesteps | 2128640 | -| train/ | | -| approx_kl | 0.06129288 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.00414 | -| n_updates | 166290 | -| policy_gradient_loss | -0.0036 | -| std | 0.00869 | -| value_loss | 6.6e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16631 | -| time_elapsed | 89254 | -| total_timesteps | 2128768 | -| train/ | | -| approx_kl | 0.010090627 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 166300 | -| policy_gradient_loss | 0.0031 | -| std | 0.00869 | -| value_loss | 4.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 16632 | -| time_elapsed | 89261 | -| total_timesteps | 2128896 | -| train/ | | -| approx_kl | 0.056769155 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.000251 | -| n_updates | 166310 | -| policy_gradient_loss | 0.0121 | -| std | 0.00869 | -| value_loss | 2.82e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16633 | -| time_elapsed | 89266 | -| total_timesteps | 2129024 | -| train/ | | -| approx_kl | 0.7497942 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.38 | -| n_updates | 166320 | -| policy_gradient_loss | 0.14 | -| std | 0.00869 | -| value_loss | 1.75e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16634 | -| time_elapsed | 89278 | -| total_timesteps | 2129152 | -| train/ | | -| approx_kl | 0.18782052 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -9.5 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 166330 | -| policy_gradient_loss | -0.0118 | -| std | 0.00869 | -| value_loss | 0.00393 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16635 | -| time_elapsed | 89284 | -| total_timesteps | 2129280 | -| train/ | | -| approx_kl | 0.0040527154 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | -0.00645 | -| n_updates | 166340 | -| policy_gradient_loss | 0.00611 | -| std | 0.00869 | -| value_loss | 3.46e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16636 | -| time_elapsed | 89291 | -| total_timesteps | 2129408 | -| train/ | | -| approx_kl | 0.18060145 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -39.9 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 166350 | -| policy_gradient_loss | -0.00331 | -| std | 0.00867 | -| value_loss | 0.000423 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16637 | -| time_elapsed | 89296 | -| total_timesteps | 2129536 | -| train/ | | -| approx_kl | 0.007975863 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.00843 | -| n_updates | 166360 | -| policy_gradient_loss | 0.011 | -| std | 0.00866 | -| value_loss | 2.82e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16638 | -| time_elapsed | 89302 | -| total_timesteps | 2129664 | -| train/ | | -| approx_kl | 0.20926568 | -| clip_fraction | 0.64 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 166370 | -| policy_gradient_loss | 0.101 | -| std | 0.00866 | -| value_loss | 6.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16639 | -| time_elapsed | 89309 | -| total_timesteps | 2129792 | -| train/ | | -| approx_kl | 0.13344072 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.0055 | -| learning_rate | 0.0003 | -| loss | 0.0862 | -| n_updates | 166380 | -| policy_gradient_loss | 0.119 | -| std | 0.00866 | -| value_loss | 1.09e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 16640 | -| time_elapsed | 89314 | -| total_timesteps | 2129920 | -| train/ | | -| approx_kl | 0.11807876 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.0956 | -| n_updates | 166390 | -| policy_gradient_loss | 0.0866 | -| std | 0.00866 | -| value_loss | 7.68e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16641 | -| time_elapsed | 89319 | -| total_timesteps | 2130048 | -| train/ | | -| approx_kl | 0.09322375 | -| clip_fraction | 0.671 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 166400 | -| policy_gradient_loss | 0.0872 | -| std | 0.00866 | -| value_loss | 6.16e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16642 | -| time_elapsed | 89330 | -| total_timesteps | 2130176 | -| train/ | | -| approx_kl | 0.360674 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 166410 | -| policy_gradient_loss | 0.0206 | -| std | 0.00866 | -| value_loss | 0.000559 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16643 | -| time_elapsed | 89335 | -| total_timesteps | 2130304 | -| train/ | | -| approx_kl | 0.18476093 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0051 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 166420 | -| policy_gradient_loss | 0.0509 | -| std | 0.00866 | -| value_loss | 5.52e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16644 | -| time_elapsed | 89341 | -| total_timesteps | 2130432 | -| train/ | | -| approx_kl | 0.042494398 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0826 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 166430 | -| policy_gradient_loss | 0.0509 | -| std | 0.00866 | -| value_loss | 1.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16645 | -| time_elapsed | 89348 | -| total_timesteps | 2130560 | -| train/ | | -| approx_kl | 0.015492795 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0576 | -| learning_rate | 0.0003 | -| loss | -0.00393 | -| n_updates | 166440 | -| policy_gradient_loss | 0.0148 | -| std | 0.00866 | -| value_loss | 1.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16646 | -| time_elapsed | 89354 | -| total_timesteps | 2130688 | -| train/ | | -| approx_kl | 0.017747639 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 166450 | -| policy_gradient_loss | 0.024 | -| std | 0.00866 | -| value_loss | 7.61e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16647 | -| time_elapsed | 89361 | -| total_timesteps | 2130816 | -| train/ | | -| approx_kl | 0.0032355385 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 166460 | -| policy_gradient_loss | 0.057 | -| std | 0.00866 | -| value_loss | 5.96e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16648 | -| time_elapsed | 89366 | -| total_timesteps | 2130944 | -| train/ | | -| approx_kl | 0.07327296 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0565 | -| n_updates | 166470 | -| policy_gradient_loss | 0.177 | -| std | 0.00866 | -| value_loss | 3.22e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16649 | -| time_elapsed | 89372 | -| total_timesteps | 2131072 | -| train/ | | -| approx_kl | 0.06574655 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.0086 | -| n_updates | 166480 | -| policy_gradient_loss | 0.0147 | -| std | 0.00866 | -| value_loss | 2.95e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16650 | -| time_elapsed | 89383 | -| total_timesteps | 2131200 | -| train/ | | -| approx_kl | 0.035116803 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -10.9 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 166490 | -| policy_gradient_loss | -0.0122 | -| std | 0.00866 | -| value_loss | 0.00382 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16651 | -| time_elapsed | 89388 | -| total_timesteps | 2131328 | -| train/ | | -| approx_kl | 0.1252237 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0792 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 166500 | -| policy_gradient_loss | 0.0465 | -| std | 0.00866 | -| value_loss | 4.75e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16652 | -| time_elapsed | 89394 | -| total_timesteps | 2131456 | -| train/ | | -| approx_kl | 0.030659653 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 166510 | -| policy_gradient_loss | 0.0126 | -| std | 0.00866 | -| value_loss | 6.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16653 | -| time_elapsed | 89399 | -| total_timesteps | 2131584 | -| train/ | | -| approx_kl | 0.08123608 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.0688 | -| n_updates | 166520 | -| policy_gradient_loss | 0.0458 | -| std | 0.00866 | -| value_loss | 3.45e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16654 | -| time_elapsed | 89404 | -| total_timesteps | 2131712 | -| train/ | | -| approx_kl | 0.0025288016 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.00395 | -| n_updates | 166530 | -| policy_gradient_loss | 0.00286 | -| std | 0.00866 | -| value_loss | 2.26e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16655 | -| time_elapsed | 89409 | -| total_timesteps | 2131840 | -| train/ | | -| approx_kl | 0.119653754 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0878 | -| n_updates | 166540 | -| policy_gradient_loss | 0.0164 | -| std | 0.00866 | -| value_loss | 1.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 16656 | -| time_elapsed | 89414 | -| total_timesteps | 2131968 | -| train/ | | -| approx_kl | 0.12095407 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0538 | -| n_updates | 166550 | -| policy_gradient_loss | 0.017 | -| std | 0.00866 | -| value_loss | 9.53e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16657 | -| time_elapsed | 89418 | -| total_timesteps | 2132096 | -| train/ | | -| approx_kl | 0.009601828 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.00172 | -| n_updates | 166560 | -| policy_gradient_loss | 0.000612 | -| std | 0.00865 | -| value_loss | 6.37e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16658 | -| time_elapsed | 89429 | -| total_timesteps | 2132224 | -| train/ | | -| approx_kl | 0.4281134 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 166570 | -| policy_gradient_loss | -0.0108 | -| std | 0.00865 | -| value_loss | 0.00236 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16659 | -| time_elapsed | 89434 | -| total_timesteps | 2132352 | -| train/ | | -| approx_kl | 0.029250147 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 166580 | -| policy_gradient_loss | 0.0458 | -| std | 0.00865 | -| value_loss | 2.63e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16660 | -| time_elapsed | 89440 | -| total_timesteps | 2132480 | -| train/ | | -| approx_kl | 0.16116509 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0579 | -| n_updates | 166590 | -| policy_gradient_loss | 0.0221 | -| std | 0.00865 | -| value_loss | 3.28e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16661 | -| time_elapsed | 89446 | -| total_timesteps | 2132608 | -| train/ | | -| approx_kl | 2.6136171e-05 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.33 | -| explained_variance | -0.0766 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 166600 | -| policy_gradient_loss | 0.00794 | -| std | 0.00861 | -| value_loss | 5.08e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16662 | -| time_elapsed | 89453 | -| total_timesteps | 2132736 | -| train/ | | -| approx_kl | 0.00057704886 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00904 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 166610 | -| policy_gradient_loss | 0.00274 | -| std | 0.00858 | -| value_loss | 3.64e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16663 | -| time_elapsed | 89458 | -| total_timesteps | 2132864 | -| train/ | | -| approx_kl | 2.0170119e-05 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -1.58 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 166620 | -| policy_gradient_loss | -0.00848 | -| std | 0.00857 | -| value_loss | 1.17e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 16664 | -| time_elapsed | 89464 | -| total_timesteps | 2132992 | -| train/ | | -| approx_kl | 0.048067216 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 166630 | -| policy_gradient_loss | 0.0399 | -| std | 0.00857 | -| value_loss | 5.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16665 | -| time_elapsed | 89469 | -| total_timesteps | 2133120 | -| train/ | | -| approx_kl | 1.95615e-05 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.00014 | -| n_updates | 166640 | -| policy_gradient_loss | 0.0643 | -| std | 0.00857 | -| value_loss | 3.34e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16666 | -| time_elapsed | 89484 | -| total_timesteps | 2133248 | -| train/ | | -| approx_kl | 0.3135581 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.746 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 166650 | -| policy_gradient_loss | 0.0163 | -| std | 0.00857 | -| value_loss | 0.000706 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16667 | -| time_elapsed | 89491 | -| total_timesteps | 2133376 | -| train/ | | -| approx_kl | 0.011233088 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00363 | -| learning_rate | 0.0003 | -| loss | 0.00355 | -| n_updates | 166660 | -| policy_gradient_loss | 0.00132 | -| std | 0.00856 | -| value_loss | 2.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16668 | -| time_elapsed | 89496 | -| total_timesteps | 2133504 | -| train/ | | -| approx_kl | 0.009067776 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 166670 | -| policy_gradient_loss | -0.00861 | -| std | 0.00856 | -| value_loss | 1.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16669 | -| time_elapsed | 89502 | -| total_timesteps | 2133632 | -| train/ | | -| approx_kl | 0.017911639 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 166680 | -| policy_gradient_loss | 0.0153 | -| std | 0.00856 | -| value_loss | 5.08e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16670 | -| time_elapsed | 89507 | -| total_timesteps | 2133760 | -| train/ | | -| approx_kl | 0.17150947 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 166690 | -| policy_gradient_loss | 0.0779 | -| std | 0.00856 | -| value_loss | 3.18e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 16671 | -| time_elapsed | 89514 | -| total_timesteps | 2133888 | -| train/ | | -| approx_kl | 0.02499436 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.00963 | -| n_updates | 166700 | -| policy_gradient_loss | 0.0103 | -| std | 0.00856 | -| value_loss | 5.89e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16672 | -| time_elapsed | 89519 | -| total_timesteps | 2134016 | -| train/ | | -| approx_kl | 0.4175543 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 166710 | -| policy_gradient_loss | 0.0457 | -| std | 0.00857 | -| value_loss | 1.23e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16673 | -| time_elapsed | 89537 | -| total_timesteps | 2134144 | -| train/ | | -| approx_kl | 0.038987346 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.833 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 166720 | -| policy_gradient_loss | -0.0109 | -| std | 0.00857 | -| value_loss | 0.00052 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16674 | -| time_elapsed | 89543 | -| total_timesteps | 2134272 | -| train/ | | -| approx_kl | 0.35850698 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.401 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 166730 | -| policy_gradient_loss | 0.0948 | -| std | 0.00857 | -| value_loss | 3.43e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16675 | -| time_elapsed | 89548 | -| total_timesteps | 2134400 | -| train/ | | -| approx_kl | 0.013164554 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.964 | -| learning_rate | 0.0003 | -| loss | -0.00575 | -| n_updates | 166740 | -| policy_gradient_loss | -0.00423 | -| std | 0.00857 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16676 | -| time_elapsed | 89555 | -| total_timesteps | 2134528 | -| train/ | | -| approx_kl | 0.010106197 | -| clip_fraction | 0.0719 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00318 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 166750 | -| policy_gradient_loss | -0.00638 | -| std | 0.00857 | -| value_loss | 3.28e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16677 | -| time_elapsed | 89560 | -| total_timesteps | 2134656 | -| train/ | | -| approx_kl | 0.0091171395 | -| clip_fraction | 0.0625 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.000851 | -| n_updates | 166760 | -| policy_gradient_loss | -0.000531 | -| std | 0.00857 | -| value_loss | 1.95e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16678 | -| time_elapsed | 89565 | -| total_timesteps | 2134784 | -| train/ | | -| approx_kl | 0.016231358 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 166770 | -| policy_gradient_loss | 0.0147 | -| std | 0.00857 | -| value_loss | 1.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 16679 | -| time_elapsed | 89569 | -| total_timesteps | 2134912 | -| train/ | | -| approx_kl | 0.07854995 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.0619 | -| n_updates | 166780 | -| policy_gradient_loss | 0.0285 | -| std | 0.00857 | -| value_loss | 8.49e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16680 | -| time_elapsed | 89573 | -| total_timesteps | 2135040 | -| train/ | | -| approx_kl | 0.41559142 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 166790 | -| policy_gradient_loss | 0.0333 | -| std | 0.00857 | -| value_loss | 8.4e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16681 | -| time_elapsed | 89583 | -| total_timesteps | 2135168 | -| train/ | | -| approx_kl | 0.038379803 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.833 | -| learning_rate | 0.0003 | -| loss | 0.000897 | -| n_updates | 166800 | -| policy_gradient_loss | 0.00129 | -| std | 0.00857 | -| value_loss | 0.00276 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16682 | -| time_elapsed | 89588 | -| total_timesteps | 2135296 | -| train/ | | -| approx_kl | 0.1793286 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0597 | -| learning_rate | 0.0003 | -| loss | 0.0959 | -| n_updates | 166810 | -| policy_gradient_loss | 0.0366 | -| std | 0.00856 | -| value_loss | 4.84e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16683 | -| time_elapsed | 89593 | -| total_timesteps | 2135424 | -| train/ | | -| approx_kl | 0.04185396 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.0292 | -| n_updates | 166820 | -| policy_gradient_loss | 0.0451 | -| std | 0.00856 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16684 | -| time_elapsed | 89598 | -| total_timesteps | 2135552 | -| train/ | | -| approx_kl | 0.014505452 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | -0.0086 | -| n_updates | 166830 | -| policy_gradient_loss | 0.00825 | -| std | 0.00856 | -| value_loss | 7.97e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16685 | -| time_elapsed | 89604 | -| total_timesteps | 2135680 | -| train/ | | -| approx_kl | 0.10809697 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0532 | -| n_updates | 166840 | -| policy_gradient_loss | 0.00693 | -| std | 0.00856 | -| value_loss | 4.52e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16686 | -| time_elapsed | 89611 | -| total_timesteps | 2135808 | -| train/ | | -| approx_kl | 0.0787126 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 166850 | -| policy_gradient_loss | 0.00912 | -| std | 0.00856 | -| value_loss | 3.14e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16687 | -| time_elapsed | 89616 | -| total_timesteps | 2135936 | -| train/ | | -| approx_kl | 0.0171603 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 166860 | -| policy_gradient_loss | 0.0122 | -| std | 0.00857 | -| value_loss | 2.06e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16688 | -| time_elapsed | 89620 | -| total_timesteps | 2136064 | -| train/ | | -| approx_kl | 0.055856843 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 166870 | -| policy_gradient_loss | 0.0115 | -| std | 0.00857 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16689 | -| time_elapsed | 89630 | -| total_timesteps | 2136192 | -| train/ | | -| approx_kl | 0.036716703 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -6.53 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 166880 | -| policy_gradient_loss | -0.0114 | -| std | 0.00857 | -| value_loss | 0.00316 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16690 | -| time_elapsed | 89636 | -| total_timesteps | 2136320 | -| train/ | | -| approx_kl | 0.098621845 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 166890 | -| policy_gradient_loss | 0.0296 | -| std | 0.00857 | -| value_loss | 1.69e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16691 | -| time_elapsed | 89642 | -| total_timesteps | 2136448 | -| train/ | | -| approx_kl | 0.24770927 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 166900 | -| policy_gradient_loss | 0.0879 | -| std | 0.00857 | -| value_loss | 4.19e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16692 | -| time_elapsed | 89650 | -| total_timesteps | 2136576 | -| train/ | | -| approx_kl | 0.13454153 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.0749 | -| n_updates | 166910 | -| policy_gradient_loss | 0.0733 | -| std | 0.00857 | -| value_loss | 2.2e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16693 | -| time_elapsed | 89655 | -| total_timesteps | 2136704 | -| train/ | | -| approx_kl | 0.11664039 | -| clip_fraction | 0.669 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0822 | -| n_updates | 166920 | -| policy_gradient_loss | 0.116 | -| std | 0.00857 | -| value_loss | 1.86e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16694 | -| time_elapsed | 89659 | -| total_timesteps | 2136832 | -| train/ | | -| approx_kl | 0.018074669 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | 0.00765 | -| n_updates | 166930 | -| policy_gradient_loss | 0.0228 | -| std | 0.00857 | -| value_loss | 6.81e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 16695 | -| time_elapsed | 89665 | -| total_timesteps | 2136960 | -| train/ | | -| approx_kl | 0.02521918 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -0.00683 | -| n_updates | 166940 | -| policy_gradient_loss | 0.000741 | -| std | 0.00858 | -| value_loss | 1.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16696 | -| time_elapsed | 89670 | -| total_timesteps | 2137088 | -| train/ | | -| approx_kl | 0.082820676 | -| clip_fraction | 0.611 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.074 | -| n_updates | 166950 | -| policy_gradient_loss | 0.176 | -| std | 0.00858 | -| value_loss | 1.82e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16697 | -| time_elapsed | 89683 | -| total_timesteps | 2137216 | -| train/ | | -| approx_kl | 0.33542573 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | 0.00321 | -| n_updates | 166960 | -| policy_gradient_loss | 0.00513 | -| std | 0.00858 | -| value_loss | 0.000152 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16698 | -| time_elapsed | 89689 | -| total_timesteps | 2137344 | -| train/ | | -| approx_kl | 0.04454369 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 166970 | -| policy_gradient_loss | 0.00838 | -| std | 0.00858 | -| value_loss | 6.7e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16699 | -| time_elapsed | 89695 | -| total_timesteps | 2137472 | -| train/ | | -| approx_kl | 0.32695755 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | 0.072 | -| n_updates | 166980 | -| policy_gradient_loss | 0.0237 | -| std | 0.00858 | -| value_loss | 8.58e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16700 | -| time_elapsed | 89703 | -| total_timesteps | 2137600 | -| train/ | | -| approx_kl | 0.007915135 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.338 | -| learning_rate | 0.0003 | -| loss | -0.00476 | -| n_updates | 166990 | -| policy_gradient_loss | 0.00183 | -| std | 0.00858 | -| value_loss | 3.55e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16701 | -| time_elapsed | 89710 | -| total_timesteps | 2137728 | -| train/ | | -| approx_kl | 0.049664456 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 167000 | -| policy_gradient_loss | 0.0107 | -| std | 0.00857 | -| value_loss | 2.42e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16702 | -| time_elapsed | 89716 | -| total_timesteps | 2137856 | -| train/ | | -| approx_kl | 0.035157643 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.0076 | -| n_updates | 167010 | -| policy_gradient_loss | 0.0042 | -| std | 0.00858 | -| value_loss | 1.39e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 16703 | -| time_elapsed | 89722 | -| total_timesteps | 2137984 | -| train/ | | -| approx_kl | 0.0049846424 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | -0.000946 | -| n_updates | 167020 | -| policy_gradient_loss | 0.00255 | -| std | 0.00858 | -| value_loss | 1.37e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16704 | -| time_elapsed | 89727 | -| total_timesteps | 2138112 | -| train/ | | -| approx_kl | 0.050817594 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 167030 | -| policy_gradient_loss | 0.0121 | -| std | 0.00859 | -| value_loss | 1.55e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16705 | -| time_elapsed | 89744 | -| total_timesteps | 2138240 | -| train/ | | -| approx_kl | 0.007275612 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -3.33 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 167040 | -| policy_gradient_loss | -0.0149 | -| std | 0.00859 | -| value_loss | 0.00249 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16706 | -| time_elapsed | 89750 | -| total_timesteps | 2138368 | -| train/ | | -| approx_kl | 0.023954913 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 167050 | -| policy_gradient_loss | 0.00446 | -| std | 0.00859 | -| value_loss | 7.67e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16707 | -| time_elapsed | 89756 | -| total_timesteps | 2138496 | -| train/ | | -| approx_kl | 2.3682602e-05 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -32.4 | -| learning_rate | 0.0003 | -| loss | -0.000497 | -| n_updates | 167060 | -| policy_gradient_loss | 0.00733 | -| std | 0.00858 | -| value_loss | 6.02e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16708 | -| time_elapsed | 89761 | -| total_timesteps | 2138624 | -| train/ | | -| approx_kl | 0.031923935 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -5.5 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 167070 | -| policy_gradient_loss | 0.0116 | -| std | 0.00856 | -| value_loss | 1.17e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16709 | -| time_elapsed | 89768 | -| total_timesteps | 2138752 | -| train/ | | -| approx_kl | 0.41153038 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0665 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 167080 | -| policy_gradient_loss | 0.0527 | -| std | 0.00856 | -| value_loss | 1.64e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 16710 | -| time_elapsed | 89775 | -| total_timesteps | 2138880 | -| train/ | | -| approx_kl | 0.025215343 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | -0.0043 | -| n_updates | 167090 | -| policy_gradient_loss | -0.000779 | -| std | 0.00856 | -| value_loss | 1.39e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16711 | -| time_elapsed | 89782 | -| total_timesteps | 2139008 | -| train/ | | -| approx_kl | 0.037056 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.00273 | -| n_updates | 167100 | -| policy_gradient_loss | 0.000125 | -| std | 0.00856 | -| value_loss | 9.49e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16712 | -| time_elapsed | 89800 | -| total_timesteps | 2139136 | -| train/ | | -| approx_kl | 0.023921631 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.908 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 167110 | -| policy_gradient_loss | -0.0193 | -| std | 0.00856 | -| value_loss | 0.00094 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16713 | -| time_elapsed | 89807 | -| total_timesteps | 2139264 | -| train/ | | -| approx_kl | 0.060871195 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.472 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 167120 | -| policy_gradient_loss | -0.012 | -| std | 0.00857 | -| value_loss | 2.07e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16714 | -| time_elapsed | 89813 | -| total_timesteps | 2139392 | -| train/ | | -| approx_kl | 0.017452186 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -3.89 | -| learning_rate | 0.0003 | -| loss | 0.0026 | -| n_updates | 167130 | -| policy_gradient_loss | 0.00406 | -| std | 0.00857 | -| value_loss | 4.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16715 | -| time_elapsed | 89823 | -| total_timesteps | 2139520 | -| train/ | | -| approx_kl | 0.006400332 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0793 | -| learning_rate | 0.0003 | -| loss | 0.000128 | -| n_updates | 167140 | -| policy_gradient_loss | 0.00346 | -| std | 0.00857 | -| value_loss | 7.01e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16716 | -| time_elapsed | 89832 | -| total_timesteps | 2139648 | -| train/ | | -| approx_kl | 0.04092586 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 1.65e-05 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 167150 | -| policy_gradient_loss | 0.0252 | -| std | 0.00857 | -| value_loss | 1.53e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16717 | -| time_elapsed | 89838 | -| total_timesteps | 2139776 | -| train/ | | -| approx_kl | 0.61905926 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | 0.491 | -| n_updates | 167160 | -| policy_gradient_loss | 0.186 | -| std | 0.00857 | -| value_loss | 9e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 16718 | -| time_elapsed | 89845 | -| total_timesteps | 2139904 | -| train/ | | -| approx_kl | 0.0026369104 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.00623 | -| learning_rate | 0.0003 | -| loss | -0.001 | -| n_updates | 167170 | -| policy_gradient_loss | 0.00962 | -| std | 0.00858 | -| value_loss | 1.96e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16719 | -| time_elapsed | 89851 | -| total_timesteps | 2140032 | -| train/ | | -| approx_kl | 0.0010871533 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0806 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 167180 | -| policy_gradient_loss | 0.000667 | -| std | 0.00858 | -| value_loss | 1.06e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16720 | -| time_elapsed | 89862 | -| total_timesteps | 2140160 | -| train/ | | -| approx_kl | 0.018829398 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.769 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 167190 | -| policy_gradient_loss | 0.000496 | -| std | 0.00859 | -| value_loss | 0.00488 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16721 | -| time_elapsed | 89867 | -| total_timesteps | 2140288 | -| train/ | | -| approx_kl | 0.001514161 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 167200 | -| policy_gradient_loss | 0.0193 | -| std | 0.00859 | -| value_loss | 1.65e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16722 | -| time_elapsed | 89874 | -| total_timesteps | 2140416 | -| train/ | | -| approx_kl | 0.4052216 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00786 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 167210 | -| policy_gradient_loss | 0.0317 | -| std | 0.00859 | -| value_loss | 1.71e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16723 | -| time_elapsed | 89878 | -| total_timesteps | 2140544 | -| train/ | | -| approx_kl | 0.008444352 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 167220 | -| policy_gradient_loss | 0.00214 | -| std | 0.00859 | -| value_loss | 9.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16724 | -| time_elapsed | 89882 | -| total_timesteps | 2140672 | -| train/ | | -| approx_kl | 0.020802654 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 167230 | -| policy_gradient_loss | 0.093 | -| std | 0.00858 | -| value_loss | 7.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16725 | -| time_elapsed | 89888 | -| total_timesteps | 2140800 | -| train/ | | -| approx_kl | 0.049455848 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 167240 | -| policy_gradient_loss | 0.0704 | -| std | 0.00858 | -| value_loss | 5.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 16726 | -| time_elapsed | 89895 | -| total_timesteps | 2140928 | -| train/ | | -| approx_kl | 0.068346635 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.0766 | -| n_updates | 167250 | -| policy_gradient_loss | 0.0791 | -| std | 0.00858 | -| value_loss | 3.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16727 | -| time_elapsed | 89901 | -| total_timesteps | 2141056 | -| train/ | | -| approx_kl | 0.016509745 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.0092 | -| n_updates | 167260 | -| policy_gradient_loss | 0.0198 | -| std | 0.00859 | -| value_loss | 2.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16728 | -| time_elapsed | 89912 | -| total_timesteps | 2141184 | -| train/ | | -| approx_kl | 0.007005309 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 1 | -| learning_rate | 0.0003 | -| loss | -0.00536 | -| n_updates | 167270 | -| policy_gradient_loss | 0.0116 | -| std | 0.00858 | -| value_loss | 3.67e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16729 | -| time_elapsed | 89917 | -| total_timesteps | 2141312 | -| train/ | | -| approx_kl | 0.0048622447 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 167280 | -| policy_gradient_loss | 0.0221 | -| std | 0.00858 | -| value_loss | 5.37e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16730 | -| time_elapsed | 89921 | -| total_timesteps | 2141440 | -| train/ | | -| approx_kl | 0.0052726297 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 167290 | -| policy_gradient_loss | 0.0211 | -| std | 0.00857 | -| value_loss | 2.94e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16731 | -| time_elapsed | 89927 | -| total_timesteps | 2141568 | -| train/ | | -| approx_kl | 0.0010287217 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | -0.000872 | -| n_updates | 167300 | -| policy_gradient_loss | 0.0224 | -| std | 0.00858 | -| value_loss | 5.69e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16732 | -| time_elapsed | 89932 | -| total_timesteps | 2141696 | -| train/ | | -| approx_kl | 0.006557395 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.00736 | -| n_updates | 167310 | -| policy_gradient_loss | 0.0189 | -| std | 0.00859 | -| value_loss | 7.32e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16733 | -| time_elapsed | 89941 | -| total_timesteps | 2141824 | -| train/ | | -| approx_kl | 0.07227141 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.916 | -| learning_rate | 0.0003 | -| loss | 0.00582 | -| n_updates | 167320 | -| policy_gradient_loss | 0.0245 | -| std | 0.00859 | -| value_loss | 5.4e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 16734 | -| time_elapsed | 89948 | -| total_timesteps | 2141952 | -| train/ | | -| approx_kl | 0.13351436 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 167330 | -| policy_gradient_loss | 0.0268 | -| std | 0.00859 | -| value_loss | 3.07e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16735 | -| time_elapsed | 89954 | -| total_timesteps | 2142080 | -| train/ | | -| approx_kl | 0.0011352142 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | -0.00044 | -| n_updates | 167340 | -| policy_gradient_loss | 0.00791 | -| std | 0.00855 | -| value_loss | 2e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16736 | -| time_elapsed | 89964 | -| total_timesteps | 2142208 | -| train/ | | -| approx_kl | 0.014412124 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 167350 | -| policy_gradient_loss | 0.0195 | -| std | 0.00852 | -| value_loss | 0.0016 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16737 | -| time_elapsed | 89969 | -| total_timesteps | 2142336 | -| train/ | | -| approx_kl | 0.17988256 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 167360 | -| policy_gradient_loss | 0.123 | -| std | 0.00851 | -| value_loss | 5.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16738 | -| time_elapsed | 89974 | -| total_timesteps | 2142464 | -| train/ | | -| approx_kl | 0.025632558 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00456 | -| learning_rate | 0.0003 | -| loss | 0.00969 | -| n_updates | 167370 | -| policy_gradient_loss | 0.0202 | -| std | 0.0085 | -| value_loss | 6.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16739 | -| time_elapsed | 89980 | -| total_timesteps | 2142592 | -| train/ | | -| approx_kl | 0.26125866 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 167380 | -| policy_gradient_loss | 0.124 | -| std | 0.0085 | -| value_loss | 4.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16740 | -| time_elapsed | 89986 | -| total_timesteps | 2142720 | -| train/ | | -| approx_kl | 0.09814306 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.0712 | -| n_updates | 167390 | -| policy_gradient_loss | 0.073 | -| std | 0.0085 | -| value_loss | 2.61e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16741 | -| time_elapsed | 89992 | -| total_timesteps | 2142848 | -| train/ | | -| approx_kl | 0.02075333 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 167400 | -| policy_gradient_loss | 0.0128 | -| std | 0.0085 | -| value_loss | 2.09e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16742 | -| time_elapsed | 89999 | -| total_timesteps | 2142976 | -| train/ | | -| approx_kl | 0.08557849 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.00531 | -| n_updates | 167410 | -| policy_gradient_loss | 0.00336 | -| std | 0.00849 | -| value_loss | 6.47e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16743 | -| time_elapsed | 90005 | -| total_timesteps | 2143104 | -| train/ | | -| approx_kl | 0.0035385387 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 167420 | -| policy_gradient_loss | 0.0148 | -| std | 0.00848 | -| value_loss | 8.73e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16744 | -| time_elapsed | 90023 | -| total_timesteps | 2143232 | -| train/ | | -| approx_kl | 0.027051333 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | -0.00526 | -| n_updates | 167430 | -| policy_gradient_loss | -0.00425 | -| std | 0.00848 | -| value_loss | 0.00135 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16745 | -| time_elapsed | 90029 | -| total_timesteps | 2143360 | -| train/ | | -| approx_kl | 0.08326525 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00803 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 167440 | -| policy_gradient_loss | -0.0167 | -| std | 0.00848 | -| value_loss | 2.06e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16746 | -| time_elapsed | 90036 | -| total_timesteps | 2143488 | -| train/ | | -| approx_kl | 0.029957723 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 167450 | -| policy_gradient_loss | 0.00962 | -| std | 0.00848 | -| value_loss | 4.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16747 | -| time_elapsed | 90042 | -| total_timesteps | 2143616 | -| train/ | | -| approx_kl | 0.019327983 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00513 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 167460 | -| policy_gradient_loss | 0.06 | -| std | 0.00848 | -| value_loss | 3.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16748 | -| time_elapsed | 90049 | -| total_timesteps | 2143744 | -| train/ | | -| approx_kl | 0.010373829 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.38 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 167470 | -| policy_gradient_loss | 0.000807 | -| std | 0.00847 | -| value_loss | 4.16e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 16749 | -| time_elapsed | 90056 | -| total_timesteps | 2143872 | -| train/ | | -| approx_kl | 0.06435213 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00258 | -| learning_rate | 0.0003 | -| loss | 0.00768 | -| n_updates | 167480 | -| policy_gradient_loss | 0.012 | -| std | 0.00847 | -| value_loss | 2.53e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16750 | -| time_elapsed | 90062 | -| total_timesteps | 2144000 | -| train/ | | -| approx_kl | 0.24777094 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00761 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 167490 | -| policy_gradient_loss | 0.11 | -| std | 0.00847 | -| value_loss | 2.35e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16751 | -| time_elapsed | 90068 | -| total_timesteps | 2144128 | -| train/ | | -| approx_kl | 0.14960495 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00239 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 167500 | -| policy_gradient_loss | 0.105 | -| std | 0.00848 | -| value_loss | 1.19e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16752 | -| time_elapsed | 90083 | -| total_timesteps | 2144256 | -| train/ | | -| approx_kl | 0.22455019 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 167510 | -| policy_gradient_loss | 0.00942 | -| std | 0.00848 | -| value_loss | 0.000111 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16753 | -| time_elapsed | 90089 | -| total_timesteps | 2144384 | -| train/ | | -| approx_kl | 0.028226119 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0665 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 167520 | -| policy_gradient_loss | 0.0287 | -| std | 0.00848 | -| value_loss | 2.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16754 | -| time_elapsed | 90096 | -| total_timesteps | 2144512 | -| train/ | | -| approx_kl | 0.022560656 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | 0.0436 | -| n_updates | 167530 | -| policy_gradient_loss | 0.000151 | -| std | 0.00848 | -| value_loss | 1.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16755 | -| time_elapsed | 90101 | -| total_timesteps | 2144640 | -| train/ | | -| approx_kl | 0.07087902 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 167540 | -| policy_gradient_loss | 0.027 | -| std | 0.00848 | -| value_loss | 1.17e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16756 | -| time_elapsed | 90108 | -| total_timesteps | 2144768 | -| train/ | | -| approx_kl | 0.22173011 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 167550 | -| policy_gradient_loss | 0.114 | -| std | 0.00847 | -| value_loss | 6.8e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 16757 | -| time_elapsed | 90115 | -| total_timesteps | 2144896 | -| train/ | | -| approx_kl | 0.114836596 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.0793 | -| n_updates | 167560 | -| policy_gradient_loss | 0.0861 | -| std | 0.00847 | -| value_loss | 2.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16758 | -| time_elapsed | 90121 | -| total_timesteps | 2145024 | -| train/ | | -| approx_kl | 0.022191742 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | 0.00719 | -| n_updates | 167570 | -| policy_gradient_loss | 0.0104 | -| std | 0.00847 | -| value_loss | 2.82e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16759 | -| time_elapsed | 90133 | -| total_timesteps | 2145152 | -| train/ | | -| approx_kl | 0.008107241 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 167580 | -| policy_gradient_loss | -0.0116 | -| std | 0.00847 | -| value_loss | 4.66e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16760 | -| time_elapsed | 90139 | -| total_timesteps | 2145280 | -| train/ | | -| approx_kl | 0.021998767 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.29 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 167590 | -| policy_gradient_loss | 0.000328 | -| std | 0.00846 | -| value_loss | 0.00186 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16761 | -| time_elapsed | 90143 | -| total_timesteps | 2145408 | -| train/ | | -| approx_kl | 0.041815326 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0955 | -| learning_rate | 0.0003 | -| loss | 0.00316 | -| n_updates | 167600 | -| policy_gradient_loss | 0.000378 | -| std | 0.00846 | -| value_loss | 4.22e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16762 | -| time_elapsed | 90150 | -| total_timesteps | 2145536 | -| train/ | | -| approx_kl | 0.006299767 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -8.77e-05 | -| n_updates | 167610 | -| policy_gradient_loss | 0.00259 | -| std | 0.00846 | -| value_loss | 4.28e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16763 | -| time_elapsed | 90156 | -| total_timesteps | 2145664 | -| train/ | | -| approx_kl | 0.051301908 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.00687 | -| n_updates | 167620 | -| policy_gradient_loss | -0.000267 | -| std | 0.00847 | -| value_loss | 5.53e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16764 | -| time_elapsed | 90162 | -| total_timesteps | 2145792 | -| train/ | | -| approx_kl | 0.006786306 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.0012 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 167630 | -| policy_gradient_loss | -0.00111 | -| std | 0.00847 | -| value_loss | 1.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 16765 | -| time_elapsed | 90168 | -| total_timesteps | 2145920 | -| train/ | | -| approx_kl | 0.028484859 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 167640 | -| policy_gradient_loss | -0.00118 | -| std | 0.00847 | -| value_loss | 1.61e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16766 | -| time_elapsed | 90173 | -| total_timesteps | 2146048 | -| train/ | | -| approx_kl | 0.053478755 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 167650 | -| policy_gradient_loss | 0.0843 | -| std | 0.00847 | -| value_loss | 5.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16767 | -| time_elapsed | 90184 | -| total_timesteps | 2146176 | -| train/ | | -| approx_kl | 0.058575433 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 167660 | -| policy_gradient_loss | -0.00792 | -| std | 0.00847 | -| value_loss | 0.0024 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16768 | -| time_elapsed | 90190 | -| total_timesteps | 2146304 | -| train/ | | -| approx_kl | 0.037520472 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 167670 | -| policy_gradient_loss | 0.0516 | -| std | 0.00847 | -| value_loss | 4.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16769 | -| time_elapsed | 90197 | -| total_timesteps | 2146432 | -| train/ | | -| approx_kl | 0.016266786 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.00706 | -| n_updates | 167680 | -| policy_gradient_loss | 0.0289 | -| std | 0.00847 | -| value_loss | 2.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16770 | -| time_elapsed | 90204 | -| total_timesteps | 2146560 | -| train/ | | -| approx_kl | 0.07972731 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | 0.0654 | -| n_updates | 167690 | -| policy_gradient_loss | 0.0308 | -| std | 0.00847 | -| value_loss | 1.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16771 | -| time_elapsed | 90211 | -| total_timesteps | 2146688 | -| train/ | | -| approx_kl | 0.004078053 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.00364 | -| n_updates | 167700 | -| policy_gradient_loss | 0.00705 | -| std | 0.00847 | -| value_loss | 8.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16772 | -| time_elapsed | 90215 | -| total_timesteps | 2146816 | -| train/ | | -| approx_kl | 0.025454298 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 167710 | -| policy_gradient_loss | 0.0197 | -| std | 0.00847 | -| value_loss | 7.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 16773 | -| time_elapsed | 90226 | -| total_timesteps | 2146944 | -| train/ | | -| approx_kl | 0.07597582 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0508 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 167720 | -| policy_gradient_loss | 0.0346 | -| std | 0.00847 | -| value_loss | 3.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16774 | -| time_elapsed | 90231 | -| total_timesteps | 2147072 | -| train/ | | -| approx_kl | 0.07118966 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 167730 | -| policy_gradient_loss | 0.00336 | -| std | 0.00847 | -| value_loss | 2.57e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16775 | -| time_elapsed | 90242 | -| total_timesteps | 2147200 | -| train/ | | -| approx_kl | 0.022744427 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 167740 | -| policy_gradient_loss | -0.00874 | -| std | 0.00847 | -| value_loss | 0.00163 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16776 | -| time_elapsed | 90247 | -| total_timesteps | 2147328 | -| train/ | | -| approx_kl | 0.20797831 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00553 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 167750 | -| policy_gradient_loss | 0.0562 | -| std | 0.00847 | -| value_loss | 1.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16777 | -| time_elapsed | 90253 | -| total_timesteps | 2147456 | -| train/ | | -| approx_kl | 0.00432421 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0739 | -| learning_rate | 0.0003 | -| loss | -0.008 | -| n_updates | 167760 | -| policy_gradient_loss | 0.00397 | -| std | 0.00847 | -| value_loss | 3.75e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16778 | -| time_elapsed | 90259 | -| total_timesteps | 2147584 | -| train/ | | -| approx_kl | 0.05551541 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | 0.0413 | -| n_updates | 167770 | -| policy_gradient_loss | 0.0606 | -| std | 0.00847 | -| value_loss | 2.63e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16779 | -| time_elapsed | 90265 | -| total_timesteps | 2147712 | -| train/ | | -| approx_kl | 0.16566485 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.0398 | -| n_updates | 167780 | -| policy_gradient_loss | 0.0263 | -| std | 0.00847 | -| value_loss | 1.48e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16780 | -| time_elapsed | 90274 | -| total_timesteps | 2147840 | -| train/ | | -| approx_kl | 0.0011029877 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 167790 | -| policy_gradient_loss | 0.00143 | -| std | 0.00847 | -| value_loss | 9.3e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 16781 | -| time_elapsed | 90281 | -| total_timesteps | 2147968 | -| train/ | | -| approx_kl | 0.058646195 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0162 | -| n_updates | 167800 | -| policy_gradient_loss | 0.0441 | -| std | 0.00848 | -| value_loss | 6.74e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16782 | -| time_elapsed | 90289 | -| total_timesteps | 2148096 | -| train/ | | -| approx_kl | 0.030928774 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.0336 | -| n_updates | 167810 | -| policy_gradient_loss | 0.018 | -| std | 0.00848 | -| value_loss | 7.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16783 | -| time_elapsed | 90303 | -| total_timesteps | 2148224 | -| train/ | | -| approx_kl | 0.005811657 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 167820 | -| policy_gradient_loss | 0.0108 | -| std | 0.00848 | -| value_loss | 0.000117 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16784 | -| time_elapsed | 90310 | -| total_timesteps | 2148352 | -| train/ | | -| approx_kl | 0.1816183 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.466 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 167830 | -| policy_gradient_loss | 0.0557 | -| std | 0.00848 | -| value_loss | 2.59e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16785 | -| time_elapsed | 90318 | -| total_timesteps | 2148480 | -| train/ | | -| approx_kl | 0.034239568 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00271 | -| learning_rate | 0.0003 | -| loss | 0.00502 | -| n_updates | 167840 | -| policy_gradient_loss | 0.0452 | -| std | 0.00848 | -| value_loss | 2.32e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16786 | -| time_elapsed | 90323 | -| total_timesteps | 2148608 | -| train/ | | -| approx_kl | 0.0349877 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00879 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 167850 | -| policy_gradient_loss | 0.0226 | -| std | 0.00848 | -| value_loss | 1.14e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16787 | -| time_elapsed | 90329 | -| total_timesteps | 2148736 | -| train/ | | -| approx_kl | 0.118013754 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 167860 | -| policy_gradient_loss | 0.0229 | -| std | 0.00848 | -| value_loss | 6.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16788 | -| time_elapsed | 90335 | -| total_timesteps | 2148864 | -| train/ | | -| approx_kl | 0.038282897 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 167870 | -| policy_gradient_loss | 0.0546 | -| std | 0.00848 | -| value_loss | 4.2e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 16789 | -| time_elapsed | 90342 | -| total_timesteps | 2148992 | -| train/ | | -| approx_kl | 0.00029753242 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -7.3e-05 | -| n_updates | 167880 | -| policy_gradient_loss | 0.0652 | -| std | 0.00847 | -| value_loss | 3.54e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 16790 | -| time_elapsed | 90348 | -| total_timesteps | 2149120 | -| train/ | | -| approx_kl | 0.013506016 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 167890 | -| policy_gradient_loss | 0.0257 | -| std | 0.00846 | -| value_loss | 3.63e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 16791 | -| time_elapsed | 90366 | -| total_timesteps | 2149248 | -| train/ | | -| approx_kl | 0.0075584976 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -6.41 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 167900 | -| policy_gradient_loss | -0.00684 | -| std | 0.00846 | -| value_loss | 0.00323 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 16792 | -| time_elapsed | 90372 | -| total_timesteps | 2149376 | -| train/ | | -| approx_kl | 0.00023105368 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -5.82 | -| learning_rate | 0.0003 | -| loss | 0.0016 | -| n_updates | 167910 | -| policy_gradient_loss | 0.00918 | -| std | 0.00846 | -| value_loss | 1.19e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 16793 | -| time_elapsed | 90378 | -| total_timesteps | 2149504 | -| train/ | | -| approx_kl | 0.24703528 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -5.3 | -| learning_rate | 0.0003 | -| loss | 0.0833 | -| n_updates | 167920 | -| policy_gradient_loss | 0.0602 | -| std | 0.00845 | -| value_loss | 2.83e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 16794 | -| time_elapsed | 90383 | -| total_timesteps | 2149632 | -| train/ | | -| approx_kl | 0.13435422 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -49.3 | -| learning_rate | 0.0003 | -| loss | 0.057 | -| n_updates | 167930 | -| policy_gradient_loss | 0.0319 | -| std | 0.00845 | -| value_loss | 5.07e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 16795 | -| time_elapsed | 90390 | -| total_timesteps | 2149760 | -| train/ | | -| approx_kl | 0.029403413 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -5.84 | -| learning_rate | 0.0003 | -| loss | 0.00278 | -| n_updates | 167940 | -| policy_gradient_loss | 0.0059 | -| std | 0.00845 | -| value_loss | 1.54e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 16796 | -| time_elapsed | 90397 | -| total_timesteps | 2149888 | -| train/ | | -| approx_kl | 0.30938447 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -5.66 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 167950 | -| policy_gradient_loss | 0.0146 | -| std | 0.00845 | -| value_loss | 1.82e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16797 | -| time_elapsed | 90403 | -| total_timesteps | 2150016 | -| train/ | | -| approx_kl | 0.032780338 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.457 | -| learning_rate | 0.0003 | -| loss | 0.00136 | -| n_updates | 167960 | -| policy_gradient_loss | 0.00207 | -| std | 0.00845 | -| value_loss | 2.14e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16798 | -| time_elapsed | 90417 | -| total_timesteps | 2150144 | -| train/ | | -| approx_kl | 0.032294005 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 167970 | -| policy_gradient_loss | 0.00791 | -| std | 0.00845 | -| value_loss | 3.56e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16799 | -| time_elapsed | 90422 | -| total_timesteps | 2150272 | -| train/ | | -| approx_kl | 0.0031415634 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.0526 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 167980 | -| policy_gradient_loss | 0.00362 | -| std | 0.00845 | -| value_loss | 2.16e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16800 | -| time_elapsed | 90430 | -| total_timesteps | 2150400 | -| train/ | | -| approx_kl | 0.052196726 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00641 | -| learning_rate | 0.0003 | -| loss | 0.00848 | -| n_updates | 167990 | -| policy_gradient_loss | 0.00139 | -| std | 0.00845 | -| value_loss | 2.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16801 | -| time_elapsed | 90440 | -| total_timesteps | 2150528 | -| train/ | | -| approx_kl | 0.14938036 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 168000 | -| policy_gradient_loss | 0.0245 | -| std | 0.00846 | -| value_loss | 1.14e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16802 | -| time_elapsed | 90447 | -| total_timesteps | 2150656 | -| train/ | | -| approx_kl | 0.27138922 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.0879 | -| n_updates | 168010 | -| policy_gradient_loss | 0.0284 | -| std | 0.00846 | -| value_loss | 8.58e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16803 | -| time_elapsed | 90451 | -| total_timesteps | 2150784 | -| train/ | | -| approx_kl | 0.028667368 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 168020 | -| policy_gradient_loss | 0.00866 | -| std | 0.00846 | -| value_loss | 4.93e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 16804 | -| time_elapsed | 90459 | -| total_timesteps | 2150912 | -| train/ | | -| approx_kl | 2.9086135e-05 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.000644 | -| n_updates | 168030 | -| policy_gradient_loss | 0.00173 | -| std | 0.00846 | -| value_loss | 5.78e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16805 | -| time_elapsed | 90468 | -| total_timesteps | 2151040 | -| train/ | | -| approx_kl | 0.004943534 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | -0.00947 | -| n_updates | 168040 | -| policy_gradient_loss | 0.00184 | -| std | 0.00846 | -| value_loss | 2.46e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16806 | -| time_elapsed | 90482 | -| total_timesteps | 2151168 | -| train/ | | -| approx_kl | 0.11370695 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.79 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 168050 | -| policy_gradient_loss | 0.00996 | -| std | 0.00846 | -| value_loss | 0.00416 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16807 | -| time_elapsed | 90488 | -| total_timesteps | 2151296 | -| train/ | | -| approx_kl | 0.13874127 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.0915 | -| n_updates | 168060 | -| policy_gradient_loss | 0.0866 | -| std | 0.00846 | -| value_loss | 7.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16808 | -| time_elapsed | 90497 | -| total_timesteps | 2151424 | -| train/ | | -| approx_kl | 0.029236307 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00329 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 168070 | -| policy_gradient_loss | 0.0215 | -| std | 0.00846 | -| value_loss | 9.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16809 | -| time_elapsed | 90501 | -| total_timesteps | 2151552 | -| train/ | | -| approx_kl | 0.42694348 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0886 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 168080 | -| policy_gradient_loss | 0.0422 | -| std | 0.00846 | -| value_loss | 3.13e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16810 | -| time_elapsed | 90506 | -| total_timesteps | 2151680 | -| train/ | | -| approx_kl | 0.027064642 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 168090 | -| policy_gradient_loss | -0.00201 | -| std | 0.00846 | -| value_loss | 2.41e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16811 | -| time_elapsed | 90511 | -| total_timesteps | 2151808 | -| train/ | | -| approx_kl | 0.0054919403 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 168100 | -| policy_gradient_loss | 0.00272 | -| std | 0.00846 | -| value_loss | 1.59e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 16812 | -| time_elapsed | 90517 | -| total_timesteps | 2151936 | -| train/ | | -| approx_kl | 0.02694872 | -| clip_fraction | 0.581 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 168110 | -| policy_gradient_loss | 0.105 | -| std | 0.00846 | -| value_loss | 6.94e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16813 | -| time_elapsed | 90524 | -| total_timesteps | 2152064 | -| train/ | | -| approx_kl | 0.045676876 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00645 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 168120 | -| policy_gradient_loss | 0.0728 | -| std | 0.00846 | -| value_loss | 1.78e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16814 | -| time_elapsed | 90535 | -| total_timesteps | 2152192 | -| train/ | | -| approx_kl | 0.0066007455 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.0488 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 168130 | -| policy_gradient_loss | -0.00992 | -| std | 0.00846 | -| value_loss | 0.00142 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16815 | -| time_elapsed | 90542 | -| total_timesteps | 2152320 | -| train/ | | -| approx_kl | 0.24848802 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 168140 | -| policy_gradient_loss | 0.09 | -| std | 0.00846 | -| value_loss | 3.77e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16816 | -| time_elapsed | 90549 | -| total_timesteps | 2152448 | -| train/ | | -| approx_kl | 0.009732297 | -| clip_fraction | 0.0563 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | 0.000781 | -| n_updates | 168150 | -| policy_gradient_loss | 0.000303 | -| std | 0.00846 | -| value_loss | 2.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16817 | -| time_elapsed | 90558 | -| total_timesteps | 2152576 | -| train/ | | -| approx_kl | 0.016398916 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | -0.00732 | -| n_updates | 168160 | -| policy_gradient_loss | 0.0142 | -| std | 0.00846 | -| value_loss | 4.74e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16818 | -| time_elapsed | 90565 | -| total_timesteps | 2152704 | -| train/ | | -| approx_kl | 0.080093235 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | 0.043 | -| n_updates | 168170 | -| policy_gradient_loss | 0.0223 | -| std | 0.00846 | -| value_loss | 8.95e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16819 | -| time_elapsed | 90572 | -| total_timesteps | 2152832 | -| train/ | | -| approx_kl | 0.00013501197 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | -0.000959 | -| n_updates | 168180 | -| policy_gradient_loss | 0.0188 | -| std | 0.00845 | -| value_loss | 6.12e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 16820 | -| time_elapsed | 90577 | -| total_timesteps | 2152960 | -| train/ | | -| approx_kl | 0.10623316 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 168190 | -| policy_gradient_loss | 0.0124 | -| std | 0.00845 | -| value_loss | 4.26e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16821 | -| time_elapsed | 90584 | -| total_timesteps | 2153088 | -| train/ | | -| approx_kl | 0.011527198 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.00672 | -| n_updates | 168200 | -| policy_gradient_loss | 0.0211 | -| std | 0.00845 | -| value_loss | 4.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16822 | -| time_elapsed | 90595 | -| total_timesteps | 2153216 | -| train/ | | -| approx_kl | 0.052520033 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 168210 | -| policy_gradient_loss | 0.01 | -| std | 0.00845 | -| value_loss | 0.000237 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16823 | -| time_elapsed | 90602 | -| total_timesteps | 2153344 | -| train/ | | -| approx_kl | 1.36923045e-05 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.000176 | -| n_updates | 168220 | -| policy_gradient_loss | 0.0183 | -| std | 0.00845 | -| value_loss | 3e-06 | --------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16824 | -| time_elapsed | 90608 | -| total_timesteps | 2153472 | -| train/ | | -| approx_kl | 0.4213499 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00827 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 168230 | -| policy_gradient_loss | 0.0504 | -| std | 0.00845 | -| value_loss | 5.5e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16825 | -| time_elapsed | 90616 | -| total_timesteps | 2153600 | -| train/ | | -| approx_kl | 0.025486508 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00777 | -| n_updates | 168240 | -| policy_gradient_loss | -0.00299 | -| std | 0.00845 | -| value_loss | 6.19e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16826 | -| time_elapsed | 90622 | -| total_timesteps | 2153728 | -| train/ | | -| approx_kl | 0.03415589 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.00282 | -| n_updates | 168250 | -| policy_gradient_loss | 0.00102 | -| std | 0.00846 | -| value_loss | 4.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16827 | -| time_elapsed | 90628 | -| total_timesteps | 2153856 | -| train/ | | -| approx_kl | 0.005820349 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | -0.00895 | -| n_updates | 168260 | -| policy_gradient_loss | 0.00188 | -| std | 0.00845 | -| value_loss | 2.88e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 16828 | -| time_elapsed | 90634 | -| total_timesteps | 2153984 | -| train/ | | -| approx_kl | 0.02083813 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 168270 | -| policy_gradient_loss | 0.119 | -| std | 0.00845 | -| value_loss | 1.72e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 16829 | -| time_elapsed | 90642 | -| total_timesteps | 2154112 | -| train/ | | -| approx_kl | 0.00628224 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 168280 | -| policy_gradient_loss | 0.0183 | -| std | 0.00845 | -| value_loss | 1.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 16830 | -| time_elapsed | 90660 | -| total_timesteps | 2154240 | -| train/ | | -| approx_kl | 0.012921797 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.67 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 168290 | -| policy_gradient_loss | -0.00929 | -| std | 0.00845 | -| value_loss | 0.000746 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 16831 | -| time_elapsed | 90666 | -| total_timesteps | 2154368 | -| train/ | | -| approx_kl | 0.05419583 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 168300 | -| policy_gradient_loss | 0.0131 | -| std | 0.00845 | -| value_loss | 8.62e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 16832 | -| time_elapsed | 90675 | -| total_timesteps | 2154496 | -| train/ | | -| approx_kl | 0.50243306 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.743 | -| learning_rate | 0.0003 | -| loss | 0.226 | -| n_updates | 168310 | -| policy_gradient_loss | 0.0567 | -| std | 0.00845 | -| value_loss | 3.1e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 16833 | -| time_elapsed | 90682 | -| total_timesteps | 2154624 | -| train/ | | -| approx_kl | 0.010608549 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | -0.00527 | -| n_updates | 168320 | -| policy_gradient_loss | 0.00304 | -| std | 0.00845 | -| value_loss | 1.94e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 16834 | -| time_elapsed | 90689 | -| total_timesteps | 2154752 | -| train/ | | -| approx_kl | 0.04321793 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0855 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 168330 | -| policy_gradient_loss | 0.00635 | -| std | 0.00845 | -| value_loss | 1.21e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 16835 | -| time_elapsed | 90696 | -| total_timesteps | 2154880 | -| train/ | | -| approx_kl | 0.005979581 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | -0.00716 | -| n_updates | 168340 | -| policy_gradient_loss | -0.000281 | -| std | 0.00846 | -| value_loss | 7.38e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16836 | -| time_elapsed | 90703 | -| total_timesteps | 2155008 | -| train/ | | -| approx_kl | 0.0045983647 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00212 | -| learning_rate | 0.0003 | -| loss | -0.00933 | -| n_updates | 168350 | -| policy_gradient_loss | -0.000926 | -| std | 0.00848 | -| value_loss | 1.74e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16837 | -| time_elapsed | 90719 | -| total_timesteps | 2155136 | -| train/ | | -| approx_kl | 0.13571863 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 168360 | -| policy_gradient_loss | -0.0164 | -| std | 0.00849 | -| value_loss | 0.000204 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16838 | -| time_elapsed | 90726 | -| total_timesteps | 2155264 | -| train/ | | -| approx_kl | 0.017080098 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.507 | -| learning_rate | 0.0003 | -| loss | -0.000587 | -| n_updates | 168370 | -| policy_gradient_loss | 0.013 | -| std | 0.00849 | -| value_loss | 5.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16839 | -| time_elapsed | 90733 | -| total_timesteps | 2155392 | -| train/ | | -| approx_kl | 0.06341367 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 168380 | -| policy_gradient_loss | 0.00916 | -| std | 0.0085 | -| value_loss | 1.44e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16840 | -| time_elapsed | 90738 | -| total_timesteps | 2155520 | -| train/ | | -| approx_kl | 8.5339416e-05 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | -0.00058 | -| n_updates | 168390 | -| policy_gradient_loss | 0.0139 | -| std | 0.0085 | -| value_loss | 5.39e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16841 | -| time_elapsed | 90745 | -| total_timesteps | 2155648 | -| train/ | | -| approx_kl | 0.0004119831 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0561 | -| learning_rate | 0.0003 | -| loss | 0.00444 | -| n_updates | 168400 | -| policy_gradient_loss | 0.000257 | -| std | 0.0085 | -| value_loss | 3.96e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16842 | -| time_elapsed | 90752 | -| total_timesteps | 2155776 | -| train/ | | -| approx_kl | 0.02710717 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | -0.00732 | -| n_updates | 168410 | -| policy_gradient_loss | 0.00807 | -| std | 0.00849 | -| value_loss | 2.19e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 16843 | -| time_elapsed | 90758 | -| total_timesteps | 2155904 | -| train/ | | -| approx_kl | 0.0003641569 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 168420 | -| policy_gradient_loss | 0.0194 | -| std | 0.0085 | -| value_loss | 1.65e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16844 | -| time_elapsed | 90763 | -| total_timesteps | 2156032 | -| train/ | | -| approx_kl | 0.3391146 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.0864 | -| n_updates | 168430 | -| policy_gradient_loss | 0.0278 | -| std | 0.0085 | -| value_loss | 1.02e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16845 | -| time_elapsed | 90780 | -| total_timesteps | 2156160 | -| train/ | | -| approx_kl | 0.06991916 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 168440 | -| policy_gradient_loss | -0.0142 | -| std | 0.0085 | -| value_loss | 0.00144 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16846 | -| time_elapsed | 90787 | -| total_timesteps | 2156288 | -| train/ | | -| approx_kl | 0.65381855 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.0294 | -| learning_rate | 0.0003 | -| loss | 0.19 | -| n_updates | 168450 | -| policy_gradient_loss | 0.132 | -| std | 0.0085 | -| value_loss | 2.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16847 | -| time_elapsed | 90793 | -| total_timesteps | 2156416 | -| train/ | | -| approx_kl | 0.033527087 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.337 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 168460 | -| policy_gradient_loss | 0.00296 | -| std | 0.00851 | -| value_loss | 1.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16848 | -| time_elapsed | 90798 | -| total_timesteps | 2156544 | -| train/ | | -| approx_kl | 0.013040068 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.467 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 168470 | -| policy_gradient_loss | -0.0105 | -| std | 0.00853 | -| value_loss | 3.8e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16849 | -| time_elapsed | 90802 | -| total_timesteps | 2156672 | -| train/ | | -| approx_kl | 0.0060169925 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 168480 | -| policy_gradient_loss | -0.00204 | -| std | 0.00856 | -| value_loss | 8.9e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16850 | -| time_elapsed | 90807 | -| total_timesteps | 2156800 | -| train/ | | -| approx_kl | 0.015610049 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00909 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 168490 | -| policy_gradient_loss | 0.0187 | -| std | 0.00857 | -| value_loss | 8.88e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 16851 | -| time_elapsed | 90813 | -| total_timesteps | 2156928 | -| train/ | | -| approx_kl | 0.06340426 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.364 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 168500 | -| policy_gradient_loss | 0.0153 | -| std | 0.00857 | -| value_loss | 4.95e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16852 | -| time_elapsed | 90819 | -| total_timesteps | 2157056 | -| train/ | | -| approx_kl | 0.0001204405 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | -6.17e-05 | -| n_updates | 168510 | -| policy_gradient_loss | 0.0173 | -| std | 0.00857 | -| value_loss | 2.91e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16853 | -| time_elapsed | 90829 | -| total_timesteps | 2157184 | -| train/ | | -| approx_kl | 0.014664562 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 168520 | -| policy_gradient_loss | -0.0103 | -| std | 0.00858 | -| value_loss | 0.00404 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16854 | -| time_elapsed | 90833 | -| total_timesteps | 2157312 | -| train/ | | -| approx_kl | 0.003146002 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00767 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 168530 | -| policy_gradient_loss | 0.019 | -| std | 0.00858 | -| value_loss | 2.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16855 | -| time_elapsed | 90838 | -| total_timesteps | 2157440 | -| train/ | | -| approx_kl | 0.23609716 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 168540 | -| policy_gradient_loss | 0.0305 | -| std | 0.00858 | -| value_loss | 3.13e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16856 | -| time_elapsed | 90843 | -| total_timesteps | 2157568 | -| train/ | | -| approx_kl | 1.968816e-05 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | 0.000884 | -| n_updates | 168550 | -| policy_gradient_loss | -0.00121 | -| std | 0.00859 | -| value_loss | 4.7e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16857 | -| time_elapsed | 90849 | -| total_timesteps | 2157696 | -| train/ | | -| approx_kl | 0.004385442 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 168560 | -| policy_gradient_loss | 0.00215 | -| std | 0.00859 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16858 | -| time_elapsed | 90854 | -| total_timesteps | 2157824 | -| train/ | | -| approx_kl | 0.026135333 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 168570 | -| policy_gradient_loss | 0.00134 | -| std | 0.00859 | -| value_loss | 4.95e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 16859 | -| time_elapsed | 90860 | -| total_timesteps | 2157952 | -| train/ | | -| approx_kl | 0.0035558026 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.000486 | -| learning_rate | 0.0003 | -| loss | -0.00477 | -| n_updates | 168580 | -| policy_gradient_loss | 0.0114 | -| std | 0.00859 | -| value_loss | 9.05e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16860 | -| time_elapsed | 90866 | -| total_timesteps | 2158080 | -| train/ | | -| approx_kl | 0.42733386 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.289 | -| n_updates | 168590 | -| policy_gradient_loss | 0.136 | -| std | 0.00859 | -| value_loss | 6.83e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16861 | -| time_elapsed | 90879 | -| total_timesteps | 2158208 | -| train/ | | -| approx_kl | 0.32255822 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.326 | -| learning_rate | 0.0003 | -| loss | 0.00718 | -| n_updates | 168600 | -| policy_gradient_loss | -0.0089 | -| std | 0.00859 | -| value_loss | 0.00157 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16862 | -| time_elapsed | 90888 | -| total_timesteps | 2158336 | -| train/ | | -| approx_kl | 0.02631127 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0696 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 168610 | -| policy_gradient_loss | 0.00793 | -| std | 0.00859 | -| value_loss | 2.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16863 | -| time_elapsed | 90896 | -| total_timesteps | 2158464 | -| train/ | | -| approx_kl | 0.030444093 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 168620 | -| policy_gradient_loss | 0.00528 | -| std | 0.00859 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16864 | -| time_elapsed | 90903 | -| total_timesteps | 2158592 | -| train/ | | -| approx_kl | 0.005224144 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0916 | -| learning_rate | 0.0003 | -| loss | -0.00739 | -| n_updates | 168630 | -| policy_gradient_loss | 0.00132 | -| std | 0.00859 | -| value_loss | 7.45e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16865 | -| time_elapsed | 90907 | -| total_timesteps | 2158720 | -| train/ | | -| approx_kl | 0.02197948 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 168640 | -| policy_gradient_loss | 0.00775 | -| std | 0.00858 | -| value_loss | 3.84e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16866 | -| time_elapsed | 90911 | -| total_timesteps | 2158848 | -| train/ | | -| approx_kl | 0.0050184727 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 168650 | -| policy_gradient_loss | 0.0187 | -| std | 0.00859 | -| value_loss | 2.73e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16867 | -| time_elapsed | 90917 | -| total_timesteps | 2158976 | -| train/ | | -| approx_kl | 0.12397751 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.0646 | -| n_updates | 168660 | -| policy_gradient_loss | 0.0265 | -| std | 0.00859 | -| value_loss | 1.65e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 16868 | -| time_elapsed | 90924 | -| total_timesteps | 2159104 | -| train/ | | -| approx_kl | 0.042886205 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 168670 | -| policy_gradient_loss | 0.00146 | -| std | 0.00859 | -| value_loss | 1.06e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 16869 | -| time_elapsed | 90939 | -| total_timesteps | 2159232 | -| train/ | | -| approx_kl | 0.07132426 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.833 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 168680 | -| policy_gradient_loss | -0.00584 | -| std | 0.00859 | -| value_loss | 0.00254 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 16870 | -| time_elapsed | 90944 | -| total_timesteps | 2159360 | -| train/ | | -| approx_kl | 0.007591506 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.00953 | -| n_updates | 168690 | -| policy_gradient_loss | 0.0229 | -| std | 0.00859 | -| value_loss | 6.99e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 16871 | -| time_elapsed | 90949 | -| total_timesteps | 2159488 | -| train/ | | -| approx_kl | 0.43757832 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.00132 | -| learning_rate | 0.0003 | -| loss | 0.232 | -| n_updates | 168700 | -| policy_gradient_loss | 0.132 | -| std | 0.00859 | -| value_loss | 5.89e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 16872 | -| time_elapsed | 90953 | -| total_timesteps | 2159616 | -| train/ | | -| approx_kl | 0.00967906 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 168710 | -| policy_gradient_loss | 0.012 | -| std | 0.00859 | -| value_loss | 4.07e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 16873 | -| time_elapsed | 90958 | -| total_timesteps | 2159744 | -| train/ | | -| approx_kl | 0.18978609 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 168720 | -| policy_gradient_loss | 0.104 | -| std | 0.00859 | -| value_loss | 3.26e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 16874 | -| time_elapsed | 90963 | -| total_timesteps | 2159872 | -| train/ | | -| approx_kl | 0.103861004 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 168730 | -| policy_gradient_loss | 0.0932 | -| std | 0.00859 | -| value_loss | 2.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16875 | -| time_elapsed | 90969 | -| total_timesteps | 2160000 | -| train/ | | -| approx_kl | 0.09758722 | -| clip_fraction | 0.65 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 168740 | -| policy_gradient_loss | 0.0986 | -| std | 0.00859 | -| value_loss | 1.46e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16876 | -| time_elapsed | 90975 | -| total_timesteps | 2160128 | -| train/ | | -| approx_kl | 0.014946605 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00257 | -| learning_rate | 0.0003 | -| loss | -0.00615 | -| n_updates | 168750 | -| policy_gradient_loss | 0.0118 | -| std | 0.00859 | -| value_loss | 8.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16877 | -| time_elapsed | 90988 | -| total_timesteps | 2160256 | -| train/ | | -| approx_kl | 0.031108752 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.861 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 168760 | -| policy_gradient_loss | -0.00778 | -| std | 0.0086 | -| value_loss | 0.000401 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16878 | -| time_elapsed | 90994 | -| total_timesteps | 2160384 | -| train/ | | -| approx_kl | 0.02367217 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 168770 | -| policy_gradient_loss | 0.00408 | -| std | 0.0086 | -| value_loss | 6.88e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16879 | -| time_elapsed | 91000 | -| total_timesteps | 2160512 | -| train/ | | -| approx_kl | 0.08643594 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -299 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 168780 | -| policy_gradient_loss | 0.00821 | -| std | 0.00859 | -| value_loss | 1.11e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16880 | -| time_elapsed | 91008 | -| total_timesteps | 2160640 | -| train/ | | -| approx_kl | 0.037918717 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -19.4 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 168790 | -| policy_gradient_loss | 0.00647 | -| std | 0.00858 | -| value_loss | 8.86e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16881 | -| time_elapsed | 91015 | -| total_timesteps | 2160768 | -| train/ | | -| approx_kl | 0.021563197 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -3.58 | -| learning_rate | 0.0003 | -| loss | 0.0323 | -| n_updates | 168800 | -| policy_gradient_loss | -0.00394 | -| std | 0.00858 | -| value_loss | 1.34e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16882 | -| time_elapsed | 91021 | -| total_timesteps | 2160896 | -| train/ | | -| approx_kl | 0.08522998 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.57 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 168810 | -| policy_gradient_loss | 0.0285 | -| std | 0.00858 | -| value_loss | 3.81e-12 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16883 | -| time_elapsed | 91027 | -| total_timesteps | 2161024 | -| train/ | | -| approx_kl | 0.2507443 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 168820 | -| policy_gradient_loss | 0.111 | -| std | 0.00858 | -| value_loss | 1.57e-12 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16884 | -| time_elapsed | 91044 | -| total_timesteps | 2161152 | -| train/ | | -| approx_kl | 0.055791683 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 1 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 168830 | -| policy_gradient_loss | 0.032 | -| std | 0.00858 | -| value_loss | 1.94e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16885 | -| time_elapsed | 91050 | -| total_timesteps | 2161280 | -| train/ | | -| approx_kl | 0.097534835 | -| clip_fraction | 0.625 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | 0.0953 | -| n_updates | 168840 | -| policy_gradient_loss | 0.0619 | -| std | 0.00858 | -| value_loss | 5.02e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16886 | -| time_elapsed | 91055 | -| total_timesteps | 2161408 | -| train/ | | -| approx_kl | 0.08557973 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0512 | -| n_updates | 168850 | -| policy_gradient_loss | 0.106 | -| std | 0.00858 | -| value_loss | 1.5e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16887 | -| time_elapsed | 91061 | -| total_timesteps | 2161536 | -| train/ | | -| approx_kl | 0.013249595 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.000158 | -| n_updates | 168860 | -| policy_gradient_loss | 0.0118 | -| std | 0.00859 | -| value_loss | 1.87e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16888 | -| time_elapsed | 91065 | -| total_timesteps | 2161664 | -| train/ | | -| approx_kl | 0.29759207 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 168870 | -| policy_gradient_loss | 0.0344 | -| std | 0.00859 | -| value_loss | 1.02e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16889 | -| time_elapsed | 91070 | -| total_timesteps | 2161792 | -| train/ | | -| approx_kl | 0.023193253 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.00554 | -| n_updates | 168880 | -| policy_gradient_loss | 0.00318 | -| std | 0.00859 | -| value_loss | 7.22e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 16890 | -| time_elapsed | 91074 | -| total_timesteps | 2161920 | -| train/ | | -| approx_kl | 0.031324208 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.00701 | -| n_updates | 168890 | -| policy_gradient_loss | 0.00303 | -| std | 0.00859 | -| value_loss | 4.7e-11 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16891 | -| time_elapsed | 91079 | -| total_timesteps | 2162048 | -| train/ | | -| approx_kl | 0.00013494352 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 168900 | -| policy_gradient_loss | 0.00133 | -| std | 0.00859 | -| value_loss | 3.39e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16892 | -| time_elapsed | 91090 | -| total_timesteps | 2162176 | -| train/ | | -| approx_kl | 0.039766043 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 168910 | -| policy_gradient_loss | -0.0114 | -| std | 0.0086 | -| value_loss | 4.63e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16893 | -| time_elapsed | 91096 | -| total_timesteps | 2162304 | -| train/ | | -| approx_kl | 0.0037380415 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 168920 | -| policy_gradient_loss | 0.0115 | -| std | 0.0086 | -| value_loss | 1.61e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16894 | -| time_elapsed | 91100 | -| total_timesteps | 2162432 | -| train/ | | -| approx_kl | 0.026805643 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00842 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 168930 | -| policy_gradient_loss | 0.0444 | -| std | 0.0086 | -| value_loss | 6.08e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16895 | -| time_elapsed | 91106 | -| total_timesteps | 2162560 | -| train/ | | -| approx_kl | 0.0016370215 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | -4.47e-05 | -| n_updates | 168940 | -| policy_gradient_loss | 0.042 | -| std | 0.0086 | -| value_loss | 3.01e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16896 | -| time_elapsed | 91112 | -| total_timesteps | 2162688 | -| train/ | | -| approx_kl | 0.16601746 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.0725 | -| n_updates | 168950 | -| policy_gradient_loss | 0.0211 | -| std | 0.00859 | -| value_loss | 1.66e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16897 | -| time_elapsed | 91118 | -| total_timesteps | 2162816 | -| train/ | | -| approx_kl | 0.0004236563 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00146 | -| learning_rate | 0.0003 | -| loss | -0.000131 | -| n_updates | 168960 | -| policy_gradient_loss | 0.00387 | -| std | 0.00857 | -| value_loss | 2.14e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16898 | -| time_elapsed | 91124 | -| total_timesteps | 2162944 | -| train/ | | -| approx_kl | 0.035872284 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00729 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 168970 | -| policy_gradient_loss | 0.0308 | -| std | 0.00855 | -| value_loss | 4.44e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16899 | -| time_elapsed | 91130 | -| total_timesteps | 2163072 | -| train/ | | -| approx_kl | 0.6658113 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.276 | -| n_updates | 168980 | -| policy_gradient_loss | 0.146 | -| std | 0.00855 | -| value_loss | 1.9e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16900 | -| time_elapsed | 91141 | -| total_timesteps | 2163200 | -| train/ | | -| approx_kl | 0.00157747 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 168990 | -| policy_gradient_loss | -0.00364 | -| std | 0.00854 | -| value_loss | 0.00112 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16901 | -| time_elapsed | 91148 | -| total_timesteps | 2163328 | -| train/ | | -| approx_kl | 0.023372374 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.00576 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 169000 | -| policy_gradient_loss | 0.00733 | -| std | 0.00852 | -| value_loss | 8.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16902 | -| time_elapsed | 91153 | -| total_timesteps | 2163456 | -| train/ | | -| approx_kl | 0.002763595 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 169010 | -| policy_gradient_loss | 0.00456 | -| std | 0.00851 | -| value_loss | 2.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16903 | -| time_elapsed | 91159 | -| total_timesteps | 2163584 | -| train/ | | -| approx_kl | 0.022337584 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0783 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 169020 | -| policy_gradient_loss | 0.0739 | -| std | 0.0085 | -| value_loss | 3.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16904 | -| time_elapsed | 91165 | -| total_timesteps | 2163712 | -| train/ | | -| approx_kl | 0.051865138 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00123 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 169030 | -| policy_gradient_loss | 0.075 | -| std | 0.0085 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16905 | -| time_elapsed | 91172 | -| total_timesteps | 2163840 | -| train/ | | -| approx_kl | 0.074113846 | -| clip_fraction | 0.64 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0893 | -| learning_rate | 0.0003 | -| loss | 0.0585 | -| n_updates | 169040 | -| policy_gradient_loss | 0.0975 | -| std | 0.0085 | -| value_loss | 2.83e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16906 | -| time_elapsed | 91179 | -| total_timesteps | 2163968 | -| train/ | | -| approx_kl | 0.07262426 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0542 | -| n_updates | 169050 | -| policy_gradient_loss | 0.093 | -| std | 0.0085 | -| value_loss | 8.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16907 | -| time_elapsed | 91186 | -| total_timesteps | 2164096 | -| train/ | | -| approx_kl | 0.016351061 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00444 | -| n_updates | 169060 | -| policy_gradient_loss | 0.0167 | -| std | 0.0085 | -| value_loss | 4.53e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16908 | -| time_elapsed | 91205 | -| total_timesteps | 2164224 | -| train/ | | -| approx_kl | 0.0035546524 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 169070 | -| policy_gradient_loss | 0.00545 | -| std | 0.0085 | -| value_loss | 0.00018 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16909 | -| time_elapsed | 91212 | -| total_timesteps | 2164352 | -| train/ | | -| approx_kl | 0.14920487 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00559 | -| learning_rate | 0.0003 | -| loss | 0.0877 | -| n_updates | 169080 | -| policy_gradient_loss | 0.0302 | -| std | 0.00849 | -| value_loss | 5.37e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16910 | -| time_elapsed | 91219 | -| total_timesteps | 2164480 | -| train/ | | -| approx_kl | 0.17562394 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -19.1 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 169090 | -| policy_gradient_loss | 0.00687 | -| std | 0.00852 | -| value_loss | 2.77e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16911 | -| time_elapsed | 91227 | -| total_timesteps | 2164608 | -| train/ | | -| approx_kl | 0.038471717 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0887 | -| learning_rate | 0.0003 | -| loss | 0.0359 | -| n_updates | 169100 | -| policy_gradient_loss | 0.077 | -| std | 0.00853 | -| value_loss | 5.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16912 | -| time_elapsed | 91235 | -| total_timesteps | 2164736 | -| train/ | | -| approx_kl | 0.014356804 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 169110 | -| policy_gradient_loss | 0.00165 | -| std | 0.00854 | -| value_loss | 5.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16913 | -| time_elapsed | 91242 | -| total_timesteps | 2164864 | -| train/ | | -| approx_kl | 0.019344818 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.00246 | -| learning_rate | 0.0003 | -| loss | -0.00732 | -| n_updates | 169120 | -| policy_gradient_loss | 0.0227 | -| std | 0.00854 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 16914 | -| time_elapsed | 91247 | -| total_timesteps | 2164992 | -| train/ | | -| approx_kl | 0.0033238865 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 169130 | -| policy_gradient_loss | 0.0648 | -| std | 0.00854 | -| value_loss | 9.75e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 23 | -| iterations | 16915 | -| time_elapsed | 91254 | -| total_timesteps | 2165120 | -| train/ | | -| approx_kl | 0.07568998 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.0587 | -| n_updates | 169140 | -| policy_gradient_loss | 0.0988 | -| std | 0.00855 | -| value_loss | 6.61e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 23 | -| iterations | 16916 | -| time_elapsed | 91275 | -| total_timesteps | 2165248 | -| train/ | | -| approx_kl | 0.06876043 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 169150 | -| policy_gradient_loss | -0.00478 | -| std | 0.00855 | -| value_loss | 0.000395 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 23 | -| iterations | 16917 | -| time_elapsed | 91282 | -| total_timesteps | 2165376 | -| train/ | | -| approx_kl | 0.1281328 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -293 | -| learning_rate | 0.0003 | -| loss | 0.0064 | -| n_updates | 169160 | -| policy_gradient_loss | 0.0176 | -| std | 0.00855 | -| value_loss | 5.27e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 23 | -| iterations | 16918 | -| time_elapsed | 91287 | -| total_timesteps | 2165504 | -| train/ | | -| approx_kl | 0.028115641 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -4.1 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 169170 | -| policy_gradient_loss | -0.00304 | -| std | 0.00855 | -| value_loss | 1.3e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 23 | -| iterations | 16919 | -| time_elapsed | 91293 | -| total_timesteps | 2165632 | -| train/ | | -| approx_kl | 0.22181559 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 169180 | -| policy_gradient_loss | 0.0159 | -| std | 0.00855 | -| value_loss | 7.59e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 23 | -| iterations | 16920 | -| time_elapsed | 91298 | -| total_timesteps | 2165760 | -| train/ | | -| approx_kl | 0.040954486 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.321 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 169190 | -| policy_gradient_loss | 0.00741 | -| std | 0.00855 | -| value_loss | 2.67e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.827 | -| time/ | | -| fps | 23 | -| iterations | 16921 | -| time_elapsed | 91305 | -| total_timesteps | 2165888 | -| train/ | | -| approx_kl | 0.010078029 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 169200 | -| policy_gradient_loss | 0.0467 | -| std | 0.00855 | -| value_loss | 1.47e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16922 | -| time_elapsed | 91311 | -| total_timesteps | 2166016 | -| train/ | | -| approx_kl | 0.0056061307 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 169210 | -| policy_gradient_loss | 0.012 | -| std | 0.00855 | -| value_loss | 7.9e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16923 | -| time_elapsed | 91330 | -| total_timesteps | 2166144 | -| train/ | | -| approx_kl | 0.043673016 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -9.09 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 169220 | -| policy_gradient_loss | -0.0104 | -| std | 0.00855 | -| value_loss | 0.00342 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16924 | -| time_elapsed | 91336 | -| total_timesteps | 2166272 | -| train/ | | -| approx_kl | 0.0011758641 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.0182 | -| learning_rate | 0.0003 | -| loss | 0.00531 | -| n_updates | 169230 | -| policy_gradient_loss | 0.0049 | -| std | 0.00854 | -| value_loss | 3.36e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16925 | -| time_elapsed | 91345 | -| total_timesteps | 2166400 | -| train/ | | -| approx_kl | 0.035838634 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -5.9 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 169240 | -| policy_gradient_loss | 0.00404 | -| std | 0.00854 | -| value_loss | 2.11e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16926 | -| time_elapsed | 91353 | -| total_timesteps | 2166528 | -| train/ | | -| approx_kl | 0.00025498634 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -195 | -| learning_rate | 0.0003 | -| loss | 0.00132 | -| n_updates | 169250 | -| policy_gradient_loss | 0.00658 | -| std | 0.00854 | -| value_loss | 5.18e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16927 | -| time_elapsed | 91361 | -| total_timesteps | 2166656 | -| train/ | | -| approx_kl | 6.756047e-05 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.84 | -| learning_rate | 0.0003 | -| loss | 0.000452 | -| n_updates | 169260 | -| policy_gradient_loss | 0.0141 | -| std | 0.00854 | -| value_loss | 4.59e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16928 | -| time_elapsed | 91365 | -| total_timesteps | 2166784 | -| train/ | | -| approx_kl | 0.12133725 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 169270 | -| policy_gradient_loss | 0.0109 | -| std | 0.00854 | -| value_loss | 3.32e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 16929 | -| time_elapsed | 91370 | -| total_timesteps | 2166912 | -| train/ | | -| approx_kl | 0.010887592 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.271 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 169280 | -| policy_gradient_loss | 0.0105 | -| std | 0.00854 | -| value_loss | 6.45e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16930 | -| time_elapsed | 91376 | -| total_timesteps | 2167040 | -| train/ | | -| approx_kl | 0.17447448 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 169290 | -| policy_gradient_loss | 0.0978 | -| std | 0.00854 | -| value_loss | 7.93e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16931 | -| time_elapsed | 91386 | -| total_timesteps | 2167168 | -| train/ | | -| approx_kl | 0.015141973 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | -0.0251 | -| n_updates | 169300 | -| policy_gradient_loss | -0.0157 | -| std | 0.00854 | -| value_loss | 0.000111 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16932 | -| time_elapsed | 91391 | -| total_timesteps | 2167296 | -| train/ | | -| approx_kl | 0.040842984 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 169310 | -| policy_gradient_loss | 0.0865 | -| std | 0.00854 | -| value_loss | 1.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16933 | -| time_elapsed | 91396 | -| total_timesteps | 2167424 | -| train/ | | -| approx_kl | 0.008608606 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00377 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 169320 | -| policy_gradient_loss | 0.0139 | -| std | 0.00854 | -| value_loss | 1.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16934 | -| time_elapsed | 91400 | -| total_timesteps | 2167552 | -| train/ | | -| approx_kl | 0.35666054 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 169330 | -| policy_gradient_loss | 0.0452 | -| std | 0.00854 | -| value_loss | 6.75e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16935 | -| time_elapsed | 91406 | -| total_timesteps | 2167680 | -| train/ | | -| approx_kl | 0.02798577 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.00668 | -| n_updates | 169340 | -| policy_gradient_loss | 0.00331 | -| std | 0.00854 | -| value_loss | 4.39e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16936 | -| time_elapsed | 91412 | -| total_timesteps | 2167808 | -| train/ | | -| approx_kl | 0.04167311 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 169350 | -| policy_gradient_loss | 0.0163 | -| std | 0.00854 | -| value_loss | 2.83e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.823 | -| time/ | | -| fps | 23 | -| iterations | 16937 | -| time_elapsed | 91418 | -| total_timesteps | 2167936 | -| train/ | | -| approx_kl | 0.029193357 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 169360 | -| policy_gradient_loss | 0.00867 | -| std | 0.00854 | -| value_loss | 1.95e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16938 | -| time_elapsed | 91424 | -| total_timesteps | 2168064 | -| train/ | | -| approx_kl | 0.030816438 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 169370 | -| policy_gradient_loss | 0.00481 | -| std | 0.00854 | -| value_loss | 2.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16939 | -| time_elapsed | 91437 | -| total_timesteps | 2168192 | -| train/ | | -| approx_kl | 0.011201179 | -| clip_fraction | 0.0773 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -6.07 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 169380 | -| policy_gradient_loss | -0.0153 | -| std | 0.00854 | -| value_loss | 0.00288 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16940 | -| time_elapsed | 91441 | -| total_timesteps | 2168320 | -| train/ | | -| approx_kl | 0.05274531 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -4.93 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 169390 | -| policy_gradient_loss | -0.00391 | -| std | 0.00853 | -| value_loss | 1.65e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16941 | -| time_elapsed | 91448 | -| total_timesteps | 2168448 | -| train/ | | -| approx_kl | 0.2283374 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -3.2 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 169400 | -| policy_gradient_loss | 0.0616 | -| std | 0.00853 | -| value_loss | 1.13e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16942 | -| time_elapsed | 91453 | -| total_timesteps | 2168576 | -| train/ | | -| approx_kl | 0.10196763 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.0782 | -| n_updates | 169410 | -| policy_gradient_loss | 0.0647 | -| std | 0.00853 | -| value_loss | 1.98e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16943 | -| time_elapsed | 91458 | -| total_timesteps | 2168704 | -| train/ | | -| approx_kl | 0.10610445 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.349 | -| learning_rate | 0.0003 | -| loss | 0.0896 | -| n_updates | 169420 | -| policy_gradient_loss | 0.14 | -| std | 0.00853 | -| value_loss | 1e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16944 | -| time_elapsed | 91465 | -| total_timesteps | 2168832 | -| train/ | | -| approx_kl | 0.092655115 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0995 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 169430 | -| policy_gradient_loss | 0.109 | -| std | 0.00853 | -| value_loss | 9.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16945 | -| time_elapsed | 91470 | -| total_timesteps | 2168960 | -| train/ | | -| approx_kl | 0.017836416 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.00943 | -| n_updates | 169440 | -| policy_gradient_loss | 0.0146 | -| std | 0.00853 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16946 | -| time_elapsed | 91476 | -| total_timesteps | 2169088 | -| train/ | | -| approx_kl | 0.109520614 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 169450 | -| policy_gradient_loss | 0.0102 | -| std | 0.00853 | -| value_loss | 1.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16947 | -| time_elapsed | 91489 | -| total_timesteps | 2169216 | -| train/ | | -| approx_kl | 0.021088889 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.792 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 169460 | -| policy_gradient_loss | -0.0111 | -| std | 0.00853 | -| value_loss | 0.00215 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16948 | -| time_elapsed | 91498 | -| total_timesteps | 2169344 | -| train/ | | -| approx_kl | 0.16259116 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.0857 | -| n_updates | 169470 | -| policy_gradient_loss | 0.026 | -| std | 0.00853 | -| value_loss | 1.94e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16949 | -| time_elapsed | 91505 | -| total_timesteps | 2169472 | -| train/ | | -| approx_kl | 0.03695291 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00576 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 169480 | -| policy_gradient_loss | 0.0488 | -| std | 0.00853 | -| value_loss | 2.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16950 | -| time_elapsed | 91511 | -| total_timesteps | 2169600 | -| train/ | | -| approx_kl | 0.011886217 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00307 | -| learning_rate | 0.0003 | -| loss | -0.00575 | -| n_updates | 169490 | -| policy_gradient_loss | 0.00761 | -| std | 0.00853 | -| value_loss | 1.49e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16951 | -| time_elapsed | 91520 | -| total_timesteps | 2169728 | -| train/ | | -| approx_kl | 0.11627636 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 169500 | -| policy_gradient_loss | 0.0411 | -| std | 0.00852 | -| value_loss | 6.45e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16952 | -| time_elapsed | 91527 | -| total_timesteps | 2169856 | -| train/ | | -| approx_kl | 0.0006092563 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 169510 | -| policy_gradient_loss | 0.000214 | -| std | 0.00852 | -| value_loss | 5.03e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 16953 | -| time_elapsed | 91534 | -| total_timesteps | 2169984 | -| train/ | | -| approx_kl | 9.054784e-06 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 169520 | -| policy_gradient_loss | 0.00802 | -| std | 0.00852 | -| value_loss | 3.17e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 16954 | -| time_elapsed | 91542 | -| total_timesteps | 2170112 | -| train/ | | -| approx_kl | 0.00013542408 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 169530 | -| policy_gradient_loss | -1.63e-05 | -| std | 0.00853 | -| value_loss | 2.62e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 16955 | -| time_elapsed | 91560 | -| total_timesteps | 2170240 | -| train/ | | -| approx_kl | 0.19933192 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.933 | -| learning_rate | 0.0003 | -| loss | -0.007 | -| n_updates | 169540 | -| policy_gradient_loss | -0.0101 | -| std | 0.00853 | -| value_loss | 0.000138 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 16956 | -| time_elapsed | 91566 | -| total_timesteps | 2170368 | -| train/ | | -| approx_kl | 0.037347347 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 169550 | -| policy_gradient_loss | 0.0453 | -| std | 0.00853 | -| value_loss | 1.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 16957 | -| time_elapsed | 91574 | -| total_timesteps | 2170496 | -| train/ | | -| approx_kl | 0.021833954 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 169560 | -| policy_gradient_loss | 0.0182 | -| std | 0.00853 | -| value_loss | 3.68e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 16958 | -| time_elapsed | 91581 | -| total_timesteps | 2170624 | -| train/ | | -| approx_kl | 0.117270686 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0788 | -| n_updates | 169570 | -| policy_gradient_loss | 0.0326 | -| std | 0.00853 | -| value_loss | 1.58e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 16959 | -| time_elapsed | 91586 | -| total_timesteps | 2170752 | -| train/ | | -| approx_kl | 0.0014141435 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 169580 | -| policy_gradient_loss | 0.00405 | -| std | 0.00853 | -| value_loss | 1.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 16960 | -| time_elapsed | 91591 | -| total_timesteps | 2170880 | -| train/ | | -| approx_kl | 0.047113344 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 169590 | -| policy_gradient_loss | 0.0454 | -| std | 0.00853 | -| value_loss | 7.76e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16961 | -| time_elapsed | 91597 | -| total_timesteps | 2171008 | -| train/ | | -| approx_kl | 2.2975728e-06 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | -3.22e-05 | -| n_updates | 169600 | -| policy_gradient_loss | 0.0717 | -| std | 0.00853 | -| value_loss | 5.09e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16962 | -| time_elapsed | 91617 | -| total_timesteps | 2171136 | -| train/ | | -| approx_kl | 0.06760491 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.939 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 169610 | -| policy_gradient_loss | -0.00544 | -| std | 0.00853 | -| value_loss | 0.000321 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16963 | -| time_elapsed | 91623 | -| total_timesteps | 2171264 | -| train/ | | -| approx_kl | 0.13658147 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.376 | -| learning_rate | 0.0003 | -| loss | 0.000747 | -| n_updates | 169620 | -| policy_gradient_loss | -0.0039 | -| std | 0.00853 | -| value_loss | 1.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16964 | -| time_elapsed | 91631 | -| total_timesteps | 2171392 | -| train/ | | -| approx_kl | 0.27633274 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 169630 | -| policy_gradient_loss | 0.106 | -| std | 0.00853 | -| value_loss | 3.72e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16965 | -| time_elapsed | 91636 | -| total_timesteps | 2171520 | -| train/ | | -| approx_kl | 0.11690219 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.472 | -| learning_rate | 0.0003 | -| loss | 0.0892 | -| n_updates | 169640 | -| policy_gradient_loss | 0.0891 | -| std | 0.00853 | -| value_loss | 2.12e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16966 | -| time_elapsed | 91641 | -| total_timesteps | 2171648 | -| train/ | | -| approx_kl | 0.09326148 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.0799 | -| n_updates | 169650 | -| policy_gradient_loss | 0.0778 | -| std | 0.00853 | -| value_loss | 3.12e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16967 | -| time_elapsed | 91647 | -| total_timesteps | 2171776 | -| train/ | | -| approx_kl | 0.09834717 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.0969 | -| n_updates | 169660 | -| policy_gradient_loss | 0.0843 | -| std | 0.00853 | -| value_loss | 2.73e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 16968 | -| time_elapsed | 91655 | -| total_timesteps | 2171904 | -| train/ | | -| approx_kl | 0.0145073375 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 169670 | -| policy_gradient_loss | 0.0161 | -| std | 0.00853 | -| value_loss | 8.64e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16969 | -| time_elapsed | 91661 | -| total_timesteps | 2172032 | -| train/ | | -| approx_kl | 0.25551718 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 169680 | -| policy_gradient_loss | 0.0288 | -| std | 0.00853 | -| value_loss | 4.62e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16970 | -| time_elapsed | 91673 | -| total_timesteps | 2172160 | -| train/ | | -| approx_kl | 0.024049383 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.77 | -| learning_rate | 0.0003 | -| loss | -0.0097 | -| n_updates | 169690 | -| policy_gradient_loss | -0.00975 | -| std | 0.00852 | -| value_loss | 0.00271 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16971 | -| time_elapsed | 91680 | -| total_timesteps | 2172288 | -| train/ | | -| approx_kl | 0.032175057 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.00471 | -| n_updates | 169700 | -| policy_gradient_loss | 0.019 | -| std | 0.00852 | -| value_loss | 5.56e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16972 | -| time_elapsed | 91687 | -| total_timesteps | 2172416 | -| train/ | | -| approx_kl | 0.4783648 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00693 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 169710 | -| policy_gradient_loss | 0.135 | -| std | 0.00852 | -| value_loss | 9.72e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16973 | -| time_elapsed | 91693 | -| total_timesteps | 2172544 | -| train/ | | -| approx_kl | 0.02803358 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00791 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 169720 | -| policy_gradient_loss | 0.00196 | -| std | 0.00853 | -| value_loss | 4.56e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16974 | -| time_elapsed | 91701 | -| total_timesteps | 2172672 | -| train/ | | -| approx_kl | 0.25154626 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.0935 | -| n_updates | 169730 | -| policy_gradient_loss | 0.0358 | -| std | 0.00854 | -| value_loss | 2.32e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16975 | -| time_elapsed | 91708 | -| total_timesteps | 2172800 | -| train/ | | -| approx_kl | 0.030578738 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 169740 | -| policy_gradient_loss | 0.0109 | -| std | 0.00855 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 16976 | -| time_elapsed | 91716 | -| total_timesteps | 2172928 | -| train/ | | -| approx_kl | 0.039781377 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 169750 | -| policy_gradient_loss | 0.00994 | -| std | 0.00856 | -| value_loss | 8.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16977 | -| time_elapsed | 91721 | -| total_timesteps | 2173056 | -| train/ | | -| approx_kl | 0.022457566 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 169760 | -| policy_gradient_loss | -0.00615 | -| std | 0.00856 | -| value_loss | 6.14e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16978 | -| time_elapsed | 91730 | -| total_timesteps | 2173184 | -| train/ | | -| approx_kl | 0.07555637 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 169770 | -| policy_gradient_loss | -0.0163 | -| std | 0.00857 | -| value_loss | 0.00145 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16979 | -| time_elapsed | 91735 | -| total_timesteps | 2173312 | -| train/ | | -| approx_kl | 0.045655206 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.34 | -| explained_variance | 0.00594 | -| learning_rate | 0.0003 | -| loss | 0.0365 | -| n_updates | 169780 | -| policy_gradient_loss | 0.0336 | -| std | 0.00854 | -| value_loss | 3.44e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16980 | -| time_elapsed | 91740 | -| total_timesteps | 2173440 | -| train/ | | -| approx_kl | 0.20529917 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -1.47 | -| learning_rate | 0.0003 | -| loss | 0.192 | -| n_updates | 169790 | -| policy_gradient_loss | 0.115 | -| std | 0.00852 | -| value_loss | 0.000234 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16981 | -| time_elapsed | 91745 | -| total_timesteps | 2173568 | -| train/ | | -| approx_kl | 0.03263674 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 169800 | -| policy_gradient_loss | 0.0175 | -| std | 0.00851 | -| value_loss | 3.14e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16982 | -| time_elapsed | 91750 | -| total_timesteps | 2173696 | -| train/ | | -| approx_kl | 0.00045084627 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.000786 | -| n_updates | 169810 | -| policy_gradient_loss | 0.019 | -| std | 0.00851 | -| value_loss | 1.79e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16983 | -| time_elapsed | 91755 | -| total_timesteps | 2173824 | -| train/ | | -| approx_kl | 0.036527768 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 169820 | -| policy_gradient_loss | -0.00391 | -| std | 0.00851 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 16984 | -| time_elapsed | 91761 | -| total_timesteps | 2173952 | -| train/ | | -| approx_kl | 0.019066894 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 169830 | -| policy_gradient_loss | 0.00241 | -| std | 0.00851 | -| value_loss | 7.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16985 | -| time_elapsed | 91765 | -| total_timesteps | 2174080 | -| train/ | | -| approx_kl | 0.35353604 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 169840 | -| policy_gradient_loss | 0.0419 | -| std | 0.00851 | -| value_loss | 5.9e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16986 | -| time_elapsed | 91778 | -| total_timesteps | 2174208 | -| train/ | | -| approx_kl | 0.0003119968 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.718 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 169850 | -| policy_gradient_loss | -0.00943 | -| std | 0.00851 | -| value_loss | 0.00498 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16987 | -| time_elapsed | 91784 | -| total_timesteps | 2174336 | -| train/ | | -| approx_kl | 0.012294151 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.297 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 169860 | -| policy_gradient_loss | -0.00591 | -| std | 0.0085 | -| value_loss | 3.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16988 | -| time_elapsed | 91789 | -| total_timesteps | 2174464 | -| train/ | | -| approx_kl | 0.03430908 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 6.88e-05 | -| n_updates | 169870 | -| policy_gradient_loss | -0.00175 | -| std | 0.0085 | -| value_loss | 5.96e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16989 | -| time_elapsed | 91795 | -| total_timesteps | 2174592 | -| train/ | | -| approx_kl | 0.0021054433 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -5.67 | -| learning_rate | 0.0003 | -| loss | 0.00268 | -| n_updates | 169880 | -| policy_gradient_loss | 0.0208 | -| std | 0.0085 | -| value_loss | 1.5e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16990 | -| time_elapsed | 91800 | -| total_timesteps | 2174720 | -| train/ | | -| approx_kl | 0.008400237 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -2.84 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 169890 | -| policy_gradient_loss | 0.00115 | -| std | 0.00851 | -| value_loss | 1.02e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16991 | -| time_elapsed | 91806 | -| total_timesteps | 2174848 | -| train/ | | -| approx_kl | 0.14512838 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.0995 | -| n_updates | 169900 | -| policy_gradient_loss | 0.0264 | -| std | 0.00851 | -| value_loss | 4.52e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.852 | -| time/ | | -| fps | 23 | -| iterations | 16992 | -| time_elapsed | 91812 | -| total_timesteps | 2174976 | -| train/ | | -| approx_kl | 0.029069128 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 169910 | -| policy_gradient_loss | 0.00705 | -| std | 0.0085 | -| value_loss | 1.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 16993 | -| time_elapsed | 91817 | -| total_timesteps | 2175104 | -| train/ | | -| approx_kl | 0.009323994 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | 0.00519 | -| n_updates | 169920 | -| policy_gradient_loss | 0.00992 | -| std | 0.00849 | -| value_loss | 6.62e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 16994 | -| time_elapsed | 91829 | -| total_timesteps | 2175232 | -| train/ | | -| approx_kl | 0.09088113 | -| clip_fraction | 0.624 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | 0.054 | -| n_updates | 169930 | -| policy_gradient_loss | 0.0441 | -| std | 0.00848 | -| value_loss | 0.000131 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 16995 | -| time_elapsed | 91835 | -| total_timesteps | 2175360 | -| train/ | | -| approx_kl | 0.045425892 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.00356 | -| n_updates | 169940 | -| policy_gradient_loss | 0.0119 | -| std | 0.00848 | -| value_loss | 2.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 16996 | -| time_elapsed | 91839 | -| total_timesteps | 2175488 | -| train/ | | -| approx_kl | 0.33950856 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.0082 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 169950 | -| policy_gradient_loss | 0.0371 | -| std | 0.00848 | -| value_loss | 5.35e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 16997 | -| time_elapsed | 91846 | -| total_timesteps | 2175616 | -| train/ | | -| approx_kl | 0.025217189 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00993 | -| learning_rate | 0.0003 | -| loss | 0.00706 | -| n_updates | 169960 | -| policy_gradient_loss | 0.00437 | -| std | 0.00848 | -| value_loss | 2.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 16998 | -| time_elapsed | 91850 | -| total_timesteps | 2175744 | -| train/ | | -| approx_kl | 0.029195447 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | -0.000638 | -| n_updates | 169970 | -| policy_gradient_loss | -0.000752 | -| std | 0.00847 | -| value_loss | 1.54e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 16999 | -| time_elapsed | 91855 | -| total_timesteps | 2175872 | -| train/ | | -| approx_kl | 0.0041190526 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 169980 | -| policy_gradient_loss | 0.000895 | -| std | 0.00848 | -| value_loss | 1.06e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17000 | -| time_elapsed | 91860 | -| total_timesteps | 2176000 | -| train/ | | -| approx_kl | 0.053549856 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 169990 | -| policy_gradient_loss | 0.0111 | -| std | 0.00848 | -| value_loss | 8.05e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17001 | -| time_elapsed | 91864 | -| total_timesteps | 2176128 | -| train/ | | -| approx_kl | 0.0067903926 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00207 | -| learning_rate | 0.0003 | -| loss | 0.000146 | -| n_updates | 170000 | -| policy_gradient_loss | 0.00541 | -| std | 0.00848 | -| value_loss | 3.61e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17002 | -| time_elapsed | 91880 | -| total_timesteps | 2176256 | -| train/ | | -| approx_kl | 0.0023444397 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.746 | -| learning_rate | 0.0003 | -| loss | 0.00366 | -| n_updates | 170010 | -| policy_gradient_loss | 0.00582 | -| std | 0.00847 | -| value_loss | 0.00421 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17003 | -| time_elapsed | 91887 | -| total_timesteps | 2176384 | -| train/ | | -| approx_kl | 4.2145606e-05 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | 0.000615 | -| n_updates | 170020 | -| policy_gradient_loss | 0.00622 | -| std | 0.00847 | -| value_loss | 2.5e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17004 | -| time_elapsed | 91892 | -| total_timesteps | 2176512 | -| train/ | | -| approx_kl | 0.009602888 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.00663 | -| n_updates | 170030 | -| policy_gradient_loss | 0.00695 | -| std | 0.00847 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17005 | -| time_elapsed | 91898 | -| total_timesteps | 2176640 | -| train/ | | -| approx_kl | 0.0032568057 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.00565 | -| n_updates | 170040 | -| policy_gradient_loss | 0.00576 | -| std | 0.00847 | -| value_loss | 6.72e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17006 | -| time_elapsed | 91904 | -| total_timesteps | 2176768 | -| train/ | | -| approx_kl | 0.019953415 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 170050 | -| policy_gradient_loss | 0.0151 | -| std | 0.00847 | -| value_loss | 4.95e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 17007 | -| time_elapsed | 91909 | -| total_timesteps | 2176896 | -| train/ | | -| approx_kl | 0.539766 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.238 | -| n_updates | 170060 | -| policy_gradient_loss | 0.15 | -| std | 0.00845 | -| value_loss | 2.03e-05 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17008 | -| time_elapsed | 91916 | -| total_timesteps | 2177024 | -| train/ | | -| approx_kl | 0.40926725 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -2.84 | -| learning_rate | 0.0003 | -| loss | 0.0713 | -| n_updates | 170070 | -| policy_gradient_loss | 0.016 | -| std | 0.00845 | -| value_loss | 1.61e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17009 | -| time_elapsed | 91927 | -| total_timesteps | 2177152 | -| train/ | | -| approx_kl | 0.19312733 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.412 | -| learning_rate | 0.0003 | -| loss | -0.00875 | -| n_updates | 170080 | -| policy_gradient_loss | -0.0118 | -| std | 0.00844 | -| value_loss | 0.00126 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17010 | -| time_elapsed | 91932 | -| total_timesteps | 2177280 | -| train/ | | -| approx_kl | 0.011796109 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00856 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 170090 | -| policy_gradient_loss | 0.0416 | -| std | 0.00844 | -| value_loss | 1.42e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17011 | -| time_elapsed | 91937 | -| total_timesteps | 2177408 | -| train/ | | -| approx_kl | 0.13573986 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00701 | -| learning_rate | 0.0003 | -| loss | 0.0845 | -| n_updates | 170100 | -| policy_gradient_loss | 0.0282 | -| std | 0.00844 | -| value_loss | 2.71e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17012 | -| time_elapsed | 91942 | -| total_timesteps | 2177536 | -| train/ | | -| approx_kl | 0.00032464322 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | -0.000963 | -| n_updates | 170110 | -| policy_gradient_loss | 0.00325 | -| std | 0.00844 | -| value_loss | 1.89e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17013 | -| time_elapsed | 91947 | -| total_timesteps | 2177664 | -| train/ | | -| approx_kl | 0.047565807 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.0284 | -| n_updates | 170120 | -| policy_gradient_loss | 0.0574 | -| std | 0.00845 | -| value_loss | 1.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17014 | -| time_elapsed | 91952 | -| total_timesteps | 2177792 | -| train/ | | -| approx_kl | 0.014956251 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 170130 | -| policy_gradient_loss | -0.000708 | -| std | 0.00845 | -| value_loss | 1.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17015 | -| time_elapsed | 91956 | -| total_timesteps | 2177920 | -| train/ | | -| approx_kl | 0.019978106 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 170140 | -| policy_gradient_loss | 0.0452 | -| std | 0.00845 | -| value_loss | 7.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17016 | -| time_elapsed | 91959 | -| total_timesteps | 2178048 | -| train/ | | -| approx_kl | 0.103615135 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.0734 | -| n_updates | 170150 | -| policy_gradient_loss | 0.033 | -| std | 0.00844 | -| value_loss | 5.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17017 | -| time_elapsed | 91968 | -| total_timesteps | 2178176 | -| train/ | | -| approx_kl | 0.010456359 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.342 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 170160 | -| policy_gradient_loss | 0.00373 | -| std | 0.00844 | -| value_loss | 0.00124 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17018 | -| time_elapsed | 91974 | -| total_timesteps | 2178304 | -| train/ | | -| approx_kl | 0.004655479 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 170170 | -| policy_gradient_loss | 0.0321 | -| std | 0.00844 | -| value_loss | 9.31e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17019 | -| time_elapsed | 91978 | -| total_timesteps | 2178432 | -| train/ | | -| approx_kl | 0.26977032 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.243 | -| n_updates | 170180 | -| policy_gradient_loss | 0.155 | -| std | 0.00844 | -| value_loss | 4.39e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17020 | -| time_elapsed | 91983 | -| total_timesteps | 2178560 | -| train/ | | -| approx_kl | 0.032026347 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.000985 | -| n_updates | 170190 | -| policy_gradient_loss | 0.00859 | -| std | 0.00844 | -| value_loss | 2.89e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17021 | -| time_elapsed | 91988 | -| total_timesteps | 2178688 | -| train/ | | -| approx_kl | 0.0008667987 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.00223 | -| n_updates | 170200 | -| policy_gradient_loss | 0.0028 | -| std | 0.00844 | -| value_loss | 1.73e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17022 | -| time_elapsed | 91993 | -| total_timesteps | 2178816 | -| train/ | | -| approx_kl | 0.11641927 | -| clip_fraction | 0.614 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 170210 | -| policy_gradient_loss | 0.0982 | -| std | 0.00844 | -| value_loss | 1.21e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 17023 | -| time_elapsed | 91999 | -| total_timesteps | 2178944 | -| train/ | | -| approx_kl | 0.020154152 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 170220 | -| policy_gradient_loss | 0.0124 | -| std | 0.00845 | -| value_loss | 8.98e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17024 | -| time_elapsed | 92004 | -| total_timesteps | 2179072 | -| train/ | | -| approx_kl | 0.09848097 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.0413 | -| n_updates | 170230 | -| policy_gradient_loss | 0.0107 | -| std | 0.00845 | -| value_loss | 6.01e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17025 | -| time_elapsed | 92013 | -| total_timesteps | 2179200 | -| train/ | | -| approx_kl | 0.033138372 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 170240 | -| policy_gradient_loss | -0.0113 | -| std | 0.00845 | -| value_loss | 0.00394 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17026 | -| time_elapsed | 92018 | -| total_timesteps | 2179328 | -| train/ | | -| approx_kl | 0.17251688 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 170250 | -| policy_gradient_loss | 0.0393 | -| std | 0.00846 | -| value_loss | 2.98e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17027 | -| time_elapsed | 92023 | -| total_timesteps | 2179456 | -| train/ | | -| approx_kl | 0.0004883809 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | -0.00044 | -| n_updates | 170260 | -| policy_gradient_loss | 0.00747 | -| std | 0.00847 | -| value_loss | 4.56e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17028 | -| time_elapsed | 92029 | -| total_timesteps | 2179584 | -| train/ | | -| approx_kl | 2.441369e-05 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0646 | -| learning_rate | 0.0003 | -| loss | -0.000113 | -| n_updates | 170270 | -| policy_gradient_loss | 0.00846 | -| std | 0.00847 | -| value_loss | 3.15e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17029 | -| time_elapsed | 92035 | -| total_timesteps | 2179712 | -| train/ | | -| approx_kl | 0.035354156 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 170280 | -| policy_gradient_loss | 0.0383 | -| std | 0.00847 | -| value_loss | 1.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17030 | -| time_elapsed | 92040 | -| total_timesteps | 2179840 | -| train/ | | -| approx_kl | 0.06778004 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 170290 | -| policy_gradient_loss | -0.00935 | -| std | 0.00847 | -| value_loss | 1.22e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 17031 | -| time_elapsed | 92046 | -| total_timesteps | 2179968 | -| train/ | | -| approx_kl | 0.09112312 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0646 | -| learning_rate | 0.0003 | -| loss | 0.0565 | -| n_updates | 170300 | -| policy_gradient_loss | 0.0305 | -| std | 0.00846 | -| value_loss | 8.23e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17032 | -| time_elapsed | 92051 | -| total_timesteps | 2180096 | -| train/ | | -| approx_kl | 0.020209957 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 170310 | -| policy_gradient_loss | 0.035 | -| std | 0.00846 | -| value_loss | 5.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17033 | -| time_elapsed | 92063 | -| total_timesteps | 2180224 | -| train/ | | -| approx_kl | 0.016384328 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.736 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 170320 | -| policy_gradient_loss | -0.0106 | -| std | 0.00845 | -| value_loss | 0.00484 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17034 | -| time_elapsed | 92068 | -| total_timesteps | 2180352 | -| train/ | | -| approx_kl | 0.008279229 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 170330 | -| policy_gradient_loss | 0.05 | -| std | 0.00845 | -| value_loss | 1.68e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17035 | -| time_elapsed | 92073 | -| total_timesteps | 2180480 | -| train/ | | -| approx_kl | 0.13955942 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00758 | -| learning_rate | 0.0003 | -| loss | 0.038 | -| n_updates | 170340 | -| policy_gradient_loss | 0.0204 | -| std | 0.00845 | -| value_loss | 2.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17036 | -| time_elapsed | 92078 | -| total_timesteps | 2180608 | -| train/ | | -| approx_kl | 9.95025e-06 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.077 | -| learning_rate | 0.0003 | -| loss | -0.000441 | -| n_updates | 170350 | -| policy_gradient_loss | 0.0207 | -| std | 0.00843 | -| value_loss | 1.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17037 | -| time_elapsed | 92082 | -| total_timesteps | 2180736 | -| train/ | | -| approx_kl | 0.04525349 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 170360 | -| policy_gradient_loss | 0.0256 | -| std | 0.00841 | -| value_loss | 6.9e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17038 | -| time_elapsed | 92086 | -| total_timesteps | 2180864 | -| train/ | | -| approx_kl | 0.07793553 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 170370 | -| policy_gradient_loss | 0.0139 | -| std | 0.0084 | -| value_loss | 2.96e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17039 | -| time_elapsed | 92091 | -| total_timesteps | 2180992 | -| train/ | | -| approx_kl | 0.0056966534 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.00553 | -| n_updates | 170380 | -| policy_gradient_loss | 0.00791 | -| std | 0.0084 | -| value_loss | 1.55e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17040 | -| time_elapsed | 92096 | -| total_timesteps | 2181120 | -| train/ | | -| approx_kl | 0.12324804 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.0911 | -| n_updates | 170390 | -| policy_gradient_loss | 0.0927 | -| std | 0.0084 | -| value_loss | 8.92e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17041 | -| time_elapsed | 92109 | -| total_timesteps | 2181248 | -| train/ | | -| approx_kl | 0.049136177 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.715 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 170400 | -| policy_gradient_loss | -0.007 | -| std | 0.0084 | -| value_loss | 0.0059 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17042 | -| time_elapsed | 92115 | -| total_timesteps | 2181376 | -| train/ | | -| approx_kl | 0.007340245 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 170410 | -| policy_gradient_loss | 0.0237 | -| std | 0.0084 | -| value_loss | 1.09e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17043 | -| time_elapsed | 92120 | -| total_timesteps | 2181504 | -| train/ | | -| approx_kl | 0.13434976 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00488 | -| learning_rate | 0.0003 | -| loss | 0.0579 | -| n_updates | 170420 | -| policy_gradient_loss | 0.00974 | -| std | 0.0084 | -| value_loss | 1.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17044 | -| time_elapsed | 92125 | -| total_timesteps | 2181632 | -| train/ | | -| approx_kl | 0.018259289 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 170430 | -| policy_gradient_loss | 0.0034 | -| std | 0.00841 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17045 | -| time_elapsed | 92130 | -| total_timesteps | 2181760 | -| train/ | | -| approx_kl | 0.008798953 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 170440 | -| policy_gradient_loss | 0.00332 | -| std | 0.00841 | -| value_loss | 1.77e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17046 | -| time_elapsed | 92136 | -| total_timesteps | 2181888 | -| train/ | | -| approx_kl | 0.2020492 | -| clip_fraction | 0.704 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00688 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 170450 | -| policy_gradient_loss | 0.116 | -| std | 0.00841 | -| value_loss | 2.08e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17047 | -| time_elapsed | 92141 | -| total_timesteps | 2182016 | -| train/ | | -| approx_kl | 0.09395164 | -| clip_fraction | 0.612 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.268 | -| learning_rate | 0.0003 | -| loss | 0.079 | -| n_updates | 170460 | -| policy_gradient_loss | 0.0734 | -| std | 0.00842 | -| value_loss | 1.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17048 | -| time_elapsed | 92154 | -| total_timesteps | 2182144 | -| train/ | | -| approx_kl | 0.035628386 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 170470 | -| policy_gradient_loss | 0.00295 | -| std | 0.00842 | -| value_loss | 0.00434 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17049 | -| time_elapsed | 92158 | -| total_timesteps | 2182272 | -| train/ | | -| approx_kl | 0.007863173 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | 0.00461 | -| n_updates | 170480 | -| policy_gradient_loss | 0.00686 | -| std | 0.00842 | -| value_loss | 1.22e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17050 | -| time_elapsed | 92163 | -| total_timesteps | 2182400 | -| train/ | | -| approx_kl | 0.0295596 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 170490 | -| policy_gradient_loss | 0.0435 | -| std | 0.00842 | -| value_loss | 1.2e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17051 | -| time_elapsed | 92168 | -| total_timesteps | 2182528 | -| train/ | | -| approx_kl | 0.011963915 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0918 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 170500 | -| policy_gradient_loss | 0.00875 | -| std | 0.00842 | -| value_loss | 5.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17052 | -| time_elapsed | 92172 | -| total_timesteps | 2182656 | -| train/ | | -| approx_kl | 0.020341493 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 170510 | -| policy_gradient_loss | 0.0174 | -| std | 0.00842 | -| value_loss | 3.91e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17053 | -| time_elapsed | 92177 | -| total_timesteps | 2182784 | -| train/ | | -| approx_kl | 0.04370792 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.000626 | -| n_updates | 170520 | -| policy_gradient_loss | -0.00336 | -| std | 0.00842 | -| value_loss | 3.82e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17054 | -| time_elapsed | 92181 | -| total_timesteps | 2182912 | -| train/ | | -| approx_kl | 0.037821703 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0878 | -| learning_rate | 0.0003 | -| loss | 0.0399 | -| n_updates | 170530 | -| policy_gradient_loss | 0.00905 | -| std | 0.00842 | -| value_loss | 1.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17055 | -| time_elapsed | 92186 | -| total_timesteps | 2183040 | -| train/ | | -| approx_kl | 0.022869239 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 170540 | -| policy_gradient_loss | 0.0216 | -| std | 0.00842 | -| value_loss | 5.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17056 | -| time_elapsed | 92195 | -| total_timesteps | 2183168 | -| train/ | | -| approx_kl | 0.049522452 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 170550 | -| policy_gradient_loss | -0.0121 | -| std | 0.00842 | -| value_loss | 8.56e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17057 | -| time_elapsed | 92200 | -| total_timesteps | 2183296 | -| train/ | | -| approx_kl | 0.30841118 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 170560 | -| policy_gradient_loss | 0.0978 | -| std | 0.00841 | -| value_loss | 1.02e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17058 | -| time_elapsed | 92205 | -| total_timesteps | 2183424 | -| train/ | | -| approx_kl | 0.05474347 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00122 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 170570 | -| policy_gradient_loss | 0.0173 | -| std | 0.00841 | -| value_loss | 4.62e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17059 | -| time_elapsed | 92210 | -| total_timesteps | 2183552 | -| train/ | | -| approx_kl | 0.081465505 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0435 | -| n_updates | 170580 | -| policy_gradient_loss | 0.0111 | -| std | 0.0084 | -| value_loss | 6.51e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17060 | -| time_elapsed | 92215 | -| total_timesteps | 2183680 | -| train/ | | -| approx_kl | 0.018120816 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.00956 | -| n_updates | 170590 | -| policy_gradient_loss | 0.0234 | -| std | 0.00841 | -| value_loss | 5.71e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17061 | -| time_elapsed | 92221 | -| total_timesteps | 2183808 | -| train/ | | -| approx_kl | 0.06586309 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | 0.0396 | -| n_updates | 170600 | -| policy_gradient_loss | 0.0187 | -| std | 0.00841 | -| value_loss | 7.56e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17062 | -| time_elapsed | 92226 | -| total_timesteps | 2183936 | -| train/ | | -| approx_kl | 0.0037928913 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.00409 | -| n_updates | 170610 | -| policy_gradient_loss | 0.00488 | -| std | 0.00842 | -| value_loss | 3.68e-10 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17063 | -| time_elapsed | 92231 | -| total_timesteps | 2184064 | -| train/ | | -| approx_kl | 0.0381752 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | -0.00831 | -| n_updates | 170620 | -| policy_gradient_loss | 0.0103 | -| std | 0.00842 | -| value_loss | 1.12e-10 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17064 | -| time_elapsed | 92242 | -| total_timesteps | 2184192 | -| train/ | | -| approx_kl | 0.006853469 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 170630 | -| policy_gradient_loss | -0.017 | -| std | 0.00842 | -| value_loss | 0.000645 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17065 | -| time_elapsed | 92249 | -| total_timesteps | 2184320 | -| train/ | | -| approx_kl | 0.017826602 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 170640 | -| policy_gradient_loss | 0.00714 | -| std | 0.00842 | -| value_loss | 5.59e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17066 | -| time_elapsed | 92254 | -| total_timesteps | 2184448 | -| train/ | | -| approx_kl | 0.0689494 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00245 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 170650 | -| policy_gradient_loss | 0.0142 | -| std | 0.00842 | -| value_loss | 9.99e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17067 | -| time_elapsed | 92260 | -| total_timesteps | 2184576 | -| train/ | | -| approx_kl | 0.00017294567 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.000183 | -| n_updates | 170660 | -| policy_gradient_loss | 0.0215 | -| std | 0.00843 | -| value_loss | 1.83e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17068 | -| time_elapsed | 92264 | -| total_timesteps | 2184704 | -| train/ | | -| approx_kl | 0.0007746485 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.000586 | -| n_updates | 170670 | -| policy_gradient_loss | 0.0196 | -| std | 0.00842 | -| value_loss | 1.4e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17069 | -| time_elapsed | 92267 | -| total_timesteps | 2184832 | -| train/ | | -| approx_kl | 4.214188e-05 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0712 | -| learning_rate | 0.0003 | -| loss | 0.000544 | -| n_updates | 170680 | -| policy_gradient_loss | 0.0185 | -| std | 0.00842 | -| value_loss | 3.66e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17070 | -| time_elapsed | 92271 | -| total_timesteps | 2184960 | -| train/ | | -| approx_kl | 0.1710092 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -5.27 | -| learning_rate | 0.0003 | -| loss | 0.00855 | -| n_updates | 170690 | -| policy_gradient_loss | 0.00292 | -| std | 0.00842 | -| value_loss | 2.08e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17071 | -| time_elapsed | 92275 | -| total_timesteps | 2185088 | -| train/ | | -| approx_kl | 0.0105666295 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00142 | -| learning_rate | 0.0003 | -| loss | 6.54e-05 | -| n_updates | 170700 | -| policy_gradient_loss | 0.0203 | -| std | 0.00842 | -| value_loss | 8.14e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17072 | -| time_elapsed | 92286 | -| total_timesteps | 2185216 | -| train/ | | -| approx_kl | 0.30222005 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.85 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 170710 | -| policy_gradient_loss | 0.0387 | -| std | 0.00842 | -| value_loss | 0.002 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17073 | -| time_elapsed | 92291 | -| total_timesteps | 2185344 | -| train/ | | -| approx_kl | 0.17255332 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 170720 | -| policy_gradient_loss | 0.092 | -| std | 0.00842 | -| value_loss | 3.94e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17074 | -| time_elapsed | 92297 | -| total_timesteps | 2185472 | -| train/ | | -| approx_kl | 0.030203752 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00784 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 170730 | -| policy_gradient_loss | 0.016 | -| std | 0.00842 | -| value_loss | 3.87e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17075 | -| time_elapsed | 92301 | -| total_timesteps | 2185600 | -| train/ | | -| approx_kl | 0.43375477 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 170740 | -| policy_gradient_loss | 0.0458 | -| std | 0.00842 | -| value_loss | 1.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17076 | -| time_elapsed | 92307 | -| total_timesteps | 2185728 | -| train/ | | -| approx_kl | 0.021659862 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 170750 | -| policy_gradient_loss | -0.00294 | -| std | 0.00842 | -| value_loss | 1.55e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17077 | -| time_elapsed | 92311 | -| total_timesteps | 2185856 | -| train/ | | -| approx_kl | 2.1282118e-05 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 170760 | -| policy_gradient_loss | -0.00414 | -| std | 0.00842 | -| value_loss | 1.11e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 17078 | -| time_elapsed | 92316 | -| total_timesteps | 2185984 | -| train/ | | -| approx_kl | 0.029140579 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 170770 | -| policy_gradient_loss | 0.00575 | -| std | 0.00842 | -| value_loss | 6.14e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 17079 | -| time_elapsed | 92320 | -| total_timesteps | 2186112 | -| train/ | | -| approx_kl | 0.0057689142 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | -0.00579 | -| n_updates | 170780 | -| policy_gradient_loss | 0.00226 | -| std | 0.00842 | -| value_loss | 4.69e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 17080 | -| time_elapsed | 92333 | -| total_timesteps | 2186240 | -| train/ | | -| approx_kl | 0.004579414 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | -0.00737 | -| n_updates | 170790 | -| policy_gradient_loss | -0.0145 | -| std | 0.00842 | -| value_loss | 0.00124 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 17081 | -| time_elapsed | 92339 | -| total_timesteps | 2186368 | -| train/ | | -| approx_kl | 0.076645434 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 170800 | -| policy_gradient_loss | 0.0344 | -| std | 0.00842 | -| value_loss | 2.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 17082 | -| time_elapsed | 92344 | -| total_timesteps | 2186496 | -| train/ | | -| approx_kl | 0.086935796 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0436 | -| n_updates | 170810 | -| policy_gradient_loss | 0.0173 | -| std | 0.00842 | -| value_loss | 5.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 17083 | -| time_elapsed | 92349 | -| total_timesteps | 2186624 | -| train/ | | -| approx_kl | 0.022560205 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0653 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 170820 | -| policy_gradient_loss | -0.000419 | -| std | 0.00842 | -| value_loss | 3.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 17084 | -| time_elapsed | 92354 | -| total_timesteps | 2186752 | -| train/ | | -| approx_kl | 0.13424098 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 170830 | -| policy_gradient_loss | 0.00984 | -| std | 0.00842 | -| value_loss | 2.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 17085 | -| time_elapsed | 92358 | -| total_timesteps | 2186880 | -| train/ | | -| approx_kl | 0.006614966 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 170840 | -| policy_gradient_loss | 0.000686 | -| std | 0.00842 | -| value_loss | 1.8e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17086 | -| time_elapsed | 92364 | -| total_timesteps | 2187008 | -| train/ | | -| approx_kl | 0.08248595 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 170850 | -| policy_gradient_loss | 0.0127 | -| std | 0.00841 | -| value_loss | 1.27e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17087 | -| time_elapsed | 92377 | -| total_timesteps | 2187136 | -| train/ | | -| approx_kl | 0.07084804 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.00794 | -| n_updates | 170860 | -| policy_gradient_loss | -0.00813 | -| std | 0.00841 | -| value_loss | 5.34e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17088 | -| time_elapsed | 92382 | -| total_timesteps | 2187264 | -| train/ | | -| approx_kl | 0.1040645 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.216 | -| learning_rate | 0.0003 | -| loss | 0.057 | -| n_updates | 170870 | -| policy_gradient_loss | 0.034 | -| std | 0.00841 | -| value_loss | 3.41e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17089 | -| time_elapsed | 92388 | -| total_timesteps | 2187392 | -| train/ | | -| approx_kl | 0.11552412 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.0037 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 170880 | -| policy_gradient_loss | 0.0199 | -| std | 0.00841 | -| value_loss | 7.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17090 | -| time_elapsed | 92394 | -| total_timesteps | 2187520 | -| train/ | | -| approx_kl | 0.03012765 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.0041 | -| n_updates | 170890 | -| policy_gradient_loss | -0.00301 | -| std | 0.00841 | -| value_loss | 4.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17091 | -| time_elapsed | 92398 | -| total_timesteps | 2187648 | -| train/ | | -| approx_kl | 0.012330591 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.00193 | -| n_updates | 170900 | -| policy_gradient_loss | -0.000497 | -| std | 0.00841 | -| value_loss | 1.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17092 | -| time_elapsed | 92403 | -| total_timesteps | 2187776 | -| train/ | | -| approx_kl | 0.10133353 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -28.8 | -| learning_rate | 0.0003 | -| loss | 0.00636 | -| n_updates | 170910 | -| policy_gradient_loss | 0.0027 | -| std | 0.00841 | -| value_loss | 1.13e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17093 | -| time_elapsed | 92408 | -| total_timesteps | 2187904 | -| train/ | | -| approx_kl | 0.2856892 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 170920 | -| policy_gradient_loss | 0.0463 | -| std | 0.00843 | -| value_loss | 4.98e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17094 | -| time_elapsed | 92414 | -| total_timesteps | 2188032 | -| train/ | | -| approx_kl | 0.067359135 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0772 | -| learning_rate | 0.0003 | -| loss | 0.0487 | -| n_updates | 170930 | -| policy_gradient_loss | 0.0359 | -| std | 0.00842 | -| value_loss | 4.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17095 | -| time_elapsed | 92425 | -| total_timesteps | 2188160 | -| train/ | | -| approx_kl | 0.014531601 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.57 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 170940 | -| policy_gradient_loss | 0.0081 | -| std | 0.00842 | -| value_loss | 0.000819 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17096 | -| time_elapsed | 92431 | -| total_timesteps | 2188288 | -| train/ | | -| approx_kl | 0.025180174 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | 0.0329 | -| n_updates | 170950 | -| policy_gradient_loss | 0.000395 | -| std | 0.00843 | -| value_loss | 3.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17097 | -| time_elapsed | 92436 | -| total_timesteps | 2188416 | -| train/ | | -| approx_kl | 0.07797954 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 170960 | -| policy_gradient_loss | 0.0309 | -| std | 0.00843 | -| value_loss | 5.11e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17098 | -| time_elapsed | 92442 | -| total_timesteps | 2188544 | -| train/ | | -| approx_kl | 0.20325333 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 170970 | -| policy_gradient_loss | 0.0963 | -| std | 0.00844 | -| value_loss | 1.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17099 | -| time_elapsed | 92446 | -| total_timesteps | 2188672 | -| train/ | | -| approx_kl | 0.041063383 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | 0.00301 | -| n_updates | 170980 | -| policy_gradient_loss | 0.0146 | -| std | 0.00844 | -| value_loss | 6.18e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17100 | -| time_elapsed | 92450 | -| total_timesteps | 2188800 | -| train/ | | -| approx_kl | 0.2923545 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.0971 | -| n_updates | 170990 | -| policy_gradient_loss | 0.0268 | -| std | 0.00844 | -| value_loss | 4.48e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17101 | -| time_elapsed | 92455 | -| total_timesteps | 2188928 | -| train/ | | -| approx_kl | 0.023890069 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 171000 | -| policy_gradient_loss | -0.000714 | -| std | 0.00844 | -| value_loss | 2.75e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17102 | -| time_elapsed | 92459 | -| total_timesteps | 2189056 | -| train/ | | -| approx_kl | 0.0043682368 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.00388 | -| n_updates | 171010 | -| policy_gradient_loss | 0.00336 | -| std | 0.00844 | -| value_loss | 1.8e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17103 | -| time_elapsed | 92467 | -| total_timesteps | 2189184 | -| train/ | | -| approx_kl | 0.12756607 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 171020 | -| policy_gradient_loss | -0.012 | -| std | 0.00844 | -| value_loss | 0.000128 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17104 | -| time_elapsed | 92472 | -| total_timesteps | 2189312 | -| train/ | | -| approx_kl | 0.2434186 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -1.2 | -| learning_rate | 0.0003 | -| loss | 0.0655 | -| n_updates | 171030 | -| policy_gradient_loss | 0.0229 | -| std | 0.00843 | -| value_loss | 4e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17105 | -| time_elapsed | 92476 | -| total_timesteps | 2189440 | -| train/ | | -| approx_kl | 0.049765196 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.914 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 171040 | -| policy_gradient_loss | 0.0116 | -| std | 0.00843 | -| value_loss | 1.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17106 | -| time_elapsed | 92480 | -| total_timesteps | 2189568 | -| train/ | | -| approx_kl | 0.089154825 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 171050 | -| policy_gradient_loss | 0.0103 | -| std | 0.00843 | -| value_loss | 5.22e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17107 | -| time_elapsed | 92484 | -| total_timesteps | 2189696 | -| train/ | | -| approx_kl | 0.25619587 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 171060 | -| policy_gradient_loss | 0.103 | -| std | 0.00843 | -| value_loss | 3.58e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17108 | -| time_elapsed | 92488 | -| total_timesteps | 2189824 | -| train/ | | -| approx_kl | 0.01454416 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.000341 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 171070 | -| policy_gradient_loss | 0.0125 | -| std | 0.00844 | -| value_loss | 1.3e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17109 | -| time_elapsed | 92493 | -| total_timesteps | 2189952 | -| train/ | | -| approx_kl | 0.06645062 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 171080 | -| policy_gradient_loss | 0.0152 | -| std | 0.00846 | -| value_loss | 1.22e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17110 | -| time_elapsed | 92497 | -| total_timesteps | 2190080 | -| train/ | | -| approx_kl | 0.024113964 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00623 | -| learning_rate | 0.0003 | -| loss | -0.00863 | -| n_updates | 171090 | -| policy_gradient_loss | 0.00779 | -| std | 0.00847 | -| value_loss | 4.58e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17111 | -| time_elapsed | 92506 | -| total_timesteps | 2190208 | -| train/ | | -| approx_kl | 0.091627985 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.733 | -| learning_rate | 0.0003 | -| loss | 0.00781 | -| n_updates | 171100 | -| policy_gradient_loss | 0.00332 | -| std | 0.00847 | -| value_loss | 0.00582 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17112 | -| time_elapsed | 92511 | -| total_timesteps | 2190336 | -| train/ | | -| approx_kl | 0.23843592 | -| clip_fraction | 0.6 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 171110 | -| policy_gradient_loss | 0.0887 | -| std | 0.00847 | -| value_loss | 3.89e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17113 | -| time_elapsed | 92516 | -| total_timesteps | 2190464 | -| train/ | | -| approx_kl | 0.14203209 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00807 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 171120 | -| policy_gradient_loss | 0.109 | -| std | 0.00848 | -| value_loss | 5.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17114 | -| time_elapsed | 92521 | -| total_timesteps | 2190592 | -| train/ | | -| approx_kl | 0.022464836 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 171130 | -| policy_gradient_loss | 0.0146 | -| std | 0.00846 | -| value_loss | 2.05e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17115 | -| time_elapsed | 92526 | -| total_timesteps | 2190720 | -| train/ | | -| approx_kl | 0.3319704 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | 0.153 | -| n_updates | 171140 | -| policy_gradient_loss | 0.0411 | -| std | 0.00845 | -| value_loss | 5.36e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17116 | -| time_elapsed | 92530 | -| total_timesteps | 2190848 | -| train/ | | -| approx_kl | 0.0068857423 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | -0.00928 | -| n_updates | 171150 | -| policy_gradient_loss | 0.000244 | -| std | 0.00844 | -| value_loss | 2.47e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17117 | -| time_elapsed | 92535 | -| total_timesteps | 2190976 | -| train/ | | -| approx_kl | 0.023730393 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 171160 | -| policy_gradient_loss | 0.0599 | -| std | 0.00842 | -| value_loss | 0.000107 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 17118 | -| time_elapsed | 92540 | -| total_timesteps | 2191104 | -| train/ | | -| approx_kl | 0.061217006 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | 0.092 | -| n_updates | 171170 | -| policy_gradient_loss | 0.0943 | -| std | 0.00841 | -| value_loss | 4.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 17119 | -| time_elapsed | 92552 | -| total_timesteps | 2191232 | -| train/ | | -| approx_kl | 0.016346859 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -8.62 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 171180 | -| policy_gradient_loss | -0.0146 | -| std | 0.0084 | -| value_loss | 0.00301 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 17120 | -| time_elapsed | 92558 | -| total_timesteps | 2191360 | -| train/ | | -| approx_kl | 0.19249223 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.0688 | -| n_updates | 171190 | -| policy_gradient_loss | 0.0312 | -| std | 0.0084 | -| value_loss | 2.4e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 17121 | -| time_elapsed | 92561 | -| total_timesteps | 2191488 | -| train/ | | -| approx_kl | 0.00093041593 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 171200 | -| policy_gradient_loss | -0.00012 | -| std | 0.00839 | -| value_loss | 6.82e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 17122 | -| time_elapsed | 92565 | -| total_timesteps | 2191616 | -| train/ | | -| approx_kl | 4.339032e-06 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | -0.000288 | -| n_updates | 171210 | -| policy_gradient_loss | 0.000432 | -| std | 0.0084 | -| value_loss | 3.86e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 17123 | -| time_elapsed | 92568 | -| total_timesteps | 2191744 | -| train/ | | -| approx_kl | 0.0001425636 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0886 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 171220 | -| policy_gradient_loss | -0.00651 | -| std | 0.0084 | -| value_loss | 2.74e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 17124 | -| time_elapsed | 92571 | -| total_timesteps | 2191872 | -| train/ | | -| approx_kl | 0.038830142 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 171230 | -| policy_gradient_loss | 0.0395 | -| std | 0.0084 | -| value_loss | 1.76e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17125 | -| time_elapsed | 92577 | -| total_timesteps | 2192000 | -| train/ | | -| approx_kl | 0.033989616 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 171240 | -| policy_gradient_loss | 0.0175 | -| std | 0.0084 | -| value_loss | 1.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17126 | -| time_elapsed | 92583 | -| total_timesteps | 2192128 | -| train/ | | -| approx_kl | 0.02422335 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00307 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 171250 | -| policy_gradient_loss | 0.0206 | -| std | 0.0084 | -| value_loss | 6.06e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17127 | -| time_elapsed | 92592 | -| total_timesteps | 2192256 | -| train/ | | -| approx_kl | 0.11588476 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.726 | -| learning_rate | 0.0003 | -| loss | -0.000166 | -| n_updates | 171260 | -| policy_gradient_loss | -0.00516 | -| std | 0.0084 | -| value_loss | 0.0049 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17128 | -| time_elapsed | 92598 | -| total_timesteps | 2192384 | -| train/ | | -| approx_kl | 5.430868e-05 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0976 | -| learning_rate | 0.0003 | -| loss | -0.000122 | -| n_updates | 171270 | -| policy_gradient_loss | 0.0214 | -| std | 0.0084 | -| value_loss | 4.48e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17129 | -| time_elapsed | 92603 | -| total_timesteps | 2192512 | -| train/ | | -| approx_kl | 0.041914575 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0708 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 171280 | -| policy_gradient_loss | 0.0148 | -| std | 0.0084 | -| value_loss | 4.63e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17130 | -| time_elapsed | 92608 | -| total_timesteps | 2192640 | -| train/ | | -| approx_kl | 0.18345147 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.892 | -| learning_rate | 0.0003 | -| loss | 0.222 | -| n_updates | 171290 | -| policy_gradient_loss | 0.125 | -| std | 0.0084 | -| value_loss | 5.1e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17131 | -| time_elapsed | 92612 | -| total_timesteps | 2192768 | -| train/ | | -| approx_kl | 0.1216778 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | 0.0813 | -| n_updates | 171300 | -| policy_gradient_loss | 0.0888 | -| std | 0.0084 | -| value_loss | 1.76e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17132 | -| time_elapsed | 92618 | -| total_timesteps | 2192896 | -| train/ | | -| approx_kl | 0.10561906 | -| clip_fraction | 0.692 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0819 | -| n_updates | 171310 | -| policy_gradient_loss | 0.0933 | -| std | 0.0084 | -| value_loss | 1.17e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17133 | -| time_elapsed | 92624 | -| total_timesteps | 2193024 | -| train/ | | -| approx_kl | 0.096447766 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 171320 | -| policy_gradient_loss | 0.084 | -| std | 0.0084 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17134 | -| time_elapsed | 92635 | -| total_timesteps | 2193152 | -| train/ | | -| approx_kl | 0.072102204 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.743 | -| learning_rate | 0.0003 | -| loss | 0.0445 | -| n_updates | 171330 | -| policy_gradient_loss | 0.0308 | -| std | 0.0084 | -| value_loss | 0.0044 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17135 | -| time_elapsed | 92640 | -| total_timesteps | 2193280 | -| train/ | | -| approx_kl | 0.034970284 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 171340 | -| policy_gradient_loss | 0.0124 | -| std | 0.0084 | -| value_loss | 7.93e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17136 | -| time_elapsed | 92646 | -| total_timesteps | 2193408 | -| train/ | | -| approx_kl | 0.0027817348 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.00248 | -| n_updates | 171350 | -| policy_gradient_loss | 0.00551 | -| std | 0.0084 | -| value_loss | 1.56e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17137 | -| time_elapsed | 92651 | -| total_timesteps | 2193536 | -| train/ | | -| approx_kl | 0.028836653 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00726 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 171360 | -| policy_gradient_loss | 0.00759 | -| std | 0.0084 | -| value_loss | 2.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17138 | -| time_elapsed | 92657 | -| total_timesteps | 2193664 | -| train/ | | -| approx_kl | 0.005251487 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.00048 | -| n_updates | 171370 | -| policy_gradient_loss | 0.0209 | -| std | 0.0084 | -| value_loss | 1.86e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17139 | -| time_elapsed | 92662 | -| total_timesteps | 2193792 | -| train/ | | -| approx_kl | 0.43360564 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.229 | -| n_updates | 171380 | -| policy_gradient_loss | 0.154 | -| std | 0.00839 | -| value_loss | 0.000344 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 17140 | -| time_elapsed | 92667 | -| total_timesteps | 2193920 | -| train/ | | -| approx_kl | 0.051765263 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00238 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 171390 | -| policy_gradient_loss | 0.0179 | -| std | 0.00838 | -| value_loss | 3.09e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17141 | -| time_elapsed | 92671 | -| total_timesteps | 2194048 | -| train/ | | -| approx_kl | 0.0027742153 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00659 | -| learning_rate | 0.0003 | -| loss | 0.00876 | -| n_updates | 171400 | -| policy_gradient_loss | 0.0041 | -| std | 0.00838 | -| value_loss | 1.53e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17142 | -| time_elapsed | 92681 | -| total_timesteps | 2194176 | -| train/ | | -| approx_kl | 0.4397361 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | 0.0235 | -| n_updates | 171410 | -| policy_gradient_loss | 0.0262 | -| std | 0.00838 | -| value_loss | 0.000623 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17143 | -| time_elapsed | 92686 | -| total_timesteps | 2194304 | -| train/ | | -| approx_kl | 0.032712158 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 171420 | -| policy_gradient_loss | 0.0458 | -| std | 0.00837 | -| value_loss | 4.72e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17144 | -| time_elapsed | 92691 | -| total_timesteps | 2194432 | -| train/ | | -| approx_kl | 0.1435419 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | 0.0744 | -| n_updates | 171430 | -| policy_gradient_loss | 0.0378 | -| std | 0.00837 | -| value_loss | 3.22e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17145 | -| time_elapsed | 92695 | -| total_timesteps | 2194560 | -| train/ | | -| approx_kl | 0.032500986 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 171440 | -| policy_gradient_loss | 0.055 | -| std | 0.00837 | -| value_loss | 2.7e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17146 | -| time_elapsed | 92700 | -| total_timesteps | 2194688 | -| train/ | | -| approx_kl | 0.032505 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 171450 | -| policy_gradient_loss | 0.0182 | -| std | 0.00837 | -| value_loss | 1.91e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17147 | -| time_elapsed | 92705 | -| total_timesteps | 2194816 | -| train/ | | -| approx_kl | 0.14100172 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.0808 | -| n_updates | 171460 | -| policy_gradient_loss | 0.0289 | -| std | 0.00837 | -| value_loss | 1.02e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17148 | -| time_elapsed | 92709 | -| total_timesteps | 2194944 | -| train/ | | -| approx_kl | 0.033388697 | -| clip_fraction | 0.571 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -6.23e-05 | -| n_updates | 171470 | -| policy_gradient_loss | 0.0477 | -| std | 0.00837 | -| value_loss | 8.94e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17149 | -| time_elapsed | 92714 | -| total_timesteps | 2195072 | -| train/ | | -| approx_kl | 0.13280767 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0377 | -| n_updates | 171480 | -| policy_gradient_loss | 0.0199 | -| std | 0.00837 | -| value_loss | 7.35e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17150 | -| time_elapsed | 92723 | -| total_timesteps | 2195200 | -| train/ | | -| approx_kl | 0.0027277572 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | -0.00464 | -| n_updates | 171490 | -| policy_gradient_loss | -0.00415 | -| std | 0.00837 | -| value_loss | 0.00275 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17151 | -| time_elapsed | 92729 | -| total_timesteps | 2195328 | -| train/ | | -| approx_kl | 0.000544481 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.007 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 171500 | -| policy_gradient_loss | 0.00322 | -| std | 0.00837 | -| value_loss | 6.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17152 | -| time_elapsed | 92733 | -| total_timesteps | 2195456 | -| train/ | | -| approx_kl | 0.050513793 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 171510 | -| policy_gradient_loss | 0.0475 | -| std | 0.00837 | -| value_loss | 1.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17153 | -| time_elapsed | 92739 | -| total_timesteps | 2195584 | -| train/ | | -| approx_kl | 5.420763e-06 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | -8.19e-05 | -| n_updates | 171520 | -| policy_gradient_loss | 0.0552 | -| std | 0.00836 | -| value_loss | 3.5e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17154 | -| time_elapsed | 92745 | -| total_timesteps | 2195712 | -| train/ | | -| approx_kl | 0.07982142 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00711 | -| learning_rate | 0.0003 | -| loss | 0.0891 | -| n_updates | 171530 | -| policy_gradient_loss | 0.108 | -| std | 0.00835 | -| value_loss | 0.00029 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17155 | -| time_elapsed | 92750 | -| total_timesteps | 2195840 | -| train/ | | -| approx_kl | 0.057021268 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.0423 | -| n_updates | 171540 | -| policy_gradient_loss | 0.0369 | -| std | 0.00834 | -| value_loss | 8.27e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17156 | -| time_elapsed | 92755 | -| total_timesteps | 2195968 | -| train/ | | -| approx_kl | 0.22226335 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 171550 | -| policy_gradient_loss | 0.103 | -| std | 0.00834 | -| value_loss | 5.08e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17157 | -| time_elapsed | 92759 | -| total_timesteps | 2196096 | -| train/ | | -| approx_kl | 0.039683487 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 171560 | -| policy_gradient_loss | 0.0217 | -| std | 0.00834 | -| value_loss | 3.36e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17158 | -| time_elapsed | 92769 | -| total_timesteps | 2196224 | -| train/ | | -| approx_kl | 0.12694828 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.612 | -| learning_rate | 0.0003 | -| loss | 0.00397 | -| n_updates | 171570 | -| policy_gradient_loss | 0.00306 | -| std | 0.00834 | -| value_loss | 0.000665 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17159 | -| time_elapsed | 92774 | -| total_timesteps | 2196352 | -| train/ | | -| approx_kl | 0.25289148 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.072 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 171580 | -| policy_gradient_loss | 0.0397 | -| std | 0.00834 | -| value_loss | 9.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17160 | -| time_elapsed | 92779 | -| total_timesteps | 2196480 | -| train/ | | -| approx_kl | 0.034629125 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -4.35e-05 | -| n_updates | 171590 | -| policy_gradient_loss | -0.000991 | -| std | 0.00834 | -| value_loss | 5.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17161 | -| time_elapsed | 92783 | -| total_timesteps | 2196608 | -| train/ | | -| approx_kl | 0.0056424355 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 171600 | -| policy_gradient_loss | 0.00149 | -| std | 0.00834 | -| value_loss | 3.55e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17162 | -| time_elapsed | 92789 | -| total_timesteps | 2196736 | -| train/ | | -| approx_kl | 0.04410351 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.00967 | -| n_updates | 171610 | -| policy_gradient_loss | 0.0234 | -| std | 0.00833 | -| value_loss | 2.39e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17163 | -| time_elapsed | 92794 | -| total_timesteps | 2196864 | -| train/ | | -| approx_kl | 0.66581553 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.288 | -| n_updates | 171620 | -| policy_gradient_loss | 0.127 | -| std | 0.00833 | -| value_loss | 1.44e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 17164 | -| time_elapsed | 92799 | -| total_timesteps | 2196992 | -| train/ | | -| approx_kl | 0.025250282 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.0061 | -| n_updates | 171630 | -| policy_gradient_loss | 0.000419 | -| std | 0.00834 | -| value_loss | 9.67e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17165 | -| time_elapsed | 92805 | -| total_timesteps | 2197120 | -| train/ | | -| approx_kl | 0.0104249995 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.00391 | -| n_updates | 171640 | -| policy_gradient_loss | 0.0218 | -| std | 0.00834 | -| value_loss | 1.19e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17166 | -| time_elapsed | 92819 | -| total_timesteps | 2197248 | -| train/ | | -| approx_kl | 0.17464046 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.688 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 171650 | -| policy_gradient_loss | -0.00768 | -| std | 0.00834 | -| value_loss | 0.00693 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17167 | -| time_elapsed | 92824 | -| total_timesteps | 2197376 | -| train/ | | -| approx_kl | 0.0019019675 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.00617 | -| n_updates | 171660 | -| policy_gradient_loss | 0.0125 | -| std | 0.00834 | -| value_loss | 1.73e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17168 | -| time_elapsed | 92829 | -| total_timesteps | 2197504 | -| train/ | | -| approx_kl | 0.00089640776 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00843 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 171670 | -| policy_gradient_loss | 0.0131 | -| std | 0.00835 | -| value_loss | 3.56e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17169 | -| time_elapsed | 92833 | -| total_timesteps | 2197632 | -| train/ | | -| approx_kl | 0.05052567 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 171680 | -| policy_gradient_loss | 0.0228 | -| std | 0.00835 | -| value_loss | 2.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17170 | -| time_elapsed | 92838 | -| total_timesteps | 2197760 | -| train/ | | -| approx_kl | 0.025885176 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0535 | -| learning_rate | 0.0003 | -| loss | 0.00264 | -| n_updates | 171690 | -| policy_gradient_loss | 0.016 | -| std | 0.00835 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17171 | -| time_elapsed | 92843 | -| total_timesteps | 2197888 | -| train/ | | -| approx_kl | 0.0022661216 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.000513 | -| n_updates | 171700 | -| policy_gradient_loss | 0.0174 | -| std | 0.00835 | -| value_loss | 6.59e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17172 | -| time_elapsed | 92847 | -| total_timesteps | 2198016 | -| train/ | | -| approx_kl | 0.05801303 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 171710 | -| policy_gradient_loss | 0.0133 | -| std | 0.00835 | -| value_loss | 3.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17173 | -| time_elapsed | 92859 | -| total_timesteps | 2198144 | -| train/ | | -| approx_kl | 0.01664019 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.932 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 171720 | -| policy_gradient_loss | 0.00237 | -| std | 0.00835 | -| value_loss | 0.000539 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17174 | -| time_elapsed | 92864 | -| total_timesteps | 2198272 | -| train/ | | -| approx_kl | 0.07927161 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00261 | -| learning_rate | 0.0003 | -| loss | 0.0938 | -| n_updates | 171730 | -| policy_gradient_loss | 0.0326 | -| std | 0.00834 | -| value_loss | 1.11e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17175 | -| time_elapsed | 92869 | -| total_timesteps | 2198400 | -| train/ | | -| approx_kl | 0.00018119626 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | 0.00407 | -| n_updates | 171740 | -| policy_gradient_loss | -0.00954 | -| std | 0.00834 | -| value_loss | 4.56e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17176 | -| time_elapsed | 92873 | -| total_timesteps | 2198528 | -| train/ | | -| approx_kl | 0.00034186663 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.000665 | -| n_updates | 171750 | -| policy_gradient_loss | 0.00928 | -| std | 0.00834 | -| value_loss | 3.02e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17177 | -| time_elapsed | 92878 | -| total_timesteps | 2198656 | -| train/ | | -| approx_kl | 0.033813886 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.00887 | -| n_updates | 171760 | -| policy_gradient_loss | 0.0346 | -| std | 0.00834 | -| value_loss | 2.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17178 | -| time_elapsed | 92882 | -| total_timesteps | 2198784 | -| train/ | | -| approx_kl | 0.08598792 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0751 | -| n_updates | 171770 | -| policy_gradient_loss | 0.0303 | -| std | 0.00835 | -| value_loss | 1.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17179 | -| time_elapsed | 92886 | -| total_timesteps | 2198912 | -| train/ | | -| approx_kl | 0.010236608 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00639 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 171780 | -| policy_gradient_loss | -0.00199 | -| std | 0.00836 | -| value_loss | 2.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17180 | -| time_elapsed | 92890 | -| total_timesteps | 2199040 | -| train/ | | -| approx_kl | 0.011812367 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00598 | -| learning_rate | 0.0003 | -| loss | 0.0069 | -| n_updates | 171790 | -| policy_gradient_loss | 0.0151 | -| std | 0.00836 | -| value_loss | 9.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17181 | -| time_elapsed | 92899 | -| total_timesteps | 2199168 | -| train/ | | -| approx_kl | 0.36611092 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -2.07 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 171800 | -| policy_gradient_loss | -0.00122 | -| std | 0.00837 | -| value_loss | 0.0019 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17182 | -| time_elapsed | 92904 | -| total_timesteps | 2199296 | -| train/ | | -| approx_kl | 0.025891181 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | 0.0406 | -| n_updates | 171810 | -| policy_gradient_loss | -0.00118 | -| std | 0.00837 | -| value_loss | 3.4e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17183 | -| time_elapsed | 92908 | -| total_timesteps | 2199424 | -| train/ | | -| approx_kl | 0.2807793 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -21.4 | -| learning_rate | 0.0003 | -| loss | 0.0596 | -| n_updates | 171820 | -| policy_gradient_loss | 0.018 | -| std | 0.00834 | -| value_loss | 1.13e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17184 | -| time_elapsed | 92913 | -| total_timesteps | 2199552 | -| train/ | | -| approx_kl | 0.05372597 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | -0.000163 | -| n_updates | 171830 | -| policy_gradient_loss | 0.0132 | -| std | 0.00833 | -| value_loss | 4.9e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17185 | -| time_elapsed | 92918 | -| total_timesteps | 2199680 | -| train/ | | -| approx_kl | 0.5847709 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.271 | -| n_updates | 171840 | -| policy_gradient_loss | 0.139 | -| std | 0.00833 | -| value_loss | 1.07e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17186 | -| time_elapsed | 92922 | -| total_timesteps | 2199808 | -| train/ | | -| approx_kl | 0.0037798905 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 171850 | -| policy_gradient_loss | 0.0149 | -| std | 0.00833 | -| value_loss | 4.91e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 17187 | -| time_elapsed | 92927 | -| total_timesteps | 2199936 | -| train/ | | -| approx_kl | 0.18469124 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 171860 | -| policy_gradient_loss | 0.0815 | -| std | 0.00833 | -| value_loss | 9.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17188 | -| time_elapsed | 92934 | -| total_timesteps | 2200064 | -| train/ | | -| approx_kl | 0.026259314 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00405 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 171870 | -| policy_gradient_loss | 0.00952 | -| std | 0.00834 | -| value_loss | 3.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17189 | -| time_elapsed | 92944 | -| total_timesteps | 2200192 | -| train/ | | -| approx_kl | 0.03665808 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.951 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 171880 | -| policy_gradient_loss | -0.00983 | -| std | 0.00834 | -| value_loss | 0.000353 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17190 | -| time_elapsed | 92950 | -| total_timesteps | 2200320 | -| train/ | | -| approx_kl | 0.14112504 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -43.5 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 171890 | -| policy_gradient_loss | 0.0345 | -| std | 0.00834 | -| value_loss | 1.9e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17191 | -| time_elapsed | 92955 | -| total_timesteps | 2200448 | -| train/ | | -| approx_kl | 0.029970229 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 171900 | -| policy_gradient_loss | 0.0226 | -| std | 0.00834 | -| value_loss | 1.81e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17192 | -| time_elapsed | 92961 | -| total_timesteps | 2200576 | -| train/ | | -| approx_kl | 0.44111386 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0609 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 171910 | -| policy_gradient_loss | 0.0431 | -| std | 0.00834 | -| value_loss | 1.22e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17193 | -| time_elapsed | 92966 | -| total_timesteps | 2200704 | -| train/ | | -| approx_kl | 0.006583292 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 171920 | -| policy_gradient_loss | 0.00331 | -| std | 0.00834 | -| value_loss | 8.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17194 | -| time_elapsed | 92973 | -| total_timesteps | 2200832 | -| train/ | | -| approx_kl | 0.053819265 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 171930 | -| policy_gradient_loss | 0.0269 | -| std | 0.00834 | -| value_loss | 5.94e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17195 | -| time_elapsed | 92977 | -| total_timesteps | 2200960 | -| train/ | | -| approx_kl | 0.53356504 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.239 | -| n_updates | 171940 | -| policy_gradient_loss | 0.105 | -| std | 0.00834 | -| value_loss | 4.4e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17196 | -| time_elapsed | 92983 | -| total_timesteps | 2201088 | -| train/ | | -| approx_kl | 0.029469356 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.00815 | -| n_updates | 171950 | -| policy_gradient_loss | 0.00099 | -| std | 0.00833 | -| value_loss | 2.59e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17197 | -| time_elapsed | 92996 | -| total_timesteps | 2201216 | -| train/ | | -| approx_kl | 0.061429165 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 171960 | -| policy_gradient_loss | -0.00924 | -| std | 0.00833 | -| value_loss | 0.000414 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17198 | -| time_elapsed | 93001 | -| total_timesteps | 2201344 | -| train/ | | -| approx_kl | 0.00678639 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 171970 | -| policy_gradient_loss | 0.00196 | -| std | 0.00833 | -| value_loss | 1.62e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17199 | -| time_elapsed | 93008 | -| total_timesteps | 2201472 | -| train/ | | -| approx_kl | 0.05389046 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.387 | -| learning_rate | 0.0003 | -| loss | 0.0042 | -| n_updates | 171980 | -| policy_gradient_loss | 0.01 | -| std | 0.00833 | -| value_loss | 1.67e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17200 | -| time_elapsed | 93012 | -| total_timesteps | 2201600 | -| train/ | | -| approx_kl | 0.23800963 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 171990 | -| policy_gradient_loss | 0.116 | -| std | 0.00834 | -| value_loss | 7.8e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17201 | -| time_elapsed | 93017 | -| total_timesteps | 2201728 | -| train/ | | -| approx_kl | 0.14270386 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 172000 | -| policy_gradient_loss | 0.0761 | -| std | 0.00834 | -| value_loss | 1.64e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17202 | -| time_elapsed | 93021 | -| total_timesteps | 2201856 | -| train/ | | -| approx_kl | 0.024011718 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | -0.000645 | -| n_updates | 172010 | -| policy_gradient_loss | 0.0156 | -| std | 0.00834 | -| value_loss | 1.16e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 17203 | -| time_elapsed | 93026 | -| total_timesteps | 2201984 | -| train/ | | -| approx_kl | 0.00086046336 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.00337 | -| n_updates | 172020 | -| policy_gradient_loss | 0.00309 | -| std | 0.00834 | -| value_loss | 1.09e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 17204 | -| time_elapsed | 93030 | -| total_timesteps | 2202112 | -| train/ | | -| approx_kl | 0.12159312 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0657 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 172030 | -| policy_gradient_loss | 0.0908 | -| std | 0.00834 | -| value_loss | 3.41e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 17205 | -| time_elapsed | 93041 | -| total_timesteps | 2202240 | -| train/ | | -| approx_kl | 0.036108233 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.00891 | -| n_updates | 172040 | -| policy_gradient_loss | -0.00347 | -| std | 0.00834 | -| value_loss | 7.2e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 17206 | -| time_elapsed | 93046 | -| total_timesteps | 2202368 | -| train/ | | -| approx_kl | 0.0060838303 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0879 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 172050 | -| policy_gradient_loss | -0.00283 | -| std | 0.00834 | -| value_loss | 1.84e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 17207 | -| time_elapsed | 93048 | -| total_timesteps | 2202496 | -| train/ | | -| approx_kl | 0.0028897836 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.000124 | -| n_updates | 172060 | -| policy_gradient_loss | 0.00359 | -| std | 0.0083 | -| value_loss | 5.99e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 17208 | -| time_elapsed | 93053 | -| total_timesteps | 2202624 | -| train/ | | -| approx_kl | 0.06482845 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.788 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 172070 | -| policy_gradient_loss | 0.0106 | -| std | 0.00828 | -| value_loss | 1.21e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 17209 | -| time_elapsed | 93059 | -| total_timesteps | 2202752 | -| train/ | | -| approx_kl | 0.0007714466 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.36 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 172080 | -| policy_gradient_loss | -0.00695 | -| std | 0.00828 | -| value_loss | 1.45e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 17210 | -| time_elapsed | 93064 | -| total_timesteps | 2202880 | -| train/ | | -| approx_kl | 0.006916604 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.668 | -| learning_rate | 0.0003 | -| loss | -0.00483 | -| n_updates | 172090 | -| policy_gradient_loss | 0.00157 | -| std | 0.00828 | -| value_loss | 6.39e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17211 | -| time_elapsed | 93069 | -| total_timesteps | 2203008 | -| train/ | | -| approx_kl | 0.023903256 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 172100 | -| policy_gradient_loss | 0.0613 | -| std | 0.00828 | -| value_loss | 1.11e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17212 | -| time_elapsed | 93080 | -| total_timesteps | 2203136 | -| train/ | | -| approx_kl | 0.3680903 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.858 | -| learning_rate | 0.0003 | -| loss | 0.00348 | -| n_updates | 172110 | -| policy_gradient_loss | 0.0126 | -| std | 0.00828 | -| value_loss | 0.00158 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17213 | -| time_elapsed | 93086 | -| total_timesteps | 2203264 | -| train/ | | -| approx_kl | 0.08048997 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.35 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 172120 | -| policy_gradient_loss | 0.00623 | -| std | 0.00828 | -| value_loss | 3.54e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17214 | -| time_elapsed | 93091 | -| total_timesteps | 2203392 | -| train/ | | -| approx_kl | 0.039061267 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00475 | -| learning_rate | 0.0003 | -| loss | -0.00069 | -| n_updates | 172130 | -| policy_gradient_loss | 0.0182 | -| std | 0.00828 | -| value_loss | 2.39e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17215 | -| time_elapsed | 93097 | -| total_timesteps | 2203520 | -| train/ | | -| approx_kl | 0.1986677 | -| clip_fraction | 0.671 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 172140 | -| policy_gradient_loss | 0.097 | -| std | 0.00828 | -| value_loss | 2.06e-07 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17216 | -| time_elapsed | 93101 | -| total_timesteps | 2203648 | -| train/ | | -| approx_kl | 0.135245 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.098 | -| n_updates | 172150 | -| policy_gradient_loss | 0.097 | -| std | 0.00828 | -| value_loss | 1.4e-07 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17217 | -| time_elapsed | 93106 | -| total_timesteps | 2203776 | -| train/ | | -| approx_kl | 0.10284757 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0902 | -| n_updates | 172160 | -| policy_gradient_loss | 0.0905 | -| std | 0.00828 | -| value_loss | 1.06e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17218 | -| time_elapsed | 93112 | -| total_timesteps | 2203904 | -| train/ | | -| approx_kl | 0.088648885 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 172170 | -| policy_gradient_loss | 0.0853 | -| std | 0.00828 | -| value_loss | 8.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17219 | -| time_elapsed | 93116 | -| total_timesteps | 2204032 | -| train/ | | -| approx_kl | 0.020524656 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.000263 | -| n_updates | 172180 | -| policy_gradient_loss | 0.0176 | -| std | 0.00829 | -| value_loss | 5.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17220 | -| time_elapsed | 93127 | -| total_timesteps | 2204160 | -| train/ | | -| approx_kl | 0.022831282 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 172190 | -| policy_gradient_loss | -0.0176 | -| std | 0.00829 | -| value_loss | 0.0003 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17221 | -| time_elapsed | 93132 | -| total_timesteps | 2204288 | -| train/ | | -| approx_kl | 0.0016303649 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.000127 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 172200 | -| policy_gradient_loss | 0.0185 | -| std | 0.00828 | -| value_loss | 1.59e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17222 | -| time_elapsed | 93135 | -| total_timesteps | 2204416 | -| train/ | | -| approx_kl | 0.0006068484 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00245 | -| learning_rate | 0.0003 | -| loss | 0.000171 | -| n_updates | 172210 | -| policy_gradient_loss | 0.0233 | -| std | 0.00828 | -| value_loss | 6.6e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17223 | -| time_elapsed | 93139 | -| total_timesteps | 2204544 | -| train/ | | -| approx_kl | 0.14061907 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.0061 | -| learning_rate | 0.0003 | -| loss | 0.0635 | -| n_updates | 172220 | -| policy_gradient_loss | 0.0157 | -| std | 0.00827 | -| value_loss | 6.81e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17224 | -| time_elapsed | 93143 | -| total_timesteps | 2204672 | -| train/ | | -| approx_kl | 0.099317156 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.009 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 172230 | -| policy_gradient_loss | 0.0101 | -| std | 0.00827 | -| value_loss | 5.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17225 | -| time_elapsed | 93148 | -| total_timesteps | 2204800 | -| train/ | | -| approx_kl | 0.038476247 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 172240 | -| policy_gradient_loss | 0.0153 | -| std | 0.00827 | -| value_loss | 1.12e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17226 | -| time_elapsed | 93152 | -| total_timesteps | 2204928 | -| train/ | | -| approx_kl | 0.10346259 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 172250 | -| policy_gradient_loss | 0.0211 | -| std | 0.00827 | -| value_loss | 1.06e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17227 | -| time_elapsed | 93158 | -| total_timesteps | 2205056 | -| train/ | | -| approx_kl | 0.12342994 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 172260 | -| policy_gradient_loss | 0.0194 | -| std | 0.00827 | -| value_loss | 8.41e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17228 | -| time_elapsed | 93168 | -| total_timesteps | 2205184 | -| train/ | | -| approx_kl | 0.14753696 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.739 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 172270 | -| policy_gradient_loss | -0.0186 | -| std | 0.00828 | -| value_loss | 0.00473 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17229 | -| time_elapsed | 93173 | -| total_timesteps | 2205312 | -| train/ | | -| approx_kl | 0.09560768 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 172280 | -| policy_gradient_loss | 0.0388 | -| std | 0.00828 | -| value_loss | 3.51e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17230 | -| time_elapsed | 93179 | -| total_timesteps | 2205440 | -| train/ | | -| approx_kl | 0.10074009 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00575 | -| learning_rate | 0.0003 | -| loss | 0.0547 | -| n_updates | 172290 | -| policy_gradient_loss | 0.0222 | -| std | 0.00828 | -| value_loss | 4.12e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17231 | -| time_elapsed | 93183 | -| total_timesteps | 2205568 | -| train/ | | -| approx_kl | 0.0010181721 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.000681 | -| n_updates | 172300 | -| policy_gradient_loss | 0.0217 | -| std | 0.00828 | -| value_loss | 2.41e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17232 | -| time_elapsed | 93188 | -| total_timesteps | 2205696 | -| train/ | | -| approx_kl | 0.3835647 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 172310 | -| policy_gradient_loss | 0.0384 | -| std | 0.00828 | -| value_loss | 2.92e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17233 | -| time_elapsed | 93194 | -| total_timesteps | 2205824 | -| train/ | | -| approx_kl | 0.07897263 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | 0.0405 | -| n_updates | 172320 | -| policy_gradient_loss | 0.0468 | -| std | 0.00829 | -| value_loss | 1.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17234 | -| time_elapsed | 93198 | -| total_timesteps | 2205952 | -| train/ | | -| approx_kl | 0.002253185 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.00935 | -| n_updates | 172330 | -| policy_gradient_loss | -0.00263 | -| std | 0.00829 | -| value_loss | 7.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17235 | -| time_elapsed | 93203 | -| total_timesteps | 2206080 | -| train/ | | -| approx_kl | 0.016440375 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.0084 | -| n_updates | 172340 | -| policy_gradient_loss | 0.0273 | -| std | 0.00829 | -| value_loss | 1.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17236 | -| time_elapsed | 93212 | -| total_timesteps | 2206208 | -| train/ | | -| approx_kl | 0.012156038 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 172350 | -| policy_gradient_loss | -0.000346 | -| std | 0.00829 | -| value_loss | 0.000241 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17237 | -| time_elapsed | 93217 | -| total_timesteps | 2206336 | -| train/ | | -| approx_kl | 0.118786395 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.000385 | -| learning_rate | 0.0003 | -| loss | 0.0584 | -| n_updates | 172360 | -| policy_gradient_loss | 0.0163 | -| std | 0.00829 | -| value_loss | 1.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17238 | -| time_elapsed | 93223 | -| total_timesteps | 2206464 | -| train/ | | -| approx_kl | 0.011452736 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0755 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 172370 | -| policy_gradient_loss | 0.00795 | -| std | 0.00829 | -| value_loss | 3.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17239 | -| time_elapsed | 93228 | -| total_timesteps | 2206592 | -| train/ | | -| approx_kl | 0.18221626 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 172380 | -| policy_gradient_loss | 0.0855 | -| std | 0.00829 | -| value_loss | 2.52e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17240 | -| time_elapsed | 93234 | -| total_timesteps | 2206720 | -| train/ | | -| approx_kl | 0.034393854 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 172390 | -| policy_gradient_loss | 0.0134 | -| std | 0.00829 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17241 | -| time_elapsed | 93239 | -| total_timesteps | 2206848 | -| train/ | | -| approx_kl | 0.49262825 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 172400 | -| policy_gradient_loss | 0.0585 | -| std | 0.00829 | -| value_loss | 1.13e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 17242 | -| time_elapsed | 93244 | -| total_timesteps | 2206976 | -| train/ | | -| approx_kl | 0.026963728 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 172410 | -| policy_gradient_loss | 0.00689 | -| std | 0.00829 | -| value_loss | 7.68e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17243 | -| time_elapsed | 93249 | -| total_timesteps | 2207104 | -| train/ | | -| approx_kl | 2.9431656e-05 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 172420 | -| policy_gradient_loss | -0.00303 | -| std | 0.00829 | -| value_loss | 5.29e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17244 | -| time_elapsed | 93262 | -| total_timesteps | 2207232 | -| train/ | | -| approx_kl | 0.010421734 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 172430 | -| policy_gradient_loss | -0.00669 | -| std | 0.00829 | -| value_loss | 0.00125 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17245 | -| time_elapsed | 93268 | -| total_timesteps | 2207360 | -| train/ | | -| approx_kl | 0.14951327 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.283 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 172440 | -| policy_gradient_loss | 0.118 | -| std | 0.00829 | -| value_loss | 8.72e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17246 | -| time_elapsed | 93274 | -| total_timesteps | 2207488 | -| train/ | | -| approx_kl | 0.10297451 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00431 | -| learning_rate | 0.0003 | -| loss | 0.0682 | -| n_updates | 172450 | -| policy_gradient_loss | 0.0882 | -| std | 0.00829 | -| value_loss | 2.6e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17247 | -| time_elapsed | 93279 | -| total_timesteps | 2207616 | -| train/ | | -| approx_kl | 0.22414017 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 172460 | -| policy_gradient_loss | 0.0886 | -| std | 0.0083 | -| value_loss | 1.39e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17248 | -| time_elapsed | 93283 | -| total_timesteps | 2207744 | -| train/ | | -| approx_kl | 0.044236526 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | 0.00597 | -| n_updates | 172470 | -| policy_gradient_loss | 0.0153 | -| std | 0.0083 | -| value_loss | 6.09e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17249 | -| time_elapsed | 93288 | -| total_timesteps | 2207872 | -| train/ | | -| approx_kl | 0.00011147093 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.0028 | -| learning_rate | 0.0003 | -| loss | 0.000468 | -| n_updates | 172480 | -| policy_gradient_loss | 0.017 | -| std | 0.0083 | -| value_loss | 1.48e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17250 | -| time_elapsed | 93293 | -| total_timesteps | 2208000 | -| train/ | | -| approx_kl | 0.00019500079 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 172490 | -| policy_gradient_loss | 0.00104 | -| std | 0.0083 | -| value_loss | 9.55e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17251 | -| time_elapsed | 93298 | -| total_timesteps | 2208128 | -| train/ | | -| approx_kl | 0.036220983 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.0046 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 172500 | -| policy_gradient_loss | 0.0145 | -| std | 0.0083 | -| value_loss | 3.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17252 | -| time_elapsed | 93308 | -| total_timesteps | 2208256 | -| train/ | | -| approx_kl | 0.086698145 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 172510 | -| policy_gradient_loss | 0.00226 | -| std | 0.0083 | -| value_loss | 0.000118 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17253 | -| time_elapsed | 93313 | -| total_timesteps | 2208384 | -| train/ | | -| approx_kl | 0.2120531 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00415 | -| learning_rate | 0.0003 | -| loss | 0.0895 | -| n_updates | 172520 | -| policy_gradient_loss | 0.0127 | -| std | 0.00829 | -| value_loss | 5.2e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17254 | -| time_elapsed | 93318 | -| total_timesteps | 2208512 | -| train/ | | -| approx_kl | 0.0058442485 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 172530 | -| policy_gradient_loss | 0.0183 | -| std | 0.00829 | -| value_loss | 1.68e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17255 | -| time_elapsed | 93323 | -| total_timesteps | 2208640 | -| train/ | | -| approx_kl | 0.06320726 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 172540 | -| policy_gradient_loss | 0.0197 | -| std | 0.00829 | -| value_loss | 1.12e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17256 | -| time_elapsed | 93327 | -| total_timesteps | 2208768 | -| train/ | | -| approx_kl | 0.5455383 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.201 | -| n_updates | 172550 | -| policy_gradient_loss | 0.0526 | -| std | 0.00829 | -| value_loss | 7.94e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17257 | -| time_elapsed | 93333 | -| total_timesteps | 2208896 | -| train/ | | -| approx_kl | 0.023620462 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.00402 | -| n_updates | 172560 | -| policy_gradient_loss | 0.00308 | -| std | 0.00828 | -| value_loss | 4.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17258 | -| time_elapsed | 93338 | -| total_timesteps | 2209024 | -| train/ | | -| approx_kl | 0.032756716 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.00836 | -| n_updates | 172570 | -| policy_gradient_loss | -0.00498 | -| std | 0.00828 | -| value_loss | 3.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17259 | -| time_elapsed | 93350 | -| total_timesteps | 2209152 | -| train/ | | -| approx_kl | 0.015275311 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 172580 | -| policy_gradient_loss | -0.0137 | -| std | 0.00828 | -| value_loss | 0.000351 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17260 | -| time_elapsed | 93356 | -| total_timesteps | 2209280 | -| train/ | | -| approx_kl | 0.24281593 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 172590 | -| policy_gradient_loss | 0.00579 | -| std | 0.00827 | -| value_loss | 2e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17261 | -| time_elapsed | 93361 | -| total_timesteps | 2209408 | -| train/ | | -| approx_kl | 0.0230608 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00465 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 172600 | -| policy_gradient_loss | 0.00291 | -| std | 0.00828 | -| value_loss | 8.69e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17262 | -| time_elapsed | 93366 | -| total_timesteps | 2209536 | -| train/ | | -| approx_kl | 0.014400287 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0027 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 172610 | -| policy_gradient_loss | 0.0235 | -| std | 0.00828 | -| value_loss | 3.4e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17263 | -| time_elapsed | 93371 | -| total_timesteps | 2209664 | -| train/ | | -| approx_kl | 0.2362119 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00339 | -| learning_rate | 0.0003 | -| loss | 0.182 | -| n_updates | 172620 | -| policy_gradient_loss | 0.123 | -| std | 0.00829 | -| value_loss | 2.88e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17264 | -| time_elapsed | 93376 | -| total_timesteps | 2209792 | -| train/ | | -| approx_kl | 0.15595764 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00762 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 172630 | -| policy_gradient_loss | 0.109 | -| std | 0.00829 | -| value_loss | 2.21e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 17265 | -| time_elapsed | 93381 | -| total_timesteps | 2209920 | -| train/ | | -| approx_kl | 0.10148066 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0635 | -| n_updates | 172640 | -| policy_gradient_loss | 0.102 | -| std | 0.00829 | -| value_loss | 1.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17266 | -| time_elapsed | 93386 | -| total_timesteps | 2210048 | -| train/ | | -| approx_kl | 0.019190244 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 172650 | -| policy_gradient_loss | 0.0162 | -| std | 0.00829 | -| value_loss | 1.1e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17267 | -| time_elapsed | 93393 | -| total_timesteps | 2210176 | -| train/ | | -| approx_kl | 0.1714541 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | 0.0568 | -| n_updates | 172660 | -| policy_gradient_loss | 0.00979 | -| std | 0.00829 | -| value_loss | 0.000202 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17268 | -| time_elapsed | 93397 | -| total_timesteps | 2210304 | -| train/ | | -| approx_kl | 0.01882889 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | -0.00892 | -| n_updates | 172670 | -| policy_gradient_loss | 0.0135 | -| std | 0.00829 | -| value_loss | 3.29e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17269 | -| time_elapsed | 93403 | -| total_timesteps | 2210432 | -| train/ | | -| approx_kl | 0.22933172 | -| clip_fraction | 0.669 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00718 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 172680 | -| policy_gradient_loss | 0.116 | -| std | 0.00829 | -| value_loss | 5.86e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17270 | -| time_elapsed | 93409 | -| total_timesteps | 2210560 | -| train/ | | -| approx_kl | 0.11149169 | -| clip_fraction | 0.65 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 172690 | -| policy_gradient_loss | 0.0999 | -| std | 0.00829 | -| value_loss | 4.24e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17271 | -| time_elapsed | 93414 | -| total_timesteps | 2210688 | -| train/ | | -| approx_kl | 0.09314691 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.0646 | -| n_updates | 172700 | -| policy_gradient_loss | 0.0931 | -| std | 0.00829 | -| value_loss | 2.51e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17272 | -| time_elapsed | 93420 | -| total_timesteps | 2210816 | -| train/ | | -| approx_kl | 0.10827549 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.0813 | -| n_updates | 172710 | -| policy_gradient_loss | 0.102 | -| std | 0.00829 | -| value_loss | 1.92e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17273 | -| time_elapsed | 93425 | -| total_timesteps | 2210944 | -| train/ | | -| approx_kl | 0.01724204 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | -0.00745 | -| n_updates | 172720 | -| policy_gradient_loss | 0.0143 | -| std | 0.00829 | -| value_loss | 1.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17274 | -| time_elapsed | 93430 | -| total_timesteps | 2211072 | -| train/ | | -| approx_kl | 0.12376545 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.0547 | -| n_updates | 172730 | -| policy_gradient_loss | 0.0141 | -| std | 0.00829 | -| value_loss | 9.74e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17275 | -| time_elapsed | 93438 | -| total_timesteps | 2211200 | -| train/ | | -| approx_kl | 0.018807696 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0256 | -| n_updates | 172740 | -| policy_gradient_loss | -0.0175 | -| std | 0.00829 | -| value_loss | 9.38e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17276 | -| time_elapsed | 93443 | -| total_timesteps | 2211328 | -| train/ | | -| approx_kl | 0.039934948 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 172750 | -| policy_gradient_loss | 0.012 | -| std | 0.00829 | -| value_loss | 6.11e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17277 | -| time_elapsed | 93448 | -| total_timesteps | 2211456 | -| train/ | | -| approx_kl | 0.00019566249 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 172760 | -| policy_gradient_loss | -0.000518 | -| std | 0.00829 | -| value_loss | 2.36e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17278 | -| time_elapsed | 93452 | -| total_timesteps | 2211584 | -| train/ | | -| approx_kl | 0.029465996 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.00137 | -| n_updates | 172770 | -| policy_gradient_loss | 0.000623 | -| std | 0.00828 | -| value_loss | 2.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17279 | -| time_elapsed | 93457 | -| total_timesteps | 2211712 | -| train/ | | -| approx_kl | 0.007316562 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.000594 | -| n_updates | 172780 | -| policy_gradient_loss | 0.00504 | -| std | 0.00828 | -| value_loss | 1.29e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17280 | -| time_elapsed | 93463 | -| total_timesteps | 2211840 | -| train/ | | -| approx_kl | 0.03949789 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | -0.00283 | -| n_updates | 172790 | -| policy_gradient_loss | -0.00468 | -| std | 0.00828 | -| value_loss | 8.55e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 17281 | -| time_elapsed | 93467 | -| total_timesteps | 2211968 | -| train/ | | -| approx_kl | 0.008810265 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 172800 | -| policy_gradient_loss | 0.0028 | -| std | 0.00828 | -| value_loss | 5.47e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17282 | -| time_elapsed | 93471 | -| total_timesteps | 2212096 | -| train/ | | -| approx_kl | 0.0005074013 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | 0.0043 | -| n_updates | 172810 | -| policy_gradient_loss | 0.000533 | -| std | 0.00828 | -| value_loss | 4.01e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17283 | -| time_elapsed | 93479 | -| total_timesteps | 2212224 | -| train/ | | -| approx_kl | 0.16687723 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.749 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 172820 | -| policy_gradient_loss | 0.0168 | -| std | 0.00828 | -| value_loss | 0.00436 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17284 | -| time_elapsed | 93483 | -| total_timesteps | 2212352 | -| train/ | | -| approx_kl | 0.00573854 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.00068 | -| n_updates | 172830 | -| policy_gradient_loss | 0.00354 | -| std | 0.00827 | -| value_loss | 4.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17285 | -| time_elapsed | 93489 | -| total_timesteps | 2212480 | -| train/ | | -| approx_kl | 0.002217114 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 172840 | -| policy_gradient_loss | 0.00783 | -| std | 0.00827 | -| value_loss | 1.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17286 | -| time_elapsed | 93494 | -| total_timesteps | 2212608 | -| train/ | | -| approx_kl | 0.06428227 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.055 | -| learning_rate | 0.0003 | -| loss | 0.0441 | -| n_updates | 172850 | -| policy_gradient_loss | 0.0105 | -| std | 0.00826 | -| value_loss | 1.32e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17287 | -| time_elapsed | 93499 | -| total_timesteps | 2212736 | -| train/ | | -| approx_kl | 0.004394195 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0031 | -| n_updates | 172860 | -| policy_gradient_loss | 0.00823 | -| std | 0.00826 | -| value_loss | 6.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17288 | -| time_elapsed | 93503 | -| total_timesteps | 2212864 | -| train/ | | -| approx_kl | 0.021490093 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00905 | -| learning_rate | 0.0003 | -| loss | 0.00596 | -| n_updates | 172870 | -| policy_gradient_loss | 0.033 | -| std | 0.00826 | -| value_loss | 3.9e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 17289 | -| time_elapsed | 93509 | -| total_timesteps | 2212992 | -| train/ | | -| approx_kl | 0.10172023 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00736 | -| learning_rate | 0.0003 | -| loss | 0.076 | -| n_updates | 172880 | -| policy_gradient_loss | 0.0443 | -| std | 0.00827 | -| value_loss | 1.51e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17290 | -| time_elapsed | 93514 | -| total_timesteps | 2213120 | -| train/ | | -| approx_kl | 0.15321514 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | 0.0963 | -| n_updates | 172890 | -| policy_gradient_loss | 0.03 | -| std | 0.00827 | -| value_loss | 4.06e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17291 | -| time_elapsed | 93528 | -| total_timesteps | 2213248 | -| train/ | | -| approx_kl | 0.0054648556 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.949 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 172900 | -| policy_gradient_loss | -0.00958 | -| std | 0.00827 | -| value_loss | 0.000166 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17292 | -| time_elapsed | 93533 | -| total_timesteps | 2213376 | -| train/ | | -| approx_kl | 0.0073032333 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 172910 | -| policy_gradient_loss | 0.033 | -| std | 0.00827 | -| value_loss | 8.39e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17293 | -| time_elapsed | 93538 | -| total_timesteps | 2213504 | -| train/ | | -| approx_kl | 0.14132951 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00203 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 172920 | -| policy_gradient_loss | 0.0596 | -| std | 0.00826 | -| value_loss | 5.84e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17294 | -| time_elapsed | 93543 | -| total_timesteps | 2213632 | -| train/ | | -| approx_kl | 0.07725154 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00716 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 172930 | -| policy_gradient_loss | 0.000269 | -| std | 0.00826 | -| value_loss | 4.65e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17295 | -| time_elapsed | 93548 | -| total_timesteps | 2213760 | -| train/ | | -| approx_kl | 0.0110929655 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 172940 | -| policy_gradient_loss | 0.00207 | -| std | 0.00826 | -| value_loss | 2.81e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 17296 | -| time_elapsed | 93553 | -| total_timesteps | 2213888 | -| train/ | | -| approx_kl | 0.0001902678 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.000816 | -| n_updates | 172950 | -| policy_gradient_loss | 0.00452 | -| std | 0.00826 | -| value_loss | 1.79e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17297 | -| time_elapsed | 93556 | -| total_timesteps | 2214016 | -| train/ | | -| approx_kl | 0.031783663 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.00132 | -| n_updates | 172960 | -| policy_gradient_loss | -0.00037 | -| std | 0.00825 | -| value_loss | 1.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17298 | -| time_elapsed | 93566 | -| total_timesteps | 2214144 | -| train/ | | -| approx_kl | 0.06836394 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.731 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 172970 | -| policy_gradient_loss | -0.0183 | -| std | 0.00825 | -| value_loss | 0.00498 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17299 | -| time_elapsed | 93572 | -| total_timesteps | 2214272 | -| train/ | | -| approx_kl | 0.04632345 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 172980 | -| policy_gradient_loss | 0.0112 | -| std | 0.00825 | -| value_loss | 8.55e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17300 | -| time_elapsed | 93578 | -| total_timesteps | 2214400 | -| train/ | | -| approx_kl | 0.024464175 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 172990 | -| policy_gradient_loss | 0.00765 | -| std | 0.00825 | -| value_loss | 1.3e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17301 | -| time_elapsed | 93584 | -| total_timesteps | 2214528 | -| train/ | | -| approx_kl | 0.038208656 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -3.71 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 173000 | -| policy_gradient_loss | 0.011 | -| std | 0.00825 | -| value_loss | 0.000239 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17302 | -| time_elapsed | 93589 | -| total_timesteps | 2214656 | -| train/ | | -| approx_kl | 0.038768012 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 173010 | -| policy_gradient_loss | 0.00659 | -| std | 0.00825 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17303 | -| time_elapsed | 93595 | -| total_timesteps | 2214784 | -| train/ | | -| approx_kl | 0.034279156 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 173020 | -| policy_gradient_loss | 0.00822 | -| std | 0.00825 | -| value_loss | 3.15e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17304 | -| time_elapsed | 93600 | -| total_timesteps | 2214912 | -| train/ | | -| approx_kl | 0.0048628254 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00248 | -| learning_rate | 0.0003 | -| loss | -0.000881 | -| n_updates | 173030 | -| policy_gradient_loss | 0.00389 | -| std | 0.00825 | -| value_loss | 8.34e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17305 | -| time_elapsed | 93605 | -| total_timesteps | 2215040 | -| train/ | | -| approx_kl | 0.00061843405 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 173040 | -| policy_gradient_loss | 0.00468 | -| std | 0.00825 | -| value_loss | 1.38e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17306 | -| time_elapsed | 93613 | -| total_timesteps | 2215168 | -| train/ | | -| approx_kl | 0.002645154 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.697 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 173050 | -| policy_gradient_loss | -0.00534 | -| std | 0.00825 | -| value_loss | 0.00691 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17307 | -| time_elapsed | 93618 | -| total_timesteps | 2215296 | -| train/ | | -| approx_kl | 0.33028913 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 173060 | -| policy_gradient_loss | 0.0376 | -| std | 0.00825 | -| value_loss | 2.85e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17308 | -| time_elapsed | 93622 | -| total_timesteps | 2215424 | -| train/ | | -| approx_kl | 0.005512062 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00641 | -| learning_rate | 0.0003 | -| loss | -0.00378 | -| n_updates | 173070 | -| policy_gradient_loss | 0.00319 | -| std | 0.00825 | -| value_loss | 1.42e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17309 | -| time_elapsed | 93626 | -| total_timesteps | 2215552 | -| train/ | | -| approx_kl | 0.06013918 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 173080 | -| policy_gradient_loss | 0.00241 | -| std | 0.00825 | -| value_loss | 1.06e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17310 | -| time_elapsed | 93630 | -| total_timesteps | 2215680 | -| train/ | | -| approx_kl | 0.0054311035 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.00675 | -| n_updates | 173090 | -| policy_gradient_loss | 0.00618 | -| std | 0.00824 | -| value_loss | 5.51e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17311 | -| time_elapsed | 93634 | -| total_timesteps | 2215808 | -| train/ | | -| approx_kl | 0.0024534143 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 173100 | -| policy_gradient_loss | -0.00418 | -| std | 0.00825 | -| value_loss | 5.46e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17312 | -| time_elapsed | 93637 | -| total_timesteps | 2215936 | -| train/ | | -| approx_kl | 0.020026594 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.00418 | -| n_updates | 173110 | -| policy_gradient_loss | 0.0294 | -| std | 0.00824 | -| value_loss | 3.28e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17313 | -| time_elapsed | 93644 | -| total_timesteps | 2216064 | -| train/ | | -| approx_kl | 0.70053506 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | 0.339 | -| n_updates | 173120 | -| policy_gradient_loss | 0.15 | -| std | 0.00824 | -| value_loss | 1.97e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17314 | -| time_elapsed | 93651 | -| total_timesteps | 2216192 | -| train/ | | -| approx_kl | 0.063511156 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.804 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 173130 | -| policy_gradient_loss | -0.00946 | -| std | 0.00824 | -| value_loss | 0.00295 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17315 | -| time_elapsed | 93656 | -| total_timesteps | 2216320 | -| train/ | | -| approx_kl | 0.034019284 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.00947 | -| n_updates | 173140 | -| policy_gradient_loss | 0.0173 | -| std | 0.00824 | -| value_loss | 1.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17316 | -| time_elapsed | 93661 | -| total_timesteps | 2216448 | -| train/ | | -| approx_kl | 0.019160535 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00541 | -| learning_rate | 0.0003 | -| loss | 0.00332 | -| n_updates | 173150 | -| policy_gradient_loss | 0.015 | -| std | 0.00824 | -| value_loss | 1.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17317 | -| time_elapsed | 93665 | -| total_timesteps | 2216576 | -| train/ | | -| approx_kl | 0.019813204 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 173160 | -| policy_gradient_loss | 0.019 | -| std | 0.00824 | -| value_loss | 9.98e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17318 | -| time_elapsed | 93669 | -| total_timesteps | 2216704 | -| train/ | | -| approx_kl | 0.1686347 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.0472 | -| n_updates | 173170 | -| policy_gradient_loss | 0.0156 | -| std | 0.00824 | -| value_loss | 6.92e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17319 | -| time_elapsed | 93674 | -| total_timesteps | 2216832 | -| train/ | | -| approx_kl | 4.5744702e-05 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.000261 | -| n_updates | 173180 | -| policy_gradient_loss | 0.00523 | -| std | 0.00824 | -| value_loss | 4.61e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17320 | -| time_elapsed | 93679 | -| total_timesteps | 2216960 | -| train/ | | -| approx_kl | 8.284161e-05 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 173190 | -| policy_gradient_loss | 0.00146 | -| std | 0.00824 | -| value_loss | 4.64e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17321 | -| time_elapsed | 93684 | -| total_timesteps | 2217088 | -| train/ | | -| approx_kl | 9.195926e-05 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 173200 | -| policy_gradient_loss | -0.00844 | -| std | 0.00824 | -| value_loss | 2.07e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17322 | -| time_elapsed | 93693 | -| total_timesteps | 2217216 | -| train/ | | -| approx_kl | 0.0015873034 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.753 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 173210 | -| policy_gradient_loss | -0.000923 | -| std | 0.00824 | -| value_loss | 0.00461 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17323 | -| time_elapsed | 93697 | -| total_timesteps | 2217344 | -| train/ | | -| approx_kl | 0.05022128 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 173220 | -| policy_gradient_loss | 0.0463 | -| std | 0.00824 | -| value_loss | 2.21e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17324 | -| time_elapsed | 93701 | -| total_timesteps | 2217472 | -| train/ | | -| approx_kl | 0.018187378 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00297 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 173230 | -| policy_gradient_loss | -0.00454 | -| std | 0.00823 | -| value_loss | 5.35e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17325 | -| time_elapsed | 93706 | -| total_timesteps | 2217600 | -| train/ | | -| approx_kl | 0.1162487 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.0434 | -| n_updates | 173240 | -| policy_gradient_loss | 0.00579 | -| std | 0.00824 | -| value_loss | 2.65e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17326 | -| time_elapsed | 93711 | -| total_timesteps | 2217728 | -| train/ | | -| approx_kl | 0.08392625 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 173250 | -| policy_gradient_loss | 0.0164 | -| std | 0.00824 | -| value_loss | 1.7e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17327 | -| time_elapsed | 93716 | -| total_timesteps | 2217856 | -| train/ | | -| approx_kl | 0.03104604 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 173260 | -| policy_gradient_loss | 0.0153 | -| std | 0.00824 | -| value_loss | 9.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 17328 | -| time_elapsed | 93722 | -| total_timesteps | 2217984 | -| train/ | | -| approx_kl | 0.023972439 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -0.00226 | -| n_updates | 173270 | -| policy_gradient_loss | 0.0177 | -| std | 0.00824 | -| value_loss | 6.74e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17329 | -| time_elapsed | 93727 | -| total_timesteps | 2218112 | -| train/ | | -| approx_kl | 0.0033535552 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.00076 | -| n_updates | 173280 | -| policy_gradient_loss | 0.0185 | -| std | 0.00824 | -| value_loss | 3.69e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17330 | -| time_elapsed | 93740 | -| total_timesteps | 2218240 | -| train/ | | -| approx_kl | 0.031942926 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.888 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 173290 | -| policy_gradient_loss | 0.00262 | -| std | 0.00824 | -| value_loss | 0.00124 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17331 | -| time_elapsed | 93744 | -| total_timesteps | 2218368 | -| train/ | | -| approx_kl | 0.021633875 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.000821 | -| learning_rate | 0.0003 | -| loss | 0.00282 | -| n_updates | 173300 | -| policy_gradient_loss | 0.0569 | -| std | 0.00824 | -| value_loss | 9.01e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17332 | -| time_elapsed | 93747 | -| total_timesteps | 2218496 | -| train/ | | -| approx_kl | 0.1394563 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00203 | -| learning_rate | 0.0003 | -| loss | 0.00744 | -| n_updates | 173310 | -| policy_gradient_loss | 0.0144 | -| std | 0.00823 | -| value_loss | 3.54e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17333 | -| time_elapsed | 93752 | -| total_timesteps | 2218624 | -| train/ | | -| approx_kl | 0.040245056 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -27.4 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 173320 | -| policy_gradient_loss | 0.0114 | -| std | 0.00823 | -| value_loss | 1.3e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17334 | -| time_elapsed | 93758 | -| total_timesteps | 2218752 | -| train/ | | -| approx_kl | 0.15189493 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.0593 | -| n_updates | 173330 | -| policy_gradient_loss | 0.0224 | -| std | 0.00824 | -| value_loss | 3.8e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17335 | -| time_elapsed | 93763 | -| total_timesteps | 2218880 | -| train/ | | -| approx_kl | 0.0006102226 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.71 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 173340 | -| policy_gradient_loss | -0.00763 | -| std | 0.00824 | -| value_loss | 3.53e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17336 | -| time_elapsed | 93767 | -| total_timesteps | 2219008 | -| train/ | | -| approx_kl | 1.193583e-05 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00899 | -| learning_rate | 0.0003 | -| loss | -0.000453 | -| n_updates | 173350 | -| policy_gradient_loss | 0.00403 | -| std | 0.00824 | -| value_loss | 4.76e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17337 | -| time_elapsed | 93779 | -| total_timesteps | 2219136 | -| train/ | | -| approx_kl | 0.0815722 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | -0.00912 | -| n_updates | 173360 | -| policy_gradient_loss | 0.0172 | -| std | 0.00824 | -| value_loss | 0.00642 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17338 | -| time_elapsed | 93783 | -| total_timesteps | 2219264 | -| train/ | | -| approx_kl | 0.018641062 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.282 | -| learning_rate | 0.0003 | -| loss | -0.0258 | -| n_updates | 173370 | -| policy_gradient_loss | 0.00997 | -| std | 0.00824 | -| value_loss | 1.19e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17339 | -| time_elapsed | 93787 | -| total_timesteps | 2219392 | -| train/ | | -| approx_kl | 0.15740144 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0095 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 173380 | -| policy_gradient_loss | 0.00512 | -| std | 0.00824 | -| value_loss | 5.61e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17340 | -| time_elapsed | 93791 | -| total_timesteps | 2219520 | -| train/ | | -| approx_kl | 0.01803704 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.291 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 173390 | -| policy_gradient_loss | -0.0035 | -| std | 0.00824 | -| value_loss | 2.83e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17341 | -| time_elapsed | 93796 | -| total_timesteps | 2219648 | -| train/ | | -| approx_kl | 0.015197938 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | 0.00564 | -| n_updates | 173400 | -| policy_gradient_loss | 0.02 | -| std | 0.00823 | -| value_loss | 4.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17342 | -| time_elapsed | 93802 | -| total_timesteps | 2219776 | -| train/ | | -| approx_kl | 0.23690099 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.203 | -| n_updates | 173410 | -| policy_gradient_loss | 0.13 | -| std | 0.00823 | -| value_loss | 9.83e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17343 | -| time_elapsed | 93807 | -| total_timesteps | 2219904 | -| train/ | | -| approx_kl | 0.11925991 | -| clip_fraction | 0.64 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.0877 | -| n_updates | 173420 | -| policy_gradient_loss | 0.107 | -| std | 0.00823 | -| value_loss | 5.08e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17344 | -| time_elapsed | 93812 | -| total_timesteps | 2220032 | -| train/ | | -| approx_kl | 0.024169402 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 173430 | -| policy_gradient_loss | 0.0201 | -| std | 0.00822 | -| value_loss | 5.66e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17345 | -| time_elapsed | 93822 | -| total_timesteps | 2220160 | -| train/ | | -| approx_kl | 0.001280196 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.922 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 173440 | -| policy_gradient_loss | -0.00925 | -| std | 0.00822 | -| value_loss | 0.000807 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17346 | -| time_elapsed | 93827 | -| total_timesteps | 2220288 | -| train/ | | -| approx_kl | 0.027485944 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 173450 | -| policy_gradient_loss | 0.0372 | -| std | 0.00821 | -| value_loss | 1.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17347 | -| time_elapsed | 93833 | -| total_timesteps | 2220416 | -| train/ | | -| approx_kl | 0.099386275 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | 0.0904 | -| n_updates | 173460 | -| policy_gradient_loss | 0.0486 | -| std | 0.00821 | -| value_loss | 4.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17348 | -| time_elapsed | 93838 | -| total_timesteps | 2220544 | -| train/ | | -| approx_kl | 0.17278191 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0907 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 173470 | -| policy_gradient_loss | 0.0316 | -| std | 0.00821 | -| value_loss | 1.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17349 | -| time_elapsed | 93843 | -| total_timesteps | 2220672 | -| train/ | | -| approx_kl | 0.09952838 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.056 | -| learning_rate | 0.0003 | -| loss | 0.052 | -| n_updates | 173480 | -| policy_gradient_loss | 0.013 | -| std | 0.00821 | -| value_loss | 7.88e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17350 | -| time_elapsed | 93846 | -| total_timesteps | 2220800 | -| train/ | | -| approx_kl | 0.13886546 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.0594 | -| n_updates | 173490 | -| policy_gradient_loss | 0.0272 | -| std | 0.00821 | -| value_loss | 8.42e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17351 | -| time_elapsed | 93851 | -| total_timesteps | 2220928 | -| train/ | | -| approx_kl | 0.07188592 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0817 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 173500 | -| policy_gradient_loss | 0.0223 | -| std | 0.00821 | -| value_loss | 2.16e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17352 | -| time_elapsed | 93856 | -| total_timesteps | 2221056 | -| train/ | | -| approx_kl | 0.24024157 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 173510 | -| policy_gradient_loss | 0.101 | -| std | 0.00822 | -| value_loss | 1.49e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17353 | -| time_elapsed | 93863 | -| total_timesteps | 2221184 | -| train/ | | -| approx_kl | 0.0315645 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -5.16 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 173520 | -| policy_gradient_loss | -0.0143 | -| std | 0.00821 | -| value_loss | 0.00285 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17354 | -| time_elapsed | 93868 | -| total_timesteps | 2221312 | -| train/ | | -| approx_kl | 0.042042613 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 173530 | -| policy_gradient_loss | 0.0914 | -| std | 0.00822 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17355 | -| time_elapsed | 93872 | -| total_timesteps | 2221440 | -| train/ | | -| approx_kl | 0.087352246 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.0555 | -| n_updates | 173540 | -| policy_gradient_loss | 0.0864 | -| std | 0.00822 | -| value_loss | 1.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17356 | -| time_elapsed | 93876 | -| total_timesteps | 2221568 | -| train/ | | -| approx_kl | 0.053057604 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0726 | -| learning_rate | 0.0003 | -| loss | 0.0496 | -| n_updates | 173550 | -| policy_gradient_loss | 0.083 | -| std | 0.00822 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17357 | -| time_elapsed | 93879 | -| total_timesteps | 2221696 | -| train/ | | -| approx_kl | 0.016205845 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 173560 | -| policy_gradient_loss | 0.0161 | -| std | 0.00822 | -| value_loss | 7.89e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17358 | -| time_elapsed | 93883 | -| total_timesteps | 2221824 | -| train/ | | -| approx_kl | 0.39894173 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 173570 | -| policy_gradient_loss | 0.0489 | -| std | 0.00822 | -| value_loss | 5.73e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17359 | -| time_elapsed | 93887 | -| total_timesteps | 2221952 | -| train/ | | -| approx_kl | 0.02941614 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 173580 | -| policy_gradient_loss | -0.00224 | -| std | 0.00822 | -| value_loss | 3.77e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17360 | -| time_elapsed | 93890 | -| total_timesteps | 2222080 | -| train/ | | -| approx_kl | 0.0050206445 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 173590 | -| policy_gradient_loss | 0.00194 | -| std | 0.00822 | -| value_loss | 2.32e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17361 | -| time_elapsed | 93900 | -| total_timesteps | 2222208 | -| train/ | | -| approx_kl | 0.05362393 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -4.8 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 173600 | -| policy_gradient_loss | -0.0124 | -| std | 0.00822 | -| value_loss | 0.00261 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17362 | -| time_elapsed | 93904 | -| total_timesteps | 2222336 | -| train/ | | -| approx_kl | 0.057212297 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00505 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 173610 | -| policy_gradient_loss | 0.0625 | -| std | 0.00823 | -| value_loss | 5.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17363 | -| time_elapsed | 93909 | -| total_timesteps | 2222464 | -| train/ | | -| approx_kl | 0.018836401 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 173620 | -| policy_gradient_loss | 0.00277 | -| std | 0.00823 | -| value_loss | 2.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17364 | -| time_elapsed | 93914 | -| total_timesteps | 2222592 | -| train/ | | -| approx_kl | 0.020053105 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.0054 | -| n_updates | 173630 | -| policy_gradient_loss | 0.0243 | -| std | 0.00823 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17365 | -| time_elapsed | 93919 | -| total_timesteps | 2222720 | -| train/ | | -| approx_kl | 0.0031996486 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 173640 | -| policy_gradient_loss | 0.0528 | -| std | 0.00823 | -| value_loss | 8.15e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17366 | -| time_elapsed | 93923 | -| total_timesteps | 2222848 | -| train/ | | -| approx_kl | 0.021134743 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 173650 | -| policy_gradient_loss | 0.017 | -| std | 0.00823 | -| value_loss | 6.21e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17367 | -| time_elapsed | 93927 | -| total_timesteps | 2222976 | -| train/ | | -| approx_kl | 0.02259807 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00792 | -| n_updates | 173660 | -| policy_gradient_loss | 0.00539 | -| std | 0.00824 | -| value_loss | 3e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 17368 | -| time_elapsed | 93933 | -| total_timesteps | 2223104 | -| train/ | | -| approx_kl | 0.073341966 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 173670 | -| policy_gradient_loss | 0.016 | -| std | 0.00824 | -| value_loss | 2.08e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 17369 | -| time_elapsed | 93943 | -| total_timesteps | 2223232 | -| train/ | | -| approx_kl | 0.1754305 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.582 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 173680 | -| policy_gradient_loss | -0.00373 | -| std | 0.00824 | -| value_loss | 0.000775 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 17370 | -| time_elapsed | 93947 | -| total_timesteps | 2223360 | -| train/ | | -| approx_kl | 0.22385634 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.272 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 173690 | -| policy_gradient_loss | 0.0429 | -| std | 0.00823 | -| value_loss | 2.28e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 17371 | -| time_elapsed | 93952 | -| total_timesteps | 2223488 | -| train/ | | -| approx_kl | 0.040419612 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.659 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 173700 | -| policy_gradient_loss | 0.00433 | -| std | 0.00823 | -| value_loss | 3.24e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 17372 | -| time_elapsed | 93959 | -| total_timesteps | 2223616 | -| train/ | | -| approx_kl | 0.00032174028 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | -0.00163 | -| n_updates | 173710 | -| policy_gradient_loss | -0.00199 | -| std | 0.00823 | -| value_loss | 1.83e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 17373 | -| time_elapsed | 93964 | -| total_timesteps | 2223744 | -| train/ | | -| approx_kl | 0.03108503 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 173720 | -| policy_gradient_loss | 0.00525 | -| std | 0.00824 | -| value_loss | 7.49e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 17374 | -| time_elapsed | 93968 | -| total_timesteps | 2223872 | -| train/ | | -| approx_kl | 0.029651495 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 173730 | -| policy_gradient_loss | -0.0034 | -| std | 0.00824 | -| value_loss | 4.87e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17375 | -| time_elapsed | 93972 | -| total_timesteps | 2224000 | -| train/ | | -| approx_kl | 0.005162144 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 173740 | -| policy_gradient_loss | 0.00235 | -| std | 0.00824 | -| value_loss | 3.23e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17376 | -| time_elapsed | 93978 | -| total_timesteps | 2224128 | -| train/ | | -| approx_kl | 0.056340322 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00454 | -| learning_rate | 0.0003 | -| loss | 0.000986 | -| n_updates | 173750 | -| policy_gradient_loss | 0.0173 | -| std | 0.00824 | -| value_loss | 1.67e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17377 | -| time_elapsed | 93988 | -| total_timesteps | 2224256 | -| train/ | | -| approx_kl | 0.3725626 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0983 | -| learning_rate | 0.0003 | -| loss | 0.00811 | -| n_updates | 173760 | -| policy_gradient_loss | -0.00429 | -| std | 0.00824 | -| value_loss | 0.00132 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17378 | -| time_elapsed | 93993 | -| total_timesteps | 2224384 | -| train/ | | -| approx_kl | 0.07945596 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | -0.0308 | -| n_updates | 173770 | -| policy_gradient_loss | -0.0133 | -| std | 0.00825 | -| value_loss | 1.46e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17379 | -| time_elapsed | 93998 | -| total_timesteps | 2224512 | -| train/ | | -| approx_kl | 0.7485353 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -11.5 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 173780 | -| policy_gradient_loss | 0.0615 | -| std | 0.00825 | -| value_loss | 1.95e-09 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17380 | -| time_elapsed | 94003 | -| total_timesteps | 2224640 | -| train/ | | -| approx_kl | 0.0032029864 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 173790 | -| policy_gradient_loss | 0.0086 | -| std | 0.00825 | -| value_loss | 7.67e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17381 | -| time_elapsed | 94009 | -| total_timesteps | 2224768 | -| train/ | | -| approx_kl | 0.41476446 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.911 | -| learning_rate | 0.0003 | -| loss | 0.052 | -| n_updates | 173800 | -| policy_gradient_loss | 0.023 | -| std | 0.00826 | -| value_loss | 2.91e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17382 | -| time_elapsed | 94014 | -| total_timesteps | 2224896 | -| train/ | | -| approx_kl | 0.02811959 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 173810 | -| policy_gradient_loss | 0.006 | -| std | 0.00827 | -| value_loss | 5.58e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17383 | -| time_elapsed | 94017 | -| total_timesteps | 2225024 | -| train/ | | -| approx_kl | 0.0047675218 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.06 | -| learning_rate | 0.0003 | -| loss | 0.000555 | -| n_updates | 173820 | -| policy_gradient_loss | 0.00358 | -| std | 0.00829 | -| value_loss | 2.72e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17384 | -| time_elapsed | 94024 | -| total_timesteps | 2225152 | -| train/ | | -| approx_kl | 0.02307696 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 173830 | -| policy_gradient_loss | 0.0139 | -| std | 0.00829 | -| value_loss | 0.000854 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17385 | -| time_elapsed | 94028 | -| total_timesteps | 2225280 | -| train/ | | -| approx_kl | 0.055620372 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.0657 | -| n_updates | 173840 | -| policy_gradient_loss | 0.0406 | -| std | 0.00829 | -| value_loss | 1.4e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17386 | -| time_elapsed | 94033 | -| total_timesteps | 2225408 | -| train/ | | -| approx_kl | 0.019457668 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00797 | -| learning_rate | 0.0003 | -| loss | 0.00791 | -| n_updates | 173850 | -| policy_gradient_loss | 0.0271 | -| std | 0.00829 | -| value_loss | 1.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17387 | -| time_elapsed | 94037 | -| total_timesteps | 2225536 | -| train/ | | -| approx_kl | 0.09667932 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 173860 | -| policy_gradient_loss | 0.0453 | -| std | 0.00829 | -| value_loss | 8.75e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17388 | -| time_elapsed | 94042 | -| total_timesteps | 2225664 | -| train/ | | -| approx_kl | 0.023036018 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 173870 | -| policy_gradient_loss | 0.0144 | -| std | 0.00829 | -| value_loss | 6.55e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17389 | -| time_elapsed | 94046 | -| total_timesteps | 2225792 | -| train/ | | -| approx_kl | 0.0946559 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.0734 | -| n_updates | 173880 | -| policy_gradient_loss | 0.0413 | -| std | 0.00829 | -| value_loss | 3.05e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 17390 | -| time_elapsed | 94051 | -| total_timesteps | 2225920 | -| train/ | | -| approx_kl | 0.0037465459 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.00235 | -| n_updates | 173890 | -| policy_gradient_loss | 0.0102 | -| std | 0.0083 | -| value_loss | 1.93e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17391 | -| time_elapsed | 94056 | -| total_timesteps | 2226048 | -| train/ | | -| approx_kl | 0.0019091577 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.00694 | -| n_updates | 173900 | -| policy_gradient_loss | 0.00189 | -| std | 0.0083 | -| value_loss | 2.14e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17392 | -| time_elapsed | 94065 | -| total_timesteps | 2226176 | -| train/ | | -| approx_kl | 0.045760058 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.596 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 173910 | -| policy_gradient_loss | -0.00703 | -| std | 0.0083 | -| value_loss | 0.000704 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17393 | -| time_elapsed | 94071 | -| total_timesteps | 2226304 | -| train/ | | -| approx_kl | 0.05538693 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -6.45 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 173920 | -| policy_gradient_loss | 0.00717 | -| std | 0.0083 | -| value_loss | 2.07e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17394 | -| time_elapsed | 94075 | -| total_timesteps | 2226432 | -| train/ | | -| approx_kl | 0.0328659 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.664 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 173930 | -| policy_gradient_loss | 0.00951 | -| std | 0.0083 | -| value_loss | 1.33e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17395 | -| time_elapsed | 94079 | -| total_timesteps | 2226560 | -| train/ | | -| approx_kl | 3.399141e-05 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.000402 | -| n_updates | 173940 | -| policy_gradient_loss | 0.00235 | -| std | 0.0083 | -| value_loss | 8.25e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17396 | -| time_elapsed | 94084 | -| total_timesteps | 2226688 | -| train/ | | -| approx_kl | 0.005651276 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 173950 | -| policy_gradient_loss | 0.00131 | -| std | 0.00831 | -| value_loss | 9.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17397 | -| time_elapsed | 94088 | -| total_timesteps | 2226816 | -| train/ | | -| approx_kl | 0.024407847 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.586 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 173960 | -| policy_gradient_loss | 0.0791 | -| std | 0.00831 | -| value_loss | 2.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17398 | -| time_elapsed | 94093 | -| total_timesteps | 2226944 | -| train/ | | -| approx_kl | 0.052506298 | -| clip_fraction | 0.603 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00583 | -| learning_rate | 0.0003 | -| loss | 0.0453 | -| n_updates | 173970 | -| policy_gradient_loss | 0.072 | -| std | 0.00832 | -| value_loss | 8.54e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17399 | -| time_elapsed | 94097 | -| total_timesteps | 2227072 | -| train/ | | -| approx_kl | 0.07324227 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.0748 | -| n_updates | 173980 | -| policy_gradient_loss | 0.0915 | -| std | 0.00832 | -| value_loss | 5.61e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17400 | -| time_elapsed | 94107 | -| total_timesteps | 2227200 | -| train/ | | -| approx_kl | 0.077904835 | -| clip_fraction | 0.614 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | 0.0453 | -| n_updates | 173990 | -| policy_gradient_loss | 0.0465 | -| std | 0.00831 | -| value_loss | 0.00319 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17401 | -| time_elapsed | 94111 | -| total_timesteps | 2227328 | -| train/ | | -| approx_kl | 0.14347968 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0897 | -| n_updates | 174000 | -| policy_gradient_loss | 0.1 | -| std | 0.00831 | -| value_loss | 1.58e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17402 | -| time_elapsed | 94115 | -| total_timesteps | 2227456 | -| train/ | | -| approx_kl | 0.031604886 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.00229 | -| n_updates | 174010 | -| policy_gradient_loss | 0.0147 | -| std | 0.00831 | -| value_loss | 7.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17403 | -| time_elapsed | 94119 | -| total_timesteps | 2227584 | -| train/ | | -| approx_kl | 0.12525913 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 174020 | -| policy_gradient_loss | 0.0127 | -| std | 0.00828 | -| value_loss | 9.01e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17404 | -| time_elapsed | 94124 | -| total_timesteps | 2227712 | -| train/ | | -| approx_kl | 0.07437783 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | 0.0361 | -| n_updates | 174030 | -| policy_gradient_loss | 0.00789 | -| std | 0.00826 | -| value_loss | 1.31e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17405 | -| time_elapsed | 94128 | -| total_timesteps | 2227840 | -| train/ | | -| approx_kl | 0.06764368 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00262 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 174040 | -| policy_gradient_loss | 0.0143 | -| std | 0.00825 | -| value_loss | 1.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17406 | -| time_elapsed | 94133 | -| total_timesteps | 2227968 | -| train/ | | -| approx_kl | 0.030025784 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.000933 | -| n_updates | 174050 | -| policy_gradient_loss | 0.0094 | -| std | 0.00825 | -| value_loss | 6.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17407 | -| time_elapsed | 94137 | -| total_timesteps | 2228096 | -| train/ | | -| approx_kl | 0.021478295 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 174060 | -| policy_gradient_loss | 0.0158 | -| std | 0.00825 | -| value_loss | 4.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17408 | -| time_elapsed | 94147 | -| total_timesteps | 2228224 | -| train/ | | -| approx_kl | 0.001564086 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.971 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 174070 | -| policy_gradient_loss | -0.0115 | -| std | 0.00825 | -| value_loss | 0.000187 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17409 | -| time_elapsed | 94152 | -| total_timesteps | 2228352 | -| train/ | | -| approx_kl | 0.0508029 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -6.23 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 174080 | -| policy_gradient_loss | 0.013 | -| std | 0.00825 | -| value_loss | 3.86e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17410 | -| time_elapsed | 94157 | -| total_timesteps | 2228480 | -| train/ | | -| approx_kl | 0.49876738 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00102 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 174090 | -| policy_gradient_loss | 0.0482 | -| std | 0.00826 | -| value_loss | 1.19e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17411 | -| time_elapsed | 94161 | -| total_timesteps | 2228608 | -| train/ | | -| approx_kl | 0.00787068 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.000377 | -| learning_rate | 0.0003 | -| loss | -0.00907 | -| n_updates | 174100 | -| policy_gradient_loss | -0.000194 | -| std | 0.00826 | -| value_loss | 9.65e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17412 | -| time_elapsed | 94166 | -| total_timesteps | 2228736 | -| train/ | | -| approx_kl | 0.00043330016 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.000978 | -| n_updates | 174110 | -| policy_gradient_loss | 0.00533 | -| std | 0.00826 | -| value_loss | 1.29e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17413 | -| time_elapsed | 94169 | -| total_timesteps | 2228864 | -| train/ | | -| approx_kl | 0.03734797 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | -0.000561 | -| n_updates | 174120 | -| policy_gradient_loss | -0.00169 | -| std | 0.00826 | -| value_loss | 7.14e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 17414 | -| time_elapsed | 94175 | -| total_timesteps | 2228992 | -| train/ | | -| approx_kl | 0.0063561387 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | -0.000101 | -| n_updates | 174130 | -| policy_gradient_loss | 0.00515 | -| std | 0.00826 | -| value_loss | 2.44e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 17415 | -| time_elapsed | 94178 | -| total_timesteps | 2229120 | -| train/ | | -| approx_kl | 0.04651748 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 174140 | -| policy_gradient_loss | 0.00867 | -| std | 0.00826 | -| value_loss | 1.19e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 17416 | -| time_elapsed | 94188 | -| total_timesteps | 2229248 | -| train/ | | -| approx_kl | 0.014733706 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.922 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 174150 | -| policy_gradient_loss | -0.0174 | -| std | 0.00827 | -| value_loss | 0.000662 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 17417 | -| time_elapsed | 94192 | -| total_timesteps | 2229376 | -| train/ | | -| approx_kl | 0.023858875 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | -0.0266 | -| n_updates | 174160 | -| policy_gradient_loss | -0.0126 | -| std | 0.00826 | -| value_loss | 2.95e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 17418 | -| time_elapsed | 94196 | -| total_timesteps | 2229504 | -| train/ | | -| approx_kl | 0.028570652 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0862 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 174170 | -| policy_gradient_loss | 0.00473 | -| std | 0.00826 | -| value_loss | 1.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 17419 | -| time_elapsed | 94201 | -| total_timesteps | 2229632 | -| train/ | | -| approx_kl | 0.030137833 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.00416 | -| n_updates | 174180 | -| policy_gradient_loss | 0.00207 | -| std | 0.00826 | -| value_loss | 9.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 17420 | -| time_elapsed | 94205 | -| total_timesteps | 2229760 | -| train/ | | -| approx_kl | 0.035036217 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.0089 | -| n_updates | 174190 | -| policy_gradient_loss | 0.00416 | -| std | 0.00826 | -| value_loss | 6.08e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 17421 | -| time_elapsed | 94209 | -| total_timesteps | 2229888 | -| train/ | | -| approx_kl | 0.028018985 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 174200 | -| policy_gradient_loss | 0.00908 | -| std | 0.00826 | -| value_loss | 4.22e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17422 | -| time_elapsed | 94213 | -| total_timesteps | 2230016 | -| train/ | | -| approx_kl | 0.0332576 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 174210 | -| policy_gradient_loss | 0.00864 | -| std | 0.00826 | -| value_loss | 2.42e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17423 | -| time_elapsed | 94225 | -| total_timesteps | 2230144 | -| train/ | | -| approx_kl | 0.103663124 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.4 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 174220 | -| policy_gradient_loss | -0.0137 | -| std | 0.00826 | -| value_loss | 0.00198 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17424 | -| time_elapsed | 94229 | -| total_timesteps | 2230272 | -| train/ | | -| approx_kl | 0.00027772738 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.000587 | -| n_updates | 174230 | -| policy_gradient_loss | 0.0154 | -| std | 0.00826 | -| value_loss | 5.71e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17425 | -| time_elapsed | 94234 | -| total_timesteps | 2230400 | -| train/ | | -| approx_kl | 0.056361195 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.425 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 174240 | -| policy_gradient_loss | 0.0205 | -| std | 0.00825 | -| value_loss | 2.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17426 | -| time_elapsed | 94239 | -| total_timesteps | 2230528 | -| train/ | | -| approx_kl | 0.092550084 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 174250 | -| policy_gradient_loss | 0.0115 | -| std | 0.00825 | -| value_loss | 5.81e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17427 | -| time_elapsed | 94243 | -| total_timesteps | 2230656 | -| train/ | | -| approx_kl | 0.13754582 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.0679 | -| n_updates | 174260 | -| policy_gradient_loss | 0.0274 | -| std | 0.00825 | -| value_loss | 3.55e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17428 | -| time_elapsed | 94248 | -| total_timesteps | 2230784 | -| train/ | | -| approx_kl | 0.0010596137 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00918 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 174270 | -| policy_gradient_loss | 0.0175 | -| std | 0.00825 | -| value_loss | 3.15e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 17429 | -| time_elapsed | 94251 | -| total_timesteps | 2230912 | -| train/ | | -| approx_kl | 0.41335618 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00286 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 174280 | -| policy_gradient_loss | 0.0446 | -| std | 0.00825 | -| value_loss | 1.92e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17430 | -| time_elapsed | 94257 | -| total_timesteps | 2231040 | -| train/ | | -| approx_kl | 0.0004998166 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00851 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 174290 | -| policy_gradient_loss | 0.000657 | -| std | 0.00824 | -| value_loss | 1.43e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17431 | -| time_elapsed | 94266 | -| total_timesteps | 2231168 | -| train/ | | -| approx_kl | 0.058516063 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.777 | -| learning_rate | 0.0003 | -| loss | -0.00846 | -| n_updates | 174300 | -| policy_gradient_loss | -0.00944 | -| std | 0.00823 | -| value_loss | 0.00302 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17432 | -| time_elapsed | 94270 | -| total_timesteps | 2231296 | -| train/ | | -| approx_kl | 0.024698574 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | 0.00326 | -| n_updates | 174310 | -| policy_gradient_loss | 0.0307 | -| std | 0.00822 | -| value_loss | 0.000136 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17433 | -| time_elapsed | 94274 | -| total_timesteps | 2231424 | -| train/ | | -| approx_kl | 0.19127916 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.0769 | -| n_updates | 174320 | -| policy_gradient_loss | 0.0342 | -| std | 0.00821 | -| value_loss | 2.15e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17434 | -| time_elapsed | 94279 | -| total_timesteps | 2231552 | -| train/ | | -| approx_kl | 0.0005701785 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00183 | -| learning_rate | 0.0003 | -| loss | -0.000563 | -| n_updates | 174330 | -| policy_gradient_loss | 0.00814 | -| std | 0.00822 | -| value_loss | 2.1e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17435 | -| time_elapsed | 94283 | -| total_timesteps | 2231680 | -| train/ | | -| approx_kl | 2.6601367e-05 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | -5.04e-05 | -| n_updates | 174340 | -| policy_gradient_loss | 0.0089 | -| std | 0.00823 | -| value_loss | 1.26e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17436 | -| time_elapsed | 94287 | -| total_timesteps | 2231808 | -| train/ | | -| approx_kl | 0.00013210531 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00411 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 174350 | -| policy_gradient_loss | -0.00351 | -| std | 0.00823 | -| value_loss | 1.54e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 17437 | -| time_elapsed | 94291 | -| total_timesteps | 2231936 | -| train/ | | -| approx_kl | 0.043678816 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | 0.0377 | -| n_updates | 174360 | -| policy_gradient_loss | 0.0686 | -| std | 0.00823 | -| value_loss | 3.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17438 | -| time_elapsed | 94295 | -| total_timesteps | 2232064 | -| train/ | | -| approx_kl | 0.17396586 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 174370 | -| policy_gradient_loss | 0.027 | -| std | 0.00823 | -| value_loss | 2.57e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17439 | -| time_elapsed | 94302 | -| total_timesteps | 2232192 | -| train/ | | -| approx_kl | 0.0008402858 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.715 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 174380 | -| policy_gradient_loss | 0.0141 | -| std | 0.00823 | -| value_loss | 0.00649 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17440 | -| time_elapsed | 94306 | -| total_timesteps | 2232320 | -| train/ | | -| approx_kl | 0.011813972 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.00687 | -| n_updates | 174390 | -| policy_gradient_loss | 0.0295 | -| std | 0.00826 | -| value_loss | 0.000257 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17441 | -| time_elapsed | 94309 | -| total_timesteps | 2232448 | -| train/ | | -| approx_kl | 0.011474337 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 174400 | -| policy_gradient_loss | 0.00837 | -| std | 0.00828 | -| value_loss | 0.000286 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17442 | -| time_elapsed | 94314 | -| total_timesteps | 2232576 | -| train/ | | -| approx_kl | 0.09988692 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00878 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 174410 | -| policy_gradient_loss | 0.0142 | -| std | 0.00829 | -| value_loss | 1.76e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17443 | -| time_elapsed | 94318 | -| total_timesteps | 2232704 | -| train/ | | -| approx_kl | 0.012567349 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.00231 | -| n_updates | 174420 | -| policy_gradient_loss | 0.0147 | -| std | 0.0083 | -| value_loss | 1.99e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17444 | -| time_elapsed | 94322 | -| total_timesteps | 2232832 | -| train/ | | -| approx_kl | 0.2068136 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 174430 | -| policy_gradient_loss | 0.141 | -| std | 0.0083 | -| value_loss | 4.29e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17445 | -| time_elapsed | 94326 | -| total_timesteps | 2232960 | -| train/ | | -| approx_kl | 0.13242796 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 174440 | -| policy_gradient_loss | 0.0814 | -| std | 0.0083 | -| value_loss | 3.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17446 | -| time_elapsed | 94332 | -| total_timesteps | 2233088 | -| train/ | | -| approx_kl | 0.025327718 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.00791 | -| n_updates | 174450 | -| policy_gradient_loss | 0.0203 | -| std | 0.0083 | -| value_loss | 2.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17447 | -| time_elapsed | 94339 | -| total_timesteps | 2233216 | -| train/ | | -| approx_kl | 0.07701137 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.432 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 174460 | -| policy_gradient_loss | -0.016 | -| std | 0.0083 | -| value_loss | 0.00097 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17448 | -| time_elapsed | 94343 | -| total_timesteps | 2233344 | -| train/ | | -| approx_kl | 0.07930465 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | 0.0538 | -| n_updates | 174470 | -| policy_gradient_loss | 0.0366 | -| std | 0.0083 | -| value_loss | 7.96e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17449 | -| time_elapsed | 94349 | -| total_timesteps | 2233472 | -| train/ | | -| approx_kl | 0.2599063 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.075 | -| learning_rate | 0.0003 | -| loss | 0.191 | -| n_updates | 174480 | -| policy_gradient_loss | 0.172 | -| std | 0.0083 | -| value_loss | 5.02e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17450 | -| time_elapsed | 94353 | -| total_timesteps | 2233600 | -| train/ | | -| approx_kl | 0.04478783 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 174490 | -| policy_gradient_loss | 0.0154 | -| std | 0.0083 | -| value_loss | 4.05e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17451 | -| time_elapsed | 94358 | -| total_timesteps | 2233728 | -| train/ | | -| approx_kl | 0.00023316685 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | -2.18e-05 | -| n_updates | 174500 | -| policy_gradient_loss | 0.0156 | -| std | 0.0083 | -| value_loss | 8.19e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17452 | -| time_elapsed | 94363 | -| total_timesteps | 2233856 | -| train/ | | -| approx_kl | 0.3076775 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.072 | -| n_updates | 174510 | -| policy_gradient_loss | 0.0318 | -| std | 0.00832 | -| value_loss | 2.04e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17453 | -| time_elapsed | 94368 | -| total_timesteps | 2233984 | -| train/ | | -| approx_kl | 0.006944777 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00583 | -| learning_rate | 0.0003 | -| loss | 0.000871 | -| n_updates | 174520 | -| policy_gradient_loss | 0.00533 | -| std | 0.00832 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17454 | -| time_elapsed | 94374 | -| total_timesteps | 2234112 | -| train/ | | -| approx_kl | 0.03923222 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 174530 | -| policy_gradient_loss | 0.00812 | -| std | 0.00832 | -| value_loss | 4.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17455 | -| time_elapsed | 94385 | -| total_timesteps | 2234240 | -| train/ | | -| approx_kl | 0.031661116 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00918 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 174540 | -| policy_gradient_loss | -0.0134 | -| std | 0.00832 | -| value_loss | 0.00125 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17456 | -| time_elapsed | 94391 | -| total_timesteps | 2234368 | -| train/ | | -| approx_kl | 0.0217183 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | 0.00988 | -| n_updates | 174550 | -| policy_gradient_loss | 0.0301 | -| std | 0.00832 | -| value_loss | 5.98e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17457 | -| time_elapsed | 94395 | -| total_timesteps | 2234496 | -| train/ | | -| approx_kl | 0.09927685 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 174560 | -| policy_gradient_loss | 0.0481 | -| std | 0.00832 | -| value_loss | 4.17e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17458 | -| time_elapsed | 94401 | -| total_timesteps | 2234624 | -| train/ | | -| approx_kl | 0.02780442 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 174570 | -| policy_gradient_loss | 0.0356 | -| std | 0.00832 | -| value_loss | 2.38e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17459 | -| time_elapsed | 94405 | -| total_timesteps | 2234752 | -| train/ | | -| approx_kl | 0.06605462 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | 0.0514 | -| n_updates | 174580 | -| policy_gradient_loss | 0.0347 | -| std | 0.00832 | -| value_loss | 1.45e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17460 | -| time_elapsed | 94410 | -| total_timesteps | 2234880 | -| train/ | | -| approx_kl | 0.0039147623 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.00521 | -| n_updates | 174590 | -| policy_gradient_loss | 0.0038 | -| std | 0.00832 | -| value_loss | 9.04e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17461 | -| time_elapsed | 94414 | -| total_timesteps | 2235008 | -| train/ | | -| approx_kl | 0.09263581 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.00842 | -| n_updates | 174600 | -| policy_gradient_loss | -0.00804 | -| std | 0.00832 | -| value_loss | 7.13e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17462 | -| time_elapsed | 94424 | -| total_timesteps | 2235136 | -| train/ | | -| approx_kl | 0.02221913 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.865 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 174610 | -| policy_gradient_loss | -0.0021 | -| std | 0.00833 | -| value_loss | 0.00151 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17463 | -| time_elapsed | 94429 | -| total_timesteps | 2235264 | -| train/ | | -| approx_kl | 0.0435082 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.274 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 174620 | -| policy_gradient_loss | 0.00785 | -| std | 0.00833 | -| value_loss | 7.31e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17464 | -| time_elapsed | 94434 | -| total_timesteps | 2235392 | -| train/ | | -| approx_kl | 0.00695739 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00238 | -| learning_rate | 0.0003 | -| loss | -0.00494 | -| n_updates | 174630 | -| policy_gradient_loss | 0.0023 | -| std | 0.00833 | -| value_loss | 6.77e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17465 | -| time_elapsed | 94439 | -| total_timesteps | 2235520 | -| train/ | | -| approx_kl | 0.04893303 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 174640 | -| policy_gradient_loss | 0.0106 | -| std | 0.00833 | -| value_loss | 4.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17466 | -| time_elapsed | 94444 | -| total_timesteps | 2235648 | -| train/ | | -| approx_kl | 0.008961471 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 174650 | -| policy_gradient_loss | 0.003 | -| std | 0.00833 | -| value_loss | 3.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17467 | -| time_elapsed | 94449 | -| total_timesteps | 2235776 | -| train/ | | -| approx_kl | 0.03407781 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 174660 | -| policy_gradient_loss | 0.00508 | -| std | 0.00833 | -| value_loss | 1.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 17468 | -| time_elapsed | 94454 | -| total_timesteps | 2235904 | -| train/ | | -| approx_kl | 0.031702254 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 174670 | -| policy_gradient_loss | 0.00771 | -| std | 0.00832 | -| value_loss | 1.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17469 | -| time_elapsed | 94458 | -| total_timesteps | 2236032 | -| train/ | | -| approx_kl | 0.004102517 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 174680 | -| policy_gradient_loss | -0.000877 | -| std | 0.00832 | -| value_loss | 8.49e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17470 | -| time_elapsed | 94467 | -| total_timesteps | 2236160 | -| train/ | | -| approx_kl | 0.39835364 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.739 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 174690 | -| policy_gradient_loss | 0.0317 | -| std | 0.00832 | -| value_loss | 0.00502 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17471 | -| time_elapsed | 94472 | -| total_timesteps | 2236288 | -| train/ | | -| approx_kl | 0.0014151358 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 174700 | -| policy_gradient_loss | 0.0276 | -| std | 0.00832 | -| value_loss | 4.41e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17472 | -| time_elapsed | 94477 | -| total_timesteps | 2236416 | -| train/ | | -| approx_kl | 0.06862507 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 174710 | -| policy_gradient_loss | 0.0291 | -| std | 0.00832 | -| value_loss | 1.2e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17473 | -| time_elapsed | 94482 | -| total_timesteps | 2236544 | -| train/ | | -| approx_kl | 0.20582283 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0943 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 174720 | -| policy_gradient_loss | 0.0802 | -| std | 0.00833 | -| value_loss | 1.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17474 | -| time_elapsed | 94484 | -| total_timesteps | 2236672 | -| train/ | | -| approx_kl | 0.13848493 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 174730 | -| policy_gradient_loss | 0.0853 | -| std | 0.00833 | -| value_loss | 9.75e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17475 | -| time_elapsed | 94487 | -| total_timesteps | 2236800 | -| train/ | | -| approx_kl | 0.030232627 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 174740 | -| policy_gradient_loss | 0.0199 | -| std | 0.00833 | -| value_loss | 6.01e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 17476 | -| time_elapsed | 94491 | -| total_timesteps | 2236928 | -| train/ | | -| approx_kl | 0.11978342 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.0507 | -| n_updates | 174750 | -| policy_gradient_loss | 0.013 | -| std | 0.00834 | -| value_loss | 4.01e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17477 | -| time_elapsed | 94496 | -| total_timesteps | 2237056 | -| train/ | | -| approx_kl | 0.014987205 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 174760 | -| policy_gradient_loss | 0.0115 | -| std | 0.00834 | -| value_loss | 2.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17478 | -| time_elapsed | 94504 | -| total_timesteps | 2237184 | -| train/ | | -| approx_kl | 0.017717095 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.864 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 174770 | -| policy_gradient_loss | -0.0114 | -| std | 0.00834 | -| value_loss | 0.000365 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17479 | -| time_elapsed | 94509 | -| total_timesteps | 2237312 | -| train/ | | -| approx_kl | 0.41765153 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.224 | -| n_updates | 174780 | -| policy_gradient_loss | 0.135 | -| std | 0.00834 | -| value_loss | 1.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17480 | -| time_elapsed | 94514 | -| total_timesteps | 2237440 | -| train/ | | -| approx_kl | 0.009102284 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.531 | -| learning_rate | 0.0003 | -| loss | -0.00876 | -| n_updates | 174790 | -| policy_gradient_loss | 0.017 | -| std | 0.00834 | -| value_loss | 6.38e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17481 | -| time_elapsed | 94519 | -| total_timesteps | 2237568 | -| train/ | | -| approx_kl | 0.063277505 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 174800 | -| policy_gradient_loss | 0.0177 | -| std | 0.00834 | -| value_loss | 3.55e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17482 | -| time_elapsed | 94525 | -| total_timesteps | 2237696 | -| train/ | | -| approx_kl | 0.003656114 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00757 | -| learning_rate | 0.0003 | -| loss | 0.00297 | -| n_updates | 174810 | -| policy_gradient_loss | 0.00591 | -| std | 0.00834 | -| value_loss | 2.45e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17483 | -| time_elapsed | 94531 | -| total_timesteps | 2237824 | -| train/ | | -| approx_kl | 0.16095129 | -| clip_fraction | 0.687 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 174820 | -| policy_gradient_loss | 0.119 | -| std | 0.00834 | -| value_loss | 1.91e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 17484 | -| time_elapsed | 94536 | -| total_timesteps | 2237952 | -| train/ | | -| approx_kl | 0.10910829 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | 0.0947 | -| n_updates | 174830 | -| policy_gradient_loss | 0.128 | -| std | 0.00834 | -| value_loss | 5.4e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17485 | -| time_elapsed | 94542 | -| total_timesteps | 2238080 | -| train/ | | -| approx_kl | 0.091120355 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 174840 | -| policy_gradient_loss | 0.077 | -| std | 0.00834 | -| value_loss | 4.71e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17486 | -| time_elapsed | 94551 | -| total_timesteps | 2238208 | -| train/ | | -| approx_kl | 0.010297558 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 174850 | -| policy_gradient_loss | -0.012 | -| std | 0.00834 | -| value_loss | 0.000456 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17487 | -| time_elapsed | 94557 | -| total_timesteps | 2238336 | -| train/ | | -| approx_kl | 0.0018565217 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00689 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 174860 | -| policy_gradient_loss | 0.00965 | -| std | 0.00833 | -| value_loss | 1.09e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17488 | -| time_elapsed | 94561 | -| total_timesteps | 2238464 | -| train/ | | -| approx_kl | 0.05011885 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.409 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 174870 | -| policy_gradient_loss | 0.00507 | -| std | 0.00833 | -| value_loss | 7.14e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17489 | -| time_elapsed | 94567 | -| total_timesteps | 2238592 | -| train/ | | -| approx_kl | 0.026478648 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 174880 | -| policy_gradient_loss | 0.025 | -| std | 0.00833 | -| value_loss | 9.54e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17490 | -| time_elapsed | 94572 | -| total_timesteps | 2238720 | -| train/ | | -| approx_kl | 0.6552205 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 174890 | -| policy_gradient_loss | 0.145 | -| std | 0.00833 | -| value_loss | 3.31e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17491 | -| time_elapsed | 94577 | -| total_timesteps | 2238848 | -| train/ | | -| approx_kl | 0.14267054 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0477 | -| learning_rate | 0.0003 | -| loss | 0.0242 | -| n_updates | 174900 | -| policy_gradient_loss | 0.00716 | -| std | 0.00833 | -| value_loss | 2.74e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17492 | -| time_elapsed | 94583 | -| total_timesteps | 2238976 | -| train/ | | -| approx_kl | 0.053794194 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.000756 | -| n_updates | 174910 | -| policy_gradient_loss | 0.00656 | -| std | 0.00833 | -| value_loss | 1.29e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17493 | -| time_elapsed | 94588 | -| total_timesteps | 2239104 | -| train/ | | -| approx_kl | 0.10974227 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0491 | -| n_updates | 174920 | -| policy_gradient_loss | 0.0207 | -| std | 0.00834 | -| value_loss | 7.79e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17494 | -| time_elapsed | 94599 | -| total_timesteps | 2239232 | -| train/ | | -| approx_kl | 0.35083097 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | 0.0603 | -| n_updates | 174930 | -| policy_gradient_loss | 0.0147 | -| std | 0.00833 | -| value_loss | 0.000392 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17495 | -| time_elapsed | 94604 | -| total_timesteps | 2239360 | -| train/ | | -| approx_kl | 0.023931932 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 174940 | -| policy_gradient_loss | 0.00957 | -| std | 0.00833 | -| value_loss | 1.26e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17496 | -| time_elapsed | 94610 | -| total_timesteps | 2239488 | -| train/ | | -| approx_kl | 0.030222634 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 174950 | -| policy_gradient_loss | 0.00521 | -| std | 0.00832 | -| value_loss | 4.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17497 | -| time_elapsed | 94614 | -| total_timesteps | 2239616 | -| train/ | | -| approx_kl | 0.032258354 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 174960 | -| policy_gradient_loss | 0.00778 | -| std | 0.00832 | -| value_loss | 8.1e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17498 | -| time_elapsed | 94619 | -| total_timesteps | 2239744 | -| train/ | | -| approx_kl | 0.0045490237 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | 0.00529 | -| n_updates | 174970 | -| policy_gradient_loss | 0.0291 | -| std | 0.00832 | -| value_loss | 0.00176 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 17499 | -| time_elapsed | 94624 | -| total_timesteps | 2239872 | -| train/ | | -| approx_kl | 0.43600616 | -| clip_fraction | 0.681 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.212 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 174980 | -| policy_gradient_loss | 0.107 | -| std | 0.00832 | -| value_loss | 0.00749 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17500 | -| time_elapsed | 94629 | -| total_timesteps | 2240000 | -| train/ | | -| approx_kl | 0.0066343206 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | -0.005 | -| n_updates | 174990 | -| policy_gradient_loss | 0.0146 | -| std | 0.00833 | -| value_loss | 0.00173 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17501 | -| time_elapsed | 94634 | -| total_timesteps | 2240128 | -| train/ | | -| approx_kl | 0.19113243 | -| clip_fraction | 0.632 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.000941 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 175000 | -| policy_gradient_loss | 0.103 | -| std | 0.00833 | -| value_loss | 0.00473 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17502 | -| time_elapsed | 94645 | -| total_timesteps | 2240256 | -| train/ | | -| approx_kl | 0.084571734 | -| clip_fraction | 0.633 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | 0.0713 | -| n_updates | 175010 | -| policy_gradient_loss | 0.067 | -| std | 0.00833 | -| value_loss | 0.00576 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17503 | -| time_elapsed | 94651 | -| total_timesteps | 2240384 | -| train/ | | -| approx_kl | 0.031068858 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 4.74e-05 | -| n_updates | 175020 | -| policy_gradient_loss | 0.013 | -| std | 0.00833 | -| value_loss | 0.000417 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17504 | -| time_elapsed | 94655 | -| total_timesteps | 2240512 | -| train/ | | -| approx_kl | 0.098403424 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0714 | -| n_updates | 175030 | -| policy_gradient_loss | 0.0195 | -| std | 0.00832 | -| value_loss | 0.000254 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17505 | -| time_elapsed | 94659 | -| total_timesteps | 2240640 | -| train/ | | -| approx_kl | 0.011754863 | -| clip_fraction | 0.0813 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 175040 | -| policy_gradient_loss | -0.00129 | -| std | 0.00832 | -| value_loss | 0.000163 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17506 | -| time_elapsed | 94662 | -| total_timesteps | 2240768 | -| train/ | | -| approx_kl | 0.018305296 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | -0.00703 | -| n_updates | 175050 | -| policy_gradient_loss | 0.0113 | -| std | 0.00832 | -| value_loss | 0.00013 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17507 | -| time_elapsed | 94666 | -| total_timesteps | 2240896 | -| train/ | | -| approx_kl | 0.060476907 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 175060 | -| policy_gradient_loss | 0.0105 | -| std | 0.00833 | -| value_loss | 0.000117 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17508 | -| time_elapsed | 94672 | -| total_timesteps | 2241024 | -| train/ | | -| approx_kl | 0.004825384 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.00521 | -| n_updates | 175070 | -| policy_gradient_loss | 0.00626 | -| std | 0.00833 | -| value_loss | 8.75e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17509 | -| time_elapsed | 94683 | -| total_timesteps | 2241152 | -| train/ | | -| approx_kl | 0.037872043 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | 0.000928 | -| n_updates | 175080 | -| policy_gradient_loss | 0.00817 | -| std | 0.00833 | -| value_loss | 0.00154 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17510 | -| time_elapsed | 94689 | -| total_timesteps | 2241280 | -| train/ | | -| approx_kl | 0.36759165 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 175090 | -| policy_gradient_loss | 0.0336 | -| std | 0.00833 | -| value_loss | 3.54e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17511 | -| time_elapsed | 94698 | -| total_timesteps | 2241408 | -| train/ | | -| approx_kl | 0.0005455534 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 175100 | -| policy_gradient_loss | -0.000417 | -| std | 0.00833 | -| value_loss | 3.02e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17512 | -| time_elapsed | 94704 | -| total_timesteps | 2241536 | -| train/ | | -| approx_kl | 0.028796325 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.0279 | -| n_updates | 175110 | -| policy_gradient_loss | -0.0131 | -| std | 0.00833 | -| value_loss | 2.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17513 | -| time_elapsed | 94708 | -| total_timesteps | 2241664 | -| train/ | | -| approx_kl | 0.067279406 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 175120 | -| policy_gradient_loss | 0.00389 | -| std | 0.00833 | -| value_loss | 1.84e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17514 | -| time_elapsed | 94712 | -| total_timesteps | 2241792 | -| train/ | | -| approx_kl | 0.06972193 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.096 | -| n_updates | 175130 | -| policy_gradient_loss | 0.0356 | -| std | 0.00833 | -| value_loss | 1.63e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17515 | -| time_elapsed | 94717 | -| total_timesteps | 2241920 | -| train/ | | -| approx_kl | 0.02037267 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 175140 | -| policy_gradient_loss | 0.0278 | -| std | 0.00833 | -| value_loss | 8.53e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17516 | -| time_elapsed | 94721 | -| total_timesteps | 2242048 | -| train/ | | -| approx_kl | 0.5324442 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.266 | -| n_updates | 175150 | -| policy_gradient_loss | 0.131 | -| std | 0.00834 | -| value_loss | 7.78e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17517 | -| time_elapsed | 94731 | -| total_timesteps | 2242176 | -| train/ | | -| approx_kl | 0.027708953 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 175160 | -| policy_gradient_loss | -0.00766 | -| std | 0.00833 | -| value_loss | 0.00142 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17518 | -| time_elapsed | 94736 | -| total_timesteps | 2242304 | -| train/ | | -| approx_kl | 0.087823756 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 175170 | -| policy_gradient_loss | 0.00945 | -| std | 0.00833 | -| value_loss | 3.67e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17519 | -| time_elapsed | 94742 | -| total_timesteps | 2242432 | -| train/ | | -| approx_kl | 0.035098456 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.000646 | -| n_updates | 175180 | -| policy_gradient_loss | 0.0119 | -| std | 0.00833 | -| value_loss | 6.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17520 | -| time_elapsed | 94747 | -| total_timesteps | 2242560 | -| train/ | | -| approx_kl | 0.020529395 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 175190 | -| policy_gradient_loss | 0.0108 | -| std | 0.00833 | -| value_loss | 5.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17521 | -| time_elapsed | 94753 | -| total_timesteps | 2242688 | -| train/ | | -| approx_kl | 0.10295822 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 175200 | -| policy_gradient_loss | 0.00717 | -| std | 0.00833 | -| value_loss | 4.86e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17522 | -| time_elapsed | 94759 | -| total_timesteps | 2242816 | -| train/ | | -| approx_kl | 0.21857788 | -| clip_fraction | 0.625 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 175210 | -| policy_gradient_loss | 0.104 | -| std | 0.00833 | -| value_loss | 3.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 17523 | -| time_elapsed | 94763 | -| total_timesteps | 2242944 | -| train/ | | -| approx_kl | 0.030524602 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 175220 | -| policy_gradient_loss | 0.0115 | -| std | 0.00838 | -| value_loss | 1.23e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17524 | -| time_elapsed | 94766 | -| total_timesteps | 2243072 | -| train/ | | -| approx_kl | 0.0009172023 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | 0.00507 | -| n_updates | 175230 | -| policy_gradient_loss | 0.00175 | -| std | 0.0084 | -| value_loss | 7.53e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17525 | -| time_elapsed | 94776 | -| total_timesteps | 2243200 | -| train/ | | -| approx_kl | 0.04541282 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 175240 | -| policy_gradient_loss | -0.00747 | -| std | 0.0084 | -| value_loss | 0.000122 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17526 | -| time_elapsed | 94781 | -| total_timesteps | 2243328 | -| train/ | | -| approx_kl | 0.048861757 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.593 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 175250 | -| policy_gradient_loss | -0.00933 | -| std | 0.00841 | -| value_loss | 1.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17527 | -| time_elapsed | 94786 | -| total_timesteps | 2243456 | -| train/ | | -| approx_kl | 0.02441979 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -6.63 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 175260 | -| policy_gradient_loss | -0.00495 | -| std | 0.00841 | -| value_loss | 2.45e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17528 | -| time_elapsed | 94791 | -| total_timesteps | 2243584 | -| train/ | | -| approx_kl | 0.0050469013 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00131 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 175270 | -| policy_gradient_loss | 0.00575 | -| std | 0.0084 | -| value_loss | 5.97e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17529 | -| time_elapsed | 94796 | -| total_timesteps | 2243712 | -| train/ | | -| approx_kl | 0.040161565 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 175280 | -| policy_gradient_loss | -0.00128 | -| std | 0.0084 | -| value_loss | 1.17e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17530 | -| time_elapsed | 94800 | -| total_timesteps | 2243840 | -| train/ | | -| approx_kl | 0.031319533 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00198 | -| learning_rate | 0.0003 | -| loss | -0.0041 | -| n_updates | 175290 | -| policy_gradient_loss | -0.00115 | -| std | 0.00841 | -| value_loss | 6.33e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17531 | -| time_elapsed | 94806 | -| total_timesteps | 2243968 | -| train/ | | -| approx_kl | 0.004993972 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 175300 | -| policy_gradient_loss | 0.000894 | -| std | 0.00841 | -| value_loss | 4e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17532 | -| time_elapsed | 94809 | -| total_timesteps | 2244096 | -| train/ | | -| approx_kl | 0.00013726112 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.000411 | -| n_updates | 175310 | -| policy_gradient_loss | 0.02 | -| std | 0.00842 | -| value_loss | 1.73e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17533 | -| time_elapsed | 94818 | -| total_timesteps | 2244224 | -| train/ | | -| approx_kl | 0.004232712 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.797 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 175320 | -| policy_gradient_loss | 0.017 | -| std | 0.00843 | -| value_loss | 0.00286 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17534 | -| time_elapsed | 94822 | -| total_timesteps | 2244352 | -| train/ | | -| approx_kl | 0.047121335 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0983 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 175330 | -| policy_gradient_loss | 0.0138 | -| std | 0.00843 | -| value_loss | 3.82e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17535 | -| time_elapsed | 94826 | -| total_timesteps | 2244480 | -| train/ | | -| approx_kl | 0.32399812 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00481 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 175340 | -| policy_gradient_loss | 0.0311 | -| std | 0.00843 | -| value_loss | 6.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17536 | -| time_elapsed | 94831 | -| total_timesteps | 2244608 | -| train/ | | -| approx_kl | 0.022784272 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00954 | -| learning_rate | 0.0003 | -| loss | 0.00833 | -| n_updates | 175350 | -| policy_gradient_loss | 0.00497 | -| std | 0.00843 | -| value_loss | 2.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17537 | -| time_elapsed | 94835 | -| total_timesteps | 2244736 | -| train/ | | -| approx_kl | 0.034446027 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.00509 | -| n_updates | 175360 | -| policy_gradient_loss | 0.00186 | -| std | 0.00843 | -| value_loss | 1.75e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17538 | -| time_elapsed | 94839 | -| total_timesteps | 2244864 | -| train/ | | -| approx_kl | 0.0062420284 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.0098 | -| n_updates | 175370 | -| policy_gradient_loss | 0.00129 | -| std | 0.00843 | -| value_loss | 1.61e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 17539 | -| time_elapsed | 94844 | -| total_timesteps | 2244992 | -| train/ | | -| approx_kl | 0.038364936 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 175380 | -| policy_gradient_loss | 0.0419 | -| std | 0.00844 | -| value_loss | 6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17540 | -| time_elapsed | 94850 | -| total_timesteps | 2245120 | -| train/ | | -| approx_kl | 0.05634913 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.499 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 175390 | -| policy_gradient_loss | 0.00219 | -| std | 0.00845 | -| value_loss | 1.51e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17541 | -| time_elapsed | 94860 | -| total_timesteps | 2245248 | -| train/ | | -| approx_kl | 0.02561252 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | 0.000996 | -| n_updates | 175400 | -| policy_gradient_loss | -0.00431 | -| std | 0.00845 | -| value_loss | 0.00418 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17542 | -| time_elapsed | 94865 | -| total_timesteps | 2245376 | -| train/ | | -| approx_kl | 0.065420486 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0897 | -| learning_rate | 0.0003 | -| loss | -0.00894 | -| n_updates | 175410 | -| policy_gradient_loss | 0.0375 | -| std | 0.00844 | -| value_loss | 6.73e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17543 | -| time_elapsed | 94871 | -| total_timesteps | 2245504 | -| train/ | | -| approx_kl | 0.027759928 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00306 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 175420 | -| policy_gradient_loss | 0.0254 | -| std | 0.00844 | -| value_loss | 1.76e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17544 | -| time_elapsed | 94876 | -| total_timesteps | 2245632 | -| train/ | | -| approx_kl | 0.017972616 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00295 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 175430 | -| policy_gradient_loss | 0.0147 | -| std | 0.00844 | -| value_loss | 8.45e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17545 | -| time_elapsed | 94881 | -| total_timesteps | 2245760 | -| train/ | | -| approx_kl | 0.07867792 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.0514 | -| n_updates | 175440 | -| policy_gradient_loss | 0.022 | -| std | 0.00842 | -| value_loss | 1.04e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 17546 | -| time_elapsed | 94886 | -| total_timesteps | 2245888 | -| train/ | | -| approx_kl | 0.023853831 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0973 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 175450 | -| policy_gradient_loss | 0.0244 | -| std | 0.00845 | -| value_loss | 0.000168 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17547 | -| time_elapsed | 94891 | -| total_timesteps | 2246016 | -| train/ | | -| approx_kl | 0.08175141 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 175460 | -| policy_gradient_loss | 0.0124 | -| std | 0.00846 | -| value_loss | 1.66e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17548 | -| time_elapsed | 94902 | -| total_timesteps | 2246144 | -| train/ | | -| approx_kl | 0.08232346 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.804 | -| learning_rate | 0.0003 | -| loss | -0.00871 | -| n_updates | 175470 | -| policy_gradient_loss | -0.00882 | -| std | 0.00846 | -| value_loss | 0.00046 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17549 | -| time_elapsed | 94908 | -| total_timesteps | 2246272 | -| train/ | | -| approx_kl | 0.11746803 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0928 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 175480 | -| policy_gradient_loss | 0.0248 | -| std | 0.00846 | -| value_loss | 9.27e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17550 | -| time_elapsed | 94912 | -| total_timesteps | 2246400 | -| train/ | | -| approx_kl | 0.0026015262 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 175490 | -| policy_gradient_loss | -0.00564 | -| std | 0.00846 | -| value_loss | 6.09e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17551 | -| time_elapsed | 94916 | -| total_timesteps | 2246528 | -| train/ | | -| approx_kl | 2.7235597e-05 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00521 | -| learning_rate | 0.0003 | -| loss | 0.00144 | -| n_updates | 175500 | -| policy_gradient_loss | -0.0047 | -| std | 0.00846 | -| value_loss | 1.84e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17552 | -| time_elapsed | 94921 | -| total_timesteps | 2246656 | -| train/ | | -| approx_kl | 0.00021903496 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00471 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 175510 | -| policy_gradient_loss | -0.00231 | -| std | 0.00846 | -| value_loss | 1.25e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17553 | -| time_elapsed | 94925 | -| total_timesteps | 2246784 | -| train/ | | -| approx_kl | 6.912509e-05 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00346 | -| learning_rate | 0.0003 | -| loss | -0.000673 | -| n_updates | 175520 | -| policy_gradient_loss | 0.00444 | -| std | 0.00846 | -| value_loss | 8.69e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 17554 | -| time_elapsed | 94930 | -| total_timesteps | 2246912 | -| train/ | | -| approx_kl | 0.03928074 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | 0.00309 | -| n_updates | 175530 | -| policy_gradient_loss | 0.0358 | -| std | 0.00846 | -| value_loss | 6.67e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17555 | -| time_elapsed | 94935 | -| total_timesteps | 2247040 | -| train/ | | -| approx_kl | 0.0017270995 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 175540 | -| policy_gradient_loss | 0.0508 | -| std | 0.00844 | -| value_loss | 4.95e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17556 | -| time_elapsed | 94944 | -| total_timesteps | 2247168 | -| train/ | | -| approx_kl | 0.0155739 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 175550 | -| policy_gradient_loss | 0.000711 | -| std | 0.00842 | -| value_loss | 0.0043 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17557 | -| time_elapsed | 94948 | -| total_timesteps | 2247296 | -| train/ | | -| approx_kl | 0.0643999 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 175560 | -| policy_gradient_loss | 0.0802 | -| std | 0.00841 | -| value_loss | 2.52e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17558 | -| time_elapsed | 94952 | -| total_timesteps | 2247424 | -| train/ | | -| approx_kl | 0.07228171 | -| clip_fraction | 0.587 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00321 | -| learning_rate | 0.0003 | -| loss | 0.0541 | -| n_updates | 175570 | -| policy_gradient_loss | 0.0828 | -| std | 0.00841 | -| value_loss | 7.17e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17559 | -| time_elapsed | 94957 | -| total_timesteps | 2247552 | -| train/ | | -| approx_kl | 0.07282813 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0006 | -| learning_rate | 0.0003 | -| loss | 0.0842 | -| n_updates | 175580 | -| policy_gradient_loss | 0.0763 | -| std | 0.00841 | -| value_loss | 4.47e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17560 | -| time_elapsed | 94962 | -| total_timesteps | 2247680 | -| train/ | | -| approx_kl | 0.07722864 | -| clip_fraction | 0.614 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00605 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 175590 | -| policy_gradient_loss | 0.0838 | -| std | 0.00841 | -| value_loss | 3.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17561 | -| time_elapsed | 94967 | -| total_timesteps | 2247808 | -| train/ | | -| approx_kl | 0.01526751 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00962 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 175600 | -| policy_gradient_loss | 0.0123 | -| std | 0.00841 | -| value_loss | 2.47e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 17562 | -| time_elapsed | 94973 | -| total_timesteps | 2247936 | -| train/ | | -| approx_kl | 0.10668796 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 175610 | -| policy_gradient_loss | 0.0114 | -| std | 0.00841 | -| value_loss | 1.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17563 | -| time_elapsed | 94979 | -| total_timesteps | 2248064 | -| train/ | | -| approx_kl | 0.009741392 | -| clip_fraction | 0.057 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 175620 | -| policy_gradient_loss | -0.00139 | -| std | 0.00841 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17564 | -| time_elapsed | 94987 | -| total_timesteps | 2248192 | -| train/ | | -| approx_kl | 0.034060605 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.666 | -| learning_rate | 0.0003 | -| loss | -0.00891 | -| n_updates | 175630 | -| policy_gradient_loss | 0.00109 | -| std | 0.00841 | -| value_loss | 0.00838 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17565 | -| time_elapsed | 94991 | -| total_timesteps | 2248320 | -| train/ | | -| approx_kl | 0.078279205 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00187 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 175640 | -| policy_gradient_loss | 0.00741 | -| std | 0.00841 | -| value_loss | 2.34e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17566 | -| time_elapsed | 94997 | -| total_timesteps | 2248448 | -| train/ | | -| approx_kl | 0.029197505 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00752 | -| learning_rate | 0.0003 | -| loss | 0.00361 | -| n_updates | 175650 | -| policy_gradient_loss | -0.00273 | -| std | 0.00841 | -| value_loss | 5.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17567 | -| time_elapsed | 95002 | -| total_timesteps | 2248576 | -| train/ | | -| approx_kl | 0.010278109 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | -0.00825 | -| n_updates | 175660 | -| policy_gradient_loss | 0.0166 | -| std | 0.00841 | -| value_loss | 3.58e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17568 | -| time_elapsed | 95006 | -| total_timesteps | 2248704 | -| train/ | | -| approx_kl | 0.18785858 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 175670 | -| policy_gradient_loss | 0.112 | -| std | 0.00841 | -| value_loss | 3.11e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17569 | -| time_elapsed | 95010 | -| total_timesteps | 2248832 | -| train/ | | -| approx_kl | 0.10770358 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | 0.0833 | -| n_updates | 175680 | -| policy_gradient_loss | 0.0793 | -| std | 0.00841 | -| value_loss | 2.85e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 17570 | -| time_elapsed | 95015 | -| total_timesteps | 2248960 | -| train/ | | -| approx_kl | 0.10575432 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0774 | -| n_updates | 175690 | -| policy_gradient_loss | 0.0995 | -| std | 0.00841 | -| value_loss | 1.31e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17571 | -| time_elapsed | 95019 | -| total_timesteps | 2249088 | -| train/ | | -| approx_kl | 0.018156989 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00927 | -| n_updates | 175700 | -| policy_gradient_loss | 0.0145 | -| std | 0.00841 | -| value_loss | 1.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17572 | -| time_elapsed | 95031 | -| total_timesteps | 2249216 | -| train/ | | -| approx_kl | 0.010162568 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 175710 | -| policy_gradient_loss | -0.00534 | -| std | 0.00841 | -| value_loss | 0.000415 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17573 | -| time_elapsed | 95037 | -| total_timesteps | 2249344 | -| train/ | | -| approx_kl | 0.034532726 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00351 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 175720 | -| policy_gradient_loss | -0.00366 | -| std | 0.00841 | -| value_loss | 1.6e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17574 | -| time_elapsed | 95042 | -| total_timesteps | 2249472 | -| train/ | | -| approx_kl | 0.006875062 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00948 | -| learning_rate | 0.0003 | -| loss | -0.00637 | -| n_updates | 175730 | -| policy_gradient_loss | 0.00186 | -| std | 0.00841 | -| value_loss | 5.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17575 | -| time_elapsed | 95046 | -| total_timesteps | 2249600 | -| train/ | | -| approx_kl | 0.0018342873 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00719 | -| learning_rate | 0.0003 | -| loss | -0.000152 | -| n_updates | 175740 | -| policy_gradient_loss | 0.00583 | -| std | 0.00841 | -| value_loss | 1.79e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17576 | -| time_elapsed | 95051 | -| total_timesteps | 2249728 | -| train/ | | -| approx_kl | 0.03796922 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.0192 | -| n_updates | 175750 | -| policy_gradient_loss | 0.029 | -| std | 0.0084 | -| value_loss | 1.3e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17577 | -| time_elapsed | 95055 | -| total_timesteps | 2249856 | -| train/ | | -| approx_kl | 0.0830169 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0738 | -| n_updates | 175760 | -| policy_gradient_loss | 0.0444 | -| std | 0.0084 | -| value_loss | 8.93e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 17578 | -| time_elapsed | 95060 | -| total_timesteps | 2249984 | -| train/ | | -| approx_kl | 0.018816965 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 175770 | -| policy_gradient_loss | 0.0187 | -| std | 0.0084 | -| value_loss | 7.57e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 17579 | -| time_elapsed | 95067 | -| total_timesteps | 2250112 | -| train/ | | -| approx_kl | 0.4656564 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 175780 | -| policy_gradient_loss | 0.121 | -| std | 0.0084 | -| value_loss | 6.31e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 17580 | -| time_elapsed | 95079 | -| total_timesteps | 2250240 | -| train/ | | -| approx_kl | 0.11515629 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 175790 | -| policy_gradient_loss | -0.0133 | -| std | 0.0084 | -| value_loss | 0.00123 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 17581 | -| time_elapsed | 95084 | -| total_timesteps | 2250368 | -| train/ | | -| approx_kl | 0.10108182 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | 0.000616 | -| n_updates | 175800 | -| policy_gradient_loss | 0.00224 | -| std | 0.0084 | -| value_loss | 2.35e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 17582 | -| time_elapsed | 95089 | -| total_timesteps | 2250496 | -| train/ | | -| approx_kl | 0.06720096 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 175810 | -| policy_gradient_loss | 0.0223 | -| std | 0.0084 | -| value_loss | 9.37e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 17583 | -| time_elapsed | 95094 | -| total_timesteps | 2250624 | -| train/ | | -| approx_kl | 0.2891289 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 175820 | -| policy_gradient_loss | 0.0894 | -| std | 0.0084 | -| value_loss | 2.98e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 17584 | -| time_elapsed | 95098 | -| total_timesteps | 2250752 | -| train/ | | -| approx_kl | 0.03522819 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 175830 | -| policy_gradient_loss | 0.0113 | -| std | 0.00841 | -| value_loss | 1.36e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 17585 | -| time_elapsed | 95105 | -| total_timesteps | 2250880 | -| train/ | | -| approx_kl | 0.09776712 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 175840 | -| policy_gradient_loss | 0.0129 | -| std | 0.00841 | -| value_loss | 1.01e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17586 | -| time_elapsed | 95111 | -| total_timesteps | 2251008 | -| train/ | | -| approx_kl | 0.118849464 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 175850 | -| policy_gradient_loss | 0.0116 | -| std | 0.00841 | -| value_loss | 4.63e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17587 | -| time_elapsed | 95123 | -| total_timesteps | 2251136 | -| train/ | | -| approx_kl | 0.06467097 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 175860 | -| policy_gradient_loss | 0.00285 | -| std | 0.00841 | -| value_loss | 0.00412 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17588 | -| time_elapsed | 95129 | -| total_timesteps | 2251264 | -| train/ | | -| approx_kl | 0.0008621644 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.0529 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 175870 | -| policy_gradient_loss | 0.0155 | -| std | 0.00841 | -| value_loss | 0.000236 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17589 | -| time_elapsed | 95134 | -| total_timesteps | 2251392 | -| train/ | | -| approx_kl | 0.055503234 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00946 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 175880 | -| policy_gradient_loss | 0.0363 | -| std | 0.0084 | -| value_loss | 5.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17590 | -| time_elapsed | 95138 | -| total_timesteps | 2251520 | -| train/ | | -| approx_kl | 0.08942878 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00338 | -| learning_rate | 0.0003 | -| loss | 0.0708 | -| n_updates | 175890 | -| policy_gradient_loss | 0.0297 | -| std | 0.0084 | -| value_loss | 1.09e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17591 | -| time_elapsed | 95143 | -| total_timesteps | 2251648 | -| train/ | | -| approx_kl | 0.02117475 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 175900 | -| policy_gradient_loss | -0.00342 | -| std | 0.0084 | -| value_loss | 1.41e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17592 | -| time_elapsed | 95148 | -| total_timesteps | 2251776 | -| train/ | | -| approx_kl | 0.34381402 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 175910 | -| policy_gradient_loss | 0.047 | -| std | 0.0084 | -| value_loss | 4.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 17593 | -| time_elapsed | 95153 | -| total_timesteps | 2251904 | -| train/ | | -| approx_kl | 0.035083912 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -0.00448 | -| n_updates | 175920 | -| policy_gradient_loss | -0.00322 | -| std | 0.0084 | -| value_loss | 4.62e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17594 | -| time_elapsed | 95157 | -| total_timesteps | 2252032 | -| train/ | | -| approx_kl | 0.0059807976 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.00945 | -| n_updates | 175930 | -| policy_gradient_loss | 0.00245 | -| std | 0.0084 | -| value_loss | 4e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17595 | -| time_elapsed | 95167 | -| total_timesteps | 2252160 | -| train/ | | -| approx_kl | 0.009230174 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 175940 | -| policy_gradient_loss | -0.0107 | -| std | 0.0084 | -| value_loss | 0.00215 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17596 | -| time_elapsed | 95171 | -| total_timesteps | 2252288 | -| train/ | | -| approx_kl | 0.055455424 | -| clip_fraction | 0.479 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00738 | -| learning_rate | 0.0003 | -| loss | 0.038 | -| n_updates | 175950 | -| policy_gradient_loss | 0.0487 | -| std | 0.0084 | -| value_loss | 1.62e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17597 | -| time_elapsed | 95176 | -| total_timesteps | 2252416 | -| train/ | | -| approx_kl | 0.01773664 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0056 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 175960 | -| policy_gradient_loss | 0.00866 | -| std | 0.0084 | -| value_loss | 5.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17598 | -| time_elapsed | 95180 | -| total_timesteps | 2252544 | -| train/ | | -| approx_kl | 0.024600666 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.00589 | -| n_updates | 175970 | -| policy_gradient_loss | 0.0544 | -| std | 0.0084 | -| value_loss | 2.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17599 | -| time_elapsed | 95185 | -| total_timesteps | 2252672 | -| train/ | | -| approx_kl | 0.0039588474 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 175980 | -| policy_gradient_loss | 0.0552 | -| std | 0.0084 | -| value_loss | 1.87e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17600 | -| time_elapsed | 95190 | -| total_timesteps | 2252800 | -| train/ | | -| approx_kl | 0.24698363 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 175990 | -| policy_gradient_loss | 0.0352 | -| std | 0.0084 | -| value_loss | 1.44e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17601 | -| time_elapsed | 95194 | -| total_timesteps | 2252928 | -| train/ | | -| approx_kl | 0.00016788812 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 176000 | -| policy_gradient_loss | 0.00175 | -| std | 0.00839 | -| value_loss | 1.2e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17602 | -| time_elapsed | 95199 | -| total_timesteps | 2253056 | -| train/ | | -| approx_kl | 5.4674223e-05 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | -0.000988 | -| n_updates | 176010 | -| policy_gradient_loss | 0.0027 | -| std | 0.00839 | -| value_loss | 9.46e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17603 | -| time_elapsed | 95207 | -| total_timesteps | 2253184 | -| train/ | | -| approx_kl | 0.06610043 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -5.12 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 176020 | -| policy_gradient_loss | -0.0154 | -| std | 0.00839 | -| value_loss | 0.00244 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17604 | -| time_elapsed | 95212 | -| total_timesteps | 2253312 | -| train/ | | -| approx_kl | 0.16426775 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -43.9 | -| learning_rate | 0.0003 | -| loss | 0.0005 | -| n_updates | 176030 | -| policy_gradient_loss | -0.000945 | -| std | 0.00839 | -| value_loss | 4.77e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17605 | -| time_elapsed | 95217 | -| total_timesteps | 2253440 | -| train/ | | -| approx_kl | 0.06407203 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.0428 | -| n_updates | 176040 | -| policy_gradient_loss | 0.0341 | -| std | 0.00839 | -| value_loss | 6.1e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17606 | -| time_elapsed | 95220 | -| total_timesteps | 2253568 | -| train/ | | -| approx_kl | 0.2376907 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 176050 | -| policy_gradient_loss | 0.11 | -| std | 0.00839 | -| value_loss | 2.01e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17607 | -| time_elapsed | 95225 | -| total_timesteps | 2253696 | -| train/ | | -| approx_kl | 0.03996203 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.00509 | -| n_updates | 176060 | -| policy_gradient_loss | 0.0124 | -| std | 0.00839 | -| value_loss | 1.88e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17608 | -| time_elapsed | 95229 | -| total_timesteps | 2253824 | -| train/ | | -| approx_kl | 0.09187749 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 176070 | -| policy_gradient_loss | 0.0125 | -| std | 0.0084 | -| value_loss | 1.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17609 | -| time_elapsed | 95234 | -| total_timesteps | 2253952 | -| train/ | | -| approx_kl | 0.017537927 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.00653 | -| n_updates | 176080 | -| policy_gradient_loss | 0.0173 | -| std | 0.0084 | -| value_loss | 7.2e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17610 | -| time_elapsed | 95240 | -| total_timesteps | 2254080 | -| train/ | | -| approx_kl | 0.0722661 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 176090 | -| policy_gradient_loss | 0.00507 | -| std | 0.0084 | -| value_loss | 7.38e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17611 | -| time_elapsed | 95249 | -| total_timesteps | 2254208 | -| train/ | | -| approx_kl | 0.046706725 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.689 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 176100 | -| policy_gradient_loss | 0.00484 | -| std | 0.0084 | -| value_loss | 0.00738 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17612 | -| time_elapsed | 95253 | -| total_timesteps | 2254336 | -| train/ | | -| approx_kl | 0.030436609 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 176110 | -| policy_gradient_loss | 0.0452 | -| std | 0.0084 | -| value_loss | 2.62e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17613 | -| time_elapsed | 95258 | -| total_timesteps | 2254464 | -| train/ | | -| approx_kl | 0.012494521 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00562 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 176120 | -| policy_gradient_loss | 0.0133 | -| std | 0.0084 | -| value_loss | 6.6e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17614 | -| time_elapsed | 95263 | -| total_timesteps | 2254592 | -| train/ | | -| approx_kl | 0.019817503 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00971 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 176130 | -| policy_gradient_loss | 0.0317 | -| std | 0.0084 | -| value_loss | 2.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17615 | -| time_elapsed | 95268 | -| total_timesteps | 2254720 | -| train/ | | -| approx_kl | 0.068963744 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.0405 | -| n_updates | 176140 | -| policy_gradient_loss | 0.0255 | -| std | 0.00841 | -| value_loss | 6.57e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17616 | -| time_elapsed | 95273 | -| total_timesteps | 2254848 | -| train/ | | -| approx_kl | 0.0713792 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00306 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 176150 | -| policy_gradient_loss | -0.00312 | -| std | 0.00842 | -| value_loss | 0.000709 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 17617 | -| time_elapsed | 95277 | -| total_timesteps | 2254976 | -| train/ | | -| approx_kl | 0.06944482 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 176160 | -| policy_gradient_loss | 0.0128 | -| std | 0.00842 | -| value_loss | 0.000103 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17618 | -| time_elapsed | 95283 | -| total_timesteps | 2255104 | -| train/ | | -| approx_kl | 0.088879414 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 3.29e-05 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 176170 | -| policy_gradient_loss | 0.0172 | -| std | 0.00843 | -| value_loss | 3.33e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17619 | -| time_elapsed | 95294 | -| total_timesteps | 2255232 | -| train/ | | -| approx_kl | 0.13783695 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | -0.00883 | -| n_updates | 176180 | -| policy_gradient_loss | -0.00626 | -| std | 0.00843 | -| value_loss | 0.000244 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17620 | -| time_elapsed | 95299 | -| total_timesteps | 2255360 | -| train/ | | -| approx_kl | 0.044719853 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | -0.00697 | -| n_updates | 176190 | -| policy_gradient_loss | 0.00899 | -| std | 0.00843 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17621 | -| time_elapsed | 95304 | -| total_timesteps | 2255488 | -| train/ | | -| approx_kl | 0.027080242 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.000908 | -| n_updates | 176200 | -| policy_gradient_loss | 0.0181 | -| std | 0.00843 | -| value_loss | 1.48e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17622 | -| time_elapsed | 95308 | -| total_timesteps | 2255616 | -| train/ | | -| approx_kl | 0.013386754 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | 0.00353 | -| n_updates | 176210 | -| policy_gradient_loss | 0.0135 | -| std | 0.00842 | -| value_loss | 0.000229 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17623 | -| time_elapsed | 95312 | -| total_timesteps | 2255744 | -| train/ | | -| approx_kl | 0.09894787 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -4.58 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 176220 | -| policy_gradient_loss | 0.0101 | -| std | 0.00842 | -| value_loss | 1.8e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 17624 | -| time_elapsed | 95316 | -| total_timesteps | 2255872 | -| train/ | | -| approx_kl | 0.09078942 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00203 | -| learning_rate | 0.0003 | -| loss | 0.0504 | -| n_updates | 176230 | -| policy_gradient_loss | 0.0191 | -| std | 0.00843 | -| value_loss | 6.65e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17625 | -| time_elapsed | 95321 | -| total_timesteps | 2256000 | -| train/ | | -| approx_kl | 0.07661174 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 176240 | -| policy_gradient_loss | 0.0135 | -| std | 0.00842 | -| value_loss | 1.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17626 | -| time_elapsed | 95327 | -| total_timesteps | 2256128 | -| train/ | | -| approx_kl | 0.024807787 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00803 | -| learning_rate | 0.0003 | -| loss | 0.00649 | -| n_updates | 176250 | -| policy_gradient_loss | 0.022 | -| std | 0.00842 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17627 | -| time_elapsed | 95337 | -| total_timesteps | 2256256 | -| train/ | | -| approx_kl | 0.060310423 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 176260 | -| policy_gradient_loss | -0.00466 | -| std | 0.00842 | -| value_loss | 0.00245 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17628 | -| time_elapsed | 95342 | -| total_timesteps | 2256384 | -| train/ | | -| approx_kl | 0.058710743 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 176270 | -| policy_gradient_loss | 0.00824 | -| std | 0.00842 | -| value_loss | 1.08e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17629 | -| time_elapsed | 95348 | -| total_timesteps | 2256512 | -| train/ | | -| approx_kl | 0.0043947413 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0904 | -| learning_rate | 0.0003 | -| loss | 0.00578 | -| n_updates | 176280 | -| policy_gradient_loss | 0.0033 | -| std | 0.00843 | -| value_loss | 9.17e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17630 | -| time_elapsed | 95353 | -| total_timesteps | 2256640 | -| train/ | | -| approx_kl | 0.019689253 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.934 | -| learning_rate | 0.0003 | -| loss | 0.00278 | -| n_updates | 176290 | -| policy_gradient_loss | 0.0197 | -| std | 0.00843 | -| value_loss | 6.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17631 | -| time_elapsed | 95358 | -| total_timesteps | 2256768 | -| train/ | | -| approx_kl | 0.54886925 | -| clip_fraction | 0.692 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.000605 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 176300 | -| policy_gradient_loss | 0.123 | -| std | 0.00843 | -| value_loss | 2.34e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 17632 | -| time_elapsed | 95363 | -| total_timesteps | 2256896 | -| train/ | | -| approx_kl | 0.022560814 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | 0.00598 | -| n_updates | 176310 | -| policy_gradient_loss | -0.00078 | -| std | 0.00843 | -| value_loss | 1.56e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17633 | -| time_elapsed | 95367 | -| total_timesteps | 2257024 | -| train/ | | -| approx_kl | 0.012450788 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 176320 | -| policy_gradient_loss | -0.00278 | -| std | 0.00843 | -| value_loss | 8.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17634 | -| time_elapsed | 95377 | -| total_timesteps | 2257152 | -| train/ | | -| approx_kl | 0.010264961 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.791 | -| learning_rate | 0.0003 | -| loss | -0.007 | -| n_updates | 176330 | -| policy_gradient_loss | -0.0114 | -| std | 0.00843 | -| value_loss | 0.00351 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17635 | -| time_elapsed | 95381 | -| total_timesteps | 2257280 | -| train/ | | -| approx_kl | 0.0015033889 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0017 | -| n_updates | 176340 | -| policy_gradient_loss | 0.00329 | -| std | 0.00842 | -| value_loss | 6.46e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17636 | -| time_elapsed | 95386 | -| total_timesteps | 2257408 | -| train/ | | -| approx_kl | 0.0007257913 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00679 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 176350 | -| policy_gradient_loss | 0.00991 | -| std | 0.00842 | -| value_loss | 1.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17637 | -| time_elapsed | 95392 | -| total_timesteps | 2257536 | -| train/ | | -| approx_kl | 0.043398608 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | 0.00915 | -| n_updates | 176360 | -| policy_gradient_loss | 0.037 | -| std | 0.00842 | -| value_loss | 5.34e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17638 | -| time_elapsed | 95398 | -| total_timesteps | 2257664 | -| train/ | | -| approx_kl | 0.1560773 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.009 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 176370 | -| policy_gradient_loss | 0.0265 | -| std | 0.00842 | -| value_loss | 1.76e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17639 | -| time_elapsed | 95404 | -| total_timesteps | 2257792 | -| train/ | | -| approx_kl | 0.0012508859 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00736 | -| learning_rate | 0.0003 | -| loss | -0.00791 | -| n_updates | 176380 | -| policy_gradient_loss | -0.00471 | -| std | 0.00842 | -| value_loss | 1.11e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 17640 | -| time_elapsed | 95410 | -| total_timesteps | 2257920 | -| train/ | | -| approx_kl | 0.028482758 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 176390 | -| policy_gradient_loss | 0.0362 | -| std | 0.00845 | -| value_loss | 8.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17641 | -| time_elapsed | 95414 | -| total_timesteps | 2258048 | -| train/ | | -| approx_kl | 0.050545614 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00525 | -| learning_rate | 0.0003 | -| loss | 0.0618 | -| n_updates | 176400 | -| policy_gradient_loss | 0.0123 | -| std | 0.00847 | -| value_loss | 2.52e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17642 | -| time_elapsed | 95422 | -| total_timesteps | 2258176 | -| train/ | | -| approx_kl | 0.04948044 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | 0.00771 | -| n_updates | 176410 | -| policy_gradient_loss | 0.00617 | -| std | 0.00847 | -| value_loss | 0.000855 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17643 | -| time_elapsed | 95426 | -| total_timesteps | 2258304 | -| train/ | | -| approx_kl | 0.018601794 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.000217 | -| n_updates | 176420 | -| policy_gradient_loss | 0.0562 | -| std | 0.00847 | -| value_loss | 4.72e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17644 | -| time_elapsed | 95429 | -| total_timesteps | 2258432 | -| train/ | | -| approx_kl | 0.06713489 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.0473 | -| n_updates | 176430 | -| policy_gradient_loss | 0.0236 | -| std | 0.00849 | -| value_loss | 3.66e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17645 | -| time_elapsed | 95435 | -| total_timesteps | 2258560 | -| train/ | | -| approx_kl | 0.10926056 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00562 | -| learning_rate | 0.0003 | -| loss | 0.0493 | -| n_updates | 176440 | -| policy_gradient_loss | 0.0324 | -| std | 0.00849 | -| value_loss | 0.00016 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17646 | -| time_elapsed | 95439 | -| total_timesteps | 2258688 | -| train/ | | -| approx_kl | 0.09165788 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00386 | -| learning_rate | 0.0003 | -| loss | 0.0428 | -| n_updates | 176450 | -| policy_gradient_loss | 0.0168 | -| std | 0.00849 | -| value_loss | 3.46e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17647 | -| time_elapsed | 95444 | -| total_timesteps | 2258816 | -| train/ | | -| approx_kl | 0.001108577 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00375 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 176460 | -| policy_gradient_loss | 0.0158 | -| std | 0.00849 | -| value_loss | 1.58e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 17648 | -| time_elapsed | 95450 | -| total_timesteps | 2258944 | -| train/ | | -| approx_kl | 0.3836388 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 176470 | -| policy_gradient_loss | 0.0463 | -| std | 0.00849 | -| value_loss | 7.53e-06 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17649 | -| time_elapsed | 95454 | -| total_timesteps | 2259072 | -| train/ | | -| approx_kl | 0.00040476816 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | -0.00204 | -| n_updates | 176480 | -| policy_gradient_loss | 0.000526 | -| std | 0.00849 | -| value_loss | 6.35e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17650 | -| time_elapsed | 95464 | -| total_timesteps | 2259200 | -| train/ | | -| approx_kl | 0.018211603 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | -0.00527 | -| n_updates | 176490 | -| policy_gradient_loss | -0.0014 | -| std | 0.00849 | -| value_loss | 0.00216 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17651 | -| time_elapsed | 95469 | -| total_timesteps | 2259328 | -| train/ | | -| approx_kl | 0.05300285 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 176500 | -| policy_gradient_loss | 0.0433 | -| std | 0.00849 | -| value_loss | 9.44e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17652 | -| time_elapsed | 95475 | -| total_timesteps | 2259456 | -| train/ | | -| approx_kl | 0.14963518 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.0599 | -| n_updates | 176510 | -| policy_gradient_loss | 0.0334 | -| std | 0.00848 | -| value_loss | 3.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17653 | -| time_elapsed | 95479 | -| total_timesteps | 2259584 | -| train/ | | -| approx_kl | 0.03428922 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 176520 | -| policy_gradient_loss | 0.0568 | -| std | 0.00848 | -| value_loss | 1.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17654 | -| time_elapsed | 95483 | -| total_timesteps | 2259712 | -| train/ | | -| approx_kl | 0.011365168 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 176530 | -| policy_gradient_loss | 0.0134 | -| std | 0.00848 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17655 | -| time_elapsed | 95489 | -| total_timesteps | 2259840 | -| train/ | | -| approx_kl | 0.018404903 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 176540 | -| policy_gradient_loss | 0.0234 | -| std | 0.00848 | -| value_loss | 9.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 17656 | -| time_elapsed | 95492 | -| total_timesteps | 2259968 | -| train/ | | -| approx_kl | 0.025170255 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.0473 | -| n_updates | 176550 | -| policy_gradient_loss | -0.00375 | -| std | 0.00848 | -| value_loss | 7.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17657 | -| time_elapsed | 95497 | -| total_timesteps | 2260096 | -| train/ | | -| approx_kl | 0.081523836 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 176560 | -| policy_gradient_loss | 0.0289 | -| std | 0.00848 | -| value_loss | 5.39e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17658 | -| time_elapsed | 95507 | -| total_timesteps | 2260224 | -| train/ | | -| approx_kl | 0.3176861 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | 0.0688 | -| n_updates | 176570 | -| policy_gradient_loss | 0.0515 | -| std | 0.00848 | -| value_loss | 0.00659 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17659 | -| time_elapsed | 95513 | -| total_timesteps | 2260352 | -| train/ | | -| approx_kl | 0.16241477 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00887 | -| learning_rate | 0.0003 | -| loss | 0.214 | -| n_updates | 176580 | -| policy_gradient_loss | 0.112 | -| std | 0.00848 | -| value_loss | 1.9e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17660 | -| time_elapsed | 95517 | -| total_timesteps | 2260480 | -| train/ | | -| approx_kl | 0.10045771 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00813 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 176590 | -| policy_gradient_loss | 0.0831 | -| std | 0.00848 | -| value_loss | 6.98e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17661 | -| time_elapsed | 95521 | -| total_timesteps | 2260608 | -| train/ | | -| approx_kl | 0.10497611 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0036 | -| learning_rate | 0.0003 | -| loss | 0.0664 | -| n_updates | 176600 | -| policy_gradient_loss | 0.128 | -| std | 0.00847 | -| value_loss | 9.28e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17662 | -| time_elapsed | 95525 | -| total_timesteps | 2260736 | -| train/ | | -| approx_kl | 0.14304408 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -26.2 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 176610 | -| policy_gradient_loss | -0.0148 | -| std | 0.00846 | -| value_loss | 6.67e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17663 | -| time_elapsed | 95527 | -| total_timesteps | 2260864 | -| train/ | | -| approx_kl | 0.09089955 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.00693 | -| n_updates | 176620 | -| policy_gradient_loss | -0.00705 | -| std | 0.00846 | -| value_loss | 1.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 17664 | -| time_elapsed | 95532 | -| total_timesteps | 2260992 | -| train/ | | -| approx_kl | 0.015657507 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.00578 | -| n_updates | 176630 | -| policy_gradient_loss | 0.00498 | -| std | 0.00846 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17665 | -| time_elapsed | 95537 | -| total_timesteps | 2261120 | -| train/ | | -| approx_kl | 3.747875e-05 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.00115 | -| n_updates | 176640 | -| policy_gradient_loss | -0.00119 | -| std | 0.00846 | -| value_loss | 7.03e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17666 | -| time_elapsed | 95552 | -| total_timesteps | 2261248 | -| train/ | | -| approx_kl | 0.0014468282 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.009 | -| n_updates | 176650 | -| policy_gradient_loss | -0.00524 | -| std | 0.00846 | -| value_loss | 0.00551 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17667 | -| time_elapsed | 95557 | -| total_timesteps | 2261376 | -| train/ | | -| approx_kl | 0.028577298 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 176660 | -| policy_gradient_loss | 0.0343 | -| std | 0.00846 | -| value_loss | 1.88e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17668 | -| time_elapsed | 95561 | -| total_timesteps | 2261504 | -| train/ | | -| approx_kl | 0.5807655 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.325 | -| n_updates | 176670 | -| policy_gradient_loss | 0.143 | -| std | 0.00846 | -| value_loss | 1.86e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17669 | -| time_elapsed | 95566 | -| total_timesteps | 2261632 | -| train/ | | -| approx_kl | 0.005727426 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 176680 | -| policy_gradient_loss | 0.0122 | -| std | 0.00846 | -| value_loss | 1.83e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17670 | -| time_elapsed | 95571 | -| total_timesteps | 2261760 | -| train/ | | -| approx_kl | 0.34692264 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 176690 | -| policy_gradient_loss | 0.0312 | -| std | 0.00846 | -| value_loss | 1.42e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17671 | -| time_elapsed | 95576 | -| total_timesteps | 2261888 | -| train/ | | -| approx_kl | 0.028232468 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 176700 | -| policy_gradient_loss | 0.00994 | -| std | 0.00846 | -| value_loss | 9.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17672 | -| time_elapsed | 95582 | -| total_timesteps | 2262016 | -| train/ | | -| approx_kl | 0.032927126 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.00839 | -| n_updates | 176710 | -| policy_gradient_loss | 0.00328 | -| std | 0.00845 | -| value_loss | 3.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17673 | -| time_elapsed | 95593 | -| total_timesteps | 2262144 | -| train/ | | -| approx_kl | 0.017195085 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 176720 | -| policy_gradient_loss | -0.0148 | -| std | 0.00845 | -| value_loss | 0.000187 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17674 | -| time_elapsed | 95598 | -| total_timesteps | 2262272 | -| train/ | | -| approx_kl | 0.065443814 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.177 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 176730 | -| policy_gradient_loss | 0.0783 | -| std | 0.00844 | -| value_loss | 4.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17675 | -| time_elapsed | 95602 | -| total_timesteps | 2262400 | -| train/ | | -| approx_kl | 0.011384517 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -11 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 176740 | -| policy_gradient_loss | 0.00295 | -| std | 0.00845 | -| value_loss | 1.02e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17676 | -| time_elapsed | 95606 | -| total_timesteps | 2262528 | -| train/ | | -| approx_kl | 0.0309335 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.836 | -| learning_rate | 0.0003 | -| loss | 0.0532 | -| n_updates | 176750 | -| policy_gradient_loss | -0.000973 | -| std | 0.00845 | -| value_loss | 1.39e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17677 | -| time_elapsed | 95611 | -| total_timesteps | 2262656 | -| train/ | | -| approx_kl | 0.038373355 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 176760 | -| policy_gradient_loss | -0.00845 | -| std | 0.00844 | -| value_loss | 1.5e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17678 | -| time_elapsed | 95616 | -| total_timesteps | 2262784 | -| train/ | | -| approx_kl | 0.009047532 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | -0.00346 | -| n_updates | 176770 | -| policy_gradient_loss | 0.01 | -| std | 0.00844 | -| value_loss | 4.25e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17679 | -| time_elapsed | 95620 | -| total_timesteps | 2262912 | -| train/ | | -| approx_kl | 0.071699895 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 176780 | -| policy_gradient_loss | 0.0222 | -| std | 0.00844 | -| value_loss | 2e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17680 | -| time_elapsed | 95624 | -| total_timesteps | 2263040 | -| train/ | | -| approx_kl | 0.43160212 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 176790 | -| policy_gradient_loss | 0.0415 | -| std | 0.00844 | -| value_loss | 1.59e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17681 | -| time_elapsed | 95634 | -| total_timesteps | 2263168 | -| train/ | | -| approx_kl | 0.0017204704 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 176800 | -| policy_gradient_loss | -0.00944 | -| std | 0.00843 | -| value_loss | 0.00684 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17682 | -| time_elapsed | 95639 | -| total_timesteps | 2263296 | -| train/ | | -| approx_kl | 0.00021872018 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0981 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 176810 | -| policy_gradient_loss | 0.0148 | -| std | 0.00843 | -| value_loss | 2.64e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17683 | -| time_elapsed | 95643 | -| total_timesteps | 2263424 | -| train/ | | -| approx_kl | 0.43475288 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00374 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 176820 | -| policy_gradient_loss | 0.0477 | -| std | 0.00843 | -| value_loss | 1.39e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17684 | -| time_elapsed | 95648 | -| total_timesteps | 2263552 | -| train/ | | -| approx_kl | 0.024126403 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.00915 | -| n_updates | 176830 | -| policy_gradient_loss | 0.00506 | -| std | 0.00843 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17685 | -| time_elapsed | 95653 | -| total_timesteps | 2263680 | -| train/ | | -| approx_kl | 0.0048726005 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 176840 | -| policy_gradient_loss | 0.00365 | -| std | 0.00843 | -| value_loss | 6.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17686 | -| time_elapsed | 95658 | -| total_timesteps | 2263808 | -| train/ | | -| approx_kl | 0.043470047 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 176850 | -| policy_gradient_loss | 0.0104 | -| std | 0.00843 | -| value_loss | 4.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 17687 | -| time_elapsed | 95662 | -| total_timesteps | 2263936 | -| train/ | | -| approx_kl | 0.009508314 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 176860 | -| policy_gradient_loss | 0.00275 | -| std | 0.00843 | -| value_loss | 3.36e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17688 | -| time_elapsed | 95665 | -| total_timesteps | 2264064 | -| train/ | | -| approx_kl | 0.00048025232 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 176870 | -| policy_gradient_loss | 0.00657 | -| std | 0.00843 | -| value_loss | 2.34e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17689 | -| time_elapsed | 95673 | -| total_timesteps | 2264192 | -| train/ | | -| approx_kl | 0.05535704 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.244 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 176880 | -| policy_gradient_loss | -0.0114 | -| std | 0.00843 | -| value_loss | 0.00125 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17690 | -| time_elapsed | 95678 | -| total_timesteps | 2264320 | -| train/ | | -| approx_kl | 0.077543795 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -3.47 | -| learning_rate | 0.0003 | -| loss | -0.00427 | -| n_updates | 176890 | -| policy_gradient_loss | 0.00639 | -| std | 0.00843 | -| value_loss | 7.59e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17691 | -| time_elapsed | 95684 | -| total_timesteps | 2264448 | -| train/ | | -| approx_kl | 0.1775435 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0917 | -| n_updates | 176900 | -| policy_gradient_loss | 0.0346 | -| std | 0.00843 | -| value_loss | 6.68e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17692 | -| time_elapsed | 95688 | -| total_timesteps | 2264576 | -| train/ | | -| approx_kl | 0.032315098 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | -0.00521 | -| n_updates | 176910 | -| policy_gradient_loss | 0.0357 | -| std | 0.00844 | -| value_loss | 4.25e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17693 | -| time_elapsed | 95693 | -| total_timesteps | 2264704 | -| train/ | | -| approx_kl | 0.15717094 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.075 | -| n_updates | 176920 | -| policy_gradient_loss | 0.0273 | -| std | 0.00844 | -| value_loss | 2.22e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17694 | -| time_elapsed | 95698 | -| total_timesteps | 2264832 | -| train/ | | -| approx_kl | 0.032315623 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 176930 | -| policy_gradient_loss | 0.0338 | -| std | 0.00844 | -| value_loss | 1.31e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 17695 | -| time_elapsed | 95703 | -| total_timesteps | 2264960 | -| train/ | | -| approx_kl | 0.13675383 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.0633 | -| n_updates | 176940 | -| policy_gradient_loss | 0.0221 | -| std | 0.00844 | -| value_loss | 1.03e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17696 | -| time_elapsed | 95707 | -| total_timesteps | 2265088 | -| train/ | | -| approx_kl | 0.034499492 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.00854 | -| n_updates | 176950 | -| policy_gradient_loss | 0.0457 | -| std | 0.00844 | -| value_loss | 8.1e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17697 | -| time_elapsed | 95718 | -| total_timesteps | 2265216 | -| train/ | | -| approx_kl | 0.003018653 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.925 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 176960 | -| policy_gradient_loss | -0.00968 | -| std | 0.00843 | -| value_loss | 0.000795 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17698 | -| time_elapsed | 95722 | -| total_timesteps | 2265344 | -| train/ | | -| approx_kl | 0.11739489 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 0.0678 | -| n_updates | 176970 | -| policy_gradient_loss | 0.0179 | -| std | 0.00842 | -| value_loss | 0.000168 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17699 | -| time_elapsed | 95726 | -| total_timesteps | 2265472 | -| train/ | | -| approx_kl | 0.012824874 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.831 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 176980 | -| policy_gradient_loss | 0.0116 | -| std | 0.00841 | -| value_loss | 7.66e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17700 | -| time_elapsed | 95731 | -| total_timesteps | 2265600 | -| train/ | | -| approx_kl | 0.15198296 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.0122 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 176990 | -| policy_gradient_loss | 0.129 | -| std | 0.00841 | -| value_loss | 2.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17701 | -| time_elapsed | 95734 | -| total_timesteps | 2265728 | -| train/ | | -| approx_kl | 0.124601215 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00747 | -| learning_rate | 0.0003 | -| loss | 0.194 | -| n_updates | 177000 | -| policy_gradient_loss | 0.133 | -| std | 0.00841 | -| value_loss | 1.98e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17702 | -| time_elapsed | 95738 | -| total_timesteps | 2265856 | -| train/ | | -| approx_kl | 0.086371325 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | 0.0849 | -| n_updates | 177010 | -| policy_gradient_loss | 0.0683 | -| std | 0.00841 | -| value_loss | 1.57e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17703 | -| time_elapsed | 95742 | -| total_timesteps | 2265984 | -| train/ | | -| approx_kl | 0.08094619 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 177020 | -| policy_gradient_loss | 0.0513 | -| std | 0.00842 | -| value_loss | 4.51e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 17704 | -| time_elapsed | 95746 | -| total_timesteps | 2266112 | -| train/ | | -| approx_kl | 0.08301024 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | 0.0785 | -| n_updates | 177030 | -| policy_gradient_loss | 0.0651 | -| std | 0.00842 | -| value_loss | 1.99e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 17705 | -| time_elapsed | 95758 | -| total_timesteps | 2266240 | -| train/ | | -| approx_kl | 0.3193814 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.298 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 177040 | -| policy_gradient_loss | 0.022 | -| std | 0.00842 | -| value_loss | 0.00127 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 17706 | -| time_elapsed | 95761 | -| total_timesteps | 2266368 | -| train/ | | -| approx_kl | 0.020066714 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00632 | -| learning_rate | 0.0003 | -| loss | 0.00283 | -| n_updates | 177050 | -| policy_gradient_loss | 0.0431 | -| std | 0.00843 | -| value_loss | 1.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 17707 | -| time_elapsed | 95765 | -| total_timesteps | 2266496 | -| train/ | | -| approx_kl | 0.055164818 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00778 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 177060 | -| policy_gradient_loss | -0.00469 | -| std | 0.00843 | -| value_loss | 3.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 17708 | -| time_elapsed | 95770 | -| total_timesteps | 2266624 | -| train/ | | -| approx_kl | 0.10936926 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 177070 | -| policy_gradient_loss | 0.0381 | -| std | 0.00843 | -| value_loss | 1.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 17709 | -| time_elapsed | 95775 | -| total_timesteps | 2266752 | -| train/ | | -| approx_kl | 0.023976875 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0697 | -| learning_rate | 0.0003 | -| loss | -0.00913 | -| n_updates | 177080 | -| policy_gradient_loss | 0.0441 | -| std | 0.00843 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 17710 | -| time_elapsed | 95780 | -| total_timesteps | 2266880 | -| train/ | | -| approx_kl | 0.010576392 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | -0.000501 | -| n_updates | 177090 | -| policy_gradient_loss | 0.0228 | -| std | 0.00843 | -| value_loss | 8.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17711 | -| time_elapsed | 95784 | -| total_timesteps | 2267008 | -| train/ | | -| approx_kl | 0.01936146 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.00341 | -| n_updates | 177100 | -| policy_gradient_loss | 0.0525 | -| std | 0.00842 | -| value_loss | 6.03e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17712 | -| time_elapsed | 95796 | -| total_timesteps | 2267136 | -| train/ | | -| approx_kl | 0.04697133 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -2.93 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 177110 | -| policy_gradient_loss | -0.00322 | -| std | 0.00843 | -| value_loss | 0.00262 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17713 | -| time_elapsed | 95802 | -| total_timesteps | 2267264 | -| train/ | | -| approx_kl | 0.08886321 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.611 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 177120 | -| policy_gradient_loss | 0.0449 | -| std | 0.00843 | -| value_loss | 0.000147 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17714 | -| time_elapsed | 95806 | -| total_timesteps | 2267392 | -| train/ | | -| approx_kl | 0.0647509 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 177130 | -| policy_gradient_loss | 0.0103 | -| std | 0.00843 | -| value_loss | 0.0118 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17715 | -| time_elapsed | 95812 | -| total_timesteps | 2267520 | -| train/ | | -| approx_kl | 0.23896012 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0898 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 177140 | -| policy_gradient_loss | 0.0897 | -| std | 0.00843 | -| value_loss | 0.00113 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17716 | -| time_elapsed | 95817 | -| total_timesteps | 2267648 | -| train/ | | -| approx_kl | 0.041347336 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00271 | -| learning_rate | 0.0003 | -| loss | 0.00999 | -| n_updates | 177150 | -| policy_gradient_loss | 0.0116 | -| std | 0.00843 | -| value_loss | 0.000564 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17717 | -| time_elapsed | 95823 | -| total_timesteps | 2267776 | -| train/ | | -| approx_kl | 0.098907165 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0622 | -| n_updates | 177160 | -| policy_gradient_loss | 0.0173 | -| std | 0.00844 | -| value_loss | 0.000287 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 17718 | -| time_elapsed | 95827 | -| total_timesteps | 2267904 | -| train/ | | -| approx_kl | 0.010899112 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.000362 | -| n_updates | 177170 | -| policy_gradient_loss | 1.13e-07 | -| std | 0.00843 | -| value_loss | 0.000186 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17719 | -| time_elapsed | 95831 | -| total_timesteps | 2268032 | -| train/ | | -| approx_kl | 0.016306486 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | -0.00646 | -| n_updates | 177180 | -| policy_gradient_loss | 0.0116 | -| std | 0.00843 | -| value_loss | 0.000152 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17720 | -| time_elapsed | 95841 | -| total_timesteps | 2268160 | -| train/ | | -| approx_kl | 0.40730906 | -| clip_fraction | 0.61 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.74 | -| learning_rate | 0.0003 | -| loss | 0.0917 | -| n_updates | 177190 | -| policy_gradient_loss | 0.0555 | -| std | 0.00843 | -| value_loss | 0.0078 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17721 | -| time_elapsed | 95847 | -| total_timesteps | 2268288 | -| train/ | | -| approx_kl | 0.044419672 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 177200 | -| policy_gradient_loss | 0.0331 | -| std | 0.00843 | -| value_loss | 5.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17722 | -| time_elapsed | 95851 | -| total_timesteps | 2268416 | -| train/ | | -| approx_kl | 0.023201002 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 177210 | -| policy_gradient_loss | 0.00672 | -| std | 0.00844 | -| value_loss | 4.79e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17723 | -| time_elapsed | 95856 | -| total_timesteps | 2268544 | -| train/ | | -| approx_kl | 0.21388769 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.075 | -| n_updates | 177220 | -| policy_gradient_loss | 0.0366 | -| std | 0.00844 | -| value_loss | 3.85e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17724 | -| time_elapsed | 95861 | -| total_timesteps | 2268672 | -| train/ | | -| approx_kl | 0.036852688 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 177230 | -| policy_gradient_loss | 0.00671 | -| std | 0.00844 | -| value_loss | 2.24e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17725 | -| time_elapsed | 95866 | -| total_timesteps | 2268800 | -| train/ | | -| approx_kl | 0.05387735 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.0941 | -| n_updates | 177240 | -| policy_gradient_loss | 0.00172 | -| std | 0.00844 | -| value_loss | 1.94e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17726 | -| time_elapsed | 95871 | -| total_timesteps | 2268928 | -| train/ | | -| approx_kl | 0.027142849 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.00799 | -| n_updates | 177250 | -| policy_gradient_loss | 0.0181 | -| std | 0.00844 | -| value_loss | 1.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17727 | -| time_elapsed | 95876 | -| total_timesteps | 2269056 | -| train/ | | -| approx_kl | 0.19219421 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.0381 | -| n_updates | 177260 | -| policy_gradient_loss | 0.012 | -| std | 0.00844 | -| value_loss | 1.21e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17728 | -| time_elapsed | 95887 | -| total_timesteps | 2269184 | -| train/ | | -| approx_kl | 0.055754893 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -3.22 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 177270 | -| policy_gradient_loss | -0.00621 | -| std | 0.00845 | -| value_loss | 0.00255 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17729 | -| time_elapsed | 95893 | -| total_timesteps | 2269312 | -| train/ | | -| approx_kl | 0.13110383 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0486 | -| n_updates | 177280 | -| policy_gradient_loss | 0.0244 | -| std | 0.00845 | -| value_loss | 5.99e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17730 | -| time_elapsed | 95898 | -| total_timesteps | 2269440 | -| train/ | | -| approx_kl | 0.036153458 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 177290 | -| policy_gradient_loss | 0.0582 | -| std | 0.00845 | -| value_loss | 3.92e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17731 | -| time_elapsed | 95905 | -| total_timesteps | 2269568 | -| train/ | | -| approx_kl | 0.11322557 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0242 | -| n_updates | 177300 | -| policy_gradient_loss | 0.0101 | -| std | 0.00845 | -| value_loss | 3.89e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17732 | -| time_elapsed | 95910 | -| total_timesteps | 2269696 | -| train/ | | -| approx_kl | 0.22246547 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.0952 | -| n_updates | 177310 | -| policy_gradient_loss | 0.0624 | -| std | 0.00845 | -| value_loss | 1.98e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17733 | -| time_elapsed | 95914 | -| total_timesteps | 2269824 | -| train/ | | -| approx_kl | 0.13601632 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 177320 | -| policy_gradient_loss | 0.119 | -| std | 0.00846 | -| value_loss | 1.49e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17734 | -| time_elapsed | 95919 | -| total_timesteps | 2269952 | -| train/ | | -| approx_kl | 0.023986287 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.00934 | -| n_updates | 177330 | -| policy_gradient_loss | 0.0163 | -| std | 0.00846 | -| value_loss | 1.3e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17735 | -| time_elapsed | 95924 | -| total_timesteps | 2270080 | -| train/ | | -| approx_kl | 0.00072472915 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00328 | -| n_updates | 177340 | -| policy_gradient_loss | 0.00327 | -| std | 0.00846 | -| value_loss | 1.03e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17736 | -| time_elapsed | 95933 | -| total_timesteps | 2270208 | -| train/ | | -| approx_kl | 0.2463745 | -| clip_fraction | 0.646 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.838 | -| learning_rate | 0.0003 | -| loss | 0.0493 | -| n_updates | 177350 | -| policy_gradient_loss | 0.0306 | -| std | 0.00846 | -| value_loss | 0.00244 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17737 | -| time_elapsed | 95938 | -| total_timesteps | 2270336 | -| train/ | | -| approx_kl | 0.0011804448 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | -0.00634 | -| n_updates | 177360 | -| policy_gradient_loss | -0.000819 | -| std | 0.00846 | -| value_loss | 1.65e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17738 | -| time_elapsed | 95943 | -| total_timesteps | 2270464 | -| train/ | | -| approx_kl | 0.007688535 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.65 | -| learning_rate | 0.0003 | -| loss | 0.00291 | -| n_updates | 177370 | -| policy_gradient_loss | 0.0172 | -| std | 0.00846 | -| value_loss | 3.58e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17739 | -| time_elapsed | 95948 | -| total_timesteps | 2270592 | -| train/ | | -| approx_kl | 0.2837962 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | 0.222 | -| n_updates | 177380 | -| policy_gradient_loss | 0.12 | -| std | 0.00846 | -| value_loss | 7.49e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17740 | -| time_elapsed | 95953 | -| total_timesteps | 2270720 | -| train/ | | -| approx_kl | 0.04225239 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 177390 | -| policy_gradient_loss | 0.0136 | -| std | 0.00846 | -| value_loss | 5.77e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17741 | -| time_elapsed | 95958 | -| total_timesteps | 2270848 | -| train/ | | -| approx_kl | 0.34645024 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 177400 | -| policy_gradient_loss | 0.0391 | -| std | 0.00846 | -| value_loss | 5.36e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17742 | -| time_elapsed | 95962 | -| total_timesteps | 2270976 | -| train/ | | -| approx_kl | 0.00815892 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 177410 | -| policy_gradient_loss | -1.46e-05 | -| std | 0.00846 | -| value_loss | 4.77e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17743 | -| time_elapsed | 95965 | -| total_timesteps | 2271104 | -| train/ | | -| approx_kl | 0.0015587197 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.000187 | -| n_updates | 177420 | -| policy_gradient_loss | 0.00286 | -| std | 0.00846 | -| value_loss | 4.49e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17744 | -| time_elapsed | 95975 | -| total_timesteps | 2271232 | -| train/ | | -| approx_kl | 0.03718515 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.704 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 177430 | -| policy_gradient_loss | 0.0313 | -| std | 0.00847 | -| value_loss | 0.00762 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17745 | -| time_elapsed | 95979 | -| total_timesteps | 2271360 | -| train/ | | -| approx_kl | 0.15511371 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 177440 | -| policy_gradient_loss | 0.0995 | -| std | 0.00847 | -| value_loss | 8.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17746 | -| time_elapsed | 95982 | -| total_timesteps | 2271488 | -| train/ | | -| approx_kl | 0.10888918 | -| clip_fraction | 0.66 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.000432 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 177450 | -| policy_gradient_loss | 0.0927 | -| std | 0.00847 | -| value_loss | 2.61e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17747 | -| time_elapsed | 95987 | -| total_timesteps | 2271616 | -| train/ | | -| approx_kl | 0.08887327 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00285 | -| learning_rate | 0.0003 | -| loss | 0.0929 | -| n_updates | 177460 | -| policy_gradient_loss | 0.072 | -| std | 0.00847 | -| value_loss | 1.47e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17748 | -| time_elapsed | 95992 | -| total_timesteps | 2271744 | -| train/ | | -| approx_kl | 0.09014043 | -| clip_fraction | 0.614 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00648 | -| learning_rate | 0.0003 | -| loss | 0.0769 | -| n_updates | 177470 | -| policy_gradient_loss | 0.119 | -| std | 0.00847 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17749 | -| time_elapsed | 95997 | -| total_timesteps | 2271872 | -| train/ | | -| approx_kl | 0.10293108 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00864 | -| learning_rate | 0.0003 | -| loss | 0.0724 | -| n_updates | 177480 | -| policy_gradient_loss | 0.096 | -| std | 0.00847 | -| value_loss | 8.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17750 | -| time_elapsed | 96001 | -| total_timesteps | 2272000 | -| train/ | | -| approx_kl | 0.016023377 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00695 | -| n_updates | 177490 | -| policy_gradient_loss | 0.0136 | -| std | 0.00847 | -| value_loss | 7.41e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17751 | -| time_elapsed | 96007 | -| total_timesteps | 2272128 | -| train/ | | -| approx_kl | 0.38797197 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00178 | -| learning_rate | 0.0003 | -| loss | 0.0984 | -| n_updates | 177500 | -| policy_gradient_loss | 0.0319 | -| std | 0.00847 | -| value_loss | 3.31e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17752 | -| time_elapsed | 96019 | -| total_timesteps | 2272256 | -| train/ | | -| approx_kl | 0.11249158 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.852 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 177510 | -| policy_gradient_loss | -0.0162 | -| std | 0.00847 | -| value_loss | 0.00205 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17753 | -| time_elapsed | 96024 | -| total_timesteps | 2272384 | -| train/ | | -| approx_kl | 0.0020353342 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00581 | -| learning_rate | 0.0003 | -| loss | -0.00585 | -| n_updates | 177520 | -| policy_gradient_loss | 0.0108 | -| std | 0.00847 | -| value_loss | 5.59e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17754 | -| time_elapsed | 96028 | -| total_timesteps | 2272512 | -| train/ | | -| approx_kl | 0.00033460231 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00584 | -| learning_rate | 0.0003 | -| loss | 0.000232 | -| n_updates | 177530 | -| policy_gradient_loss | 0.0197 | -| std | 0.00847 | -| value_loss | 8.48e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17755 | -| time_elapsed | 96033 | -| total_timesteps | 2272640 | -| train/ | | -| approx_kl | 0.37780502 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.0976 | -| n_updates | 177540 | -| policy_gradient_loss | 0.0392 | -| std | 0.00847 | -| value_loss | 7.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17756 | -| time_elapsed | 96038 | -| total_timesteps | 2272768 | -| train/ | | -| approx_kl | 0.025120733 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 3.27e-05 | -| n_updates | 177550 | -| policy_gradient_loss | 0.000304 | -| std | 0.00847 | -| value_loss | 5.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17757 | -| time_elapsed | 96042 | -| total_timesteps | 2272896 | -| train/ | | -| approx_kl | 0.006308003 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 177560 | -| policy_gradient_loss | 0.00371 | -| std | 0.00847 | -| value_loss | 3.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17758 | -| time_elapsed | 96046 | -| total_timesteps | 2273024 | -| train/ | | -| approx_kl | 0.034401186 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 177570 | -| policy_gradient_loss | 0.00505 | -| std | 0.00847 | -| value_loss | 2.19e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17759 | -| time_elapsed | 96056 | -| total_timesteps | 2273152 | -| train/ | | -| approx_kl | 0.04515783 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.0271 | -| n_updates | 177580 | -| policy_gradient_loss | -0.0216 | -| std | 0.00847 | -| value_loss | 0.00368 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17760 | -| time_elapsed | 96060 | -| total_timesteps | 2273280 | -| train/ | | -| approx_kl | 0.010770805 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 177590 | -| policy_gradient_loss | 0.015 | -| std | 0.00848 | -| value_loss | 2.24e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17761 | -| time_elapsed | 96064 | -| total_timesteps | 2273408 | -| train/ | | -| approx_kl | 0.30478048 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00616 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 177600 | -| policy_gradient_loss | 0.0346 | -| std | 0.00847 | -| value_loss | 4.07e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17762 | -| time_elapsed | 96069 | -| total_timesteps | 2273536 | -| train/ | | -| approx_kl | 0.0071956813 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 177610 | -| policy_gradient_loss | 0.00551 | -| std | 0.00847 | -| value_loss | 2.64e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17763 | -| time_elapsed | 96075 | -| total_timesteps | 2273664 | -| train/ | | -| approx_kl | 0.054240353 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.0291 | -| n_updates | 177620 | -| policy_gradient_loss | 0.00386 | -| std | 0.00846 | -| value_loss | 1.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17764 | -| time_elapsed | 96080 | -| total_timesteps | 2273792 | -| train/ | | -| approx_kl | 0.06613918 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00985 | -| learning_rate | 0.0003 | -| loss | 0.0777 | -| n_updates | 177630 | -| policy_gradient_loss | 0.0109 | -| std | 0.00844 | -| value_loss | 4.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17765 | -| time_elapsed | 96085 | -| total_timesteps | 2273920 | -| train/ | | -| approx_kl | 0.34660098 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00389 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 177640 | -| policy_gradient_loss | 0.0417 | -| std | 0.00843 | -| value_loss | 1.44e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17766 | -| time_elapsed | 96090 | -| total_timesteps | 2274048 | -| train/ | | -| approx_kl | 0.02132348 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.000505 | -| n_updates | 177650 | -| policy_gradient_loss | 0.00152 | -| std | 0.00843 | -| value_loss | 9.1e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17767 | -| time_elapsed | 96100 | -| total_timesteps | 2274176 | -| train/ | | -| approx_kl | 0.00018654205 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | 0.00916 | -| n_updates | 177660 | -| policy_gradient_loss | 0.0105 | -| std | 0.00843 | -| value_loss | 0.000719 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17768 | -| time_elapsed | 96105 | -| total_timesteps | 2274304 | -| train/ | | -| approx_kl | 0.014600068 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00467 | -| learning_rate | 0.0003 | -| loss | -0.00898 | -| n_updates | 177670 | -| policy_gradient_loss | 0.00496 | -| std | 0.00843 | -| value_loss | 3.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17769 | -| time_elapsed | 96110 | -| total_timesteps | 2274432 | -| train/ | | -| approx_kl | 0.0025285957 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00209 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 177680 | -| policy_gradient_loss | 0.0154 | -| std | 0.00843 | -| value_loss | 1.02e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17770 | -| time_elapsed | 96114 | -| total_timesteps | 2274560 | -| train/ | | -| approx_kl | 0.123704344 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 177690 | -| policy_gradient_loss | 0.0407 | -| std | 0.00843 | -| value_loss | 8.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17771 | -| time_elapsed | 96120 | -| total_timesteps | 2274688 | -| train/ | | -| approx_kl | 0.0039948444 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.000598 | -| n_updates | 177700 | -| policy_gradient_loss | 0.00526 | -| std | 0.00843 | -| value_loss | 4.88e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17772 | -| time_elapsed | 96127 | -| total_timesteps | 2274816 | -| train/ | | -| approx_kl | 0.04614387 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 177710 | -| policy_gradient_loss | 0.00315 | -| std | 0.00846 | -| value_loss | 7.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17773 | -| time_elapsed | 96133 | -| total_timesteps | 2274944 | -| train/ | | -| approx_kl | 0.007472393 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0082 | -| learning_rate | 0.0003 | -| loss | -0.00855 | -| n_updates | 177720 | -| policy_gradient_loss | 0.00129 | -| std | 0.00846 | -| value_loss | 4.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17774 | -| time_elapsed | 96138 | -| total_timesteps | 2275072 | -| train/ | | -| approx_kl | 0.03510853 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 177730 | -| policy_gradient_loss | -0.000463 | -| std | 0.00846 | -| value_loss | 2.16e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17775 | -| time_elapsed | 96145 | -| total_timesteps | 2275200 | -| train/ | | -| approx_kl | 0.023744587 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.706 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 177740 | -| policy_gradient_loss | -0.00175 | -| std | 0.00846 | -| value_loss | 0.000766 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17776 | -| time_elapsed | 96151 | -| total_timesteps | 2275328 | -| train/ | | -| approx_kl | 0.20204096 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00945 | -| learning_rate | 0.0003 | -| loss | 0.0901 | -| n_updates | 177750 | -| policy_gradient_loss | 0.0153 | -| std | 0.00846 | -| value_loss | 6.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17777 | -| time_elapsed | 96157 | -| total_timesteps | 2275456 | -| train/ | | -| approx_kl | 0.007997887 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | 0.00793 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 177760 | -| policy_gradient_loss | 0.0121 | -| std | 0.00845 | -| value_loss | 3.4e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17778 | -| time_elapsed | 96163 | -| total_timesteps | 2275584 | -| train/ | | -| approx_kl | 0.15062779 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.00727 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 177770 | -| policy_gradient_loss | 0.0887 | -| std | 0.00845 | -| value_loss | 2.32e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17779 | -| time_elapsed | 96168 | -| total_timesteps | 2275712 | -| train/ | | -| approx_kl | 0.027683292 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 177780 | -| policy_gradient_loss | 0.0143 | -| std | 0.00845 | -| value_loss | 1.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17780 | -| time_elapsed | 96172 | -| total_timesteps | 2275840 | -| train/ | | -| approx_kl | 0.34122518 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.35 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 177790 | -| policy_gradient_loss | 0.0351 | -| std | 0.00845 | -| value_loss | 1.26e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 17781 | -| time_elapsed | 96177 | -| total_timesteps | 2275968 | -| train/ | | -| approx_kl | 0.0100053605 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 177800 | -| policy_gradient_loss | 0.00359 | -| std | 0.00844 | -| value_loss | 8e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17782 | -| time_elapsed | 96183 | -| total_timesteps | 2276096 | -| train/ | | -| approx_kl | 0.0429719 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 177810 | -| policy_gradient_loss | 0.0121 | -| std | 0.00844 | -| value_loss | 5.86e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17783 | -| time_elapsed | 96191 | -| total_timesteps | 2276224 | -| train/ | | -| approx_kl | 0.018413948 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.793 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 177820 | -| policy_gradient_loss | 0.00203 | -| std | 0.00844 | -| value_loss | 0.00188 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17784 | -| time_elapsed | 96197 | -| total_timesteps | 2276352 | -| train/ | | -| approx_kl | 0.029967614 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.533 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 177830 | -| policy_gradient_loss | 0.00459 | -| std | 0.00845 | -| value_loss | 1.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17785 | -| time_elapsed | 96201 | -| total_timesteps | 2276480 | -| train/ | | -| approx_kl | 0.18064182 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 177840 | -| policy_gradient_loss | 0.0365 | -| std | 0.00844 | -| value_loss | 6.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17786 | -| time_elapsed | 96206 | -| total_timesteps | 2276608 | -| train/ | | -| approx_kl | 0.040403314 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 177850 | -| policy_gradient_loss | 0.0747 | -| std | 0.00844 | -| value_loss | 6.63e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17787 | -| time_elapsed | 96211 | -| total_timesteps | 2276736 | -| train/ | | -| approx_kl | 0.18499488 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 177860 | -| policy_gradient_loss | 0.04 | -| std | 0.00843 | -| value_loss | 6.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17788 | -| time_elapsed | 96215 | -| total_timesteps | 2276864 | -| train/ | | -| approx_kl | 0.035071515 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 177870 | -| policy_gradient_loss | 0.046 | -| std | 0.00843 | -| value_loss | 3.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17789 | -| time_elapsed | 96218 | -| total_timesteps | 2276992 | -| train/ | | -| approx_kl | 0.015529711 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0094 | -| learning_rate | 0.0003 | -| loss | 0.000216 | -| n_updates | 177880 | -| policy_gradient_loss | 0.0161 | -| std | 0.00843 | -| value_loss | 2.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17790 | -| time_elapsed | 96222 | -| total_timesteps | 2277120 | -| train/ | | -| approx_kl | 0.10167737 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 177890 | -| policy_gradient_loss | 0.0221 | -| std | 0.00844 | -| value_loss | 1.49e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17791 | -| time_elapsed | 96232 | -| total_timesteps | 2277248 | -| train/ | | -| approx_kl | 0.07291513 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 177900 | -| policy_gradient_loss | 0.0118 | -| std | 0.00844 | -| value_loss | 0.00146 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17792 | -| time_elapsed | 96237 | -| total_timesteps | 2277376 | -| train/ | | -| approx_kl | 0.0041589336 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 177910 | -| policy_gradient_loss | 0.0694 | -| std | 0.00844 | -| value_loss | 3.86e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17793 | -| time_elapsed | 96242 | -| total_timesteps | 2277504 | -| train/ | | -| approx_kl | 0.017988384 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.000798 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 177920 | -| policy_gradient_loss | 0.0192 | -| std | 0.00843 | -| value_loss | 4.6e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17794 | -| time_elapsed | 96247 | -| total_timesteps | 2277632 | -| train/ | | -| approx_kl | 0.0003991779 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.00218 | -| learning_rate | 0.0003 | -| loss | 0.00177 | -| n_updates | 177930 | -| policy_gradient_loss | 0.0147 | -| std | 0.00843 | -| value_loss | 2.63e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17795 | -| time_elapsed | 96252 | -| total_timesteps | 2277760 | -| train/ | | -| approx_kl | 0.07226783 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | -0.000297 | -| n_updates | 177940 | -| policy_gradient_loss | 0.013 | -| std | 0.00842 | -| value_loss | 2.14e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 17796 | -| time_elapsed | 96258 | -| total_timesteps | 2277888 | -| train/ | | -| approx_kl | 0.17197154 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0684 | -| n_updates | 177950 | -| policy_gradient_loss | 0.0297 | -| std | 0.00842 | -| value_loss | 1.7e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17797 | -| time_elapsed | 96264 | -| total_timesteps | 2278016 | -| train/ | | -| approx_kl | 0.0010678652 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | -0.000841 | -| n_updates | 177960 | -| policy_gradient_loss | 0.00867 | -| std | 0.00842 | -| value_loss | 9.24e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17798 | -| time_elapsed | 96274 | -| total_timesteps | 2278144 | -| train/ | | -| approx_kl | 0.033045705 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.771 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 177970 | -| policy_gradient_loss | 0.0153 | -| std | 0.00841 | -| value_loss | 0.00477 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17799 | -| time_elapsed | 96280 | -| total_timesteps | 2278272 | -| train/ | | -| approx_kl | 0.0068107955 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 177980 | -| policy_gradient_loss | 0.0134 | -| std | 0.00841 | -| value_loss | 5.88e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17800 | -| time_elapsed | 96286 | -| total_timesteps | 2278400 | -| train/ | | -| approx_kl | 0.10987944 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00575 | -| learning_rate | 0.0003 | -| loss | 0.0517 | -| n_updates | 177990 | -| policy_gradient_loss | 0.00698 | -| std | 0.00839 | -| value_loss | 6.47e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17801 | -| time_elapsed | 96290 | -| total_timesteps | 2278528 | -| train/ | | -| approx_kl | 0.033552717 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | 0.00374 | -| n_updates | 178000 | -| policy_gradient_loss | 0.00974 | -| std | 0.00838 | -| value_loss | 8.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17802 | -| time_elapsed | 96294 | -| total_timesteps | 2278656 | -| train/ | | -| approx_kl | 0.22592036 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 178010 | -| policy_gradient_loss | 0.0754 | -| std | 0.00838 | -| value_loss | 1.22e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17803 | -| time_elapsed | 96298 | -| total_timesteps | 2278784 | -| train/ | | -| approx_kl | 0.11050676 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.078 | -| n_updates | 178020 | -| policy_gradient_loss | 0.0908 | -| std | 0.00838 | -| value_loss | 3.84e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 17804 | -| time_elapsed | 96301 | -| total_timesteps | 2278912 | -| train/ | | -| approx_kl | 0.119570106 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.089 | -| n_updates | 178030 | -| policy_gradient_loss | 0.127 | -| std | 0.00837 | -| value_loss | 3.16e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17805 | -| time_elapsed | 96306 | -| total_timesteps | 2279040 | -| train/ | | -| approx_kl | 0.10662959 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.0762 | -| n_updates | 178040 | -| policy_gradient_loss | 0.11 | -| std | 0.00837 | -| value_loss | 1.94e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17806 | -| time_elapsed | 96318 | -| total_timesteps | 2279168 | -| train/ | | -| approx_kl | 0.021284522 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 178050 | -| policy_gradient_loss | -0.0154 | -| std | 0.00837 | -| value_loss | 0.00033 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17807 | -| time_elapsed | 96322 | -| total_timesteps | 2279296 | -| train/ | | -| approx_kl | 0.029953536 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -6.36 | -| learning_rate | 0.0003 | -| loss | 0.00987 | -| n_updates | 178060 | -| policy_gradient_loss | 0.00558 | -| std | 0.00838 | -| value_loss | 6.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17808 | -| time_elapsed | 96327 | -| total_timesteps | 2279424 | -| train/ | | -| approx_kl | 0.032745313 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -2.61 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 178070 | -| policy_gradient_loss | 0.00767 | -| std | 0.00839 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17809 | -| time_elapsed | 96332 | -| total_timesteps | 2279552 | -| train/ | | -| approx_kl | 0.018588621 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 178080 | -| policy_gradient_loss | 0.000458 | -| std | 0.00839 | -| value_loss | 1.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17810 | -| time_elapsed | 96335 | -| total_timesteps | 2279680 | -| train/ | | -| approx_kl | 0.04220918 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -1.84 | -| learning_rate | 0.0003 | -| loss | 0.00391 | -| n_updates | 178090 | -| policy_gradient_loss | 0.00132 | -| std | 0.00839 | -| value_loss | 2.2e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17811 | -| time_elapsed | 96339 | -| total_timesteps | 2279808 | -| train/ | | -| approx_kl | 0.0054292656 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.000732 | -| n_updates | 178100 | -| policy_gradient_loss | 0.00328 | -| std | 0.00839 | -| value_loss | 1.14e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 17812 | -| time_elapsed | 96344 | -| total_timesteps | 2279936 | -| train/ | | -| approx_kl | 0.0426409 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 178110 | -| policy_gradient_loss | 0.00794 | -| std | 0.00839 | -| value_loss | 9.61e-10 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17813 | -| time_elapsed | 96349 | -| total_timesteps | 2280064 | -| train/ | | -| approx_kl | 0.008023247 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 178120 | -| policy_gradient_loss | 0.000756 | -| std | 0.00839 | -| value_loss | 5.98e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17814 | -| time_elapsed | 96358 | -| total_timesteps | 2280192 | -| train/ | | -| approx_kl | 0.052509338 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.77 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 178130 | -| policy_gradient_loss | 0.0211 | -| std | 0.0084 | -| value_loss | 0.00424 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17815 | -| time_elapsed | 96363 | -| total_timesteps | 2280320 | -| train/ | | -| approx_kl | 0.048635103 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 178140 | -| policy_gradient_loss | 0.0447 | -| std | 0.0084 | -| value_loss | 1.86e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17816 | -| time_elapsed | 96368 | -| total_timesteps | 2280448 | -| train/ | | -| approx_kl | 0.00015658652 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00538 | -| learning_rate | 0.0003 | -| loss | -0.000984 | -| n_updates | 178150 | -| policy_gradient_loss | 0.00684 | -| std | 0.0084 | -| value_loss | 3.21e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17817 | -| time_elapsed | 96372 | -| total_timesteps | 2280576 | -| train/ | | -| approx_kl | 0.0047609285 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 178160 | -| policy_gradient_loss | -0.00297 | -| std | 0.0084 | -| value_loss | 1.41e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17818 | -| time_elapsed | 96376 | -| total_timesteps | 2280704 | -| train/ | | -| approx_kl | 0.019922387 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -0.00168 | -| n_updates | 178170 | -| policy_gradient_loss | 0.0211 | -| std | 0.00839 | -| value_loss | 8.19e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17819 | -| time_elapsed | 96380 | -| total_timesteps | 2280832 | -| train/ | | -| approx_kl | 0.12085361 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 178180 | -| policy_gradient_loss | 0.0468 | -| std | 0.00839 | -| value_loss | 7.22e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 17820 | -| time_elapsed | 96384 | -| total_timesteps | 2280960 | -| train/ | | -| approx_kl | 0.13599534 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.0961 | -| n_updates | 178190 | -| policy_gradient_loss | 0.0268 | -| std | 0.00839 | -| value_loss | 5.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17821 | -| time_elapsed | 96390 | -| total_timesteps | 2281088 | -| train/ | | -| approx_kl | 0.109559454 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.0735 | -| n_updates | 178200 | -| policy_gradient_loss | 0.0175 | -| std | 0.00839 | -| value_loss | 3.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17822 | -| time_elapsed | 96400 | -| total_timesteps | 2281216 | -| train/ | | -| approx_kl | 0.010307054 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.753 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 178210 | -| policy_gradient_loss | -0.0091 | -| std | 0.0084 | -| value_loss | 0.00503 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17823 | -| time_elapsed | 96405 | -| total_timesteps | 2281344 | -| train/ | | -| approx_kl | 0.0066373865 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 178220 | -| policy_gradient_loss | 0.0161 | -| std | 0.0084 | -| value_loss | 3.27e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17824 | -| time_elapsed | 96410 | -| total_timesteps | 2281472 | -| train/ | | -| approx_kl | 0.07006095 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00612 | -| learning_rate | 0.0003 | -| loss | 0.0356 | -| n_updates | 178230 | -| policy_gradient_loss | 0.0204 | -| std | 0.0084 | -| value_loss | 1.93e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17825 | -| time_elapsed | 96415 | -| total_timesteps | 2281600 | -| train/ | | -| approx_kl | 6.722752e-06 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | -6.8e-05 | -| n_updates | 178240 | -| policy_gradient_loss | 0.0194 | -| std | 0.0084 | -| value_loss | 1.24e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17826 | -| time_elapsed | 96420 | -| total_timesteps | 2281728 | -| train/ | | -| approx_kl | 0.36451218 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 178250 | -| policy_gradient_loss | 0.0482 | -| std | 0.0084 | -| value_loss | 2.73e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17827 | -| time_elapsed | 96424 | -| total_timesteps | 2281856 | -| train/ | | -| approx_kl | 0.03257724 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | -0.00585 | -| n_updates | 178260 | -| policy_gradient_loss | -0.0024 | -| std | 0.0084 | -| value_loss | 8.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17828 | -| time_elapsed | 96428 | -| total_timesteps | 2281984 | -| train/ | | -| approx_kl | 0.005339101 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.00957 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 178270 | -| policy_gradient_loss | 0.00253 | -| std | 0.0084 | -| value_loss | 1.59e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17829 | -| time_elapsed | 96433 | -| total_timesteps | 2282112 | -| train/ | | -| approx_kl | 0.02276628 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 178280 | -| policy_gradient_loss | 0.0971 | -| std | 0.0084 | -| value_loss | 5.98e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17830 | -| time_elapsed | 96443 | -| total_timesteps | 2282240 | -| train/ | | -| approx_kl | 0.014180757 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.727 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 178290 | -| policy_gradient_loss | -0.0129 | -| std | 0.00839 | -| value_loss | 0.00637 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17831 | -| time_elapsed | 96448 | -| total_timesteps | 2282368 | -| train/ | | -| approx_kl | 0.018821772 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | 0.00475 | -| n_updates | 178300 | -| policy_gradient_loss | 0.00404 | -| std | 0.00839 | -| value_loss | 2.79e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17832 | -| time_elapsed | 96453 | -| total_timesteps | 2282496 | -| train/ | | -| approx_kl | 0.034408294 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.00689 | -| n_updates | 178310 | -| policy_gradient_loss | -0.00442 | -| std | 0.00839 | -| value_loss | 3.76e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17833 | -| time_elapsed | 96458 | -| total_timesteps | 2282624 | -| train/ | | -| approx_kl | 0.0054764915 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 178320 | -| policy_gradient_loss | 0.00186 | -| std | 0.00839 | -| value_loss | 1.5e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17834 | -| time_elapsed | 96463 | -| total_timesteps | 2282752 | -| train/ | | -| approx_kl | 0.052749205 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0466 | -| learning_rate | 0.0003 | -| loss | 0.0332 | -| n_updates | 178330 | -| policy_gradient_loss | 0.0128 | -| std | 0.00839 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 17835 | -| time_elapsed | 96468 | -| total_timesteps | 2282880 | -| train/ | | -| approx_kl | 0.008046855 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 178340 | -| policy_gradient_loss | 0.00471 | -| std | 0.00839 | -| value_loss | 7.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17836 | -| time_elapsed | 96473 | -| total_timesteps | 2283008 | -| train/ | | -| approx_kl | 0.040737245 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 178350 | -| policy_gradient_loss | 0.0117 | -| std | 0.00839 | -| value_loss | 5.27e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17837 | -| time_elapsed | 96483 | -| total_timesteps | 2283136 | -| train/ | | -| approx_kl | 0.04604788 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 178360 | -| policy_gradient_loss | -0.00225 | -| std | 0.00838 | -| value_loss | 0.00285 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17838 | -| time_elapsed | 96486 | -| total_timesteps | 2283264 | -| train/ | | -| approx_kl | 0.0674804 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | 0.142 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 178370 | -| policy_gradient_loss | 0.00998 | -| std | 0.00837 | -| value_loss | 6.56e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17839 | -| time_elapsed | 96490 | -| total_timesteps | 2283392 | -| train/ | | -| approx_kl | 0.066229194 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.36 | -| explained_variance | -0.324 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 178380 | -| policy_gradient_loss | 0.00372 | -| std | 0.00836 | -| value_loss | 2.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17840 | -| time_elapsed | 96496 | -| total_timesteps | 2283520 | -| train/ | | -| approx_kl | 0.006304864 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 178390 | -| policy_gradient_loss | 0.000533 | -| std | 0.00836 | -| value_loss | 9.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17841 | -| time_elapsed | 96502 | -| total_timesteps | 2283648 | -| train/ | | -| approx_kl | 0.045028586 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 178400 | -| policy_gradient_loss | 0.00841 | -| std | 0.00835 | -| value_loss | 5.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17842 | -| time_elapsed | 96506 | -| total_timesteps | 2283776 | -| train/ | | -| approx_kl | 0.057590976 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | 0.00501 | -| n_updates | 178410 | -| policy_gradient_loss | -0.00297 | -| std | 0.00835 | -| value_loss | 4.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17843 | -| time_elapsed | 96511 | -| total_timesteps | 2283904 | -| train/ | | -| approx_kl | 0.023646228 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | -0.000687 | -| n_updates | 178420 | -| policy_gradient_loss | 0.000475 | -| std | 0.00835 | -| value_loss | 3.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17844 | -| time_elapsed | 96516 | -| total_timesteps | 2284032 | -| train/ | | -| approx_kl | 0.005262927 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | 0.00508 | -| n_updates | 178430 | -| policy_gradient_loss | 0.00292 | -| std | 0.00833 | -| value_loss | 3.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17845 | -| time_elapsed | 96523 | -| total_timesteps | 2284160 | -| train/ | | -| approx_kl | 0.066352285 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 178440 | -| policy_gradient_loss | -0.0145 | -| std | 0.0083 | -| value_loss | 0.00169 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17846 | -| time_elapsed | 96528 | -| total_timesteps | 2284288 | -| train/ | | -| approx_kl | 0.443574 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | 0.0892 | -| n_updates | 178450 | -| policy_gradient_loss | 0.0261 | -| std | 0.0083 | -| value_loss | 2.14e-06 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17847 | -| time_elapsed | 96531 | -| total_timesteps | 2284416 | -| train/ | | -| approx_kl | 4.610652e-05 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00245 | -| learning_rate | 0.0003 | -| loss | 0.000468 | -| n_updates | 178460 | -| policy_gradient_loss | 0.00173 | -| std | 0.00829 | -| value_loss | 7.28e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17848 | -| time_elapsed | 96537 | -| total_timesteps | 2284544 | -| train/ | | -| approx_kl | 0.008063684 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.000266 | -| n_updates | 178470 | -| policy_gradient_loss | 0.00315 | -| std | 0.0083 | -| value_loss | 4.7e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17849 | -| time_elapsed | 96542 | -| total_timesteps | 2284672 | -| train/ | | -| approx_kl | 0.00026045786 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0841 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 178480 | -| policy_gradient_loss | 0.00433 | -| std | 0.00829 | -| value_loss | 3.61e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17850 | -| time_elapsed | 96548 | -| total_timesteps | 2284800 | -| train/ | | -| approx_kl | 0.00750352 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 178490 | -| policy_gradient_loss | 6.23e-05 | -| std | 0.00828 | -| value_loss | 1.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 17851 | -| time_elapsed | 96553 | -| total_timesteps | 2284928 | -| train/ | | -| approx_kl | 0.024395196 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.81 | -| learning_rate | 0.0003 | -| loss | 0.00214 | -| n_updates | 178500 | -| policy_gradient_loss | 0.0313 | -| std | 0.00827 | -| value_loss | 2.31e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17852 | -| time_elapsed | 96559 | -| total_timesteps | 2285056 | -| train/ | | -| approx_kl | 0.04152636 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.18 | -| learning_rate | 0.0003 | -| loss | 0.0336 | -| n_updates | 178510 | -| policy_gradient_loss | 0.0177 | -| std | 0.00826 | -| value_loss | 9.73e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17853 | -| time_elapsed | 96568 | -| total_timesteps | 2285184 | -| train/ | | -| approx_kl | 0.0055759586 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 178520 | -| policy_gradient_loss | 0.00161 | -| std | 0.00826 | -| value_loss | 0.00353 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17854 | -| time_elapsed | 96572 | -| total_timesteps | 2285312 | -| train/ | | -| approx_kl | 0.006453974 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 178530 | -| policy_gradient_loss | 0.02 | -| std | 0.00826 | -| value_loss | 9.54e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17855 | -| time_elapsed | 96578 | -| total_timesteps | 2285440 | -| train/ | | -| approx_kl | 0.1253904 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.001 | -| learning_rate | 0.0003 | -| loss | 0.0545 | -| n_updates | 178540 | -| policy_gradient_loss | 0.0091 | -| std | 0.00826 | -| value_loss | 6.67e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17856 | -| time_elapsed | 96583 | -| total_timesteps | 2285568 | -| train/ | | -| approx_kl | 0.082586475 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 178550 | -| policy_gradient_loss | 0.0104 | -| std | 0.00826 | -| value_loss | 2.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17857 | -| time_elapsed | 96588 | -| total_timesteps | 2285696 | -| train/ | | -| approx_kl | 0.029970862 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.363 | -| learning_rate | 0.0003 | -| loss | 0.000613 | -| n_updates | 178560 | -| policy_gradient_loss | 0.0152 | -| std | 0.00826 | -| value_loss | 3.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17858 | -| time_elapsed | 96593 | -| total_timesteps | 2285824 | -| train/ | | -| approx_kl | 0.018226918 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | -0.000167 | -| n_updates | 178570 | -| policy_gradient_loss | 0.0156 | -| std | 0.00826 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 17859 | -| time_elapsed | 96597 | -| total_timesteps | 2285952 | -| train/ | | -| approx_kl | 0.0028027068 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 178580 | -| policy_gradient_loss | 0.00368 | -| std | 0.00826 | -| value_loss | 1.05e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17860 | -| time_elapsed | 96601 | -| total_timesteps | 2286080 | -| train/ | | -| approx_kl | 0.0028242958 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.000242 | -| n_updates | 178590 | -| policy_gradient_loss | 0.016 | -| std | 0.00825 | -| value_loss | 4.13e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17861 | -| time_elapsed | 96610 | -| total_timesteps | 2286208 | -| train/ | | -| approx_kl | 0.04678069 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 178600 | -| policy_gradient_loss | -0.0125 | -| std | 0.00824 | -| value_loss | 0.00147 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17862 | -| time_elapsed | 96616 | -| total_timesteps | 2286336 | -| train/ | | -| approx_kl | 0.013042608 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.00997 | -| n_updates | 178610 | -| policy_gradient_loss | 0.00293 | -| std | 0.00824 | -| value_loss | 9.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17863 | -| time_elapsed | 96621 | -| total_timesteps | 2286464 | -| train/ | | -| approx_kl | 0.048684213 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 178620 | -| policy_gradient_loss | 0.0581 | -| std | 0.00823 | -| value_loss | 3.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17864 | -| time_elapsed | 96627 | -| total_timesteps | 2286592 | -| train/ | | -| approx_kl | 0.09442718 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 178630 | -| policy_gradient_loss | 0.0911 | -| std | 0.00823 | -| value_loss | 3.15e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17865 | -| time_elapsed | 96632 | -| total_timesteps | 2286720 | -| train/ | | -| approx_kl | 0.06769976 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.0506 | -| n_updates | 178640 | -| policy_gradient_loss | 0.0848 | -| std | 0.00823 | -| value_loss | 2.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17866 | -| time_elapsed | 96636 | -| total_timesteps | 2286848 | -| train/ | | -| approx_kl | 0.068777844 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.0859 | -| n_updates | 178650 | -| policy_gradient_loss | 0.0716 | -| std | 0.00824 | -| value_loss | 2.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 17867 | -| time_elapsed | 96641 | -| total_timesteps | 2286976 | -| train/ | | -| approx_kl | 0.019753564 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.00311 | -| n_updates | 178660 | -| policy_gradient_loss | 0.0195 | -| std | 0.00824 | -| value_loss | 1.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 17868 | -| time_elapsed | 96647 | -| total_timesteps | 2287104 | -| train/ | | -| approx_kl | 0.13994962 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0552 | -| n_updates | 178670 | -| policy_gradient_loss | 0.0142 | -| std | 0.00824 | -| value_loss | 9.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 17869 | -| time_elapsed | 96660 | -| total_timesteps | 2287232 | -| train/ | | -| approx_kl | 0.046073318 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -8.2 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 178680 | -| policy_gradient_loss | -0.0104 | -| std | 0.00823 | -| value_loss | 0.00387 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 17870 | -| time_elapsed | 96666 | -| total_timesteps | 2287360 | -| train/ | | -| approx_kl | 0.12515709 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | 0.0556 | -| n_updates | 178690 | -| policy_gradient_loss | 0.0307 | -| std | 0.00823 | -| value_loss | 9.27e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 17871 | -| time_elapsed | 96670 | -| total_timesteps | 2287488 | -| train/ | | -| approx_kl | 0.0020088255 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00303 | -| learning_rate | 0.0003 | -| loss | -1.94e-06 | -| n_updates | 178700 | -| policy_gradient_loss | 0.00973 | -| std | 0.00825 | -| value_loss | 2.48e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 17872 | -| time_elapsed | 96676 | -| total_timesteps | 2287616 | -| train/ | | -| approx_kl | 0.012075316 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00558 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 178710 | -| policy_gradient_loss | 0.0603 | -| std | 0.00826 | -| value_loss | 0.000112 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 17873 | -| time_elapsed | 96682 | -| total_timesteps | 2287744 | -| train/ | | -| approx_kl | 0.008931122 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.16 | -| learning_rate | 0.0003 | -| loss | -0.000305 | -| n_updates | 178720 | -| policy_gradient_loss | 0.0181 | -| std | 0.00826 | -| value_loss | 4.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 17874 | -| time_elapsed | 96688 | -| total_timesteps | 2287872 | -| train/ | | -| approx_kl | 0.10355905 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.0042 | -| learning_rate | 0.0003 | -| loss | 0.064 | -| n_updates | 178730 | -| policy_gradient_loss | 0.0103 | -| std | 0.00826 | -| value_loss | 7.81e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17875 | -| time_elapsed | 96693 | -| total_timesteps | 2288000 | -| train/ | | -| approx_kl | 0.07642997 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.0457 | -| n_updates | 178740 | -| policy_gradient_loss | 0.0257 | -| std | 0.00826 | -| value_loss | 1.59e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17876 | -| time_elapsed | 96698 | -| total_timesteps | 2288128 | -| train/ | | -| approx_kl | 0.033093184 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00567 | -| learning_rate | 0.0003 | -| loss | 0.00984 | -| n_updates | 178750 | -| policy_gradient_loss | 0.0222 | -| std | 0.00826 | -| value_loss | 7.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17877 | -| time_elapsed | 96709 | -| total_timesteps | 2288256 | -| train/ | | -| approx_kl | 0.037305187 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.786 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 178760 | -| policy_gradient_loss | 0.00189 | -| std | 0.00826 | -| value_loss | 0.00488 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17878 | -| time_elapsed | 96713 | -| total_timesteps | 2288384 | -| train/ | | -| approx_kl | 0.0915875 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0291 | -| n_updates | 178770 | -| policy_gradient_loss | 0.0171 | -| std | 0.00826 | -| value_loss | 4.19e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17879 | -| time_elapsed | 96716 | -| total_timesteps | 2288512 | -| train/ | | -| approx_kl | 0.12046279 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00688 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 178780 | -| policy_gradient_loss | 0.0153 | -| std | 0.00826 | -| value_loss | 6.39e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17880 | -| time_elapsed | 96719 | -| total_timesteps | 2288640 | -| train/ | | -| approx_kl | 0.021881966 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 178790 | -| policy_gradient_loss | -0.00166 | -| std | 0.00825 | -| value_loss | 2.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17881 | -| time_elapsed | 96724 | -| total_timesteps | 2288768 | -| train/ | | -| approx_kl | 0.010028379 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 178800 | -| policy_gradient_loss | 0.00168 | -| std | 0.00825 | -| value_loss | 3.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 17882 | -| time_elapsed | 96729 | -| total_timesteps | 2288896 | -| train/ | | -| approx_kl | 0.07786855 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.00643 | -| n_updates | 178810 | -| policy_gradient_loss | -0.0146 | -| std | 0.00824 | -| value_loss | 1.23e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17883 | -| time_elapsed | 96733 | -| total_timesteps | 2289024 | -| train/ | | -| approx_kl | 0.014438307 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 178820 | -| policy_gradient_loss | -0.000905 | -| std | 0.00824 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17884 | -| time_elapsed | 96744 | -| total_timesteps | 2289152 | -| train/ | | -| approx_kl | 0.018368669 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 178830 | -| policy_gradient_loss | -0.00907 | -| std | 0.00824 | -| value_loss | 0.000183 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17885 | -| time_elapsed | 96749 | -| total_timesteps | 2289280 | -| train/ | | -| approx_kl | 0.023378443 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00794 | -| n_updates | 178840 | -| policy_gradient_loss | -0.00283 | -| std | 0.00824 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17886 | -| time_elapsed | 96755 | -| total_timesteps | 2289408 | -| train/ | | -| approx_kl | 0.0058590733 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 178850 | -| policy_gradient_loss | 0.00698 | -| std | 0.00824 | -| value_loss | 4.67e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17887 | -| time_elapsed | 96761 | -| total_timesteps | 2289536 | -| train/ | | -| approx_kl | 0.043503273 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 178860 | -| policy_gradient_loss | 0.00782 | -| std | 0.00824 | -| value_loss | 3.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17888 | -| time_elapsed | 96767 | -| total_timesteps | 2289664 | -| train/ | | -| approx_kl | 0.08570629 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.0673 | -| n_updates | 178870 | -| policy_gradient_loss | 0.0526 | -| std | 0.00823 | -| value_loss | 2.18e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17889 | -| time_elapsed | 96773 | -| total_timesteps | 2289792 | -| train/ | | -| approx_kl | 0.0033658398 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | 0.00766 | -| n_updates | 178880 | -| policy_gradient_loss | 0.0023 | -| std | 0.00823 | -| value_loss | 1.39e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 17890 | -| time_elapsed | 96779 | -| total_timesteps | 2289920 | -| train/ | | -| approx_kl | 0.021420278 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | -0.00779 | -| n_updates | 178890 | -| policy_gradient_loss | 0.0255 | -| std | 0.00823 | -| value_loss | 1.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17891 | -| time_elapsed | 96783 | -| total_timesteps | 2290048 | -| train/ | | -| approx_kl | 0.46106568 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.204 | -| n_updates | 178900 | -| policy_gradient_loss | 0.122 | -| std | 0.00823 | -| value_loss | 6.97e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17892 | -| time_elapsed | 96792 | -| total_timesteps | 2290176 | -| train/ | | -| approx_kl | 0.10023991 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.812 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 178910 | -| policy_gradient_loss | 0.00325 | -| std | 0.00823 | -| value_loss | 0.004 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17893 | -| time_elapsed | 96796 | -| total_timesteps | 2290304 | -| train/ | | -| approx_kl | 0.09174179 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 178920 | -| policy_gradient_loss | 0.0189 | -| std | 0.00823 | -| value_loss | 5.27e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17894 | -| time_elapsed | 96801 | -| total_timesteps | 2290432 | -| train/ | | -| approx_kl | 0.0065970304 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | 0.000827 | -| n_updates | 178930 | -| policy_gradient_loss | 0.000453 | -| std | 0.00821 | -| value_loss | 9.57e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17895 | -| time_elapsed | 96806 | -| total_timesteps | 2290560 | -| train/ | | -| approx_kl | 0.00745038 | -| clip_fraction | 0.0578 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 178940 | -| policy_gradient_loss | -0.00609 | -| std | 0.00819 | -| value_loss | 2.95e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17896 | -| time_elapsed | 96812 | -| total_timesteps | 2290688 | -| train/ | | -| approx_kl | 0.006558999 | -| clip_fraction | 0.0273 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00295 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 178950 | -| policy_gradient_loss | -0.000633 | -| std | 0.00818 | -| value_loss | 6.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17897 | -| time_elapsed | 96816 | -| total_timesteps | 2290816 | -| train/ | | -| approx_kl | 0.019436441 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0722 | -| learning_rate | 0.0003 | -| loss | -0.0318 | -| n_updates | 178960 | -| policy_gradient_loss | 0.000824 | -| std | 0.00818 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 17898 | -| time_elapsed | 96821 | -| total_timesteps | 2290944 | -| train/ | | -| approx_kl | 0.062246945 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00449 | -| learning_rate | 0.0003 | -| loss | 0.0336 | -| n_updates | 178970 | -| policy_gradient_loss | 0.0174 | -| std | 0.00818 | -| value_loss | 2.6e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17899 | -| time_elapsed | 96825 | -| total_timesteps | 2291072 | -| train/ | | -| approx_kl | 0.00013077026 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0714 | -| learning_rate | 0.0003 | -| loss | -0.000897 | -| n_updates | 178980 | -| policy_gradient_loss | 0.0174 | -| std | 0.00818 | -| value_loss | 1.71e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17900 | -| time_elapsed | 96835 | -| total_timesteps | 2291200 | -| train/ | | -| approx_kl | 0.27866048 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.599 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 178990 | -| policy_gradient_loss | -0.0084 | -| std | 0.00819 | -| value_loss | 0.00104 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17901 | -| time_elapsed | 96840 | -| total_timesteps | 2291328 | -| train/ | | -| approx_kl | 0.034555092 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -250 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 179000 | -| policy_gradient_loss | -0.00679 | -| std | 0.00819 | -| value_loss | 4.47e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17902 | -| time_elapsed | 96845 | -| total_timesteps | 2291456 | -| train/ | | -| approx_kl | 0.030834585 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -77.5 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 179010 | -| policy_gradient_loss | -0.0147 | -| std | 0.00818 | -| value_loss | 2.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17903 | -| time_elapsed | 96851 | -| total_timesteps | 2291584 | -| train/ | | -| approx_kl | 0.025528187 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0771 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 179020 | -| policy_gradient_loss | -0.00725 | -| std | 0.00818 | -| value_loss | 8.91e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17904 | -| time_elapsed | 96856 | -| total_timesteps | 2291712 | -| train/ | | -| approx_kl | 0.15212362 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00533 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 179030 | -| policy_gradient_loss | 0.0119 | -| std | 0.00818 | -| value_loss | 8.69e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17905 | -| time_elapsed | 96859 | -| total_timesteps | 2291840 | -| train/ | | -| approx_kl | 0.072291195 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 179040 | -| policy_gradient_loss | 0.0257 | -| std | 0.00818 | -| value_loss | 1.84e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 17906 | -| time_elapsed | 96864 | -| total_timesteps | 2291968 | -| train/ | | -| approx_kl | 0.20267294 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 179050 | -| policy_gradient_loss | 0.0906 | -| std | 0.00818 | -| value_loss | 1.32e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17907 | -| time_elapsed | 96869 | -| total_timesteps | 2292096 | -| train/ | | -| approx_kl | 0.15747789 | -| clip_fraction | 0.624 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.0847 | -| n_updates | 179060 | -| policy_gradient_loss | 0.0947 | -| std | 0.00818 | -| value_loss | 9.44e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17908 | -| time_elapsed | 96878 | -| total_timesteps | 2292224 | -| train/ | | -| approx_kl | 0.017383447 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.796 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 179070 | -| policy_gradient_loss | 0.00355 | -| std | 0.00818 | -| value_loss | 0.00454 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17909 | -| time_elapsed | 96883 | -| total_timesteps | 2292352 | -| train/ | | -| approx_kl | 0.07148385 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0995 | -| learning_rate | 0.0003 | -| loss | 0.0625 | -| n_updates | 179080 | -| policy_gradient_loss | 0.044 | -| std | 0.00818 | -| value_loss | 1.56e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17910 | -| time_elapsed | 96886 | -| total_timesteps | 2292480 | -| train/ | | -| approx_kl | 0.27152982 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 179090 | -| policy_gradient_loss | -0.00491 | -| std | 0.00818 | -| value_loss | 3.6e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17911 | -| time_elapsed | 96890 | -| total_timesteps | 2292608 | -| train/ | | -| approx_kl | 0.032085694 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 179100 | -| policy_gradient_loss | 0.00535 | -| std | 0.00818 | -| value_loss | 3.66e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17912 | -| time_elapsed | 96896 | -| total_timesteps | 2292736 | -| train/ | | -| approx_kl | 0.12365168 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 179110 | -| policy_gradient_loss | 0.00887 | -| std | 0.00819 | -| value_loss | 7.9e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17913 | -| time_elapsed | 96900 | -| total_timesteps | 2292864 | -| train/ | | -| approx_kl | 0.009173103 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00494 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 179120 | -| policy_gradient_loss | 0.0135 | -| std | 0.00819 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 17914 | -| time_elapsed | 96905 | -| total_timesteps | 2292992 | -| train/ | | -| approx_kl | 0.052814804 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0044 | -| n_updates | 179130 | -| policy_gradient_loss | 0.0067 | -| std | 0.00819 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 17915 | -| time_elapsed | 96909 | -| total_timesteps | 2293120 | -| train/ | | -| approx_kl | 0.0035003494 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.00453 | -| n_updates | 179140 | -| policy_gradient_loss | 0.00501 | -| std | 0.00818 | -| value_loss | 7.35e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 17916 | -| time_elapsed | 96920 | -| total_timesteps | 2293248 | -| train/ | | -| approx_kl | 0.30706123 | -| clip_fraction | 0.65 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.286 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 179150 | -| policy_gradient_loss | 0.0231 | -| std | 0.00818 | -| value_loss | 0.00151 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 17917 | -| time_elapsed | 96926 | -| total_timesteps | 2293376 | -| train/ | | -| approx_kl | 0.07283595 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 179160 | -| policy_gradient_loss | 0.0038 | -| std | 0.00818 | -| value_loss | 1.78e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 17918 | -| time_elapsed | 96930 | -| total_timesteps | 2293504 | -| train/ | | -| approx_kl | 0.02261321 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -31.5 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 179170 | -| policy_gradient_loss | -0.0102 | -| std | 0.00818 | -| value_loss | 7.81e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 17919 | -| time_elapsed | 96935 | -| total_timesteps | 2293632 | -| train/ | | -| approx_kl | 0.12870674 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -13.9 | -| learning_rate | 0.0003 | -| loss | 0.0693 | -| n_updates | 179180 | -| policy_gradient_loss | 0.0235 | -| std | 0.00818 | -| value_loss | 2.95e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 17920 | -| time_elapsed | 96939 | -| total_timesteps | 2293760 | -| train/ | | -| approx_kl | 0.034329962 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -5.37e-05 | -| n_updates | 179190 | -| policy_gradient_loss | 0.037 | -| std | 0.00818 | -| value_loss | 1.89e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 17921 | -| time_elapsed | 96943 | -| total_timesteps | 2293888 | -| train/ | | -| approx_kl | 0.014412725 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -5.1 | -| learning_rate | 0.0003 | -| loss | -0.0083 | -| n_updates | 179200 | -| policy_gradient_loss | -0.000872 | -| std | 0.00818 | -| value_loss | 2.45e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17922 | -| time_elapsed | 96947 | -| total_timesteps | 2294016 | -| train/ | | -| approx_kl | 0.008174419 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 179210 | -| policy_gradient_loss | 0.00916 | -| std | 0.0082 | -| value_loss | 2.53e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17923 | -| time_elapsed | 96960 | -| total_timesteps | 2294144 | -| train/ | | -| approx_kl | 0.013328019 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.0297 | -| n_updates | 179220 | -| policy_gradient_loss | 0.00359 | -| std | 0.00822 | -| value_loss | 0.000313 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17924 | -| time_elapsed | 96964 | -| total_timesteps | 2294272 | -| train/ | | -| approx_kl | 8.3145685e-05 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.379 | -| learning_rate | 0.0003 | -| loss | 0.000471 | -| n_updates | 179230 | -| policy_gradient_loss | 0.0175 | -| std | 0.00823 | -| value_loss | 8.82e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17925 | -| time_elapsed | 96969 | -| total_timesteps | 2294400 | -| train/ | | -| approx_kl | 0.12669273 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 179240 | -| policy_gradient_loss | 0.0131 | -| std | 0.00823 | -| value_loss | 4.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17926 | -| time_elapsed | 96974 | -| total_timesteps | 2294528 | -| train/ | | -| approx_kl | 0.011522267 | -| clip_fraction | 0.0852 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.578 | -| learning_rate | 0.0003 | -| loss | -0.00643 | -| n_updates | 179250 | -| policy_gradient_loss | -0.00371 | -| std | 0.00823 | -| value_loss | 1.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17927 | -| time_elapsed | 96979 | -| total_timesteps | 2294656 | -| train/ | | -| approx_kl | 0.008102097 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0947 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 179260 | -| policy_gradient_loss | -0.00108 | -| std | 0.00822 | -| value_loss | 8.5e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17928 | -| time_elapsed | 96983 | -| total_timesteps | 2294784 | -| train/ | | -| approx_kl | 0.0066857054 | -| clip_fraction | 0.0391 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | -0.00195 | -| n_updates | 179270 | -| policy_gradient_loss | -0.000986 | -| std | 0.00821 | -| value_loss | 4.91e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 17929 | -| time_elapsed | 96987 | -| total_timesteps | 2294912 | -| train/ | | -| approx_kl | 0.016606007 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 179280 | -| policy_gradient_loss | 0.0147 | -| std | 0.00821 | -| value_loss | 2.91e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17930 | -| time_elapsed | 96991 | -| total_timesteps | 2295040 | -| train/ | | -| approx_kl | 0.07536861 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0406 | -| n_updates | 179290 | -| policy_gradient_loss | 0.0201 | -| std | 0.0082 | -| value_loss | 1.83e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17931 | -| time_elapsed | 97000 | -| total_timesteps | 2295168 | -| train/ | | -| approx_kl | 0.012412107 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 179300 | -| policy_gradient_loss | -0.0171 | -| std | 0.00819 | -| value_loss | 0.00258 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17932 | -| time_elapsed | 97006 | -| total_timesteps | 2295296 | -| train/ | | -| approx_kl | 0.0045643514 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 179310 | -| policy_gradient_loss | 0.00547 | -| std | 0.00819 | -| value_loss | 7.57e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17933 | -| time_elapsed | 97011 | -| total_timesteps | 2295424 | -| train/ | | -| approx_kl | 0.00010940572 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | 0.000923 | -| n_updates | 179320 | -| policy_gradient_loss | 0.00139 | -| std | 0.00819 | -| value_loss | 5.79e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17934 | -| time_elapsed | 97016 | -| total_timesteps | 2295552 | -| train/ | | -| approx_kl | 0.034770336 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 179330 | -| policy_gradient_loss | 0.0406 | -| std | 0.0082 | -| value_loss | 3.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17935 | -| time_elapsed | 97020 | -| total_timesteps | 2295680 | -| train/ | | -| approx_kl | 0.015226893 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0661 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 179340 | -| policy_gradient_loss | 0.00636 | -| std | 0.0082 | -| value_loss | 2.83e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17936 | -| time_elapsed | 97025 | -| total_timesteps | 2295808 | -| train/ | | -| approx_kl | 0.12316301 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.0721 | -| n_updates | 179350 | -| policy_gradient_loss | 0.0117 | -| std | 0.00819 | -| value_loss | 1.69e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 17937 | -| time_elapsed | 97027 | -| total_timesteps | 2295936 | -| train/ | | -| approx_kl | 0.002530049 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.000418 | -| n_updates | 179360 | -| policy_gradient_loss | 0.0149 | -| std | 0.00819 | -| value_loss | 2.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17938 | -| time_elapsed | 97032 | -| total_timesteps | 2296064 | -| train/ | | -| approx_kl | 0.09238914 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 179370 | -| policy_gradient_loss | 0.0316 | -| std | 0.00819 | -| value_loss | 1.29e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17939 | -| time_elapsed | 97040 | -| total_timesteps | 2296192 | -| train/ | | -| approx_kl | 0.005901308 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -5.67 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 179380 | -| policy_gradient_loss | -0.0138 | -| std | 0.0082 | -| value_loss | 0.00335 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17940 | -| time_elapsed | 97044 | -| total_timesteps | 2296320 | -| train/ | | -| approx_kl | 0.03538397 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00888 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 179390 | -| policy_gradient_loss | 0.0496 | -| std | 0.00821 | -| value_loss | 1.28e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17941 | -| time_elapsed | 97050 | -| total_timesteps | 2296448 | -| train/ | | -| approx_kl | 0.0034074504 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 179400 | -| policy_gradient_loss | 0.0196 | -| std | 0.00821 | -| value_loss | 2.95e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17942 | -| time_elapsed | 97056 | -| total_timesteps | 2296576 | -| train/ | | -| approx_kl | 0.4605463 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | 0.0734 | -| n_updates | 179410 | -| policy_gradient_loss | 0.0286 | -| std | 0.00821 | -| value_loss | 4.59e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17943 | -| time_elapsed | 97060 | -| total_timesteps | 2296704 | -| train/ | | -| approx_kl | 0.06586717 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 179420 | -| policy_gradient_loss | -0.00687 | -| std | 0.00821 | -| value_loss | 1.55e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17944 | -| time_elapsed | 97064 | -| total_timesteps | 2296832 | -| train/ | | -| approx_kl | 0.020718314 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | 0.00331 | -| n_updates | 179430 | -| policy_gradient_loss | 0.0042 | -| std | 0.00821 | -| value_loss | 1.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 17945 | -| time_elapsed | 97069 | -| total_timesteps | 2296960 | -| train/ | | -| approx_kl | 0.03717352 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.00137 | -| n_updates | 179440 | -| policy_gradient_loss | 0.00167 | -| std | 0.00821 | -| value_loss | 8.46e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17946 | -| time_elapsed | 97074 | -| total_timesteps | 2297088 | -| train/ | | -| approx_kl | 0.061805684 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 179450 | -| policy_gradient_loss | 0.00665 | -| std | 0.00821 | -| value_loss | 6.26e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17947 | -| time_elapsed | 97082 | -| total_timesteps | 2297216 | -| train/ | | -| approx_kl | 0.013254255 | -| clip_fraction | 0.568 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | 0.00737 | -| n_updates | 179460 | -| policy_gradient_loss | 0.0295 | -| std | 0.00821 | -| value_loss | 0.000238 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17948 | -| time_elapsed | 97088 | -| total_timesteps | 2297344 | -| train/ | | -| approx_kl | 0.10449384 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 179470 | -| policy_gradient_loss | 0.0144 | -| std | 0.00821 | -| value_loss | 1.79e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17949 | -| time_elapsed | 97094 | -| total_timesteps | 2297472 | -| train/ | | -| approx_kl | 0.4756089 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.093 | -| n_updates | 179480 | -| policy_gradient_loss | 0.043 | -| std | 0.00821 | -| value_loss | 5.4e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17950 | -| time_elapsed | 97099 | -| total_timesteps | 2297600 | -| train/ | | -| approx_kl | 0.030005377 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 179490 | -| policy_gradient_loss | 0.00909 | -| std | 0.00821 | -| value_loss | 4.27e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17951 | -| time_elapsed | 97104 | -| total_timesteps | 2297728 | -| train/ | | -| approx_kl | 0.13401179 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.0826 | -| n_updates | 179500 | -| policy_gradient_loss | 0.0237 | -| std | 0.00825 | -| value_loss | 2.7e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17952 | -| time_elapsed | 97109 | -| total_timesteps | 2297856 | -| train/ | | -| approx_kl | 0.007450999 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 179510 | -| policy_gradient_loss | 0.000946 | -| std | 0.00825 | -| value_loss | 1.63e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 17953 | -| time_elapsed | 97113 | -| total_timesteps | 2297984 | -| train/ | | -| approx_kl | 0.017281555 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 179520 | -| policy_gradient_loss | 0.0148 | -| std | 0.00824 | -| value_loss | 1.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17954 | -| time_elapsed | 97117 | -| total_timesteps | 2298112 | -| train/ | | -| approx_kl | 0.16275243 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.0913 | -| n_updates | 179530 | -| policy_gradient_loss | 0.093 | -| std | 0.00824 | -| value_loss | 7.23e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17955 | -| time_elapsed | 97129 | -| total_timesteps | 2298240 | -| train/ | | -| approx_kl | 0.0011876244 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 179540 | -| policy_gradient_loss | 0.00119 | -| std | 0.00824 | -| value_loss | 0.00181 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17956 | -| time_elapsed | 97133 | -| total_timesteps | 2298368 | -| train/ | | -| approx_kl | 0.009820439 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 179550 | -| policy_gradient_loss | -0.00244 | -| std | 0.00824 | -| value_loss | 1.01e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17957 | -| time_elapsed | 97139 | -| total_timesteps | 2298496 | -| train/ | | -| approx_kl | 0.0432391 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 179560 | -| policy_gradient_loss | -0.0106 | -| std | 0.00823 | -| value_loss | 8.37e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17958 | -| time_elapsed | 97143 | -| total_timesteps | 2298624 | -| train/ | | -| approx_kl | 0.033534802 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 179570 | -| policy_gradient_loss | 0.00852 | -| std | 0.00823 | -| value_loss | 6.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17959 | -| time_elapsed | 97148 | -| total_timesteps | 2298752 | -| train/ | | -| approx_kl | 0.028398775 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 179580 | -| policy_gradient_loss | 0.00619 | -| std | 0.00823 | -| value_loss | 4.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 17960 | -| time_elapsed | 97153 | -| total_timesteps | 2298880 | -| train/ | | -| approx_kl | 0.025838438 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.00804 | -| n_updates | 179590 | -| policy_gradient_loss | 0.0039 | -| std | 0.00823 | -| value_loss | 2.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17961 | -| time_elapsed | 97159 | -| total_timesteps | 2299008 | -| train/ | | -| approx_kl | 0.030110799 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 179600 | -| policy_gradient_loss | 0.00817 | -| std | 0.00823 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17962 | -| time_elapsed | 97172 | -| total_timesteps | 2299136 | -| train/ | | -| approx_kl | 0.09625937 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.16 | -| learning_rate | 0.0003 | -| loss | -0.00842 | -| n_updates | 179610 | -| policy_gradient_loss | -0.00925 | -| std | 0.00823 | -| value_loss | 0.00255 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17963 | -| time_elapsed | 97177 | -| total_timesteps | 2299264 | -| train/ | | -| approx_kl | 0.029208308 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.677 | -| learning_rate | 0.0003 | -| loss | 0.0061 | -| n_updates | 179620 | -| policy_gradient_loss | 0.00823 | -| std | 0.00824 | -| value_loss | 2.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17964 | -| time_elapsed | 97182 | -| total_timesteps | 2299392 | -| train/ | | -| approx_kl | 0.09057071 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -4.69 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 179630 | -| policy_gradient_loss | 0.0203 | -| std | 0.00824 | -| value_loss | 8.54e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17965 | -| time_elapsed | 97187 | -| total_timesteps | 2299520 | -| train/ | | -| approx_kl | 0.20734677 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.39 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 179640 | -| policy_gradient_loss | 0.0749 | -| std | 0.00824 | -| value_loss | 3e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17966 | -| time_elapsed | 97193 | -| total_timesteps | 2299648 | -| train/ | | -| approx_kl | 0.044236183 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.339 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 179650 | -| policy_gradient_loss | 0.0181 | -| std | 0.00824 | -| value_loss | 1.49e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17967 | -| time_elapsed | 97198 | -| total_timesteps | 2299776 | -| train/ | | -| approx_kl | 0.50249076 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 179660 | -| policy_gradient_loss | 0.0512 | -| std | 0.00824 | -| value_loss | 1.13e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17968 | -| time_elapsed | 97203 | -| total_timesteps | 2299904 | -| train/ | | -| approx_kl | 0.018196195 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0906 | -| learning_rate | 0.0003 | -| loss | 0.00687 | -| n_updates | 179670 | -| policy_gradient_loss | 0.00444 | -| std | 0.00823 | -| value_loss | 9e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17969 | -| time_elapsed | 97208 | -| total_timesteps | 2300032 | -| train/ | | -| approx_kl | 0.006881802 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0615 | -| learning_rate | 0.0003 | -| loss | -0.00911 | -| n_updates | 179680 | -| policy_gradient_loss | 0.00114 | -| std | 0.00823 | -| value_loss | 2.03e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17970 | -| time_elapsed | 97219 | -| total_timesteps | 2300160 | -| train/ | | -| approx_kl | 0.07475991 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.32 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 179690 | -| policy_gradient_loss | -0.00695 | -| std | 0.00823 | -| value_loss | 0.00193 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17971 | -| time_elapsed | 97224 | -| total_timesteps | 2300288 | -| train/ | | -| approx_kl | 0.13822897 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.205 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 179700 | -| policy_gradient_loss | 0.0234 | -| std | 0.00823 | -| value_loss | 2.58e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17972 | -| time_elapsed | 97229 | -| total_timesteps | 2300416 | -| train/ | | -| approx_kl | 0.027780341 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00625 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 179710 | -| policy_gradient_loss | 0.0448 | -| std | 0.00824 | -| value_loss | 3.85e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17973 | -| time_elapsed | 97235 | -| total_timesteps | 2300544 | -| train/ | | -| approx_kl | 0.04221563 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.13 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 179720 | -| policy_gradient_loss | 0.0133 | -| std | 0.00822 | -| value_loss | 2.11e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17974 | -| time_elapsed | 97240 | -| total_timesteps | 2300672 | -| train/ | | -| approx_kl | 0.23742396 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | 0.216 | -| n_updates | 179730 | -| policy_gradient_loss | 0.0668 | -| std | 0.00822 | -| value_loss | 6.77e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17975 | -| time_elapsed | 97246 | -| total_timesteps | 2300800 | -| train/ | | -| approx_kl | 0.031023916 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00264 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 179740 | -| policy_gradient_loss | 0.0511 | -| std | 0.00821 | -| value_loss | 1.8e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 17976 | -| time_elapsed | 97249 | -| total_timesteps | 2300928 | -| train/ | | -| approx_kl | 0.17534724 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.0918 | -| n_updates | 179750 | -| policy_gradient_loss | 0.0335 | -| std | 0.00821 | -| value_loss | 1.12e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17977 | -| time_elapsed | 97253 | -| total_timesteps | 2301056 | -| train/ | | -| approx_kl | 0.032280575 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.00229 | -| n_updates | 179760 | -| policy_gradient_loss | 0.0363 | -| std | 0.00822 | -| value_loss | 9.33e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17978 | -| time_elapsed | 97261 | -| total_timesteps | 2301184 | -| train/ | | -| approx_kl | 0.12768345 | -| clip_fraction | 0.582 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.666 | -| learning_rate | 0.0003 | -| loss | 0.00715 | -| n_updates | 179770 | -| policy_gradient_loss | 0.00153 | -| std | 0.00822 | -| value_loss | 0.000694 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17979 | -| time_elapsed | 97267 | -| total_timesteps | 2301312 | -| train/ | | -| approx_kl | 0.09023143 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.0732 | -| n_updates | 179780 | -| policy_gradient_loss | 0.0874 | -| std | 0.00822 | -| value_loss | 7.22e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17980 | -| time_elapsed | 97271 | -| total_timesteps | 2301440 | -| train/ | | -| approx_kl | 0.01568314 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00175 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 179790 | -| policy_gradient_loss | 0.021 | -| std | 0.00822 | -| value_loss | 1.55e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17981 | -| time_elapsed | 97275 | -| total_timesteps | 2301568 | -| train/ | | -| approx_kl | 0.36193433 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 179800 | -| policy_gradient_loss | 0.0408 | -| std | 0.00822 | -| value_loss | 1.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17982 | -| time_elapsed | 97280 | -| total_timesteps | 2301696 | -| train/ | | -| approx_kl | 0.027947169 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.00431 | -| n_updates | 179810 | -| policy_gradient_loss | 0.00255 | -| std | 0.00822 | -| value_loss | 7.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17983 | -| time_elapsed | 97285 | -| total_timesteps | 2301824 | -| train/ | | -| approx_kl | 0.031375457 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 179820 | -| policy_gradient_loss | 0.00772 | -| std | 0.00822 | -| value_loss | 4.64e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 17984 | -| time_elapsed | 97289 | -| total_timesteps | 2301952 | -| train/ | | -| approx_kl | 0.0053187083 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | -0.000951 | -| n_updates | 179830 | -| policy_gradient_loss | 0.00322 | -| std | 0.00823 | -| value_loss | 5.71e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17985 | -| time_elapsed | 97294 | -| total_timesteps | 2302080 | -| train/ | | -| approx_kl | 0.05152985 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 179840 | -| policy_gradient_loss | 0.00845 | -| std | 0.00824 | -| value_loss | 2.04e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17986 | -| time_elapsed | 97301 | -| total_timesteps | 2302208 | -| train/ | | -| approx_kl | 0.19371785 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | 0.00843 | -| n_updates | 179850 | -| policy_gradient_loss | 0.000505 | -| std | 0.00825 | -| value_loss | 8.13e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17987 | -| time_elapsed | 97307 | -| total_timesteps | 2302336 | -| train/ | | -| approx_kl | 0.11753603 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -4.06 | -| learning_rate | 0.0003 | -| loss | 0.097 | -| n_updates | 179860 | -| policy_gradient_loss | 0.0532 | -| std | 0.00825 | -| value_loss | 3.59e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17988 | -| time_elapsed | 97311 | -| total_timesteps | 2302464 | -| train/ | | -| approx_kl | 0.026853193 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -17.7 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 179870 | -| policy_gradient_loss | 0.00896 | -| std | 0.00824 | -| value_loss | 1.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17989 | -| time_elapsed | 97316 | -| total_timesteps | 2302592 | -| train/ | | -| approx_kl | 0.081890754 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.291 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 179880 | -| policy_gradient_loss | 0.0265 | -| std | 0.00824 | -| value_loss | 3.41e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17990 | -| time_elapsed | 97321 | -| total_timesteps | 2302720 | -| train/ | | -| approx_kl | 0.118618526 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00368 | -| learning_rate | 0.0003 | -| loss | 0.0594 | -| n_updates | 179890 | -| policy_gradient_loss | 0.0252 | -| std | 0.00824 | -| value_loss | 1.38e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17991 | -| time_elapsed | 97326 | -| total_timesteps | 2302848 | -| train/ | | -| approx_kl | 0.028721618 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | -0.00865 | -| n_updates | 179900 | -| policy_gradient_loss | 0.0435 | -| std | 0.00825 | -| value_loss | 1.15e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17992 | -| time_elapsed | 97331 | -| total_timesteps | 2302976 | -| train/ | | -| approx_kl | 0.15686025 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.0429 | -| n_updates | 179910 | -| policy_gradient_loss | 0.0306 | -| std | 0.00824 | -| value_loss | 1.01e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17993 | -| time_elapsed | 97336 | -| total_timesteps | 2303104 | -| train/ | | -| approx_kl | 0.0005797208 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 179920 | -| policy_gradient_loss | 0.00407 | -| std | 0.00824 | -| value_loss | 6.24e-12 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17994 | -| time_elapsed | 97347 | -| total_timesteps | 2303232 | -| train/ | | -| approx_kl | 0.017921068 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.753 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 179930 | -| policy_gradient_loss | 0.0213 | -| std | 0.00824 | -| value_loss | 0.00511 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17995 | -| time_elapsed | 97352 | -| total_timesteps | 2303360 | -| train/ | | -| approx_kl | 0.031125965 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 179940 | -| policy_gradient_loss | 0.016 | -| std | 0.00824 | -| value_loss | 4.15e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17996 | -| time_elapsed | 97357 | -| total_timesteps | 2303488 | -| train/ | | -| approx_kl | 0.019004181 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00687 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 179950 | -| policy_gradient_loss | 0.0186 | -| std | 0.00824 | -| value_loss | 3.15e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17997 | -| time_elapsed | 97362 | -| total_timesteps | 2303616 | -| train/ | | -| approx_kl | 0.0040820194 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | -0.00523 | -| n_updates | 179960 | -| policy_gradient_loss | 0.0141 | -| std | 0.00823 | -| value_loss | 2.22e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17998 | -| time_elapsed | 97366 | -| total_timesteps | 2303744 | -| train/ | | -| approx_kl | 0.06362812 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 179970 | -| policy_gradient_loss | 0.0323 | -| std | 0.00823 | -| value_loss | 1.45e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 17999 | -| time_elapsed | 97371 | -| total_timesteps | 2303872 | -| train/ | | -| approx_kl | 0.08264377 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.0337 | -| n_updates | 179980 | -| policy_gradient_loss | 0.015 | -| std | 0.00823 | -| value_loss | 1.05e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18000 | -| time_elapsed | 97376 | -| total_timesteps | 2304000 | -| train/ | | -| approx_kl | 0.00058396487 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 179990 | -| policy_gradient_loss | 0.0166 | -| std | 0.00822 | -| value_loss | 7e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18001 | -| time_elapsed | 97381 | -| total_timesteps | 2304128 | -| train/ | | -| approx_kl | 0.025955278 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00316 | -| learning_rate | 0.0003 | -| loss | -0.0284 | -| n_updates | 180000 | -| policy_gradient_loss | -0.0191 | -| std | 0.00822 | -| value_loss | 4.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18002 | -| time_elapsed | 97391 | -| total_timesteps | 2304256 | -| train/ | | -| approx_kl | 0.19867346 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | 0.0482 | -| n_updates | 180010 | -| policy_gradient_loss | 0.049 | -| std | 0.00822 | -| value_loss | 0.000494 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18003 | -| time_elapsed | 97396 | -| total_timesteps | 2304384 | -| train/ | | -| approx_kl | 0.1647613 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00889 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 180020 | -| policy_gradient_loss | 0.099 | -| std | 0.00822 | -| value_loss | 2.44e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18004 | -| time_elapsed | 97400 | -| total_timesteps | 2304512 | -| train/ | | -| approx_kl | 0.12103553 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00564 | -| learning_rate | 0.0003 | -| loss | 0.0976 | -| n_updates | 180030 | -| policy_gradient_loss | 0.119 | -| std | 0.00822 | -| value_loss | 8.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18005 | -| time_elapsed | 97403 | -| total_timesteps | 2304640 | -| train/ | | -| approx_kl | 0.025859568 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0095 | -| learning_rate | 0.0003 | -| loss | 0.00464 | -| n_updates | 180040 | -| policy_gradient_loss | 0.0188 | -| std | 0.00822 | -| value_loss | 5.16e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18006 | -| time_elapsed | 97408 | -| total_timesteps | 2304768 | -| train/ | | -| approx_kl | 0.3857317 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 180050 | -| policy_gradient_loss | 0.0416 | -| std | 0.00822 | -| value_loss | 3.91e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 18007 | -| time_elapsed | 97414 | -| total_timesteps | 2304896 | -| train/ | | -| approx_kl | 0.007445587 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 180060 | -| policy_gradient_loss | 0.00348 | -| std | 0.00823 | -| value_loss | 2.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18008 | -| time_elapsed | 97418 | -| total_timesteps | 2305024 | -| train/ | | -| approx_kl | 0.046375133 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0795 | -| learning_rate | 0.0003 | -| loss | 0.0381 | -| n_updates | 180070 | -| policy_gradient_loss | 0.0157 | -| std | 0.00822 | -| value_loss | 1.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18009 | -| time_elapsed | 97429 | -| total_timesteps | 2305152 | -| train/ | | -| approx_kl | 0.053138763 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.907 | -| learning_rate | 0.0003 | -| loss | -0.00654 | -| n_updates | 180080 | -| policy_gradient_loss | -0.00551 | -| std | 0.00822 | -| value_loss | 0.001 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18010 | -| time_elapsed | 97434 | -| total_timesteps | 2305280 | -| train/ | | -| approx_kl | 0.0029641534 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 180090 | -| policy_gradient_loss | 0.0038 | -| std | 0.00821 | -| value_loss | 1.68e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18011 | -| time_elapsed | 97439 | -| total_timesteps | 2305408 | -| train/ | | -| approx_kl | 0.02334305 | -| clip_fraction | 0.539 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 180100 | -| policy_gradient_loss | 0.0869 | -| std | 0.0082 | -| value_loss | 7.4e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18012 | -| time_elapsed | 97444 | -| total_timesteps | 2305536 | -| train/ | | -| approx_kl | 0.06964714 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 180110 | -| policy_gradient_loss | 0.0799 | -| std | 0.0082 | -| value_loss | 8.14e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18013 | -| time_elapsed | 97449 | -| total_timesteps | 2305664 | -| train/ | | -| approx_kl | 0.083506815 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.0809 | -| n_updates | 180120 | -| policy_gradient_loss | 0.108 | -| std | 0.0082 | -| value_loss | 5.63e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18014 | -| time_elapsed | 97453 | -| total_timesteps | 2305792 | -| train/ | | -| approx_kl | 0.077154845 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 180130 | -| policy_gradient_loss | 0.0965 | -| std | 0.0082 | -| value_loss | 4.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 18015 | -| time_elapsed | 97457 | -| total_timesteps | 2305920 | -| train/ | | -| approx_kl | 0.019024756 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 180140 | -| policy_gradient_loss | 0.0199 | -| std | 0.0082 | -| value_loss | 3.95e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18016 | -| time_elapsed | 97462 | -| total_timesteps | 2306048 | -| train/ | | -| approx_kl | 0.10594272 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 180150 | -| policy_gradient_loss | 0.0135 | -| std | 0.0082 | -| value_loss | 2.35e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18017 | -| time_elapsed | 97471 | -| total_timesteps | 2306176 | -| train/ | | -| approx_kl | 0.041695975 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.544 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 180160 | -| policy_gradient_loss | -0.0135 | -| std | 0.0082 | -| value_loss | 0.00086 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18018 | -| time_elapsed | 97475 | -| total_timesteps | 2306304 | -| train/ | | -| approx_kl | 0.07147353 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 180170 | -| policy_gradient_loss | 0.0176 | -| std | 0.0082 | -| value_loss | 1.3e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18019 | -| time_elapsed | 97479 | -| total_timesteps | 2306432 | -| train/ | | -| approx_kl | 0.00033785636 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 180180 | -| policy_gradient_loss | 0.0199 | -| std | 0.00819 | -| value_loss | 3.25e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18020 | -| time_elapsed | 97483 | -| total_timesteps | 2306560 | -| train/ | | -| approx_kl | 0.4038733 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 180190 | -| policy_gradient_loss | 0.0463 | -| std | 0.00819 | -| value_loss | 2.79e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18021 | -| time_elapsed | 97488 | -| total_timesteps | 2306688 | -| train/ | | -| approx_kl | 0.026554562 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | 0.000275 | -| n_updates | 180200 | -| policy_gradient_loss | 0.000826 | -| std | 0.00819 | -| value_loss | 2.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18022 | -| time_elapsed | 97493 | -| total_timesteps | 2306816 | -| train/ | | -| approx_kl | 0.005944582 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.00421 | -| n_updates | 180210 | -| policy_gradient_loss | 0.00271 | -| std | 0.0082 | -| value_loss | 1.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18023 | -| time_elapsed | 97498 | -| total_timesteps | 2306944 | -| train/ | | -| approx_kl | 0.065267175 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 180220 | -| policy_gradient_loss | 0.0105 | -| std | 0.0082 | -| value_loss | 8.62e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18024 | -| time_elapsed | 97502 | -| total_timesteps | 2307072 | -| train/ | | -| approx_kl | 0.029089289 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 180230 | -| policy_gradient_loss | 0.0359 | -| std | 0.00819 | -| value_loss | 4.88e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18025 | -| time_elapsed | 97510 | -| total_timesteps | 2307200 | -| train/ | | -| approx_kl | 0.37984866 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 180240 | -| policy_gradient_loss | 0.0608 | -| std | 0.00819 | -| value_loss | 0.0055 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18026 | -| time_elapsed | 97515 | -| total_timesteps | 2307328 | -| train/ | | -| approx_kl | 0.015100483 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 180250 | -| policy_gradient_loss | 0.00945 | -| std | 0.00819 | -| value_loss | 1.22e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18027 | -| time_elapsed | 97519 | -| total_timesteps | 2307456 | -| train/ | | -| approx_kl | 0.07074535 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.0074 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 180260 | -| policy_gradient_loss | 0.0195 | -| std | 0.00819 | -| value_loss | 1.11e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18028 | -| time_elapsed | 97523 | -| total_timesteps | 2307584 | -| train/ | | -| approx_kl | 0.2086494 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 180270 | -| policy_gradient_loss | 0.0154 | -| std | 0.00819 | -| value_loss | 6.22e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18029 | -| time_elapsed | 97528 | -| total_timesteps | 2307712 | -| train/ | | -| approx_kl | 0.04737571 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 180280 | -| policy_gradient_loss | 0.0273 | -| std | 0.00818 | -| value_loss | 4.08e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18030 | -| time_elapsed | 97533 | -| total_timesteps | 2307840 | -| train/ | | -| approx_kl | 0.1743185 | -| clip_fraction | 0.624 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 180290 | -| policy_gradient_loss | 0.0845 | -| std | 0.00818 | -| value_loss | 2.98e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18031 | -| time_elapsed | 97537 | -| total_timesteps | 2307968 | -| train/ | | -| approx_kl | 0.11365434 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0911 | -| n_updates | 180300 | -| policy_gradient_loss | 0.0861 | -| std | 0.00818 | -| value_loss | 2.06e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18032 | -| time_elapsed | 97542 | -| total_timesteps | 2308096 | -| train/ | | -| approx_kl | 0.13954057 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 180310 | -| policy_gradient_loss | 0.116 | -| std | 0.00818 | -| value_loss | 1.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18033 | -| time_elapsed | 97551 | -| total_timesteps | 2308224 | -| train/ | | -| approx_kl | 0.022923887 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | 1.02e-05 | -| n_updates | 180320 | -| policy_gradient_loss | 0.00722 | -| std | 0.00818 | -| value_loss | 0.00126 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18034 | -| time_elapsed | 97555 | -| total_timesteps | 2308352 | -| train/ | | -| approx_kl | 0.11799426 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00547 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 180330 | -| policy_gradient_loss | 0.0128 | -| std | 0.00817 | -| value_loss | 1.84e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18035 | -| time_elapsed | 97560 | -| total_timesteps | 2308480 | -| train/ | | -| approx_kl | 0.0145740835 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 180340 | -| policy_gradient_loss | 0.0115 | -| std | 0.00816 | -| value_loss | 1.11e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18036 | -| time_elapsed | 97565 | -| total_timesteps | 2308608 | -| train/ | | -| approx_kl | 0.07334512 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.342 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 180350 | -| policy_gradient_loss | 0.0159 | -| std | 0.00816 | -| value_loss | 6.32e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18037 | -| time_elapsed | 97571 | -| total_timesteps | 2308736 | -| train/ | | -| approx_kl | 0.013204208 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 180360 | -| policy_gradient_loss | -0.00307 | -| std | 0.00816 | -| value_loss | 3.44e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18038 | -| time_elapsed | 97577 | -| total_timesteps | 2308864 | -| train/ | | -| approx_kl | 0.0022258712 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 180370 | -| policy_gradient_loss | 0.0222 | -| std | 0.00815 | -| value_loss | 2.08e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18039 | -| time_elapsed | 97583 | -| total_timesteps | 2308992 | -| train/ | | -| approx_kl | 0.15947922 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 180380 | -| policy_gradient_loss | 0.0104 | -| std | 0.00815 | -| value_loss | 1.44e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 18040 | -| time_elapsed | 97589 | -| total_timesteps | 2309120 | -| train/ | | -| approx_kl | 0.16200905 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 180390 | -| policy_gradient_loss | 0.0101 | -| std | 0.00813 | -| value_loss | 1.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 18041 | -| time_elapsed | 97601 | -| total_timesteps | 2309248 | -| train/ | | -| approx_kl | 0.07109863 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.538 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 180400 | -| policy_gradient_loss | 0.00324 | -| std | 0.00813 | -| value_loss | 0.000878 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 18042 | -| time_elapsed | 97607 | -| total_timesteps | 2309376 | -| train/ | | -| approx_kl | 0.26367483 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.000263 | -| learning_rate | 0.0003 | -| loss | 0.0805 | -| n_updates | 180410 | -| policy_gradient_loss | 0.014 | -| std | 0.00812 | -| value_loss | 4.73e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 18043 | -| time_elapsed | 97611 | -| total_timesteps | 2309504 | -| train/ | | -| approx_kl | 0.020798657 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.00322 | -| n_updates | 180420 | -| policy_gradient_loss | -0.00109 | -| std | 0.00812 | -| value_loss | 1.44e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 18044 | -| time_elapsed | 97616 | -| total_timesteps | 2309632 | -| train/ | | -| approx_kl | 0.006899303 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0952 | -| learning_rate | 0.0003 | -| loss | 6.57e-06 | -| n_updates | 180430 | -| policy_gradient_loss | 0.0165 | -| std | 0.00815 | -| value_loss | 2.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 18045 | -| time_elapsed | 97621 | -| total_timesteps | 2309760 | -| train/ | | -| approx_kl | 0.025700537 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 180440 | -| policy_gradient_loss | 0.0392 | -| std | 0.00819 | -| value_loss | 1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 18046 | -| time_elapsed | 97625 | -| total_timesteps | 2309888 | -| train/ | | -| approx_kl | 0.009260326 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00994 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 180450 | -| policy_gradient_loss | 0.0161 | -| std | 0.0082 | -| value_loss | 6.55e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18047 | -| time_elapsed | 97631 | -| total_timesteps | 2310016 | -| train/ | | -| approx_kl | 0.12848654 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 180460 | -| policy_gradient_loss | 0.0243 | -| std | 0.0082 | -| value_loss | 1.46e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18048 | -| time_elapsed | 97642 | -| total_timesteps | 2310144 | -| train/ | | -| approx_kl | 0.3606597 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 180470 | -| policy_gradient_loss | 0.00969 | -| std | 0.00819 | -| value_loss | 0.000155 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18049 | -| time_elapsed | 97647 | -| total_timesteps | 2310272 | -| train/ | | -| approx_kl | 0.045660995 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.0032 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 180480 | -| policy_gradient_loss | 0.00874 | -| std | 0.00819 | -| value_loss | 3.13e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18050 | -| time_elapsed | 97652 | -| total_timesteps | 2310400 | -| train/ | | -| approx_kl | 0.0012261234 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00128 | -| learning_rate | 0.0003 | -| loss | -0.00045 | -| n_updates | 180490 | -| policy_gradient_loss | 0.00424 | -| std | 0.00819 | -| value_loss | 4.91e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18051 | -| time_elapsed | 97657 | -| total_timesteps | 2310528 | -| train/ | | -| approx_kl | 0.022262733 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 180500 | -| policy_gradient_loss | 0.0168 | -| std | 0.00819 | -| value_loss | 7.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18052 | -| time_elapsed | 97662 | -| total_timesteps | 2310656 | -| train/ | | -| approx_kl | 0.40937284 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00304 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 180510 | -| policy_gradient_loss | 0.043 | -| std | 0.00819 | -| value_loss | 4.68e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18053 | -| time_elapsed | 97665 | -| total_timesteps | 2310784 | -| train/ | | -| approx_kl | 0.045822076 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0963 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 180520 | -| policy_gradient_loss | 0.00627 | -| std | 0.0082 | -| value_loss | 1.19e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18054 | -| time_elapsed | 97669 | -| total_timesteps | 2310912 | -| train/ | | -| approx_kl | 0.0045028487 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.000824 | -| n_updates | 180530 | -| policy_gradient_loss | 0.0055 | -| std | 0.0082 | -| value_loss | 7.26e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18055 | -| time_elapsed | 97673 | -| total_timesteps | 2311040 | -| train/ | | -| approx_kl | 0.0039989823 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | -0.00914 | -| n_updates | 180540 | -| policy_gradient_loss | 0.00453 | -| std | 0.00819 | -| value_loss | 2.86e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18056 | -| time_elapsed | 97682 | -| total_timesteps | 2311168 | -| train/ | | -| approx_kl | 0.29389206 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -1.44 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 180550 | -| policy_gradient_loss | 0.0037 | -| std | 0.00819 | -| value_loss | 0.00196 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18057 | -| time_elapsed | 97687 | -| total_timesteps | 2311296 | -| train/ | | -| approx_kl | 0.012678625 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.00509 | -| n_updates | 180560 | -| policy_gradient_loss | 0.00808 | -| std | 0.00819 | -| value_loss | 3.24e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18058 | -| time_elapsed | 97693 | -| total_timesteps | 2311424 | -| train/ | | -| approx_kl | 0.0032164054 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00523 | -| learning_rate | 0.0003 | -| loss | -0.000979 | -| n_updates | 180570 | -| policy_gradient_loss | 0.00187 | -| std | 0.0082 | -| value_loss | 1.36e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18059 | -| time_elapsed | 97698 | -| total_timesteps | 2311552 | -| train/ | | -| approx_kl | 0.023500133 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0609 | -| learning_rate | 0.0003 | -| loss | 0.0341 | -| n_updates | 180580 | -| policy_gradient_loss | 0.0482 | -| std | 0.00821 | -| value_loss | 4.88e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18060 | -| time_elapsed | 97702 | -| total_timesteps | 2311680 | -| train/ | | -| approx_kl | 0.06908596 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00586 | -| learning_rate | 0.0003 | -| loss | 0.0686 | -| n_updates | 180590 | -| policy_gradient_loss | 0.0812 | -| std | 0.00822 | -| value_loss | 5.84e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18061 | -| time_elapsed | 97707 | -| total_timesteps | 2311808 | -| train/ | | -| approx_kl | 0.0140204225 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00865 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 180600 | -| policy_gradient_loss | 0.0128 | -| std | 0.00822 | -| value_loss | 3.54e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 18062 | -| time_elapsed | 97711 | -| total_timesteps | 2311936 | -| train/ | | -| approx_kl | 0.30832013 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 180610 | -| policy_gradient_loss | 0.0363 | -| std | 0.00822 | -| value_loss | 1.97e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18063 | -| time_elapsed | 97715 | -| total_timesteps | 2312064 | -| train/ | | -| approx_kl | 0.031131057 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 180620 | -| policy_gradient_loss | -0.00238 | -| std | 0.00822 | -| value_loss | 1.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18064 | -| time_elapsed | 97723 | -| total_timesteps | 2312192 | -| train/ | | -| approx_kl | 0.003271745 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.85 | -| learning_rate | 0.0003 | -| loss | -0.00361 | -| n_updates | 180630 | -| policy_gradient_loss | -0.00253 | -| std | 0.00822 | -| value_loss | 0.00209 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18065 | -| time_elapsed | 97728 | -| total_timesteps | 2312320 | -| train/ | | -| approx_kl | 0.02560844 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | 0.00875 | -| n_updates | 180640 | -| policy_gradient_loss | 0.00596 | -| std | 0.00821 | -| value_loss | 2.11e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18066 | -| time_elapsed | 97733 | -| total_timesteps | 2312448 | -| train/ | | -| approx_kl | 0.004497143 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 180650 | -| policy_gradient_loss | 7.51e-05 | -| std | 0.00821 | -| value_loss | 4.06e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18067 | -| time_elapsed | 97738 | -| total_timesteps | 2312576 | -| train/ | | -| approx_kl | 3.2315496e-05 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | 7.42e-05 | -| n_updates | 180660 | -| policy_gradient_loss | 0.0219 | -| std | 0.00821 | -| value_loss | 3.48e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18068 | -| time_elapsed | 97741 | -| total_timesteps | 2312704 | -| train/ | | -| approx_kl | 0.13948935 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0847 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 180670 | -| policy_gradient_loss | 0.0494 | -| std | 0.00821 | -| value_loss | 2.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18069 | -| time_elapsed | 97747 | -| total_timesteps | 2312832 | -| train/ | | -| approx_kl | 0.073062964 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 180680 | -| policy_gradient_loss | 0.00822 | -| std | 0.00821 | -| value_loss | 1.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18070 | -| time_elapsed | 97752 | -| total_timesteps | 2312960 | -| train/ | | -| approx_kl | 0.020065237 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | -0.000322 | -| n_updates | 180690 | -| policy_gradient_loss | 0.00217 | -| std | 0.00821 | -| value_loss | 8.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18071 | -| time_elapsed | 97757 | -| total_timesteps | 2313088 | -| train/ | | -| approx_kl | 0.034585185 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 180700 | -| policy_gradient_loss | 0.00691 | -| std | 0.00821 | -| value_loss | 5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18072 | -| time_elapsed | 97768 | -| total_timesteps | 2313216 | -| train/ | | -| approx_kl | 0.024455283 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.738 | -| learning_rate | 0.0003 | -| loss | 0.00954 | -| n_updates | 180710 | -| policy_gradient_loss | 0.00989 | -| std | 0.00821 | -| value_loss | 0.00611 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18073 | -| time_elapsed | 97773 | -| total_timesteps | 2313344 | -| train/ | | -| approx_kl | 0.00230149 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 180720 | -| policy_gradient_loss | 0.0239 | -| std | 0.00821 | -| value_loss | 1.51e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18074 | -| time_elapsed | 97778 | -| total_timesteps | 2313472 | -| train/ | | -| approx_kl | 0.14968564 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00508 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 180730 | -| policy_gradient_loss | 0.0446 | -| std | 0.00821 | -| value_loss | 1.97e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18075 | -| time_elapsed | 97784 | -| total_timesteps | 2313600 | -| train/ | | -| approx_kl | 0.049888015 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | 0.0344 | -| n_updates | 180740 | -| policy_gradient_loss | 0.0132 | -| std | 0.0082 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18076 | -| time_elapsed | 97789 | -| total_timesteps | 2313728 | -| train/ | | -| approx_kl | 0.003967965 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 180750 | -| policy_gradient_loss | 0.00467 | -| std | 0.0082 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18077 | -| time_elapsed | 97793 | -| total_timesteps | 2313856 | -| train/ | | -| approx_kl | 0.0025682654 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 180760 | -| policy_gradient_loss | 0.0115 | -| std | 0.0082 | -| value_loss | 5.66e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18078 | -| time_elapsed | 97797 | -| total_timesteps | 2313984 | -| train/ | | -| approx_kl | 0.047092773 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 180770 | -| policy_gradient_loss | 0.0465 | -| std | 0.00819 | -| value_loss | 2.82e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 18079 | -| time_elapsed | 97802 | -| total_timesteps | 2314112 | -| train/ | | -| approx_kl | 0.7835289 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.317 | -| n_updates | 180780 | -| policy_gradient_loss | 0.136 | -| std | 0.00819 | -| value_loss | 1.6e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 18080 | -| time_elapsed | 97813 | -| total_timesteps | 2314240 | -| train/ | | -| approx_kl | 0.14085126 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -4.02 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 180790 | -| policy_gradient_loss | -0.00989 | -| std | 0.00819 | -| value_loss | 0.00272 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 18081 | -| time_elapsed | 97817 | -| total_timesteps | 2314368 | -| train/ | | -| approx_kl | 0.096631534 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -1.39 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 180800 | -| policy_gradient_loss | 0.0257 | -| std | 0.00819 | -| value_loss | 2.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 18082 | -| time_elapsed | 97822 | -| total_timesteps | 2314496 | -| train/ | | -| approx_kl | 0.11161569 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 180810 | -| policy_gradient_loss | 0.00639 | -| std | 0.00819 | -| value_loss | 1.53e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 18083 | -| time_elapsed | 97826 | -| total_timesteps | 2314624 | -| train/ | | -| approx_kl | 0.4571011 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -2.66 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 180820 | -| policy_gradient_loss | 0.0267 | -| std | 0.00819 | -| value_loss | 2.72e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 18084 | -| time_elapsed | 97832 | -| total_timesteps | 2314752 | -| train/ | | -| approx_kl | 0.013705969 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 180830 | -| policy_gradient_loss | 0.00025 | -| std | 0.00819 | -| value_loss | 1.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 18085 | -| time_elapsed | 97838 | -| total_timesteps | 2314880 | -| train/ | | -| approx_kl | 0.04242629 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | 0.00737 | -| n_updates | 180840 | -| policy_gradient_loss | 0.018 | -| std | 0.00819 | -| value_loss | 1.25e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18086 | -| time_elapsed | 97842 | -| total_timesteps | 2315008 | -| train/ | | -| approx_kl | 0.06764424 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.07 | -| learning_rate | 0.0003 | -| loss | 0.0631 | -| n_updates | 180850 | -| policy_gradient_loss | 0.0536 | -| std | 0.00819 | -| value_loss | 8.17e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18087 | -| time_elapsed | 97853 | -| total_timesteps | 2315136 | -| train/ | | -| approx_kl | 0.031993534 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 180860 | -| policy_gradient_loss | -0.00984 | -| std | 0.00818 | -| value_loss | 2.67e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18088 | -| time_elapsed | 97859 | -| total_timesteps | 2315264 | -| train/ | | -| approx_kl | 0.60366166 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.589 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 180870 | -| policy_gradient_loss | 0.0875 | -| std | 0.00818 | -| value_loss | 1.13e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18089 | -| time_elapsed | 97864 | -| total_timesteps | 2315392 | -| train/ | | -| approx_kl | 0.0047484636 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | -0.000397 | -| n_updates | 180880 | -| policy_gradient_loss | 0.0185 | -| std | 0.00818 | -| value_loss | 2.56e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18090 | -| time_elapsed | 97870 | -| total_timesteps | 2315520 | -| train/ | | -| approx_kl | 0.05845034 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 180890 | -| policy_gradient_loss | 0.0138 | -| std | 0.00818 | -| value_loss | 1.13e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18091 | -| time_elapsed | 97876 | -| total_timesteps | 2315648 | -| train/ | | -| approx_kl | 2.9637944e-05 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | -0.00024 | -| n_updates | 180900 | -| policy_gradient_loss | 0.0175 | -| std | 0.00817 | -| value_loss | 6.44e-10 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18092 | -| time_elapsed | 97880 | -| total_timesteps | 2315776 | -| train/ | | -| approx_kl | 0.36411124 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 180910 | -| policy_gradient_loss | 0.0399 | -| std | 0.00817 | -| value_loss | 6.85e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 18093 | -| time_elapsed | 97884 | -| total_timesteps | 2315904 | -| train/ | | -| approx_kl | 0.026559584 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 180920 | -| policy_gradient_loss | -0.00353 | -| std | 0.00817 | -| value_loss | 3.42e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18094 | -| time_elapsed | 97888 | -| total_timesteps | 2316032 | -| train/ | | -| approx_kl | 0.03343452 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 180930 | -| policy_gradient_loss | 0.0115 | -| std | 0.00818 | -| value_loss | 2.34e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18095 | -| time_elapsed | 97898 | -| total_timesteps | 2316160 | -| train/ | | -| approx_kl | 0.117758736 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -3.47 | -| learning_rate | 0.0003 | -| loss | -0.00839 | -| n_updates | 180940 | -| policy_gradient_loss | -0.0101 | -| std | 0.00819 | -| value_loss | 0.00245 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18096 | -| time_elapsed | 97903 | -| total_timesteps | 2316288 | -| train/ | | -| approx_kl | 0.08314162 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 180950 | -| policy_gradient_loss | 0.0215 | -| std | 0.00819 | -| value_loss | 3.36e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18097 | -| time_elapsed | 97907 | -| total_timesteps | 2316416 | -| train/ | | -| approx_kl | 0.21310547 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 180960 | -| policy_gradient_loss | 0.0914 | -| std | 0.00819 | -| value_loss | 1.71e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18098 | -| time_elapsed | 97912 | -| total_timesteps | 2316544 | -| train/ | | -| approx_kl | 0.04173982 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | 0.0162 | -| n_updates | 180970 | -| policy_gradient_loss | 0.0203 | -| std | 0.0082 | -| value_loss | 1.27e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18099 | -| time_elapsed | 97917 | -| total_timesteps | 2316672 | -| train/ | | -| approx_kl | 0.14373733 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.0815 | -| n_updates | 180980 | -| policy_gradient_loss | 0.0224 | -| std | 0.00819 | -| value_loss | 8.68e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18100 | -| time_elapsed | 97922 | -| total_timesteps | 2316800 | -| train/ | | -| approx_kl | 0.016211722 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 180990 | -| policy_gradient_loss | 0.0156 | -| std | 0.00819 | -| value_loss | 5.84e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18101 | -| time_elapsed | 97926 | -| total_timesteps | 2316928 | -| train/ | | -| approx_kl | 0.08343534 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.00437 | -| n_updates | 181000 | -| policy_gradient_loss | 0.01 | -| std | 0.00819 | -| value_loss | 5.1e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18102 | -| time_elapsed | 97931 | -| total_timesteps | 2317056 | -| train/ | | -| approx_kl | 0.0995548 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 181010 | -| policy_gradient_loss | 0.0153 | -| std | 0.00819 | -| value_loss | 2.87e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18103 | -| time_elapsed | 97942 | -| total_timesteps | 2317184 | -| train/ | | -| approx_kl | 0.029660977 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 181020 | -| policy_gradient_loss | -0.0121 | -| std | 0.00819 | -| value_loss | 0.000145 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18104 | -| time_elapsed | 97947 | -| total_timesteps | 2317312 | -| train/ | | -| approx_kl | 0.051313184 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.294 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 181030 | -| policy_gradient_loss | 0.00778 | -| std | 0.00819 | -| value_loss | 2.22e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18105 | -| time_elapsed | 97951 | -| total_timesteps | 2317440 | -| train/ | | -| approx_kl | 0.1052435 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 181040 | -| policy_gradient_loss | 0.0155 | -| std | 0.0082 | -| value_loss | 1.84e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18106 | -| time_elapsed | 97956 | -| total_timesteps | 2317568 | -| train/ | | -| approx_kl | 0.028789246 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | -0.00624 | -| n_updates | 181050 | -| policy_gradient_loss | 0.00739 | -| std | 0.0082 | -| value_loss | 3.01e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18107 | -| time_elapsed | 97959 | -| total_timesteps | 2317696 | -| train/ | | -| approx_kl | 0.081010126 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0602 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 181060 | -| policy_gradient_loss | 0.0226 | -| std | 0.0082 | -| value_loss | 2.31e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18108 | -| time_elapsed | 97964 | -| total_timesteps | 2317824 | -| train/ | | -| approx_kl | 0.22235116 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.0833 | -| n_updates | 181070 | -| policy_gradient_loss | 0.0803 | -| std | 0.0082 | -| value_loss | 1.92e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 18109 | -| time_elapsed | 97968 | -| total_timesteps | 2317952 | -| train/ | | -| approx_kl | 0.11272003 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | 0.0842 | -| n_updates | 181080 | -| policy_gradient_loss | 0.0735 | -| std | 0.0082 | -| value_loss | 6.37e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18110 | -| time_elapsed | 97972 | -| total_timesteps | 2318080 | -| train/ | | -| approx_kl | 0.092153266 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0493 | -| n_updates | 181090 | -| policy_gradient_loss | 0.0629 | -| std | 0.00821 | -| value_loss | 4.14e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18111 | -| time_elapsed | 97982 | -| total_timesteps | 2318208 | -| train/ | | -| approx_kl | 0.03350503 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 181100 | -| policy_gradient_loss | -0.00231 | -| std | 0.00821 | -| value_loss | 0.000141 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18112 | -| time_elapsed | 97986 | -| total_timesteps | 2318336 | -| train/ | | -| approx_kl | 0.103743866 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0601 | -| n_updates | 181110 | -| policy_gradient_loss | 0.0168 | -| std | 0.00821 | -| value_loss | 2.98e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18113 | -| time_elapsed | 97991 | -| total_timesteps | 2318464 | -| train/ | | -| approx_kl | 0.01438842 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00519 | -| learning_rate | 0.0003 | -| loss | -0.00975 | -| n_updates | 181120 | -| policy_gradient_loss | 0.0122 | -| std | 0.00821 | -| value_loss | 2.84e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18114 | -| time_elapsed | 97997 | -| total_timesteps | 2318592 | -| train/ | | -| approx_kl | 0.19095264 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 181130 | -| policy_gradient_loss | 0.1 | -| std | 0.00821 | -| value_loss | 2.08e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18115 | -| time_elapsed | 98001 | -| total_timesteps | 2318720 | -| train/ | | -| approx_kl | 0.10236751 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.0787 | -| n_updates | 181140 | -| policy_gradient_loss | 0.0896 | -| std | 0.00822 | -| value_loss | 1.36e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18116 | -| time_elapsed | 98005 | -| total_timesteps | 2318848 | -| train/ | | -| approx_kl | 0.020635216 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 181150 | -| policy_gradient_loss | 0.0161 | -| std | 0.00822 | -| value_loss | 1.06e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18117 | -| time_elapsed | 98008 | -| total_timesteps | 2318976 | -| train/ | | -| approx_kl | 0.3755263 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 181160 | -| policy_gradient_loss | 0.0392 | -| std | 0.00822 | -| value_loss | 7.84e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 18118 | -| time_elapsed | 98011 | -| total_timesteps | 2319104 | -| train/ | | -| approx_kl | 0.031556077 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 181170 | -| policy_gradient_loss | -0.00107 | -| std | 0.00822 | -| value_loss | 5.31e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 18119 | -| time_elapsed | 98018 | -| total_timesteps | 2319232 | -| train/ | | -| approx_kl | 0.054686163 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 181180 | -| policy_gradient_loss | -0.00317 | -| std | 0.00822 | -| value_loss | 3.18e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 18120 | -| time_elapsed | 98023 | -| total_timesteps | 2319360 | -| train/ | | -| approx_kl | 0.014410736 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00453 | -| n_updates | 181190 | -| policy_gradient_loss | 0.0151 | -| std | 0.00822 | -| value_loss | 5.79e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 18121 | -| time_elapsed | 98028 | -| total_timesteps | 2319488 | -| train/ | | -| approx_kl | 0.015061822 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00807 | -| learning_rate | 0.0003 | -| loss | 0.00763 | -| n_updates | 181200 | -| policy_gradient_loss | 0.0212 | -| std | 0.00821 | -| value_loss | 5.53e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 18122 | -| time_elapsed | 98034 | -| total_timesteps | 2319616 | -| train/ | | -| approx_kl | 0.13236023 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | -0.000758 | -| n_updates | 181210 | -| policy_gradient_loss | -0.00158 | -| std | 0.00821 | -| value_loss | 3.61e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 18123 | -| time_elapsed | 98039 | -| total_timesteps | 2319744 | -| train/ | | -| approx_kl | 0.22986928 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 181220 | -| policy_gradient_loss | 0.0888 | -| std | 0.0082 | -| value_loss | 9.91e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 18124 | -| time_elapsed | 98044 | -| total_timesteps | 2319872 | -| train/ | | -| approx_kl | 0.1499847 | -| clip_fraction | 0.664 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00915 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 181230 | -| policy_gradient_loss | 0.0995 | -| std | 0.00821 | -| value_loss | 9.35e-11 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18125 | -| time_elapsed | 98049 | -| total_timesteps | 2320000 | -| train/ | | -| approx_kl | 0.028113727 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.0201 | -| n_updates | 181240 | -| policy_gradient_loss | 0.0215 | -| std | 0.00821 | -| value_loss | 6.65e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18126 | -| time_elapsed | 98055 | -| total_timesteps | 2320128 | -| train/ | | -| approx_kl | 0.35727605 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00403 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 181250 | -| policy_gradient_loss | 0.0471 | -| std | 0.00821 | -| value_loss | 3.39e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18127 | -| time_elapsed | 98065 | -| total_timesteps | 2320256 | -| train/ | | -| approx_kl | 0.043207638 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 181260 | -| policy_gradient_loss | 0.00719 | -| std | 0.00821 | -| value_loss | 0.00118 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18128 | -| time_elapsed | 98069 | -| total_timesteps | 2320384 | -| train/ | | -| approx_kl | 0.020484837 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 181270 | -| policy_gradient_loss | -0.00563 | -| std | 0.00821 | -| value_loss | 2.72e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18129 | -| time_elapsed | 98073 | -| total_timesteps | 2320512 | -| train/ | | -| approx_kl | 0.031815268 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00672 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 181280 | -| policy_gradient_loss | 0.00696 | -| std | 0.00821 | -| value_loss | 2.68e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18130 | -| time_elapsed | 98076 | -| total_timesteps | 2320640 | -| train/ | | -| approx_kl | 0.025053428 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 181290 | -| policy_gradient_loss | 0.00582 | -| std | 0.00821 | -| value_loss | 1.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18131 | -| time_elapsed | 98080 | -| total_timesteps | 2320768 | -| train/ | | -| approx_kl | 0.026699927 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 181300 | -| policy_gradient_loss | -0.00981 | -| std | 0.0082 | -| value_loss | 9.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18132 | -| time_elapsed | 98086 | -| total_timesteps | 2320896 | -| train/ | | -| approx_kl | 0.025441572 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 181310 | -| policy_gradient_loss | 0.0075 | -| std | 0.00817 | -| value_loss | 2.13e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18133 | -| time_elapsed | 98090 | -| total_timesteps | 2321024 | -| train/ | | -| approx_kl | 0.0010136897 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -6.45 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 181320 | -| policy_gradient_loss | 0.000577 | -| std | 0.00814 | -| value_loss | 0.000125 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18134 | -| time_elapsed | 98100 | -| total_timesteps | 2321152 | -| train/ | | -| approx_kl | 0.06478202 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -2.95 | -| learning_rate | 0.0003 | -| loss | 0.00463 | -| n_updates | 181330 | -| policy_gradient_loss | -0.00364 | -| std | 0.00813 | -| value_loss | 0.0107 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18135 | -| time_elapsed | 98105 | -| total_timesteps | 2321280 | -| train/ | | -| approx_kl | 0.09850501 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 181340 | -| policy_gradient_loss | 0.00924 | -| std | 0.00812 | -| value_loss | 0.000146 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18136 | -| time_elapsed | 98109 | -| total_timesteps | 2321408 | -| train/ | | -| approx_kl | 0.02267436 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | -0.00606 | -| n_updates | 181350 | -| policy_gradient_loss | 0.0213 | -| std | 0.00811 | -| value_loss | 8.35e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18137 | -| time_elapsed | 98115 | -| total_timesteps | 2321536 | -| train/ | | -| approx_kl | 0.22567374 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | 0.27 | -| n_updates | 181360 | -| policy_gradient_loss | 0.141 | -| std | 0.00811 | -| value_loss | 8.76e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18138 | -| time_elapsed | 98120 | -| total_timesteps | 2321664 | -| train/ | | -| approx_kl | 0.042021476 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 181370 | -| policy_gradient_loss | 0.0237 | -| std | 0.00811 | -| value_loss | 7.09e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18139 | -| time_elapsed | 98124 | -| total_timesteps | 2321792 | -| train/ | | -| approx_kl | 0.4105028 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 181380 | -| policy_gradient_loss | 0.036 | -| std | 0.00811 | -| value_loss | 5.65e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18140 | -| time_elapsed | 98129 | -| total_timesteps | 2321920 | -| train/ | | -| approx_kl | 0.009216903 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 181390 | -| policy_gradient_loss | 1.46e-05 | -| std | 0.00811 | -| value_loss | 4.74e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18141 | -| time_elapsed | 98132 | -| total_timesteps | 2322048 | -| train/ | | -| approx_kl | 0.048154313 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 181400 | -| policy_gradient_loss | 0.00952 | -| std | 0.00811 | -| value_loss | 2.32e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18142 | -| time_elapsed | 98143 | -| total_timesteps | 2322176 | -| train/ | | -| approx_kl | 0.017971652 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -5.01 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 181410 | -| policy_gradient_loss | -0.0115 | -| std | 0.00811 | -| value_loss | 0.00267 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18143 | -| time_elapsed | 98148 | -| total_timesteps | 2322304 | -| train/ | | -| approx_kl | 0.004423842 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.000139 | -| n_updates | 181420 | -| policy_gradient_loss | 0.00377 | -| std | 0.00814 | -| value_loss | 6.5e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18144 | -| time_elapsed | 98153 | -| total_timesteps | 2322432 | -| train/ | | -| approx_kl | 0.21874541 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.0081 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 181430 | -| policy_gradient_loss | 0.0447 | -| std | 0.00816 | -| value_loss | 3.49e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18145 | -| time_elapsed | 98158 | -| total_timesteps | 2322560 | -| train/ | | -| approx_kl | 0.0510208 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00058 | -| n_updates | 181440 | -| policy_gradient_loss | -0.00383 | -| std | 0.00816 | -| value_loss | 7.32e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18146 | -| time_elapsed | 98163 | -| total_timesteps | 2322688 | -| train/ | | -| approx_kl | 0.027272144 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.000377 | -| n_updates | 181450 | -| policy_gradient_loss | 0.00117 | -| std | 0.00817 | -| value_loss | 6.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18147 | -| time_elapsed | 98168 | -| total_timesteps | 2322816 | -| train/ | | -| approx_kl | 0.032220997 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | 0.00321 | -| n_updates | 181460 | -| policy_gradient_loss | 0.000995 | -| std | 0.00817 | -| value_loss | 5.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18148 | -| time_elapsed | 98172 | -| total_timesteps | 2322944 | -| train/ | | -| approx_kl | 0.036211237 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.00172 | -| n_updates | 181470 | -| policy_gradient_loss | 0.00104 | -| std | 0.00817 | -| value_loss | 5.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18149 | -| time_elapsed | 98176 | -| total_timesteps | 2323072 | -| train/ | | -| approx_kl | 0.034881204 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 181480 | -| policy_gradient_loss | 0.00559 | -| std | 0.00817 | -| value_loss | 4.35e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18150 | -| time_elapsed | 98183 | -| total_timesteps | 2323200 | -| train/ | | -| approx_kl | 0.0046494757 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.798 | -| learning_rate | 0.0003 | -| loss | 0.00303 | -| n_updates | 181490 | -| policy_gradient_loss | 0.00163 | -| std | 0.00817 | -| value_loss | 0.00318 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18151 | -| time_elapsed | 98187 | -| total_timesteps | 2323328 | -| train/ | | -| approx_kl | 0.028685434 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 181500 | -| policy_gradient_loss | 0.0229 | -| std | 0.00816 | -| value_loss | 7.2e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18152 | -| time_elapsed | 98191 | -| total_timesteps | 2323456 | -| train/ | | -| approx_kl | 0.6422471 | -| clip_fraction | 0.679 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -14 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 181510 | -| policy_gradient_loss | 0.0518 | -| std | 0.00817 | -| value_loss | 3.21e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18153 | -| time_elapsed | 98196 | -| total_timesteps | 2323584 | -| train/ | | -| approx_kl | 0.0058916 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00181 | -| learning_rate | 0.0003 | -| loss | -0.00564 | -| n_updates | 181520 | -| policy_gradient_loss | 0.0216 | -| std | 0.00817 | -| value_loss | 3.19e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18154 | -| time_elapsed | 98200 | -| total_timesteps | 2323712 | -| train/ | | -| approx_kl | 0.0514449 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 181530 | -| policy_gradient_loss | 0.0179 | -| std | 0.00816 | -| value_loss | 1.12e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18155 | -| time_elapsed | 98204 | -| total_timesteps | 2323840 | -| train/ | | -| approx_kl | 0.08488344 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 181540 | -| policy_gradient_loss | 0.0142 | -| std | 0.00816 | -| value_loss | 8.07e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18156 | -| time_elapsed | 98208 | -| total_timesteps | 2323968 | -| train/ | | -| approx_kl | 0.01585456 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 181550 | -| policy_gradient_loss | 0.0229 | -| std | 0.00816 | -| value_loss | 5.5e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18157 | -| time_elapsed | 98212 | -| total_timesteps | 2324096 | -| train/ | | -| approx_kl | 0.17019606 | -| clip_fraction | 0.624 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 181560 | -| policy_gradient_loss | 0.0821 | -| std | 0.00816 | -| value_loss | 5.35e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18158 | -| time_elapsed | 98224 | -| total_timesteps | 2324224 | -| train/ | | -| approx_kl | 0.22074921 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | 0.0646 | -| n_updates | 181570 | -| policy_gradient_loss | 0.0657 | -| std | 0.00816 | -| value_loss | 0.00214 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18159 | -| time_elapsed | 98229 | -| total_timesteps | 2324352 | -| train/ | | -| approx_kl | 0.15568894 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0857 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 181580 | -| policy_gradient_loss | 0.116 | -| std | 0.00816 | -| value_loss | 3.92e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18160 | -| time_elapsed | 98234 | -| total_timesteps | 2324480 | -| train/ | | -| approx_kl | 0.02314917 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00827 | -| learning_rate | 0.0003 | -| loss | 0.00829 | -| n_updates | 181590 | -| policy_gradient_loss | 0.0131 | -| std | 0.00816 | -| value_loss | 1.13e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18161 | -| time_elapsed | 98238 | -| total_timesteps | 2324608 | -| train/ | | -| approx_kl | 0.3564774 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00701 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 181600 | -| policy_gradient_loss | 0.0377 | -| std | 0.00815 | -| value_loss | 4.09e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18162 | -| time_elapsed | 98242 | -| total_timesteps | 2324736 | -| train/ | | -| approx_kl | 0.0107790865 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 181610 | -| policy_gradient_loss | 0.0061 | -| std | 0.00815 | -| value_loss | 2.44e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18163 | -| time_elapsed | 98246 | -| total_timesteps | 2324864 | -| train/ | | -| approx_kl | 0.04667346 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 181620 | -| policy_gradient_loss | 0.0096 | -| std | 0.00814 | -| value_loss | 2.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18164 | -| time_elapsed | 98251 | -| total_timesteps | 2324992 | -| train/ | | -| approx_kl | 0.007078279 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 181630 | -| policy_gradient_loss | 0.00231 | -| std | 0.00814 | -| value_loss | 1.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18165 | -| time_elapsed | 98256 | -| total_timesteps | 2325120 | -| train/ | | -| approx_kl | 0.05636397 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 181640 | -| policy_gradient_loss | 0.0276 | -| std | 0.00814 | -| value_loss | 1.11e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18166 | -| time_elapsed | 98268 | -| total_timesteps | 2325248 | -| train/ | | -| approx_kl | 0.6810447 | -| clip_fraction | 0.694 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.895 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 181650 | -| policy_gradient_loss | 0.0737 | -| std | 0.00814 | -| value_loss | 0.00111 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18167 | -| time_elapsed | 98274 | -| total_timesteps | 2325376 | -| train/ | | -| approx_kl | 0.30608842 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00994 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 181660 | -| policy_gradient_loss | 0.0386 | -| std | 0.00814 | -| value_loss | 4.32e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18168 | -| time_elapsed | 98278 | -| total_timesteps | 2325504 | -| train/ | | -| approx_kl | 0.03134891 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00904 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 181670 | -| policy_gradient_loss | 0.00735 | -| std | 0.00814 | -| value_loss | 8.58e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18169 | -| time_elapsed | 98283 | -| total_timesteps | 2325632 | -| train/ | | -| approx_kl | 0.00026893336 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 181680 | -| policy_gradient_loss | 0.00038 | -| std | 0.00813 | -| value_loss | 5.05e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18170 | -| time_elapsed | 98287 | -| total_timesteps | 2325760 | -| train/ | | -| approx_kl | 0.022854965 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0971 | -| learning_rate | 0.0003 | -| loss | 0.00636 | -| n_updates | 181690 | -| policy_gradient_loss | 0.00356 | -| std | 0.00813 | -| value_loss | 2.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18171 | -| time_elapsed | 98292 | -| total_timesteps | 2325888 | -| train/ | | -| approx_kl | 0.006512889 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0955 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 181700 | -| policy_gradient_loss | 0.00341 | -| std | 0.00812 | -| value_loss | 9.43e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18172 | -| time_elapsed | 98297 | -| total_timesteps | 2326016 | -| train/ | | -| approx_kl | 0.03618695 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 181710 | -| policy_gradient_loss | 0.00465 | -| std | 0.00812 | -| value_loss | 7.59e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18173 | -| time_elapsed | 98308 | -| total_timesteps | 2326144 | -| train/ | | -| approx_kl | 0.05615091 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.644 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 181720 | -| policy_gradient_loss | -0.00825 | -| std | 0.00812 | -| value_loss | 0.000658 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18174 | -| time_elapsed | 98313 | -| total_timesteps | 2326272 | -| train/ | | -| approx_kl | 0.024844814 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.538 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 181730 | -| policy_gradient_loss | 0.000579 | -| std | 0.00812 | -| value_loss | 6.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18175 | -| time_elapsed | 98318 | -| total_timesteps | 2326400 | -| train/ | | -| approx_kl | 0.090344205 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 181740 | -| policy_gradient_loss | 0.0113 | -| std | 0.00812 | -| value_loss | 6.38e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18176 | -| time_elapsed | 98323 | -| total_timesteps | 2326528 | -| train/ | | -| approx_kl | 0.23919417 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | 0.0856 | -| n_updates | 181750 | -| policy_gradient_loss | 0.0602 | -| std | 0.00812 | -| value_loss | 1.04e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18177 | -| time_elapsed | 98328 | -| total_timesteps | 2326656 | -| train/ | | -| approx_kl | 0.13683243 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | 0.0827 | -| n_updates | 181760 | -| policy_gradient_loss | 0.0769 | -| std | 0.00812 | -| value_loss | 7.44e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18178 | -| time_elapsed | 98333 | -| total_timesteps | 2326784 | -| train/ | | -| approx_kl | 0.10074811 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 181770 | -| policy_gradient_loss | 0.113 | -| std | 0.00812 | -| value_loss | 7.31e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18179 | -| time_elapsed | 98338 | -| total_timesteps | 2326912 | -| train/ | | -| approx_kl | 0.10297694 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.0688 | -| n_updates | 181780 | -| policy_gradient_loss | 0.107 | -| std | 0.00812 | -| value_loss | 4.16e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18180 | -| time_elapsed | 98346 | -| total_timesteps | 2327040 | -| train/ | | -| approx_kl | 0.11025217 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0812 | -| learning_rate | 0.0003 | -| loss | 0.0992 | -| n_updates | 181790 | -| policy_gradient_loss | 0.0994 | -| std | 0.00813 | -| value_loss | 2.13e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18181 | -| time_elapsed | 98355 | -| total_timesteps | 2327168 | -| train/ | | -| approx_kl | 0.18670276 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | 0.00799 | -| n_updates | 181800 | -| policy_gradient_loss | 0.00828 | -| std | 0.00813 | -| value_loss | 0.000594 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18182 | -| time_elapsed | 98360 | -| total_timesteps | 2327296 | -| train/ | | -| approx_kl | 0.03421672 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -1.42 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 181810 | -| policy_gradient_loss | 0.00502 | -| std | 0.00812 | -| value_loss | 2.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18183 | -| time_elapsed | 98364 | -| total_timesteps | 2327424 | -| train/ | | -| approx_kl | 0.20075315 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.0835 | -| n_updates | 181820 | -| policy_gradient_loss | 0.0292 | -| std | 0.00813 | -| value_loss | 3.37e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18184 | -| time_elapsed | 98368 | -| total_timesteps | 2327552 | -| train/ | | -| approx_kl | 0.00042813644 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00377 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 181830 | -| policy_gradient_loss | 0.00338 | -| std | 0.00813 | -| value_loss | 2.4e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18185 | -| time_elapsed | 98373 | -| total_timesteps | 2327680 | -| train/ | | -| approx_kl | 0.052004643 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00616 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 181840 | -| policy_gradient_loss | 0.0628 | -| std | 0.00813 | -| value_loss | 1.88e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18186 | -| time_elapsed | 98376 | -| total_timesteps | 2327808 | -| train/ | | -| approx_kl | 0.14449829 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00952 | -| learning_rate | 0.0003 | -| loss | 0.0651 | -| n_updates | 181850 | -| policy_gradient_loss | 0.0271 | -| std | 0.00813 | -| value_loss | 1.41e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18187 | -| time_elapsed | 98381 | -| total_timesteps | 2327936 | -| train/ | | -| approx_kl | 0.035038747 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 181860 | -| policy_gradient_loss | 0.0507 | -| std | 0.00813 | -| value_loss | 1.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18188 | -| time_elapsed | 98385 | -| total_timesteps | 2328064 | -| train/ | | -| approx_kl | 0.032423403 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 181870 | -| policy_gradient_loss | 0.0246 | -| std | 0.00813 | -| value_loss | 8.61e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18189 | -| time_elapsed | 98393 | -| total_timesteps | 2328192 | -| train/ | | -| approx_kl | 0.024315879 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 181880 | -| policy_gradient_loss | -0.0104 | -| std | 0.00813 | -| value_loss | 0.000198 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18190 | -| time_elapsed | 98397 | -| total_timesteps | 2328320 | -| train/ | | -| approx_kl | 0.045989804 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 181890 | -| policy_gradient_loss | 0.0384 | -| std | 0.00813 | -| value_loss | 1.82e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18191 | -| time_elapsed | 98401 | -| total_timesteps | 2328448 | -| train/ | | -| approx_kl | 0.12503833 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.000724 | -| learning_rate | 0.0003 | -| loss | 0.0588 | -| n_updates | 181900 | -| policy_gradient_loss | 0.0305 | -| std | 0.00813 | -| value_loss | 2.69e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18192 | -| time_elapsed | 98404 | -| total_timesteps | 2328576 | -| train/ | | -| approx_kl | 0.032043837 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00986 | -| learning_rate | 0.0003 | -| loss | 0.00127 | -| n_updates | 181910 | -| policy_gradient_loss | 0.0496 | -| std | 0.00813 | -| value_loss | 1.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18193 | -| time_elapsed | 98408 | -| total_timesteps | 2328704 | -| train/ | | -| approx_kl | 0.012770011 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | -0.0018 | -| n_updates | 181920 | -| policy_gradient_loss | 0.0148 | -| std | 0.00813 | -| value_loss | 1.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18194 | -| time_elapsed | 98413 | -| total_timesteps | 2328832 | -| train/ | | -| approx_kl | 0.15134692 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 181930 | -| policy_gradient_loss | 0.0475 | -| std | 0.00813 | -| value_loss | 6.44e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18195 | -| time_elapsed | 98419 | -| total_timesteps | 2328960 | -| train/ | | -| approx_kl | 0.00065405946 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 181940 | -| policy_gradient_loss | -0.00161 | -| std | 0.00813 | -| value_loss | 5.45e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18196 | -| time_elapsed | 98424 | -| total_timesteps | 2329088 | -| train/ | | -| approx_kl | 0.0509816 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 181950 | -| policy_gradient_loss | 0.055 | -| std | 0.00813 | -| value_loss | 5.19e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18197 | -| time_elapsed | 98434 | -| total_timesteps | 2329216 | -| train/ | | -| approx_kl | 0.017721647 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.227 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 181960 | -| policy_gradient_loss | -0.0133 | -| std | 0.00813 | -| value_loss | 0.00101 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18198 | -| time_elapsed | 98439 | -| total_timesteps | 2329344 | -| train/ | | -| approx_kl | 0.010656334 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.942 | -| learning_rate | 0.0003 | -| loss | 0.00507 | -| n_updates | 181970 | -| policy_gradient_loss | 0.00245 | -| std | 0.00813 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18199 | -| time_elapsed | 98445 | -| total_timesteps | 2329472 | -| train/ | | -| approx_kl | 0.027244626 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00282 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 181980 | -| policy_gradient_loss | 0.0387 | -| std | 0.00813 | -| value_loss | 4.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18200 | -| time_elapsed | 98452 | -| total_timesteps | 2329600 | -| train/ | | -| approx_kl | 0.014123047 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0588 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 181990 | -| policy_gradient_loss | -0.00632 | -| std | 0.00814 | -| value_loss | 6.13e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18201 | -| time_elapsed | 98458 | -| total_timesteps | 2329728 | -| train/ | | -| approx_kl | 0.05885618 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00859 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 182000 | -| policy_gradient_loss | 0.00932 | -| std | 0.00816 | -| value_loss | 5.51e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18202 | -| time_elapsed | 98464 | -| total_timesteps | 2329856 | -| train/ | | -| approx_kl | 0.24168396 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.237 | -| n_updates | 182010 | -| policy_gradient_loss | 0.135 | -| std | 0.00817 | -| value_loss | 1.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18203 | -| time_elapsed | 98469 | -| total_timesteps | 2329984 | -| train/ | | -| approx_kl | 0.032904785 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00625 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 182020 | -| policy_gradient_loss | 0.0186 | -| std | 0.00817 | -| value_loss | 2.67e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18204 | -| time_elapsed | 98474 | -| total_timesteps | 2330112 | -| train/ | | -| approx_kl | 0.00031210482 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.000289 | -| n_updates | 182030 | -| policy_gradient_loss | 0.0205 | -| std | 0.00818 | -| value_loss | 1.49e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18205 | -| time_elapsed | 98484 | -| total_timesteps | 2330240 | -| train/ | | -| approx_kl | 0.36818597 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.949 | -| learning_rate | 0.0003 | -| loss | 0.0838 | -| n_updates | 182040 | -| policy_gradient_loss | 0.0223 | -| std | 0.00818 | -| value_loss | 0.000388 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18206 | -| time_elapsed | 98488 | -| total_timesteps | 2330368 | -| train/ | | -| approx_kl | 0.021145247 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -7.89 | -| learning_rate | 0.0003 | -| loss | 0.00451 | -| n_updates | 182050 | -| policy_gradient_loss | 0.00348 | -| std | 0.00817 | -| value_loss | 3.55e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18207 | -| time_elapsed | 98494 | -| total_timesteps | 2330496 | -| train/ | | -| approx_kl | 0.0029573753 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 182060 | -| policy_gradient_loss | 0.00194 | -| std | 0.00817 | -| value_loss | 6.36e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18208 | -| time_elapsed | 98498 | -| total_timesteps | 2330624 | -| train/ | | -| approx_kl | 0.0010398985 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.00376 | -| n_updates | 182070 | -| policy_gradient_loss | 0.00347 | -| std | 0.00817 | -| value_loss | 2e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18209 | -| time_elapsed | 98502 | -| total_timesteps | 2330752 | -| train/ | | -| approx_kl | 2.626609e-05 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.000383 | -| learning_rate | 0.0003 | -| loss | 0.000337 | -| n_updates | 182080 | -| policy_gradient_loss | 0.0037 | -| std | 0.00817 | -| value_loss | 4.8e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18210 | -| time_elapsed | 98506 | -| total_timesteps | 2330880 | -| train/ | | -| approx_kl | 0.025452811 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 182090 | -| policy_gradient_loss | 9.32e-05 | -| std | 0.00817 | -| value_loss | 3.18e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18211 | -| time_elapsed | 98509 | -| total_timesteps | 2331008 | -| train/ | | -| approx_kl | 0.0341461 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.00749 | -| n_updates | 182100 | -| policy_gradient_loss | 0.00347 | -| std | 0.00816 | -| value_loss | 2.56e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18212 | -| time_elapsed | 98520 | -| total_timesteps | 2331136 | -| train/ | | -| approx_kl | 0.009231025 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | 0.000273 | -| n_updates | 182110 | -| policy_gradient_loss | 0.00103 | -| std | 0.00816 | -| value_loss | 4.65e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18213 | -| time_elapsed | 98525 | -| total_timesteps | 2331264 | -| train/ | | -| approx_kl | 0.027190207 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.105 | -| learning_rate | 0.0003 | -| loss | -0.00562 | -| n_updates | 182120 | -| policy_gradient_loss | 0.0114 | -| std | 0.00816 | -| value_loss | 4.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18214 | -| time_elapsed | 98530 | -| total_timesteps | 2331392 | -| train/ | | -| approx_kl | 0.010137774 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00592 | -| learning_rate | 0.0003 | -| loss | 0.00526 | -| n_updates | 182130 | -| policy_gradient_loss | 0.0253 | -| std | 0.00821 | -| value_loss | 5.5e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18215 | -| time_elapsed | 98536 | -| total_timesteps | 2331520 | -| train/ | | -| approx_kl | 0.12502977 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -33.8 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 182140 | -| policy_gradient_loss | 0.00311 | -| std | 0.00823 | -| value_loss | 3.2e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18216 | -| time_elapsed | 98542 | -| total_timesteps | 2331648 | -| train/ | | -| approx_kl | 0.013310755 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 182150 | -| policy_gradient_loss | 0.0159 | -| std | 0.00824 | -| value_loss | 5.01e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18217 | -| time_elapsed | 98546 | -| total_timesteps | 2331776 | -| train/ | | -| approx_kl | 0.15356798 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 182160 | -| policy_gradient_loss | 0.083 | -| std | 0.00825 | -| value_loss | 2.56e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18218 | -| time_elapsed | 98552 | -| total_timesteps | 2331904 | -| train/ | | -| approx_kl | 0.026546415 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0871 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 182170 | -| policy_gradient_loss | 0.00874 | -| std | 0.00825 | -| value_loss | 1.26e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18219 | -| time_elapsed | 98557 | -| total_timesteps | 2332032 | -| train/ | | -| approx_kl | 0.34691724 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 182180 | -| policy_gradient_loss | 0.0344 | -| std | 0.00825 | -| value_loss | 9.53e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18220 | -| time_elapsed | 98566 | -| total_timesteps | 2332160 | -| train/ | | -| approx_kl | 0.00433165 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 182190 | -| policy_gradient_loss | -0.00657 | -| std | 0.00825 | -| value_loss | 0.000137 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18221 | -| time_elapsed | 98573 | -| total_timesteps | 2332288 | -| train/ | | -| approx_kl | 0.01979576 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 182200 | -| policy_gradient_loss | 0.00683 | -| std | 0.00825 | -| value_loss | 2.02e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18222 | -| time_elapsed | 98578 | -| total_timesteps | 2332416 | -| train/ | | -| approx_kl | 0.0033913343 | -| clip_fraction | 0.0984 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00377 | -| learning_rate | 0.0003 | -| loss | -0.000951 | -| n_updates | 182210 | -| policy_gradient_loss | 0.00222 | -| std | 0.00825 | -| value_loss | 1.57e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18223 | -| time_elapsed | 98584 | -| total_timesteps | 2332544 | -| train/ | | -| approx_kl | 0.05252316 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 182220 | -| policy_gradient_loss | 0.00738 | -| std | 0.00825 | -| value_loss | 3.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18224 | -| time_elapsed | 98589 | -| total_timesteps | 2332672 | -| train/ | | -| approx_kl | 0.032129563 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00256 | -| learning_rate | 0.0003 | -| loss | -0.00909 | -| n_updates | 182230 | -| policy_gradient_loss | 0.019 | -| std | 0.00825 | -| value_loss | 2.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18225 | -| time_elapsed | 98595 | -| total_timesteps | 2332800 | -| train/ | | -| approx_kl | 0.08508174 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | 0.0643 | -| n_updates | 182240 | -| policy_gradient_loss | 0.0479 | -| std | 0.00825 | -| value_loss | 9.67e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 18226 | -| time_elapsed | 98601 | -| total_timesteps | 2332928 | -| train/ | | -| approx_kl | 0.010314465 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.056 | -| learning_rate | 0.0003 | -| loss | 0.00377 | -| n_updates | 182250 | -| policy_gradient_loss | 0.00423 | -| std | 0.00824 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18227 | -| time_elapsed | 98606 | -| total_timesteps | 2333056 | -| train/ | | -| approx_kl | 0.044342775 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 182260 | -| policy_gradient_loss | 0.0111 | -| std | 0.00824 | -| value_loss | 4.93e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18228 | -| time_elapsed | 98616 | -| total_timesteps | 2333184 | -| train/ | | -| approx_kl | 0.00093234284 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.697 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 182270 | -| policy_gradient_loss | -0.0117 | -| std | 0.00823 | -| value_loss | 0.00686 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18229 | -| time_elapsed | 98620 | -| total_timesteps | 2333312 | -| train/ | | -| approx_kl | 0.057183236 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00219 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 182280 | -| policy_gradient_loss | 0.0018 | -| std | 0.00823 | -| value_loss | 1.95e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18230 | -| time_elapsed | 98625 | -| total_timesteps | 2333440 | -| train/ | | -| approx_kl | 0.010246992 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00194 | -| learning_rate | 0.0003 | -| loss | -0.000967 | -| n_updates | 182290 | -| policy_gradient_loss | 0.00208 | -| std | 0.00823 | -| value_loss | 3.9e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18231 | -| time_elapsed | 98630 | -| total_timesteps | 2333568 | -| train/ | | -| approx_kl | 0.04904588 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | 0.00173 | -| n_updates | 182300 | -| policy_gradient_loss | 0.0149 | -| std | 0.00823 | -| value_loss | 1.05e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18232 | -| time_elapsed | 98636 | -| total_timesteps | 2333696 | -| train/ | | -| approx_kl | 0.05577977 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0623 | -| n_updates | 182310 | -| policy_gradient_loss | 0.0303 | -| std | 0.00823 | -| value_loss | 4.55e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18233 | -| time_elapsed | 98641 | -| total_timesteps | 2333824 | -| train/ | | -| approx_kl | 3.678724e-08 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -3.75e-05 | -| n_updates | 182320 | -| policy_gradient_loss | 0.00459 | -| std | 0.00823 | -| value_loss | 3.78e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18234 | -| time_elapsed | 98647 | -| total_timesteps | 2333952 | -| train/ | | -| approx_kl | 0.0047397916 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.00905 | -| n_updates | 182330 | -| policy_gradient_loss | 0.00489 | -| std | 0.00823 | -| value_loss | 2.36e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18235 | -| time_elapsed | 98652 | -| total_timesteps | 2334080 | -| train/ | | -| approx_kl | 0.017893378 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00999 | -| n_updates | 182340 | -| policy_gradient_loss | 0.0272 | -| std | 0.00823 | -| value_loss | 1.39e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18236 | -| time_elapsed | 98659 | -| total_timesteps | 2334208 | -| train/ | | -| approx_kl | 0.08225866 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.919 | -| learning_rate | 0.0003 | -| loss | 0.0329 | -| n_updates | 182350 | -| policy_gradient_loss | 0.0207 | -| std | 0.00823 | -| value_loss | 0.000731 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18237 | -| time_elapsed | 98664 | -| total_timesteps | 2334336 | -| train/ | | -| approx_kl | 0.0036956724 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0054 | -| learning_rate | 0.0003 | -| loss | 0.00622 | -| n_updates | 182360 | -| policy_gradient_loss | 0.00519 | -| std | 0.00823 | -| value_loss | 3.3e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18238 | -| time_elapsed | 98670 | -| total_timesteps | 2334464 | -| train/ | | -| approx_kl | 3.0961353e-05 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00345 | -| learning_rate | 0.0003 | -| loss | -0.000206 | -| n_updates | 182370 | -| policy_gradient_loss | 0.00794 | -| std | 0.00823 | -| value_loss | 4.38e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18239 | -| time_elapsed | 98675 | -| total_timesteps | 2334592 | -| train/ | | -| approx_kl | 0.23512313 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 182380 | -| policy_gradient_loss | -0.00274 | -| std | 0.00823 | -| value_loss | 3.08e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18240 | -| time_elapsed | 98679 | -| total_timesteps | 2334720 | -| train/ | | -| approx_kl | 0.010992756 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 182390 | -| policy_gradient_loss | 0.0085 | -| std | 0.00823 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18241 | -| time_elapsed | 98683 | -| total_timesteps | 2334848 | -| train/ | | -| approx_kl | 0.15864292 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 182400 | -| policy_gradient_loss | 0.119 | -| std | 0.00823 | -| value_loss | 1.41e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 18242 | -| time_elapsed | 98688 | -| total_timesteps | 2334976 | -| train/ | | -| approx_kl | 0.10486955 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | 0.09 | -| n_updates | 182410 | -| policy_gradient_loss | 0.0847 | -| std | 0.00823 | -| value_loss | 1.36e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18243 | -| time_elapsed | 98693 | -| total_timesteps | 2335104 | -| train/ | | -| approx_kl | 0.019133288 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | 0.00654 | -| n_updates | 182420 | -| policy_gradient_loss | 0.0139 | -| std | 0.00823 | -| value_loss | 6.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18244 | -| time_elapsed | 98704 | -| total_timesteps | 2335232 | -| train/ | | -| approx_kl | 0.008878058 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 182430 | -| policy_gradient_loss | -0.0134 | -| std | 0.00823 | -| value_loss | 0.00465 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18245 | -| time_elapsed | 98709 | -| total_timesteps | 2335360 | -| train/ | | -| approx_kl | 0.03483883 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0901 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 182440 | -| policy_gradient_loss | 0.0199 | -| std | 0.00823 | -| value_loss | 0.000195 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18246 | -| time_elapsed | 98713 | -| total_timesteps | 2335488 | -| train/ | | -| approx_kl | 0.35823682 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00468 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 182450 | -| policy_gradient_loss | 0.0453 | -| std | 0.00823 | -| value_loss | 3.14e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18247 | -| time_elapsed | 98718 | -| total_timesteps | 2335616 | -| train/ | | -| approx_kl | 0.008238269 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 182460 | -| policy_gradient_loss | -1.44e-05 | -| std | 0.00823 | -| value_loss | 1.72e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18248 | -| time_elapsed | 98723 | -| total_timesteps | 2335744 | -| train/ | | -| approx_kl | 0.000442354 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.00306 | -| n_updates | 182470 | -| policy_gradient_loss | 0.000655 | -| std | 0.00823 | -| value_loss | 1.03e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18249 | -| time_elapsed | 98727 | -| total_timesteps | 2335872 | -| train/ | | -| approx_kl | 6.025657e-07 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.000143 | -| n_updates | 182480 | -| policy_gradient_loss | -0.0022 | -| std | 0.00823 | -| value_loss | 8.08e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18250 | -| time_elapsed | 98732 | -| total_timesteps | 2336000 | -| train/ | | -| approx_kl | 1.9413419e-05 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.000648 | -| n_updates | 182490 | -| policy_gradient_loss | 0.0033 | -| std | 0.00822 | -| value_loss | 5.52e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18251 | -| time_elapsed | 98735 | -| total_timesteps | 2336128 | -| train/ | | -| approx_kl | 0.031436823 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00449 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 182500 | -| policy_gradient_loss | -0.00152 | -| std | 0.00822 | -| value_loss | 2.32e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18252 | -| time_elapsed | 98745 | -| total_timesteps | 2336256 | -| train/ | | -| approx_kl | 0.030603118 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.865 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 182510 | -| policy_gradient_loss | -0.00186 | -| std | 0.00822 | -| value_loss | 0.00167 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18253 | -| time_elapsed | 98748 | -| total_timesteps | 2336384 | -| train/ | | -| approx_kl | 0.030878328 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00268 | -| learning_rate | 0.0003 | -| loss | -0.00783 | -| n_updates | 182520 | -| policy_gradient_loss | -0.00437 | -| std | 0.00822 | -| value_loss | 6.87e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18254 | -| time_elapsed | 98752 | -| total_timesteps | 2336512 | -| train/ | | -| approx_kl | 0.0001423657 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00012 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 182530 | -| policy_gradient_loss | 0.0015 | -| std | 0.00822 | -| value_loss | 2.7e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18255 | -| time_elapsed | 98757 | -| total_timesteps | 2336640 | -| train/ | | -| approx_kl | 0.028333822 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.091 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 182540 | -| policy_gradient_loss | -0.00262 | -| std | 0.00822 | -| value_loss | 2.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18256 | -| time_elapsed | 98760 | -| total_timesteps | 2336768 | -| train/ | | -| approx_kl | 0.030506313 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 182550 | -| policy_gradient_loss | 0.00948 | -| std | 0.00822 | -| value_loss | 3.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18257 | -| time_elapsed | 98766 | -| total_timesteps | 2336896 | -| train/ | | -| approx_kl | 0.037329603 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0619 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 182560 | -| policy_gradient_loss | 0.0112 | -| std | 0.00822 | -| value_loss | 3.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18258 | -| time_elapsed | 98770 | -| total_timesteps | 2337024 | -| train/ | | -| approx_kl | 0.03129571 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 182570 | -| policy_gradient_loss | -0.0118 | -| std | 0.00822 | -| value_loss | 1.48e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18259 | -| time_elapsed | 98782 | -| total_timesteps | 2337152 | -| train/ | | -| approx_kl | 0.008807254 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.836 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 182580 | -| policy_gradient_loss | -0.00558 | -| std | 0.00822 | -| value_loss | 0.00199 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18260 | -| time_elapsed | 98786 | -| total_timesteps | 2337280 | -| train/ | | -| approx_kl | 0.036645852 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | 0.0159 | -| n_updates | 182590 | -| policy_gradient_loss | 0.00589 | -| std | 0.00822 | -| value_loss | 9.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18261 | -| time_elapsed | 98790 | -| total_timesteps | 2337408 | -| train/ | | -| approx_kl | 0.026759775 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 182600 | -| policy_gradient_loss | 0.0058 | -| std | 0.00822 | -| value_loss | 4.95e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18262 | -| time_elapsed | 98795 | -| total_timesteps | 2337536 | -| train/ | | -| approx_kl | 0.03039676 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.367 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 182610 | -| policy_gradient_loss | 0.00862 | -| std | 0.00822 | -| value_loss | 2.79e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18263 | -| time_elapsed | 98798 | -| total_timesteps | 2337664 | -| train/ | | -| approx_kl | 0.0047975676 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.00447 | -| n_updates | 182620 | -| policy_gradient_loss | 0.00197 | -| std | 0.00822 | -| value_loss | 3.3e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18264 | -| time_elapsed | 98802 | -| total_timesteps | 2337792 | -| train/ | | -| approx_kl | 0.0217169 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 182630 | -| policy_gradient_loss | 0.0987 | -| std | 0.00822 | -| value_loss | 1.03e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 18265 | -| time_elapsed | 98808 | -| total_timesteps | 2337920 | -| train/ | | -| approx_kl | 0.0075370017 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 4.17e-05 | -| n_updates | 182640 | -| policy_gradient_loss | 0.0217 | -| std | 0.00822 | -| value_loss | 7.49e-08 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18266 | -| time_elapsed | 98812 | -| total_timesteps | 2338048 | -| train/ | | -| approx_kl | 0.401105 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 182650 | -| policy_gradient_loss | 0.0376 | -| std | 0.00822 | -| value_loss | 6.11e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18267 | -| time_elapsed | 98822 | -| total_timesteps | 2338176 | -| train/ | | -| approx_kl | 0.002771461 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.697 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 182660 | -| policy_gradient_loss | -0.00946 | -| std | 0.00822 | -| value_loss | 0.00783 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18268 | -| time_elapsed | 98827 | -| total_timesteps | 2338304 | -| train/ | | -| approx_kl | 0.037876282 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0656 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 182670 | -| policy_gradient_loss | 0.0369 | -| std | 0.00821 | -| value_loss | 7.01e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18269 | -| time_elapsed | 98831 | -| total_timesteps | 2338432 | -| train/ | | -| approx_kl | 0.53363806 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | 0.403 | -| n_updates | 182680 | -| policy_gradient_loss | 0.124 | -| std | 0.0082 | -| value_loss | 0.000252 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18270 | -| time_elapsed | 98836 | -| total_timesteps | 2338560 | -| train/ | | -| approx_kl | 0.015277859 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | 0.00805 | -| n_updates | 182690 | -| policy_gradient_loss | 0.01 | -| std | 0.0082 | -| value_loss | 1.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18271 | -| time_elapsed | 98841 | -| total_timesteps | 2338688 | -| train/ | | -| approx_kl | 0.040438466 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | -0.000692 | -| n_updates | 182700 | -| policy_gradient_loss | 0.00964 | -| std | 0.0082 | -| value_loss | 4.61e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18272 | -| time_elapsed | 98846 | -| total_timesteps | 2338816 | -| train/ | | -| approx_kl | 4.3713953e-05 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.000244 | -| n_updates | 182710 | -| policy_gradient_loss | 0.0197 | -| std | 0.0082 | -| value_loss | 3.41e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18273 | -| time_elapsed | 98850 | -| total_timesteps | 2338944 | -| train/ | | -| approx_kl | 0.033018984 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 182720 | -| policy_gradient_loss | -0.0102 | -| std | 0.00819 | -| value_loss | 2.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18274 | -| time_elapsed | 98855 | -| total_timesteps | 2339072 | -| train/ | | -| approx_kl | 0.031391796 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 182730 | -| policy_gradient_loss | -0.00576 | -| std | 0.0082 | -| value_loss | 1.81e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18275 | -| time_elapsed | 98862 | -| total_timesteps | 2339200 | -| train/ | | -| approx_kl | 0.0817807 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.785 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 182740 | -| policy_gradient_loss | 0.009 | -| std | 0.0082 | -| value_loss | 0.00426 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18276 | -| time_elapsed | 98870 | -| total_timesteps | 2339328 | -| train/ | | -| approx_kl | 0.03883563 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -4.09 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 182750 | -| policy_gradient_loss | 0.0083 | -| std | 0.0082 | -| value_loss | 2.4e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18277 | -| time_elapsed | 98877 | -| total_timesteps | 2339456 | -| train/ | | -| approx_kl | 0.057569362 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.0511 | -| n_updates | 182760 | -| policy_gradient_loss | 0.0202 | -| std | 0.00817 | -| value_loss | 2.77e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18278 | -| time_elapsed | 98883 | -| total_timesteps | 2339584 | -| train/ | | -| approx_kl | 0.016166003 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.00602 | -| n_updates | 182770 | -| policy_gradient_loss | 0.00141 | -| std | 0.00815 | -| value_loss | 5.93e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18279 | -| time_elapsed | 98887 | -| total_timesteps | 2339712 | -| train/ | | -| approx_kl | 0.013173975 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00879 | -| learning_rate | 0.0003 | -| loss | 0.000899 | -| n_updates | 182780 | -| policy_gradient_loss | 0.0147 | -| std | 0.00815 | -| value_loss | 7.17e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18280 | -| time_elapsed | 98892 | -| total_timesteps | 2339840 | -| train/ | | -| approx_kl | 0.1633098 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 182790 | -| policy_gradient_loss | 0.0835 | -| std | 0.00815 | -| value_loss | 1.83e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18281 | -| time_elapsed | 98896 | -| total_timesteps | 2339968 | -| train/ | | -| approx_kl | 0.10777536 | -| clip_fraction | 0.636 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 182800 | -| policy_gradient_loss | 0.105 | -| std | 0.00815 | -| value_loss | 1.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18282 | -| time_elapsed | 98901 | -| total_timesteps | 2340096 | -| train/ | | -| approx_kl | 0.024690647 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 182810 | -| policy_gradient_loss | 0.0208 | -| std | 0.00814 | -| value_loss | 1.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18283 | -| time_elapsed | 98911 | -| total_timesteps | 2340224 | -| train/ | | -| approx_kl | 0.29498172 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | 0.0411 | -| n_updates | 182820 | -| policy_gradient_loss | 0.0106 | -| std | 0.00814 | -| value_loss | 0.00101 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18284 | -| time_elapsed | 98917 | -| total_timesteps | 2340352 | -| train/ | | -| approx_kl | 0.24002014 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00712 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 182830 | -| policy_gradient_loss | 0.0393 | -| std | 0.00814 | -| value_loss | 6.67e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18285 | -| time_elapsed | 98921 | -| total_timesteps | 2340480 | -| train/ | | -| approx_kl | 0.0035604183 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00967 | -| learning_rate | 0.0003 | -| loss | -0.00313 | -| n_updates | 182840 | -| policy_gradient_loss | 0.00523 | -| std | 0.00814 | -| value_loss | 1.62e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18286 | -| time_elapsed | 98926 | -| total_timesteps | 2340608 | -| train/ | | -| approx_kl | 0.057869956 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 182850 | -| policy_gradient_loss | 0.00771 | -| std | 0.00814 | -| value_loss | 1.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18287 | -| time_elapsed | 98932 | -| total_timesteps | 2340736 | -| train/ | | -| approx_kl | 0.15869337 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 182860 | -| policy_gradient_loss | 0.0252 | -| std | 0.00813 | -| value_loss | 7.34e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18288 | -| time_elapsed | 98937 | -| total_timesteps | 2340864 | -| train/ | | -| approx_kl | 0.30782655 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 182870 | -| policy_gradient_loss | 0.0366 | -| std | 0.00813 | -| value_loss | 4.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 18289 | -| time_elapsed | 98942 | -| total_timesteps | 2340992 | -| train/ | | -| approx_kl | 0.02503017 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.00203 | -| n_updates | 182880 | -| policy_gradient_loss | 0.00151 | -| std | 0.00813 | -| value_loss | 3.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18290 | -| time_elapsed | 98948 | -| total_timesteps | 2341120 | -| train/ | | -| approx_kl | 0.025312306 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | 0.00199 | -| n_updates | 182890 | -| policy_gradient_loss | 0.000619 | -| std | 0.00813 | -| value_loss | 2.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18291 | -| time_elapsed | 98959 | -| total_timesteps | 2341248 | -| train/ | | -| approx_kl | 0.07834981 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 182900 | -| policy_gradient_loss | -0.0104 | -| std | 0.00813 | -| value_loss | 0.000242 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18292 | -| time_elapsed | 98964 | -| total_timesteps | 2341376 | -| train/ | | -| approx_kl | 0.19272369 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | 0.0694 | -| n_updates | 182910 | -| policy_gradient_loss | 0.0242 | -| std | 0.00813 | -| value_loss | 1.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18293 | -| time_elapsed | 98968 | -| total_timesteps | 2341504 | -| train/ | | -| approx_kl | 0.049220808 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 182920 | -| policy_gradient_loss | 0.0466 | -| std | 0.00813 | -| value_loss | 7.35e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18294 | -| time_elapsed | 98974 | -| total_timesteps | 2341632 | -| train/ | | -| approx_kl | 0.02527409 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00227 | -| learning_rate | 0.0003 | -| loss | 0.0261 | -| n_updates | 182930 | -| policy_gradient_loss | 0.014 | -| std | 0.00813 | -| value_loss | 5.1e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18295 | -| time_elapsed | 98978 | -| total_timesteps | 2341760 | -| train/ | | -| approx_kl | 0.00028807065 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.00208 | -| n_updates | 182940 | -| policy_gradient_loss | 0.0613 | -| std | 0.00813 | -| value_loss | 2.53e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18296 | -| time_elapsed | 98983 | -| total_timesteps | 2341888 | -| train/ | | -| approx_kl | 0.016807925 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 182950 | -| policy_gradient_loss | 0.0229 | -| std | 0.00813 | -| value_loss | 1.62e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18297 | -| time_elapsed | 98987 | -| total_timesteps | 2342016 | -| train/ | | -| approx_kl | 0.22943565 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 182960 | -| policy_gradient_loss | 0.118 | -| std | 0.00813 | -| value_loss | 1.66e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18298 | -| time_elapsed | 98998 | -| total_timesteps | 2342144 | -| train/ | | -| approx_kl | 0.03862885 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.781 | -| learning_rate | 0.0003 | -| loss | -0.00975 | -| n_updates | 182970 | -| policy_gradient_loss | -0.011 | -| std | 0.00813 | -| value_loss | 0.00447 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18299 | -| time_elapsed | 99003 | -| total_timesteps | 2342272 | -| train/ | | -| approx_kl | 0.022603212 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.359 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 182980 | -| policy_gradient_loss | -0.00614 | -| std | 0.00813 | -| value_loss | 2.05e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18300 | -| time_elapsed | 99009 | -| total_timesteps | 2342400 | -| train/ | | -| approx_kl | 2.7120113e-06 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00583 | -| learning_rate | 0.0003 | -| loss | -0.000171 | -| n_updates | 182990 | -| policy_gradient_loss | 0.00244 | -| std | 0.00813 | -| value_loss | 1.29e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18301 | -| time_elapsed | 99014 | -| total_timesteps | 2342528 | -| train/ | | -| approx_kl | 0.030769926 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0606 | -| learning_rate | 0.0003 | -| loss | 0.00671 | -| n_updates | 183000 | -| policy_gradient_loss | 0.00298 | -| std | 0.00813 | -| value_loss | 7.96e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18302 | -| time_elapsed | 99019 | -| total_timesteps | 2342656 | -| train/ | | -| approx_kl | 0.02943091 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | -0.00404 | -| n_updates | 183010 | -| policy_gradient_loss | -0.00201 | -| std | 0.00813 | -| value_loss | 6.36e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18303 | -| time_elapsed | 99024 | -| total_timesteps | 2342784 | -| train/ | | -| approx_kl | 0.006082154 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 183020 | -| policy_gradient_loss | 0.00274 | -| std | 0.00813 | -| value_loss | 5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 18304 | -| time_elapsed | 99029 | -| total_timesteps | 2342912 | -| train/ | | -| approx_kl | 0.025849145 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 183030 | -| policy_gradient_loss | 0.0959 | -| std | 0.00813 | -| value_loss | 2.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18305 | -| time_elapsed | 99034 | -| total_timesteps | 2343040 | -| train/ | | -| approx_kl | 0.054660402 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.0501 | -| n_updates | 183040 | -| policy_gradient_loss | 0.0758 | -| std | 0.00813 | -| value_loss | 2.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18306 | -| time_elapsed | 99044 | -| total_timesteps | 2343168 | -| train/ | | -| approx_kl | 0.008073672 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.874 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 183050 | -| policy_gradient_loss | -0.00696 | -| std | 0.00813 | -| value_loss | 0.00174 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18307 | -| time_elapsed | 99050 | -| total_timesteps | 2343296 | -| train/ | | -| approx_kl | 0.062335365 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.0395 | -| n_updates | 183060 | -| policy_gradient_loss | 0.0137 | -| std | 0.00813 | -| value_loss | 1.31e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18308 | -| time_elapsed | 99056 | -| total_timesteps | 2343424 | -| train/ | | -| approx_kl | 0.019431941 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00415 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 183070 | -| policy_gradient_loss | 0.00173 | -| std | 0.00813 | -| value_loss | 1.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18309 | -| time_elapsed | 99062 | -| total_timesteps | 2343552 | -| train/ | | -| approx_kl | 0.026083859 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 183080 | -| policy_gradient_loss | 0.00453 | -| std | 0.00813 | -| value_loss | 1.1e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18310 | -| time_elapsed | 99067 | -| total_timesteps | 2343680 | -| train/ | | -| approx_kl | 0.0064237327 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.0025 | -| n_updates | 183090 | -| policy_gradient_loss | 0.00579 | -| std | 0.00813 | -| value_loss | 6.94e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18311 | -| time_elapsed | 99071 | -| total_timesteps | 2343808 | -| train/ | | -| approx_kl | 0.00057939254 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0679 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 183100 | -| policy_gradient_loss | 0.000831 | -| std | 0.00813 | -| value_loss | 4.62e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18312 | -| time_elapsed | 99077 | -| total_timesteps | 2343936 | -| train/ | | -| approx_kl | 0.0038755913 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 183110 | -| policy_gradient_loss | 0.00447 | -| std | 0.00813 | -| value_loss | 2.63e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18313 | -| time_elapsed | 99083 | -| total_timesteps | 2344064 | -| train/ | | -| approx_kl | 0.022690905 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0624 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 183120 | -| policy_gradient_loss | 0.0722 | -| std | 0.00813 | -| value_loss | 2.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18314 | -| time_elapsed | 99091 | -| total_timesteps | 2344192 | -| train/ | | -| approx_kl | 0.11186093 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.966 | -| learning_rate | 0.0003 | -| loss | 0.0377 | -| n_updates | 183130 | -| policy_gradient_loss | 0.0441 | -| std | 0.00813 | -| value_loss | 0.000306 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18315 | -| time_elapsed | 99096 | -| total_timesteps | 2344320 | -| train/ | | -| approx_kl | 0.18961947 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00832 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 183140 | -| policy_gradient_loss | 0.1 | -| std | 0.00813 | -| value_loss | 1.31e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18316 | -| time_elapsed | 99101 | -| total_timesteps | 2344448 | -| train/ | | -| approx_kl | 0.024840554 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00493 | -| learning_rate | 0.0003 | -| loss | 0.00342 | -| n_updates | 183150 | -| policy_gradient_loss | 0.0142 | -| std | 0.00813 | -| value_loss | 5.12e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18317 | -| time_elapsed | 99104 | -| total_timesteps | 2344576 | -| train/ | | -| approx_kl | 0.11093181 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.0613 | -| n_updates | 183160 | -| policy_gradient_loss | 0.0151 | -| std | 0.00813 | -| value_loss | 2.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18318 | -| time_elapsed | 99107 | -| total_timesteps | 2344704 | -| train/ | | -| approx_kl | 0.013181593 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 183170 | -| policy_gradient_loss | 0.0108 | -| std | 0.00813 | -| value_loss | 1.64e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18319 | -| time_elapsed | 99111 | -| total_timesteps | 2344832 | -| train/ | | -| approx_kl | 0.06834236 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 183180 | -| policy_gradient_loss | 0.0137 | -| std | 0.00813 | -| value_loss | 1.32e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 18320 | -| time_elapsed | 99116 | -| total_timesteps | 2344960 | -| train/ | | -| approx_kl | 0.003635798 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.00184 | -| n_updates | 183190 | -| policy_gradient_loss | 0.00448 | -| std | 0.00814 | -| value_loss | 9.62e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18321 | -| time_elapsed | 99122 | -| total_timesteps | 2345088 | -| train/ | | -| approx_kl | 0.14328867 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0869 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 183200 | -| policy_gradient_loss | 0.0979 | -| std | 0.00814 | -| value_loss | 5.1e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18322 | -| time_elapsed | 99130 | -| total_timesteps | 2345216 | -| train/ | | -| approx_kl | 0.0443293 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -3.38 | -| learning_rate | 0.0003 | -| loss | 0.00865 | -| n_updates | 183210 | -| policy_gradient_loss | 0.00896 | -| std | 0.00814 | -| value_loss | 0.00281 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18323 | -| time_elapsed | 99135 | -| total_timesteps | 2345344 | -| train/ | | -| approx_kl | 0.0013396912 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | -0.000279 | -| n_updates | 183220 | -| policy_gradient_loss | 0.0154 | -| std | 0.00814 | -| value_loss | 9.6e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18324 | -| time_elapsed | 99140 | -| total_timesteps | 2345472 | -| train/ | | -| approx_kl | 0.5818911 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0783 | -| learning_rate | 0.0003 | -| loss | 0.302 | -| n_updates | 183230 | -| policy_gradient_loss | 0.121 | -| std | 0.00814 | -| value_loss | 5.74e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18325 | -| time_elapsed | 99145 | -| total_timesteps | 2345600 | -| train/ | | -| approx_kl | 0.02097886 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.469 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 183240 | -| policy_gradient_loss | -0.0016 | -| std | 0.00814 | -| value_loss | 4.29e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18326 | -| time_elapsed | 99150 | -| total_timesteps | 2345728 | -| train/ | | -| approx_kl | 0.009421784 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 183250 | -| policy_gradient_loss | -0.00117 | -| std | 0.00814 | -| value_loss | 1.73e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18327 | -| time_elapsed | 99155 | -| total_timesteps | 2345856 | -| train/ | | -| approx_kl | 0.016665097 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.074 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 183260 | -| policy_gradient_loss | 0.0159 | -| std | 0.00814 | -| value_loss | 1.51e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 18328 | -| time_elapsed | 99159 | -| total_timesteps | 2345984 | -| train/ | | -| approx_kl | 0.05618517 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 183270 | -| policy_gradient_loss | 0.011 | -| std | 0.00814 | -| value_loss | 8.06e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18329 | -| time_elapsed | 99163 | -| total_timesteps | 2346112 | -| train/ | | -| approx_kl | 0.08945737 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 183280 | -| policy_gradient_loss | 0.02 | -| std | 0.00814 | -| value_loss | 5.43e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18330 | -| time_elapsed | 99174 | -| total_timesteps | 2346240 | -| train/ | | -| approx_kl | 0.028292134 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -9.6e-05 | -| n_updates | 183290 | -| policy_gradient_loss | -0.00271 | -| std | 0.00813 | -| value_loss | 0.00322 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18331 | -| time_elapsed | 99179 | -| total_timesteps | 2346368 | -| train/ | | -| approx_kl | 0.031844184 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 183300 | -| policy_gradient_loss | 0.0216 | -| std | 0.00813 | -| value_loss | 1.32e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18332 | -| time_elapsed | 99184 | -| total_timesteps | 2346496 | -| train/ | | -| approx_kl | 0.016912483 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00669 | -| learning_rate | 0.0003 | -| loss | 0.00483 | -| n_updates | 183310 | -| policy_gradient_loss | 0.0157 | -| std | 0.00813 | -| value_loss | 1.26e-05 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18333 | -| time_elapsed | 99188 | -| total_timesteps | 2346624 | -| train/ | | -| approx_kl | 0.175087 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.561 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 183320 | -| policy_gradient_loss | 0.0181 | -| std | 0.00813 | -| value_loss | 1.14e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18334 | -| time_elapsed | 99195 | -| total_timesteps | 2346752 | -| train/ | | -| approx_kl | 0.055975348 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00529 | -| learning_rate | 0.0003 | -| loss | 0.00846 | -| n_updates | 183330 | -| policy_gradient_loss | 0.0547 | -| std | 0.00812 | -| value_loss | 4.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18335 | -| time_elapsed | 99200 | -| total_timesteps | 2346880 | -| train/ | | -| approx_kl | 0.11986169 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 183340 | -| policy_gradient_loss | 0.021 | -| std | 0.00812 | -| value_loss | 3.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18336 | -| time_elapsed | 99204 | -| total_timesteps | 2347008 | -| train/ | | -| approx_kl | 0.036286708 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.0191 | -| n_updates | 183350 | -| policy_gradient_loss | 0.051 | -| std | 0.00812 | -| value_loss | 1.84e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18337 | -| time_elapsed | 99216 | -| total_timesteps | 2347136 | -| train/ | | -| approx_kl | 0.003614447 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.886 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 183360 | -| policy_gradient_loss | -0.011 | -| std | 0.00811 | -| value_loss | 0.00153 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18338 | -| time_elapsed | 99221 | -| total_timesteps | 2347264 | -| train/ | | -| approx_kl | 0.028479613 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.426 | -| learning_rate | 0.0003 | -| loss | 0.0056 | -| n_updates | 183370 | -| policy_gradient_loss | 0.00369 | -| std | 0.00809 | -| value_loss | 7.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18339 | -| time_elapsed | 99226 | -| total_timesteps | 2347392 | -| train/ | | -| approx_kl | 0.041136242 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.74 | -| learning_rate | 0.0003 | -| loss | 0.0093 | -| n_updates | 183380 | -| policy_gradient_loss | 0.00391 | -| std | 0.00809 | -| value_loss | 1.33e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18340 | -| time_elapsed | 99230 | -| total_timesteps | 2347520 | -| train/ | | -| approx_kl | 0.0052103824 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.273 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 183390 | -| policy_gradient_loss | 0.00289 | -| std | 0.00808 | -| value_loss | 8.14e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18341 | -| time_elapsed | 99235 | -| total_timesteps | 2347648 | -| train/ | | -| approx_kl | 0.0004318552 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 183400 | -| policy_gradient_loss | 0.02 | -| std | 0.00808 | -| value_loss | 8.9e-07 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18342 | -| time_elapsed | 99240 | -| total_timesteps | 2347776 | -| train/ | | -| approx_kl | 0.759573 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | 0.285 | -| n_updates | 183410 | -| policy_gradient_loss | 0.125 | -| std | 0.00808 | -| value_loss | 7.75e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 18343 | -| time_elapsed | 99244 | -| total_timesteps | 2347904 | -| train/ | | -| approx_kl | 0.015392677 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.00487 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 183420 | -| policy_gradient_loss | -0.00248 | -| std | 0.00808 | -| value_loss | 2.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18344 | -| time_elapsed | 99248 | -| total_timesteps | 2348032 | -| train/ | | -| approx_kl | 0.009609977 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0561 | -| learning_rate | 0.0003 | -| loss | -0.00372 | -| n_updates | 183430 | -| policy_gradient_loss | -0.00242 | -| std | 0.00808 | -| value_loss | 1.3e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18345 | -| time_elapsed | 99259 | -| total_timesteps | 2348160 | -| train/ | | -| approx_kl | 0.20327449 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.235 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 183440 | -| policy_gradient_loss | 0.00158 | -| std | 0.00808 | -| value_loss | 0.00284 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18346 | -| time_elapsed | 99264 | -| total_timesteps | 2348288 | -| train/ | | -| approx_kl | 0.0028361669 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.334 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 183450 | -| policy_gradient_loss | 0.00219 | -| std | 0.00808 | -| value_loss | 1.3e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18347 | -| time_elapsed | 99269 | -| total_timesteps | 2348416 | -| train/ | | -| approx_kl | 0.050657116 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.0095 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 183460 | -| policy_gradient_loss | 0.0463 | -| std | 0.00807 | -| value_loss | 1.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18348 | -| time_elapsed | 99274 | -| total_timesteps | 2348544 | -| train/ | | -| approx_kl | 0.03385951 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 183470 | -| policy_gradient_loss | 0.0261 | -| std | 0.00807 | -| value_loss | 1.01e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18349 | -| time_elapsed | 99280 | -| total_timesteps | 2348672 | -| train/ | | -| approx_kl | 0.008074509 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | 0.00765 | -| n_updates | 183480 | -| policy_gradient_loss | 0.0768 | -| std | 0.00807 | -| value_loss | 0.00192 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18350 | -| time_elapsed | 99285 | -| total_timesteps | 2348800 | -| train/ | | -| approx_kl | 0.002075437 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.00437 | -| n_updates | 183490 | -| policy_gradient_loss | 0.0226 | -| std | 0.00806 | -| value_loss | 0.00209 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 18351 | -| time_elapsed | 99290 | -| total_timesteps | 2348928 | -| train/ | | -| approx_kl | 0.06664508 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00578 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 183500 | -| policy_gradient_loss | 0.0209 | -| std | 0.00806 | -| value_loss | 0.000204 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18352 | -| time_elapsed | 99294 | -| total_timesteps | 2349056 | -| train/ | | -| approx_kl | 0.3924 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 183510 | -| policy_gradient_loss | 0.0345 | -| std | 0.00806 | -| value_loss | 0.000171 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18353 | -| time_elapsed | 99302 | -| total_timesteps | 2349184 | -| train/ | | -| approx_kl | 0.037565924 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 183520 | -| policy_gradient_loss | -0.012 | -| std | 0.00806 | -| value_loss | 0.00372 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18354 | -| time_elapsed | 99308 | -| total_timesteps | 2349312 | -| train/ | | -| approx_kl | 0.055418 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0882 | -| learning_rate | 0.0003 | -| loss | 0.00929 | -| n_updates | 183530 | -| policy_gradient_loss | 0.000403 | -| std | 0.00806 | -| value_loss | 4.78e-05 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18355 | -| time_elapsed | 99312 | -| total_timesteps | 2349440 | -| train/ | | -| approx_kl | 0.03273385 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0643 | -| learning_rate | 0.0003 | -| loss | 0.00358 | -| n_updates | 183540 | -| policy_gradient_loss | 0.00276 | -| std | 0.00806 | -| value_loss | 3.91e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18356 | -| time_elapsed | 99316 | -| total_timesteps | 2349568 | -| train/ | | -| approx_kl | 0.023555793 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.00999 | -| n_updates | 183550 | -| policy_gradient_loss | 0.00572 | -| std | 0.00806 | -| value_loss | 2.39e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18357 | -| time_elapsed | 99322 | -| total_timesteps | 2349696 | -| train/ | | -| approx_kl | 0.04176876 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | -0.00823 | -| n_updates | 183560 | -| policy_gradient_loss | -0.00474 | -| std | 0.00806 | -| value_loss | 1.78e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18358 | -| time_elapsed | 99328 | -| total_timesteps | 2349824 | -| train/ | | -| approx_kl | 0.01763631 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.00716 | -| n_updates | 183570 | -| policy_gradient_loss | 0.0063 | -| std | 0.00806 | -| value_loss | 1.09e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18359 | -| time_elapsed | 99333 | -| total_timesteps | 2349952 | -| train/ | | -| approx_kl | 0.061006404 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0892 | -| learning_rate | 0.0003 | -| loss | 0.00277 | -| n_updates | 183580 | -| policy_gradient_loss | 0.0147 | -| std | 0.00805 | -| value_loss | 6.79e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18360 | -| time_elapsed | 99337 | -| total_timesteps | 2350080 | -| train/ | | -| approx_kl | 0.629856 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.266 | -| n_updates | 183590 | -| policy_gradient_loss | 0.151 | -| std | 0.00805 | -| value_loss | 4.82e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18361 | -| time_elapsed | 99345 | -| total_timesteps | 2350208 | -| train/ | | -| approx_kl | 0.013809164 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.638 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 183600 | -| policy_gradient_loss | -0.00705 | -| std | 0.00805 | -| value_loss | 0.00109 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18362 | -| time_elapsed | 99348 | -| total_timesteps | 2350336 | -| train/ | | -| approx_kl | 0.002809978 | -| clip_fraction | 0.0281 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00393 | -| n_updates | 183610 | -| policy_gradient_loss | -0.00165 | -| std | 0.00804 | -| value_loss | 3.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18363 | -| time_elapsed | 99352 | -| total_timesteps | 2350464 | -| train/ | | -| approx_kl | 0.016724955 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00143 | -| learning_rate | 0.0003 | -| loss | -0.00451 | -| n_updates | 183620 | -| policy_gradient_loss | -0.00494 | -| std | 0.00803 | -| value_loss | 1.26e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18364 | -| time_elapsed | 99358 | -| total_timesteps | 2350592 | -| train/ | | -| approx_kl | 0.010694383 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.00398 | -| n_updates | 183630 | -| policy_gradient_loss | 0.00162 | -| std | 0.00804 | -| value_loss | 8.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18365 | -| time_elapsed | 99364 | -| total_timesteps | 2350720 | -| train/ | | -| approx_kl | 0.01642752 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | -0.000291 | -| n_updates | 183640 | -| policy_gradient_loss | 0.0194 | -| std | 0.00804 | -| value_loss | 7.9e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18366 | -| time_elapsed | 99368 | -| total_timesteps | 2350848 | -| train/ | | -| approx_kl | 0.23028435 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 183650 | -| policy_gradient_loss | 0.127 | -| std | 0.00804 | -| value_loss | 5.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 18367 | -| time_elapsed | 99373 | -| total_timesteps | 2350976 | -| train/ | | -| approx_kl | 0.03922852 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 183660 | -| policy_gradient_loss | 0.018 | -| std | 0.00804 | -| value_loss | 3.32e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18368 | -| time_elapsed | 99376 | -| total_timesteps | 2351104 | -| train/ | | -| approx_kl | 0.3349865 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 183670 | -| policy_gradient_loss | 0.0345 | -| std | 0.00804 | -| value_loss | 2.14e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18369 | -| time_elapsed | 99386 | -| total_timesteps | 2351232 | -| train/ | | -| approx_kl | 0.007997312 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.147 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 183680 | -| policy_gradient_loss | -0.0132 | -| std | 0.00804 | -| value_loss | 0.0021 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18370 | -| time_elapsed | 99391 | -| total_timesteps | 2351360 | -| train/ | | -| approx_kl | 0.17628731 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 183690 | -| policy_gradient_loss | 0.0307 | -| std | 0.00803 | -| value_loss | 3.69e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18371 | -| time_elapsed | 99395 | -| total_timesteps | 2351488 | -| train/ | | -| approx_kl | 0.058953635 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -17.5 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 183700 | -| policy_gradient_loss | 0.00361 | -| std | 0.00802 | -| value_loss | 0.000394 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18372 | -| time_elapsed | 99399 | -| total_timesteps | 2351616 | -| train/ | | -| approx_kl | 0.41532513 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 183710 | -| policy_gradient_loss | 0.039 | -| std | 0.00802 | -| value_loss | 0.000436 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18373 | -| time_elapsed | 99403 | -| total_timesteps | 2351744 | -| train/ | | -| approx_kl | 0.03321813 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00447 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 183720 | -| policy_gradient_loss | 0.00582 | -| std | 0.00802 | -| value_loss | 8.53e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18374 | -| time_elapsed | 99409 | -| total_timesteps | 2351872 | -| train/ | | -| approx_kl | 0.0065286136 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00813 | -| learning_rate | 0.0003 | -| loss | 0.000199 | -| n_updates | 183730 | -| policy_gradient_loss | 0.00676 | -| std | 0.00802 | -| value_loss | 3.5e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18375 | -| time_elapsed | 99415 | -| total_timesteps | 2352000 | -| train/ | | -| approx_kl | 0.052267723 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.00801 | -| n_updates | 183740 | -| policy_gradient_loss | -0.000768 | -| std | 0.00802 | -| value_loss | 2.45e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18376 | -| time_elapsed | 99419 | -| total_timesteps | 2352128 | -| train/ | | -| approx_kl | 0.007999581 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00352 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 183750 | -| policy_gradient_loss | -8.92e-05 | -| std | 0.00802 | -| value_loss | 0.000142 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18377 | -| time_elapsed | 99429 | -| total_timesteps | 2352256 | -| train/ | | -| approx_kl | 0.055161845 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 183760 | -| policy_gradient_loss | 0.0355 | -| std | 0.00802 | -| value_loss | 0.00182 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18378 | -| time_elapsed | 99433 | -| total_timesteps | 2352384 | -| train/ | | -| approx_kl | 0.04803198 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 183770 | -| policy_gradient_loss | 0.013 | -| std | 0.00802 | -| value_loss | 1.24e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18379 | -| time_elapsed | 99438 | -| total_timesteps | 2352512 | -| train/ | | -| approx_kl | 0.3990941 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 183780 | -| policy_gradient_loss | 0.0373 | -| std | 0.00802 | -| value_loss | 7.44e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18380 | -| time_elapsed | 99444 | -| total_timesteps | 2352640 | -| train/ | | -| approx_kl | 0.008014876 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00509 | -| n_updates | 183790 | -| policy_gradient_loss | 0.00298 | -| std | 0.00802 | -| value_loss | 4.26e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18381 | -| time_elapsed | 99449 | -| total_timesteps | 2352768 | -| train/ | | -| approx_kl | 0.0669242 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 183800 | -| policy_gradient_loss | 0.0195 | -| std | 0.00802 | -| value_loss | 2.59e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 18382 | -| time_elapsed | 99454 | -| total_timesteps | 2352896 | -| train/ | | -| approx_kl | 0.023038296 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 183810 | -| policy_gradient_loss | 0.000501 | -| std | 0.00802 | -| value_loss | 2.09e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18383 | -| time_elapsed | 99457 | -| total_timesteps | 2353024 | -| train/ | | -| approx_kl | 0.03597479 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.00489 | -| n_updates | 183820 | -| policy_gradient_loss | 0.00107 | -| std | 0.00802 | -| value_loss | 1.56e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18384 | -| time_elapsed | 99469 | -| total_timesteps | 2353152 | -| train/ | | -| approx_kl | 0.01091065 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.75 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 183830 | -| policy_gradient_loss | 0.00164 | -| std | 0.00802 | -| value_loss | 0.00431 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18385 | -| time_elapsed | 99473 | -| total_timesteps | 2353280 | -| train/ | | -| approx_kl | 0.044950996 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 183840 | -| policy_gradient_loss | 0.0195 | -| std | 0.00803 | -| value_loss | 0.00016 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18386 | -| time_elapsed | 99477 | -| total_timesteps | 2353408 | -| train/ | | -| approx_kl | 0.37838274 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.000125 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 183850 | -| policy_gradient_loss | 0.04 | -| std | 0.00803 | -| value_loss | 4.88e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18387 | -| time_elapsed | 99482 | -| total_timesteps | 2353536 | -| train/ | | -| approx_kl | 0.023877826 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0036 | -| n_updates | 183860 | -| policy_gradient_loss | 0.00373 | -| std | 0.00803 | -| value_loss | 2.71e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18388 | -| time_elapsed | 99487 | -| total_timesteps | 2353664 | -| train/ | | -| approx_kl | 0.0046999995 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | -0.00921 | -| n_updates | 183870 | -| policy_gradient_loss | 0.00392 | -| std | 0.00803 | -| value_loss | 1.9e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18389 | -| time_elapsed | 99492 | -| total_timesteps | 2353792 | -| train/ | | -| approx_kl | 0.060591877 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 183880 | -| policy_gradient_loss | 0.00714 | -| std | 0.00804 | -| value_loss | 1.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18390 | -| time_elapsed | 99497 | -| total_timesteps | 2353920 | -| train/ | | -| approx_kl | 0.027116505 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 183890 | -| policy_gradient_loss | 0.0318 | -| std | 0.00804 | -| value_loss | 7.28e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18391 | -| time_elapsed | 99502 | -| total_timesteps | 2354048 | -| train/ | | -| approx_kl | 0.6587004 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.331 | -| n_updates | 183900 | -| policy_gradient_loss | 0.14 | -| std | 0.00804 | -| value_loss | 6.18e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18392 | -| time_elapsed | 99511 | -| total_timesteps | 2354176 | -| train/ | | -| approx_kl | 0.022570673 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 183910 | -| policy_gradient_loss | 0.00946 | -| std | 0.00804 | -| value_loss | 0.00112 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18393 | -| time_elapsed | 99517 | -| total_timesteps | 2354304 | -| train/ | | -| approx_kl | 0.0007601874 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.0023 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 183920 | -| policy_gradient_loss | 0.00742 | -| std | 0.00804 | -| value_loss | 1.01e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18394 | -| time_elapsed | 99522 | -| total_timesteps | 2354432 | -| train/ | | -| approx_kl | 0.2736534 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 183930 | -| policy_gradient_loss | 0.0436 | -| std | 0.00804 | -| value_loss | 2.68e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18395 | -| time_elapsed | 99527 | -| total_timesteps | 2354560 | -| train/ | | -| approx_kl | 0.3127083 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 183940 | -| policy_gradient_loss | 0.0443 | -| std | 0.00803 | -| value_loss | 4.37e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18396 | -| time_elapsed | 99532 | -| total_timesteps | 2354688 | -| train/ | | -| approx_kl | 0.061110936 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.00185 | -| n_updates | 183950 | -| policy_gradient_loss | 0.0263 | -| std | 0.00803 | -| value_loss | 2.23e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18397 | -| time_elapsed | 99537 | -| total_timesteps | 2354816 | -| train/ | | -| approx_kl | 0.10380385 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 183960 | -| policy_gradient_loss | 0.0542 | -| std | 0.00803 | -| value_loss | 2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 18398 | -| time_elapsed | 99543 | -| total_timesteps | 2354944 | -| train/ | | -| approx_kl | 0.026910393 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.00565 | -| n_updates | 183970 | -| policy_gradient_loss | 0.0294 | -| std | 0.00803 | -| value_loss | 1.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18399 | -| time_elapsed | 99548 | -| total_timesteps | 2355072 | -| train/ | | -| approx_kl | 0.14988568 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 183980 | -| policy_gradient_loss | 0.056 | -| std | 0.00803 | -| value_loss | 9.97e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18400 | -| time_elapsed | 99555 | -| total_timesteps | 2355200 | -| train/ | | -| approx_kl | 0.02270159 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.886 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 183990 | -| policy_gradient_loss | -0.0105 | -| std | 0.00803 | -| value_loss | 0.00179 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18401 | -| time_elapsed | 99560 | -| total_timesteps | 2355328 | -| train/ | | -| approx_kl | 0.0101753585 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00212 | -| learning_rate | 0.0003 | -| loss | 0.00785 | -| n_updates | 184000 | -| policy_gradient_loss | 0.0118 | -| std | 0.00804 | -| value_loss | 1.19e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18402 | -| time_elapsed | 99565 | -| total_timesteps | 2355456 | -| train/ | | -| approx_kl | 0.0032102051 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00276 | -| learning_rate | 0.0003 | -| loss | 0.00943 | -| n_updates | 184010 | -| policy_gradient_loss | 0.00248 | -| std | 0.00804 | -| value_loss | 1.27e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18403 | -| time_elapsed | 99568 | -| total_timesteps | 2355584 | -| train/ | | -| approx_kl | 0.075594805 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | 0.0481 | -| n_updates | 184020 | -| policy_gradient_loss | 0.0344 | -| std | 0.00804 | -| value_loss | 1.29e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18404 | -| time_elapsed | 99571 | -| total_timesteps | 2355712 | -| train/ | | -| approx_kl | 0.043776587 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00834 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 184030 | -| policy_gradient_loss | 0.0352 | -| std | 0.00805 | -| value_loss | 0.000196 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18405 | -| time_elapsed | 99575 | -| total_timesteps | 2355840 | -| train/ | | -| approx_kl | 0.6706314 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.714 | -| learning_rate | 0.0003 | -| loss | 0.394 | -| n_updates | 184040 | -| policy_gradient_loss | 0.178 | -| std | 0.00806 | -| value_loss | 0.000903 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18406 | -| time_elapsed | 99579 | -| total_timesteps | 2355968 | -| train/ | | -| approx_kl | 0.027635256 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0634 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 184050 | -| policy_gradient_loss | 0.00182 | -| std | 0.00806 | -| value_loss | 0.000129 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18407 | -| time_elapsed | 99584 | -| total_timesteps | 2356096 | -| train/ | | -| approx_kl | 0.01680943 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.00256 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 184060 | -| policy_gradient_loss | 0.0123 | -| std | 0.00806 | -| value_loss | 3.43e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18408 | -| time_elapsed | 99595 | -| total_timesteps | 2356224 | -| train/ | | -| approx_kl | 0.16217564 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.893 | -| learning_rate | 0.0003 | -| loss | 0.0932 | -| n_updates | 184070 | -| policy_gradient_loss | 0.0708 | -| std | 0.00806 | -| value_loss | 0.00212 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18409 | -| time_elapsed | 99599 | -| total_timesteps | 2356352 | -| train/ | | -| approx_kl | 0.14724064 | -| clip_fraction | 0.669 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.0963 | -| n_updates | 184080 | -| policy_gradient_loss | 0.0941 | -| std | 0.00806 | -| value_loss | 1.16e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18410 | -| time_elapsed | 99604 | -| total_timesteps | 2356480 | -| train/ | | -| approx_kl | 0.022389472 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0886 | -| learning_rate | 0.0003 | -| loss | 0.00835 | -| n_updates | 184090 | -| policy_gradient_loss | 0.0204 | -| std | 0.00806 | -| value_loss | 5.85e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18411 | -| time_elapsed | 99609 | -| total_timesteps | 2356608 | -| train/ | | -| approx_kl | 0.0003235829 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.00369 | -| n_updates | 184100 | -| policy_gradient_loss | -0.000172 | -| std | 0.00806 | -| value_loss | 4.55e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18412 | -| time_elapsed | 99614 | -| total_timesteps | 2356736 | -| train/ | | -| approx_kl | 0.11566402 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 184110 | -| policy_gradient_loss | 0.0992 | -| std | 0.00806 | -| value_loss | 3.51e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18413 | -| time_elapsed | 99619 | -| total_timesteps | 2356864 | -| train/ | | -| approx_kl | 0.12761705 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 184120 | -| policy_gradient_loss | 0.148 | -| std | 0.00806 | -| value_loss | 2.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18414 | -| time_elapsed | 99624 | -| total_timesteps | 2356992 | -| train/ | | -| approx_kl | 0.021189954 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.00213 | -| n_updates | 184130 | -| policy_gradient_loss | 0.0172 | -| std | 0.00806 | -| value_loss | 2.15e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 18415 | -| time_elapsed | 99628 | -| total_timesteps | 2357120 | -| train/ | | -| approx_kl | 0.00024985475 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.000156 | -| n_updates | 184140 | -| policy_gradient_loss | 0.0237 | -| std | 0.00806 | -| value_loss | 5.52e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 18416 | -| time_elapsed | 99637 | -| total_timesteps | 2357248 | -| train/ | | -| approx_kl | 0.024792625 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -5.04 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 184150 | -| policy_gradient_loss | -0.0177 | -| std | 0.00805 | -| value_loss | 0.0037 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 18417 | -| time_elapsed | 99641 | -| total_timesteps | 2357376 | -| train/ | | -| approx_kl | 0.21297225 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 184160 | -| policy_gradient_loss | 0.126 | -| std | 0.00805 | -| value_loss | 5.05e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 18418 | -| time_elapsed | 99645 | -| total_timesteps | 2357504 | -| train/ | | -| approx_kl | 0.03003427 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 184170 | -| policy_gradient_loss | 0.0156 | -| std | 0.00805 | -| value_loss | 2.69e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 18419 | -| time_elapsed | 99650 | -| total_timesteps | 2357632 | -| train/ | | -| approx_kl | 0.0015139589 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.00808 | -| n_updates | 184180 | -| policy_gradient_loss | 0.00347 | -| std | 0.00805 | -| value_loss | 1.87e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 18420 | -| time_elapsed | 99655 | -| total_timesteps | 2357760 | -| train/ | | -| approx_kl | 0.11242904 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 184190 | -| policy_gradient_loss | 0.109 | -| std | 0.00805 | -| value_loss | 1.22e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 18421 | -| time_elapsed | 99659 | -| total_timesteps | 2357888 | -| train/ | | -| approx_kl | 0.10591412 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.0844 | -| n_updates | 184200 | -| policy_gradient_loss | 0.111 | -| std | 0.00805 | -| value_loss | 7.82e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18422 | -| time_elapsed | 99663 | -| total_timesteps | 2358016 | -| train/ | | -| approx_kl | 0.019820873 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 184210 | -| policy_gradient_loss | 0.0142 | -| std | 0.00805 | -| value_loss | 7.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18423 | -| time_elapsed | 99675 | -| total_timesteps | 2358144 | -| train/ | | -| approx_kl | 0.015552216 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.824 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 184220 | -| policy_gradient_loss | 0.0011 | -| std | 0.00805 | -| value_loss | 0.00385 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18424 | -| time_elapsed | 99680 | -| total_timesteps | 2358272 | -| train/ | | -| approx_kl | 0.18602441 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 184230 | -| policy_gradient_loss | 0.0311 | -| std | 0.00805 | -| value_loss | 3.33e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18425 | -| time_elapsed | 99686 | -| total_timesteps | 2358400 | -| train/ | | -| approx_kl | 0.00427696 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.00755 | -| n_updates | 184240 | -| policy_gradient_loss | 0.066 | -| std | 0.00805 | -| value_loss | 7.24e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18426 | -| time_elapsed | 99689 | -| total_timesteps | 2358528 | -| train/ | | -| approx_kl | 0.023750033 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.807 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 184250 | -| policy_gradient_loss | 0.0221 | -| std | 0.00805 | -| value_loss | 9.84e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18427 | -| time_elapsed | 99694 | -| total_timesteps | 2358656 | -| train/ | | -| approx_kl | 0.2165587 | -| clip_fraction | 0.664 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 184260 | -| policy_gradient_loss | 0.078 | -| std | 0.00805 | -| value_loss | 3.42e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18428 | -| time_elapsed | 99699 | -| total_timesteps | 2358784 | -| train/ | | -| approx_kl | 0.033788722 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 184270 | -| policy_gradient_loss | 0.00534 | -| std | 0.00805 | -| value_loss | 2.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 18429 | -| time_elapsed | 99703 | -| total_timesteps | 2358912 | -| train/ | | -| approx_kl | 0.10685364 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.0652 | -| n_updates | 184280 | -| policy_gradient_loss | 0.0165 | -| std | 0.00805 | -| value_loss | 6.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18430 | -| time_elapsed | 99707 | -| total_timesteps | 2359040 | -| train/ | | -| approx_kl | 0.007500082 | -| clip_fraction | 0.0586 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.318 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 184290 | -| policy_gradient_loss | -0.0058 | -| std | 0.00806 | -| value_loss | 5.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18431 | -| time_elapsed | 99718 | -| total_timesteps | 2359168 | -| train/ | | -| approx_kl | 0.011116039 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 184300 | -| policy_gradient_loss | -0.0135 | -| std | 0.00806 | -| value_loss | 0.00267 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18432 | -| time_elapsed | 99723 | -| total_timesteps | 2359296 | -| train/ | | -| approx_kl | 0.04728549 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.508 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 184310 | -| policy_gradient_loss | 0.0227 | -| std | 0.00805 | -| value_loss | 3.51e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18433 | -| time_elapsed | 99728 | -| total_timesteps | 2359424 | -| train/ | | -| approx_kl | 0.09720451 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.0668 | -| n_updates | 184320 | -| policy_gradient_loss | 0.0586 | -| std | 0.00805 | -| value_loss | 8.97e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18434 | -| time_elapsed | 99732 | -| total_timesteps | 2359552 | -| train/ | | -| approx_kl | 0.02570779 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0857 | -| learning_rate | 0.0003 | -| loss | 0.00737 | -| n_updates | 184330 | -| policy_gradient_loss | 0.032 | -| std | 0.00805 | -| value_loss | 5.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18435 | -| time_elapsed | 99737 | -| total_timesteps | 2359680 | -| train/ | | -| approx_kl | 0.55502546 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 184340 | -| policy_gradient_loss | 0.148 | -| std | 0.00805 | -| value_loss | 3.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18436 | -| time_elapsed | 99741 | -| total_timesteps | 2359808 | -| train/ | | -| approx_kl | 0.005499958 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0818 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 184350 | -| policy_gradient_loss | 0.0172 | -| std | 0.00805 | -| value_loss | 2.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 18437 | -| time_elapsed | 99746 | -| total_timesteps | 2359936 | -| train/ | | -| approx_kl | 0.13278073 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | 0.08 | -| n_updates | 184360 | -| policy_gradient_loss | 0.0224 | -| std | 0.00803 | -| value_loss | 5.16e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18438 | -| time_elapsed | 99751 | -| total_timesteps | 2360064 | -| train/ | | -| approx_kl | 0.022539986 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -23 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 184370 | -| policy_gradient_loss | 0.0138 | -| std | 0.00802 | -| value_loss | 7.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18439 | -| time_elapsed | 99760 | -| total_timesteps | 2360192 | -| train/ | | -| approx_kl | 0.005858412 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.988 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 184380 | -| policy_gradient_loss | 0.00597 | -| std | 0.00801 | -| value_loss | 0.00268 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18440 | -| time_elapsed | 99764 | -| total_timesteps | 2360320 | -| train/ | | -| approx_kl | 0.020415757 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 184390 | -| policy_gradient_loss | 0.0167 | -| std | 0.00801 | -| value_loss | 6.1e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18441 | -| time_elapsed | 99769 | -| total_timesteps | 2360448 | -| train/ | | -| approx_kl | 0.3459523 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | 0.295 | -| n_updates | 184400 | -| policy_gradient_loss | 0.175 | -| std | 0.00801 | -| value_loss | 3.19e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18442 | -| time_elapsed | 99774 | -| total_timesteps | 2360576 | -| train/ | | -| approx_kl | 0.059167918 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 184410 | -| policy_gradient_loss | 0.014 | -| std | 0.00801 | -| value_loss | 1.66e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18443 | -| time_elapsed | 99779 | -| total_timesteps | 2360704 | -| train/ | | -| approx_kl | 0.21338534 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 184420 | -| policy_gradient_loss | -0.00789 | -| std | 0.00802 | -| value_loss | 1.52e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18444 | -| time_elapsed | 99783 | -| total_timesteps | 2360832 | -| train/ | | -| approx_kl | 0.05408626 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 184430 | -| policy_gradient_loss | 0.0148 | -| std | 0.00802 | -| value_loss | 8.25e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 18445 | -| time_elapsed | 99787 | -| total_timesteps | 2360960 | -| train/ | | -| approx_kl | 0.28169918 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 184440 | -| policy_gradient_loss | 0.118 | -| std | 0.00802 | -| value_loss | 6.69e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18446 | -| time_elapsed | 99791 | -| total_timesteps | 2361088 | -| train/ | | -| approx_kl | 0.13650374 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 184450 | -| policy_gradient_loss | 0.152 | -| std | 0.00802 | -| value_loss | 5.15e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18447 | -| time_elapsed | 99801 | -| total_timesteps | 2361216 | -| train/ | | -| approx_kl | 0.0032332633 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | -0.0235 | -| n_updates | 184460 | -| policy_gradient_loss | -0.0134 | -| std | 0.00803 | -| value_loss | 0.000758 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18448 | -| time_elapsed | 99806 | -| total_timesteps | 2361344 | -| train/ | | -| approx_kl | 0.08892451 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 184470 | -| policy_gradient_loss | 0.021 | -| std | 0.00803 | -| value_loss | 0.000118 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18449 | -| time_elapsed | 99811 | -| total_timesteps | 2361472 | -| train/ | | -| approx_kl | 0.15275377 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.0534 | -| n_updates | 184480 | -| policy_gradient_loss | 0.0322 | -| std | 0.00803 | -| value_loss | 2.86e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18450 | -| time_elapsed | 99816 | -| total_timesteps | 2361600 | -| train/ | | -| approx_kl | 0.0026537539 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -339 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 184490 | -| policy_gradient_loss | -0.00178 | -| std | 0.00803 | -| value_loss | 1.1e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18451 | -| time_elapsed | 99822 | -| total_timesteps | 2361728 | -| train/ | | -| approx_kl | 1.2053642e-05 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -2.17 | -| learning_rate | 0.0003 | -| loss | 0.000583 | -| n_updates | 184500 | -| policy_gradient_loss | -0.00183 | -| std | 0.00804 | -| value_loss | 1.4e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18452 | -| time_elapsed | 99826 | -| total_timesteps | 2361856 | -| train/ | | -| approx_kl | 0.042266265 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.0197 | -| n_updates | 184510 | -| policy_gradient_loss | 0.0493 | -| std | 0.00804 | -| value_loss | 1.4e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 18453 | -| time_elapsed | 99830 | -| total_timesteps | 2361984 | -| train/ | | -| approx_kl | 5.668495e-06 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00977 | -| learning_rate | 0.0003 | -| loss | 0.000319 | -| n_updates | 184520 | -| policy_gradient_loss | 0.0639 | -| std | 0.00805 | -| value_loss | 9.79e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 18454 | -| time_elapsed | 99835 | -| total_timesteps | 2362112 | -| train/ | | -| approx_kl | 0.08564643 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.00685 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 184530 | -| policy_gradient_loss | 0.111 | -| std | 0.00805 | -| value_loss | 7.12e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 18455 | -| time_elapsed | 99846 | -| total_timesteps | 2362240 | -| train/ | | -| approx_kl | 0.015949506 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.26 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 184540 | -| policy_gradient_loss | -0.0164 | -| std | 0.00805 | -| value_loss | 0.00242 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 18456 | -| time_elapsed | 99851 | -| total_timesteps | 2362368 | -| train/ | | -| approx_kl | 0.0090315305 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 184550 | -| policy_gradient_loss | 0.0261 | -| std | 0.00805 | -| value_loss | 7.82e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 18457 | -| time_elapsed | 99856 | -| total_timesteps | 2362496 | -| train/ | | -| approx_kl | 0.18295945 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 184560 | -| policy_gradient_loss | 0.0557 | -| std | 0.00805 | -| value_loss | 1.77e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 18458 | -| time_elapsed | 99861 | -| total_timesteps | 2362624 | -| train/ | | -| approx_kl | 0.039161343 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.327 | -| learning_rate | 0.0003 | -| loss | 0.00504 | -| n_updates | 184570 | -| policy_gradient_loss | 0.0211 | -| std | 0.00805 | -| value_loss | 9.66e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 18459 | -| time_elapsed | 99867 | -| total_timesteps | 2362752 | -| train/ | | -| approx_kl | 0.6693524 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.313 | -| n_updates | 184580 | -| policy_gradient_loss | 0.29 | -| std | 0.00805 | -| value_loss | 5.64e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 18460 | -| time_elapsed | 99872 | -| total_timesteps | 2362880 | -| train/ | | -| approx_kl | 0.15989664 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 184590 | -| policy_gradient_loss | 0.00781 | -| std | 0.00805 | -| value_loss | 7.61e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18461 | -| time_elapsed | 99876 | -| total_timesteps | 2363008 | -| train/ | | -| approx_kl | 0.04924735 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 184600 | -| policy_gradient_loss | 0.0173 | -| std | 0.00805 | -| value_loss | 1.53e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18462 | -| time_elapsed | 99888 | -| total_timesteps | 2363136 | -| train/ | | -| approx_kl | 0.16107826 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 184610 | -| policy_gradient_loss | -0.000141 | -| std | 0.00806 | -| value_loss | 0.00234 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18463 | -| time_elapsed | 99894 | -| total_timesteps | 2363264 | -| train/ | | -| approx_kl | 0.006968325 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.75 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 184620 | -| policy_gradient_loss | 0.000604 | -| std | 0.00806 | -| value_loss | 1.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18464 | -| time_elapsed | 99898 | -| total_timesteps | 2363392 | -| train/ | | -| approx_kl | 0.047203414 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.094 | -| learning_rate | 0.0003 | -| loss | 0.00425 | -| n_updates | 184630 | -| policy_gradient_loss | 0.000258 | -| std | 0.00806 | -| value_loss | 4.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18465 | -| time_elapsed | 99903 | -| total_timesteps | 2363520 | -| train/ | | -| approx_kl | 0.007907163 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 184640 | -| policy_gradient_loss | 0.0386 | -| std | 0.00807 | -| value_loss | 3.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18466 | -| time_elapsed | 99907 | -| total_timesteps | 2363648 | -| train/ | | -| approx_kl | 0.22742513 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.978 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 184650 | -| policy_gradient_loss | 0.0154 | -| std | 0.00808 | -| value_loss | 5.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18467 | -| time_elapsed | 99913 | -| total_timesteps | 2363776 | -| train/ | | -| approx_kl | 0.050284818 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0973 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 184660 | -| policy_gradient_loss | 0.0602 | -| std | 0.00808 | -| value_loss | 2.64e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 18468 | -| time_elapsed | 99919 | -| total_timesteps | 2363904 | -| train/ | | -| approx_kl | 0.013463216 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0907 | -| learning_rate | 0.0003 | -| loss | -0.00518 | -| n_updates | 184670 | -| policy_gradient_loss | 0.0108 | -| std | 0.00808 | -| value_loss | 1.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18469 | -| time_elapsed | 99925 | -| total_timesteps | 2364032 | -| train/ | | -| approx_kl | 0.029865392 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 184680 | -| policy_gradient_loss | 0.0207 | -| std | 0.00808 | -| value_loss | 1.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18470 | -| time_elapsed | 99934 | -| total_timesteps | 2364160 | -| train/ | | -| approx_kl | 0.014307136 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.915 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 184690 | -| policy_gradient_loss | -0.00349 | -| std | 0.00808 | -| value_loss | 0.000995 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18471 | -| time_elapsed | 99938 | -| total_timesteps | 2364288 | -| train/ | | -| approx_kl | 0.013522916 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.00568 | -| n_updates | 184700 | -| policy_gradient_loss | 0.0364 | -| std | 0.00807 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18472 | -| time_elapsed | 99943 | -| total_timesteps | 2364416 | -| train/ | | -| approx_kl | 0.054948412 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 184710 | -| policy_gradient_loss | -0.00364 | -| std | 0.00806 | -| value_loss | 4.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18473 | -| time_elapsed | 99948 | -| total_timesteps | 2364544 | -| train/ | | -| approx_kl | 0.008331943 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 184720 | -| policy_gradient_loss | 0.0378 | -| std | 0.00805 | -| value_loss | 3.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18474 | -| time_elapsed | 99953 | -| total_timesteps | 2364672 | -| train/ | | -| approx_kl | 0.007726776 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 184730 | -| policy_gradient_loss | 0.00556 | -| std | 0.00805 | -| value_loss | 3.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18475 | -| time_elapsed | 99957 | -| total_timesteps | 2364800 | -| train/ | | -| approx_kl | 0.054048624 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 184740 | -| policy_gradient_loss | 0.0293 | -| std | 0.00804 | -| value_loss | 2.04e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18476 | -| time_elapsed | 99961 | -| total_timesteps | 2364928 | -| train/ | | -| approx_kl | 0.2731956 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.000506 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 184750 | -| policy_gradient_loss | 0.132 | -| std | 0.00803 | -| value_loss | 2.27e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18477 | -| time_elapsed | 99966 | -| total_timesteps | 2365056 | -| train/ | | -| approx_kl | 0.03851065 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 184760 | -| policy_gradient_loss | 0.0216 | -| std | 0.00801 | -| value_loss | 7.55e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18478 | -| time_elapsed | 99974 | -| total_timesteps | 2365184 | -| train/ | | -| approx_kl | 0.04127835 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.75 | -| learning_rate | 0.0003 | -| loss | -0.0219 | -| n_updates | 184770 | -| policy_gradient_loss | -0.0169 | -| std | 0.008 | -| value_loss | 0.00604 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18479 | -| time_elapsed | 99978 | -| total_timesteps | 2365312 | -| train/ | | -| approx_kl | 0.043546755 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0722 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 184780 | -| policy_gradient_loss | 0.017 | -| std | 0.008 | -| value_loss | 3.27e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18480 | -| time_elapsed | 99981 | -| total_timesteps | 2365440 | -| train/ | | -| approx_kl | 0.081199564 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 184790 | -| policy_gradient_loss | 0.0256 | -| std | 0.008 | -| value_loss | 5.17e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18481 | -| time_elapsed | 99986 | -| total_timesteps | 2365568 | -| train/ | | -| approx_kl | 0.11490241 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0746 | -| learning_rate | 0.0003 | -| loss | 0.0494 | -| n_updates | 184800 | -| policy_gradient_loss | 0.0199 | -| std | 0.00799 | -| value_loss | 2.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18482 | -| time_elapsed | 99991 | -| total_timesteps | 2365696 | -| train/ | | -| approx_kl | 0.020432897 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 184810 | -| policy_gradient_loss | 0.000409 | -| std | 0.00799 | -| value_loss | 1.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18483 | -| time_elapsed | 99995 | -| total_timesteps | 2365824 | -| train/ | | -| approx_kl | 0.14497474 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0708 | -| n_updates | 184820 | -| policy_gradient_loss | 0.0136 | -| std | 0.00799 | -| value_loss | 1.16e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 18484 | -| time_elapsed | 99999 | -| total_timesteps | 2365952 | -| train/ | | -| approx_kl | 0.14297447 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 184830 | -| policy_gradient_loss | 0.0139 | -| std | 0.00797 | -| value_loss | 2.34e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18485 | -| time_elapsed | 100004 | -| total_timesteps | 2366080 | -| train/ | | -| approx_kl | 0.15296075 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -97.7 | -| learning_rate | 0.0003 | -| loss | 0.00676 | -| n_updates | 184840 | -| policy_gradient_loss | -0.00159 | -| std | 0.00797 | -| value_loss | 4.68e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18486 | -| time_elapsed | 100014 | -| total_timesteps | 2366208 | -| train/ | | -| approx_kl | 0.0010935897 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.938 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 184850 | -| policy_gradient_loss | 0.0437 | -| std | 0.00797 | -| value_loss | 0.000758 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18487 | -| time_elapsed | 100019 | -| total_timesteps | 2366336 | -| train/ | | -| approx_kl | 0.009142714 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | 0.0072 | -| n_updates | 184860 | -| policy_gradient_loss | 0.0221 | -| std | 0.00797 | -| value_loss | 3.59e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18488 | -| time_elapsed | 100024 | -| total_timesteps | 2366464 | -| train/ | | -| approx_kl | 0.07891617 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00364 | -| learning_rate | 0.0003 | -| loss | 0.0336 | -| n_updates | 184870 | -| policy_gradient_loss | 0.0205 | -| std | 0.00797 | -| value_loss | 5.94e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18489 | -| time_elapsed | 100029 | -| total_timesteps | 2366592 | -| train/ | | -| approx_kl | 0.0050225207 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.00657 | -| n_updates | 184880 | -| policy_gradient_loss | 0.00769 | -| std | 0.00797 | -| value_loss | 4.12e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18490 | -| time_elapsed | 100035 | -| total_timesteps | 2366720 | -| train/ | | -| approx_kl | 0.044997327 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 184890 | -| policy_gradient_loss | 0.0217 | -| std | 0.00797 | -| value_loss | 2.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18491 | -| time_elapsed | 100040 | -| total_timesteps | 2366848 | -| train/ | | -| approx_kl | 0.37313667 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 184900 | -| policy_gradient_loss | 0.041 | -| std | 0.00796 | -| value_loss | 1.6e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18492 | -| time_elapsed | 100044 | -| total_timesteps | 2366976 | -| train/ | | -| approx_kl | 0.027573671 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 184910 | -| policy_gradient_loss | 6.03e-05 | -| std | 0.00796 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18493 | -| time_elapsed | 100049 | -| total_timesteps | 2367104 | -| train/ | | -| approx_kl | 0.0025430168 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 184920 | -| policy_gradient_loss | 0.0138 | -| std | 0.00797 | -| value_loss | 5.97e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18494 | -| time_elapsed | 100059 | -| total_timesteps | 2367232 | -| train/ | | -| approx_kl | 0.20127463 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -1.77 | -| learning_rate | 0.0003 | -| loss | -0.000824 | -| n_updates | 184930 | -| policy_gradient_loss | 0.0192 | -| std | 0.00797 | -| value_loss | 0.00273 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18495 | -| time_elapsed | 100063 | -| total_timesteps | 2367360 | -| train/ | | -| approx_kl | 0.08884063 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 184940 | -| policy_gradient_loss | 0.0152 | -| std | 0.00798 | -| value_loss | 3.43e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18496 | -| time_elapsed | 100069 | -| total_timesteps | 2367488 | -| train/ | | -| approx_kl | 0.101873055 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00166 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 184950 | -| policy_gradient_loss | 0.0188 | -| std | 0.00798 | -| value_loss | 5.3e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18497 | -| time_elapsed | 100074 | -| total_timesteps | 2367616 | -| train/ | | -| approx_kl | 0.0058785155 | -| clip_fraction | 0.0312 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0734 | -| learning_rate | 0.0003 | -| loss | -0.00297 | -| n_updates | 184960 | -| policy_gradient_loss | -0.00139 | -| std | 0.00797 | -| value_loss | 2.67e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18498 | -| time_elapsed | 100080 | -| total_timesteps | 2367744 | -| train/ | | -| approx_kl | 0.11256264 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 184970 | -| policy_gradient_loss | 0.0214 | -| std | 0.00797 | -| value_loss | 1.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18499 | -| time_elapsed | 100085 | -| total_timesteps | 2367872 | -| train/ | | -| approx_kl | 0.040136326 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | 0.00995 | -| n_updates | 184980 | -| policy_gradient_loss | 0.0139 | -| std | 0.00798 | -| value_loss | 9.08e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18500 | -| time_elapsed | 100090 | -| total_timesteps | 2368000 | -| train/ | | -| approx_kl | 0.0016097878 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 184990 | -| policy_gradient_loss | 0.019 | -| std | 0.00797 | -| value_loss | 5.73e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18501 | -| time_elapsed | 100095 | -| total_timesteps | 2368128 | -| train/ | | -| approx_kl | 0.048904315 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00494 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 185000 | -| policy_gradient_loss | 0.0288 | -| std | 0.00796 | -| value_loss | 3.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18502 | -| time_elapsed | 100106 | -| total_timesteps | 2368256 | -| train/ | | -| approx_kl | 0.025028447 | -| clip_fraction | 0.578 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.808 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 185010 | -| policy_gradient_loss | 0.0141 | -| std | 0.00795 | -| value_loss | 0.00427 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18503 | -| time_elapsed | 100111 | -| total_timesteps | 2368384 | -| train/ | | -| approx_kl | 0.032333385 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.21 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 185020 | -| policy_gradient_loss | 0.0045 | -| std | 0.00795 | -| value_loss | 2.19e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18504 | -| time_elapsed | 100115 | -| total_timesteps | 2368512 | -| train/ | | -| approx_kl | 0.062214494 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00184 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 185030 | -| policy_gradient_loss | -0.000985 | -| std | 0.00795 | -| value_loss | 3.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18505 | -| time_elapsed | 100119 | -| total_timesteps | 2368640 | -| train/ | | -| approx_kl | 0.007967362 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 185040 | -| policy_gradient_loss | 0.000732 | -| std | 0.00795 | -| value_loss | 4.32e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18506 | -| time_elapsed | 100124 | -| total_timesteps | 2368768 | -| train/ | | -| approx_kl | 0.0018328233 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0773 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 185050 | -| policy_gradient_loss | 0.00295 | -| std | 0.00796 | -| value_loss | 2.58e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18507 | -| time_elapsed | 100129 | -| total_timesteps | 2368896 | -| train/ | | -| approx_kl | 0.024170227 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0666 | -| learning_rate | 0.0003 | -| loss | 0.0505 | -| n_updates | 185060 | -| policy_gradient_loss | 0.0628 | -| std | 0.00796 | -| value_loss | 1.81e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18508 | -| time_elapsed | 100134 | -| total_timesteps | 2369024 | -| train/ | | -| approx_kl | 0.07571865 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.0503 | -| n_updates | 185070 | -| policy_gradient_loss | 0.105 | -| std | 0.00794 | -| value_loss | 1.77e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18509 | -| time_elapsed | 100143 | -| total_timesteps | 2369152 | -| train/ | | -| approx_kl | 0.01330566 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.00895 | -| n_updates | 185080 | -| policy_gradient_loss | -0.0046 | -| std | 0.00793 | -| value_loss | 0.00183 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18510 | -| time_elapsed | 100147 | -| total_timesteps | 2369280 | -| train/ | | -| approx_kl | 0.007195304 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.601 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 185090 | -| policy_gradient_loss | 0.000236 | -| std | 0.00793 | -| value_loss | 1.25e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18511 | -| time_elapsed | 100152 | -| total_timesteps | 2369408 | -| train/ | | -| approx_kl | 0.06001286 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | 0.0365 | -| n_updates | 185100 | -| policy_gradient_loss | 0.00907 | -| std | 0.00792 | -| value_loss | 1.58e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18512 | -| time_elapsed | 100156 | -| total_timesteps | 2369536 | -| train/ | | -| approx_kl | 0.027047666 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.847 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 185110 | -| policy_gradient_loss | 0.0265 | -| std | 0.00793 | -| value_loss | 4.06e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18513 | -| time_elapsed | 100160 | -| total_timesteps | 2369664 | -| train/ | | -| approx_kl | 0.07888238 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.0557 | -| n_updates | 185120 | -| policy_gradient_loss | 0.0408 | -| std | 0.00792 | -| value_loss | 2.54e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18514 | -| time_elapsed | 100164 | -| total_timesteps | 2369792 | -| train/ | | -| approx_kl | 0.3345595 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.0652 | -| n_updates | 185130 | -| policy_gradient_loss | 0.000667 | -| std | 0.00792 | -| value_loss | 6.33e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18515 | -| time_elapsed | 100169 | -| total_timesteps | 2369920 | -| train/ | | -| approx_kl | 0.0033656745 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0739 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 185140 | -| policy_gradient_loss | 0.0144 | -| std | 0.00792 | -| value_loss | 3.47e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18516 | -| time_elapsed | 100173 | -| total_timesteps | 2370048 | -| train/ | | -| approx_kl | 0.35691643 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 185150 | -| policy_gradient_loss | 0.0378 | -| std | 0.00792 | -| value_loss | 2.76e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18517 | -| time_elapsed | 100183 | -| total_timesteps | 2370176 | -| train/ | | -| approx_kl | 0.014207074 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.94 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 185160 | -| policy_gradient_loss | -0.0149 | -| std | 0.00792 | -| value_loss | 0.000282 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18518 | -| time_elapsed | 100187 | -| total_timesteps | 2370304 | -| train/ | | -| approx_kl | 0.16420302 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0859 | -| n_updates | 185170 | -| policy_gradient_loss | 0.032 | -| std | 0.00792 | -| value_loss | 2.03e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18519 | -| time_elapsed | 100192 | -| total_timesteps | 2370432 | -| train/ | | -| approx_kl | 0.00085490895 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.889 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 185180 | -| policy_gradient_loss | -0.00306 | -| std | 0.00792 | -| value_loss | 5.06e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18520 | -| time_elapsed | 100196 | -| total_timesteps | 2370560 | -| train/ | | -| approx_kl | 0.041767232 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 185190 | -| policy_gradient_loss | 0.0443 | -| std | 0.00792 | -| value_loss | 3.24e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18521 | -| time_elapsed | 100200 | -| total_timesteps | 2370688 | -| train/ | | -| approx_kl | 0.0314845 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00973 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 185200 | -| policy_gradient_loss | 0.0182 | -| std | 0.00792 | -| value_loss | 2.78e-09 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18522 | -| time_elapsed | 100203 | -| total_timesteps | 2370816 | -| train/ | | -| approx_kl | 0.00043063844 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00657 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 185210 | -| policy_gradient_loss | 0.0679 | -| std | 0.00792 | -| value_loss | 1.62e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18523 | -| time_elapsed | 100207 | -| total_timesteps | 2370944 | -| train/ | | -| approx_kl | 0.078351535 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.0815 | -| n_updates | 185220 | -| policy_gradient_loss | 0.124 | -| std | 0.00792 | -| value_loss | 1.23e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18524 | -| time_elapsed | 100212 | -| total_timesteps | 2371072 | -| train/ | | -| approx_kl | 0.064007044 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.00672 | -| n_updates | 185230 | -| policy_gradient_loss | 0.0156 | -| std | 0.00792 | -| value_loss | 1.01e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18525 | -| time_elapsed | 100221 | -| total_timesteps | 2371200 | -| train/ | | -| approx_kl | 0.08576692 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.695 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 185240 | -| policy_gradient_loss | -0.008 | -| std | 0.00792 | -| value_loss | 0.000899 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18526 | -| time_elapsed | 100225 | -| total_timesteps | 2371328 | -| train/ | | -| approx_kl | 0.0074250735 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 185250 | -| policy_gradient_loss | 0.00835 | -| std | 0.00792 | -| value_loss | 7.93e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18527 | -| time_elapsed | 100229 | -| total_timesteps | 2371456 | -| train/ | | -| approx_kl | 0.055391688 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.0159 | -| n_updates | 185260 | -| policy_gradient_loss | 0.00473 | -| std | 0.00792 | -| value_loss | 6.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18528 | -| time_elapsed | 100233 | -| total_timesteps | 2371584 | -| train/ | | -| approx_kl | 0.031563383 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 185270 | -| policy_gradient_loss | 0.00758 | -| std | 0.00792 | -| value_loss | 3.13e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18529 | -| time_elapsed | 100238 | -| total_timesteps | 2371712 | -| train/ | | -| approx_kl | 0.01169432 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0888 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 185280 | -| policy_gradient_loss | 0.0364 | -| std | 0.00792 | -| value_loss | 1.66e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18530 | -| time_elapsed | 100244 | -| total_timesteps | 2371840 | -| train/ | | -| approx_kl | 0.1708746 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.0701 | -| n_updates | 185290 | -| policy_gradient_loss | 0.0255 | -| std | 0.00792 | -| value_loss | 1.38e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 18531 | -| time_elapsed | 100249 | -| total_timesteps | 2371968 | -| train/ | | -| approx_kl | 0.063455716 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 185300 | -| policy_gradient_loss | 0.0429 | -| std | 0.00792 | -| value_loss | 1.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18532 | -| time_elapsed | 100253 | -| total_timesteps | 2372096 | -| train/ | | -| approx_kl | 0.14231142 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0676 | -| n_updates | 185310 | -| policy_gradient_loss | 0.0313 | -| std | 0.00792 | -| value_loss | 6.35e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18533 | -| time_elapsed | 100262 | -| total_timesteps | 2372224 | -| train/ | | -| approx_kl | 0.0064850356 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 185320 | -| policy_gradient_loss | 0.0332 | -| std | 0.00792 | -| value_loss | 0.000251 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18534 | -| time_elapsed | 100266 | -| total_timesteps | 2372352 | -| train/ | | -| approx_kl | 0.15285756 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 185330 | -| policy_gradient_loss | 0.149 | -| std | 0.00792 | -| value_loss | 1.57e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18535 | -| time_elapsed | 100271 | -| total_timesteps | 2372480 | -| train/ | | -| approx_kl | 0.0066603078 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00711 | -| learning_rate | 0.0003 | -| loss | 0.00471 | -| n_updates | 185340 | -| policy_gradient_loss | 0.0169 | -| std | 0.00791 | -| value_loss | 2.59e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18536 | -| time_elapsed | 100276 | -| total_timesteps | 2372608 | -| train/ | | -| approx_kl | 0.012516265 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 185350 | -| policy_gradient_loss | 0.0151 | -| std | 0.00791 | -| value_loss | 8.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18537 | -| time_elapsed | 100282 | -| total_timesteps | 2372736 | -| train/ | | -| approx_kl | 0.089872755 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.0632 | -| n_updates | 185360 | -| policy_gradient_loss | 0.0303 | -| std | 0.0079 | -| value_loss | 6.26e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18538 | -| time_elapsed | 100288 | -| total_timesteps | 2372864 | -| train/ | | -| approx_kl | 0.004736429 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.00726 | -| n_updates | 185370 | -| policy_gradient_loss | 0.00627 | -| std | 0.0079 | -| value_loss | 4.38e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 18539 | -| time_elapsed | 100293 | -| total_timesteps | 2372992 | -| train/ | | -| approx_kl | 0.1097092 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.0941 | -| n_updates | 185380 | -| policy_gradient_loss | 0.0871 | -| std | 0.0079 | -| value_loss | 2.58e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18540 | -| time_elapsed | 100298 | -| total_timesteps | 2373120 | -| train/ | | -| approx_kl | 0.021923903 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.00949 | -| n_updates | 185390 | -| policy_gradient_loss | 0.0168 | -| std | 0.0079 | -| value_loss | 1.71e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18541 | -| time_elapsed | 100309 | -| total_timesteps | 2373248 | -| train/ | | -| approx_kl | 0.09233166 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 185400 | -| policy_gradient_loss | -0.0147 | -| std | 0.0079 | -| value_loss | 0.00208 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18542 | -| time_elapsed | 100312 | -| total_timesteps | 2373376 | -| train/ | | -| approx_kl | 0.021829862 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -3.2 | -| learning_rate | 0.0003 | -| loss | -0.00768 | -| n_updates | 185410 | -| policy_gradient_loss | 0.013 | -| std | 0.0079 | -| value_loss | 2.75e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18543 | -| time_elapsed | 100317 | -| total_timesteps | 2373504 | -| train/ | | -| approx_kl | 0.0028144182 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.00355 | -| n_updates | 185420 | -| policy_gradient_loss | 0.0112 | -| std | 0.00791 | -| value_loss | 6.7e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18544 | -| time_elapsed | 100321 | -| total_timesteps | 2373632 | -| train/ | | -| approx_kl | 0.00811464 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | 0.00943 | -| n_updates | 185430 | -| policy_gradient_loss | 0.0188 | -| std | 0.00791 | -| value_loss | 4.05e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18545 | -| time_elapsed | 100326 | -| total_timesteps | 2373760 | -| train/ | | -| approx_kl | 0.08256256 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 185440 | -| policy_gradient_loss | 0.0352 | -| std | 0.00791 | -| value_loss | 2.66e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18546 | -| time_elapsed | 100331 | -| total_timesteps | 2373888 | -| train/ | | -| approx_kl | 0.15124056 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | 0.0934 | -| n_updates | 185450 | -| policy_gradient_loss | 0.0341 | -| std | 0.00791 | -| value_loss | 6.58e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18547 | -| time_elapsed | 100336 | -| total_timesteps | 2374016 | -| train/ | | -| approx_kl | 0.03759363 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.00556 | -| n_updates | 185460 | -| policy_gradient_loss | 0.0597 | -| std | 0.00791 | -| value_loss | 8.64e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18548 | -| time_elapsed | 100347 | -| total_timesteps | 2374144 | -| train/ | | -| approx_kl | 0.029725254 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.00543 | -| n_updates | 185470 | -| policy_gradient_loss | -0.00573 | -| std | 0.0079 | -| value_loss | 0.00154 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18549 | -| time_elapsed | 100354 | -| total_timesteps | 2374272 | -| train/ | | -| approx_kl | 0.09635305 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 185480 | -| policy_gradient_loss | 0.0196 | -| std | 0.00789 | -| value_loss | 1.9e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18550 | -| time_elapsed | 100358 | -| total_timesteps | 2374400 | -| train/ | | -| approx_kl | 0.093176894 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00293 | -| learning_rate | 0.0003 | -| loss | 0.0565 | -| n_updates | 185490 | -| policy_gradient_loss | 0.0384 | -| std | 0.00789 | -| value_loss | 2.72e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18551 | -| time_elapsed | 100363 | -| total_timesteps | 2374528 | -| train/ | | -| approx_kl | 0.10649346 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 185500 | -| policy_gradient_loss | 0.00778 | -| std | 0.00789 | -| value_loss | 1.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18552 | -| time_elapsed | 100367 | -| total_timesteps | 2374656 | -| train/ | | -| approx_kl | 0.00773419 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.00308 | -| n_updates | 185510 | -| policy_gradient_loss | 0.00852 | -| std | 0.00789 | -| value_loss | 8.87e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18553 | -| time_elapsed | 100372 | -| total_timesteps | 2374784 | -| train/ | | -| approx_kl | 0.13502587 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 185520 | -| policy_gradient_loss | 0.0948 | -| std | 0.0079 | -| value_loss | 1.79e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 18554 | -| time_elapsed | 100377 | -| total_timesteps | 2374912 | -| train/ | | -| approx_kl | 0.40359905 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00065 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 185530 | -| policy_gradient_loss | 0.123 | -| std | 0.00787 | -| value_loss | 0.000313 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18555 | -| time_elapsed | 100383 | -| total_timesteps | 2375040 | -| train/ | | -| approx_kl | 0.16976565 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 185540 | -| policy_gradient_loss | 0.116 | -| std | 0.00786 | -| value_loss | 0.00158 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18556 | -| time_elapsed | 100393 | -| total_timesteps | 2375168 | -| train/ | | -| approx_kl | 0.004518056 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.763 | -| learning_rate | 0.0003 | -| loss | -0.00507 | -| n_updates | 185550 | -| policy_gradient_loss | 0.00819 | -| std | 0.00785 | -| value_loss | 0.00501 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18557 | -| time_elapsed | 100398 | -| total_timesteps | 2375296 | -| train/ | | -| approx_kl | 0.005834993 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.00596 | -| n_updates | 185560 | -| policy_gradient_loss | 0.00703 | -| std | 0.00785 | -| value_loss | 6.65e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18558 | -| time_elapsed | 100402 | -| total_timesteps | 2375424 | -| train/ | | -| approx_kl | 0.05433305 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0523 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 185570 | -| policy_gradient_loss | 0.022 | -| std | 0.00785 | -| value_loss | 4.44e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18559 | -| time_elapsed | 100406 | -| total_timesteps | 2375552 | -| train/ | | -| approx_kl | 0.51037943 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.25 | -| n_updates | 185580 | -| policy_gradient_loss | 0.0636 | -| std | 0.00785 | -| value_loss | 2.95e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18560 | -| time_elapsed | 100412 | -| total_timesteps | 2375680 | -| train/ | | -| approx_kl | 0.009216491 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 185590 | -| policy_gradient_loss | 0.0025 | -| std | 0.00784 | -| value_loss | 1.74e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18561 | -| time_elapsed | 100416 | -| total_timesteps | 2375808 | -| train/ | | -| approx_kl | 0.00038768072 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | 0.00209 | -| n_updates | 185600 | -| policy_gradient_loss | 0.00275 | -| std | 0.00784 | -| value_loss | 1.47e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18562 | -| time_elapsed | 100421 | -| total_timesteps | 2375936 | -| train/ | | -| approx_kl | 0.004396797 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | -0.00269 | -| n_updates | 185610 | -| policy_gradient_loss | 0.00386 | -| std | 0.00784 | -| value_loss | 8.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18563 | -| time_elapsed | 100427 | -| total_timesteps | 2376064 | -| train/ | | -| approx_kl | 0.058389675 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.0359 | -| n_updates | 185620 | -| policy_gradient_loss | 0.0143 | -| std | 0.00784 | -| value_loss | 5.65e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18564 | -| time_elapsed | 100436 | -| total_timesteps | 2376192 | -| train/ | | -| approx_kl | 0.0031627757 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.932 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 185630 | -| policy_gradient_loss | -0.0176 | -| std | 0.00784 | -| value_loss | 0.000346 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18565 | -| time_elapsed | 100440 | -| total_timesteps | 2376320 | -| train/ | | -| approx_kl | 0.062214717 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 185640 | -| policy_gradient_loss | 0.00305 | -| std | 0.00784 | -| value_loss | 5.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18566 | -| time_elapsed | 100444 | -| total_timesteps | 2376448 | -| train/ | | -| approx_kl | 0.009022071 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.273 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 185650 | -| policy_gradient_loss | 0.0017 | -| std | 0.00784 | -| value_loss | 3.82e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18567 | -| time_elapsed | 100448 | -| total_timesteps | 2376576 | -| train/ | | -| approx_kl | 0.0005387706 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | 0.00621 | -| n_updates | 185660 | -| policy_gradient_loss | 0.00195 | -| std | 0.00784 | -| value_loss | 3.83e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18568 | -| time_elapsed | 100453 | -| total_timesteps | 2376704 | -| train/ | | -| approx_kl | 0.03940463 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 185670 | -| policy_gradient_loss | 0.00781 | -| std | 0.00784 | -| value_loss | 2.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18569 | -| time_elapsed | 100458 | -| total_timesteps | 2376832 | -| train/ | | -| approx_kl | 0.027061362 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.00715 | -| n_updates | 185680 | -| policy_gradient_loss | 0.00355 | -| std | 0.00784 | -| value_loss | 1.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18570 | -| time_elapsed | 100464 | -| total_timesteps | 2376960 | -| train/ | | -| approx_kl | 0.031869605 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 185690 | -| policy_gradient_loss | -0.0119 | -| std | 0.00783 | -| value_loss | 1.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18571 | -| time_elapsed | 100469 | -| total_timesteps | 2377088 | -| train/ | | -| approx_kl | 0.034952395 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 185700 | -| policy_gradient_loss | 0.00765 | -| std | 0.00783 | -| value_loss | 6.79e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18572 | -| time_elapsed | 100479 | -| total_timesteps | 2377216 | -| train/ | | -| approx_kl | 0.029387712 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0748 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 185710 | -| policy_gradient_loss | -0.0114 | -| std | 0.00784 | -| value_loss | 0.00191 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18573 | -| time_elapsed | 100485 | -| total_timesteps | 2377344 | -| train/ | | -| approx_kl | 0.0060951053 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 185720 | -| policy_gradient_loss | 0.0221 | -| std | 0.00784 | -| value_loss | 4.35e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18574 | -| time_elapsed | 100490 | -| total_timesteps | 2377472 | -| train/ | | -| approx_kl | 0.3746069 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.00129 | -| learning_rate | 0.0003 | -| loss | 0.26 | -| n_updates | 185730 | -| policy_gradient_loss | 0.161 | -| std | 0.00784 | -| value_loss | 7.15e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18575 | -| time_elapsed | 100495 | -| total_timesteps | 2377600 | -| train/ | | -| approx_kl | 0.11777297 | -| clip_fraction | 0.646 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.0874 | -| n_updates | 185740 | -| policy_gradient_loss | 0.0744 | -| std | 0.00784 | -| value_loss | 3.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18576 | -| time_elapsed | 100499 | -| total_timesteps | 2377728 | -| train/ | | -| approx_kl | 0.112033084 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.0932 | -| n_updates | 185750 | -| policy_gradient_loss | 0.107 | -| std | 0.00784 | -| value_loss | 2.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18577 | -| time_elapsed | 100504 | -| total_timesteps | 2377856 | -| train/ | | -| approx_kl | 0.10323126 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 185760 | -| policy_gradient_loss | 0.108 | -| std | 0.00784 | -| value_loss | 2.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18578 | -| time_elapsed | 100510 | -| total_timesteps | 2377984 | -| train/ | | -| approx_kl | 0.09809503 | -| clip_fraction | 0.671 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 185770 | -| policy_gradient_loss | 0.109 | -| std | 0.00784 | -| value_loss | 1.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 18579 | -| time_elapsed | 100514 | -| total_timesteps | 2378112 | -| train/ | | -| approx_kl | 0.08950724 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 185780 | -| policy_gradient_loss | 0.0962 | -| std | 0.00784 | -| value_loss | 1.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 18580 | -| time_elapsed | 100527 | -| total_timesteps | 2378240 | -| train/ | | -| approx_kl | 0.027133625 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 185790 | -| policy_gradient_loss | 0.000471 | -| std | 0.00784 | -| value_loss | 0.000395 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 18581 | -| time_elapsed | 100532 | -| total_timesteps | 2378368 | -| train/ | | -| approx_kl | 0.08499808 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -6.08 | -| learning_rate | 0.0003 | -| loss | 0.0574 | -| n_updates | 185800 | -| policy_gradient_loss | 0.029 | -| std | 0.00785 | -| value_loss | 1.68e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 18582 | -| time_elapsed | 100537 | -| total_timesteps | 2378496 | -| train/ | | -| approx_kl | 0.14364713 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.0935 | -| n_updates | 185810 | -| policy_gradient_loss | 0.0279 | -| std | 0.00785 | -| value_loss | 5.63e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 18583 | -| time_elapsed | 100541 | -| total_timesteps | 2378624 | -| train/ | | -| approx_kl | 0.52241683 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0489 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 185820 | -| policy_gradient_loss | 0.0457 | -| std | 0.00786 | -| value_loss | 4.18e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 18584 | -| time_elapsed | 100546 | -| total_timesteps | 2378752 | -| train/ | | -| approx_kl | 0.028524164 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 185830 | -| policy_gradient_loss | -0.000769 | -| std | 0.00786 | -| value_loss | 3.01e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 18585 | -| time_elapsed | 100550 | -| total_timesteps | 2378880 | -| train/ | | -| approx_kl | 0.03760308 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | -0.000931 | -| n_updates | 185840 | -| policy_gradient_loss | -0.00104 | -| std | 0.00786 | -| value_loss | 2.11e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18586 | -| time_elapsed | 100555 | -| total_timesteps | 2379008 | -| train/ | | -| approx_kl | 0.033308793 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.00095 | -| n_updates | 185850 | -| policy_gradient_loss | 0.000541 | -| std | 0.00786 | -| value_loss | 1.64e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18587 | -| time_elapsed | 100566 | -| total_timesteps | 2379136 | -| train/ | | -| approx_kl | 0.0023009018 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.953 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 185860 | -| policy_gradient_loss | -0.00606 | -| std | 0.00786 | -| value_loss | 0.000551 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18588 | -| time_elapsed | 100573 | -| total_timesteps | 2379264 | -| train/ | | -| approx_kl | 0.34768695 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.153 | -| learning_rate | 0.0003 | -| loss | 0.0974 | -| n_updates | 185870 | -| policy_gradient_loss | 0.0287 | -| std | 0.00786 | -| value_loss | 8.78e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18589 | -| time_elapsed | 100578 | -| total_timesteps | 2379392 | -| train/ | | -| approx_kl | 0.12761971 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.00151 | -| learning_rate | 0.0003 | -| loss | 0.08 | -| n_updates | 185880 | -| policy_gradient_loss | 0.0394 | -| std | 0.0079 | -| value_loss | 6.07e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18590 | -| time_elapsed | 100583 | -| total_timesteps | 2379520 | -| train/ | | -| approx_kl | 0.018159606 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 185890 | -| policy_gradient_loss | 0.0275 | -| std | 0.00792 | -| value_loss | 1.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18591 | -| time_elapsed | 100587 | -| total_timesteps | 2379648 | -| train/ | | -| approx_kl | 0.014685941 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00584 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 185900 | -| policy_gradient_loss | 0.00948 | -| std | 0.00793 | -| value_loss | 3.4e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18592 | -| time_elapsed | 100590 | -| total_timesteps | 2379776 | -| train/ | | -| approx_kl | 0.12539472 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0658 | -| learning_rate | 0.0003 | -| loss | 0.0613 | -| n_updates | 185910 | -| policy_gradient_loss | 0.04 | -| std | 0.00793 | -| value_loss | 2.06e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18593 | -| time_elapsed | 100594 | -| total_timesteps | 2379904 | -| train/ | | -| approx_kl | 0.033456817 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 185920 | -| policy_gradient_loss | 0.0464 | -| std | 0.00793 | -| value_loss | 1.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18594 | -| time_elapsed | 100600 | -| total_timesteps | 2380032 | -| train/ | | -| approx_kl | 0.17790866 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0843 | -| n_updates | 185930 | -| policy_gradient_loss | 0.0302 | -| std | 0.00793 | -| value_loss | 8.78e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18595 | -| time_elapsed | 100611 | -| total_timesteps | 2380160 | -| train/ | | -| approx_kl | 0.026765259 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.863 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 185940 | -| policy_gradient_loss | -0.0161 | -| std | 0.00793 | -| value_loss | 0.00264 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18596 | -| time_elapsed | 100616 | -| total_timesteps | 2380288 | -| train/ | | -| approx_kl | 0.019296793 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 185950 | -| policy_gradient_loss | 0.0415 | -| std | 0.00793 | -| value_loss | 2.24e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18597 | -| time_elapsed | 100621 | -| total_timesteps | 2380416 | -| train/ | | -| approx_kl | 0.22266367 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00302 | -| learning_rate | 0.0003 | -| loss | 0.086 | -| n_updates | 185960 | -| policy_gradient_loss | 0.0332 | -| std | 0.00793 | -| value_loss | 2.38e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18598 | -| time_elapsed | 100624 | -| total_timesteps | 2380544 | -| train/ | | -| approx_kl | 0.04139032 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 185970 | -| policy_gradient_loss | 0.0504 | -| std | 0.00793 | -| value_loss | 3.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18599 | -| time_elapsed | 100628 | -| total_timesteps | 2380672 | -| train/ | | -| approx_kl | 0.013097944 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | 0.00175 | -| n_updates | 185980 | -| policy_gradient_loss | 0.0179 | -| std | 0.00793 | -| value_loss | 2.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18600 | -| time_elapsed | 100632 | -| total_timesteps | 2380800 | -| train/ | | -| approx_kl | 0.021406926 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0646 | -| learning_rate | 0.0003 | -| loss | 0.00379 | -| n_updates | 185990 | -| policy_gradient_loss | 0.0341 | -| std | 0.00793 | -| value_loss | 1.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18601 | -| time_elapsed | 100637 | -| total_timesteps | 2380928 | -| train/ | | -| approx_kl | 0.05209717 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.00938 | -| n_updates | 186000 | -| policy_gradient_loss | 0.00194 | -| std | 0.00793 | -| value_loss | 1.15e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18602 | -| time_elapsed | 100641 | -| total_timesteps | 2381056 | -| train/ | | -| approx_kl | 0.032431986 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.00779 | -| n_updates | 186010 | -| policy_gradient_loss | 0.00375 | -| std | 0.00793 | -| value_loss | 6.01e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18603 | -| time_elapsed | 100651 | -| total_timesteps | 2381184 | -| train/ | | -| approx_kl | 0.0147963185 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -5.87 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 186020 | -| policy_gradient_loss | -0.00934 | -| std | 0.00793 | -| value_loss | 0.00396 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18604 | -| time_elapsed | 100655 | -| total_timesteps | 2381312 | -| train/ | | -| approx_kl | 0.060511313 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.237 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 186030 | -| policy_gradient_loss | 0.0434 | -| std | 0.00793 | -| value_loss | 1.61e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18605 | -| time_elapsed | 100660 | -| total_timesteps | 2381440 | -| train/ | | -| approx_kl | 0.022102134 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.000661 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 186040 | -| policy_gradient_loss | 0.00642 | -| std | 0.00793 | -| value_loss | 2.25e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18606 | -| time_elapsed | 100664 | -| total_timesteps | 2381568 | -| train/ | | -| approx_kl | 0.11446629 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 186050 | -| policy_gradient_loss | 0.00644 | -| std | 0.00793 | -| value_loss | 9.55e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18607 | -| time_elapsed | 100669 | -| total_timesteps | 2381696 | -| train/ | | -| approx_kl | 0.04748001 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0982 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 186060 | -| policy_gradient_loss | 0.0337 | -| std | 0.00793 | -| value_loss | 4.13e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18608 | -| time_elapsed | 100673 | -| total_timesteps | 2381824 | -| train/ | | -| approx_kl | 0.10326967 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 186070 | -| policy_gradient_loss | 0.0283 | -| std | 0.00793 | -| value_loss | 3.06e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18609 | -| time_elapsed | 100678 | -| total_timesteps | 2381952 | -| train/ | | -| approx_kl | 0.006808879 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0725 | -| learning_rate | 0.0003 | -| loss | 0.00312 | -| n_updates | 186080 | -| policy_gradient_loss | 0.0283 | -| std | 0.00792 | -| value_loss | 7.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18610 | -| time_elapsed | 100683 | -| total_timesteps | 2382080 | -| train/ | | -| approx_kl | 0.33455053 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.348 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 186090 | -| policy_gradient_loss | 0.0412 | -| std | 0.00791 | -| value_loss | 4.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18611 | -| time_elapsed | 100691 | -| total_timesteps | 2382208 | -| train/ | | -| approx_kl | 0.008339694 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 186100 | -| policy_gradient_loss | -0.0069 | -| std | 0.00791 | -| value_loss | 0.00042 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18612 | -| time_elapsed | 100695 | -| total_timesteps | 2382336 | -| train/ | | -| approx_kl | 0.0030398774 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 186110 | -| policy_gradient_loss | 0.000209 | -| std | 0.00791 | -| value_loss | 7.32e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18613 | -| time_elapsed | 100699 | -| total_timesteps | 2382464 | -| train/ | | -| approx_kl | 0.14727704 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 186120 | -| policy_gradient_loss | 0.0212 | -| std | 0.00791 | -| value_loss | 3.42e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18614 | -| time_elapsed | 100702 | -| total_timesteps | 2382592 | -| train/ | | -| approx_kl | 0.0009326022 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.00601 | -| n_updates | 186130 | -| policy_gradient_loss | -0.00646 | -| std | 0.00791 | -| value_loss | 2.42e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18615 | -| time_elapsed | 100706 | -| total_timesteps | 2382720 | -| train/ | | -| approx_kl | 0.043624613 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0523 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 186140 | -| policy_gradient_loss | 0.0406 | -| std | 0.00792 | -| value_loss | 1.78e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18616 | -| time_elapsed | 100712 | -| total_timesteps | 2382848 | -| train/ | | -| approx_kl | 0.01714386 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 186150 | -| policy_gradient_loss | 0.00929 | -| std | 0.00792 | -| value_loss | 1.4e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18617 | -| time_elapsed | 100716 | -| total_timesteps | 2382976 | -| train/ | | -| approx_kl | 0.09166485 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.0405 | -| n_updates | 186160 | -| policy_gradient_loss | 0.00497 | -| std | 0.00793 | -| value_loss | 1.27e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18618 | -| time_elapsed | 100721 | -| total_timesteps | 2383104 | -| train/ | | -| approx_kl | 0.03878628 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.602 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 186170 | -| policy_gradient_loss | 0.00454 | -| std | 0.00793 | -| value_loss | 5.06e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18619 | -| time_elapsed | 100731 | -| total_timesteps | 2383232 | -| train/ | | -| approx_kl | 0.12546384 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | 0.0888 | -| n_updates | 186180 | -| policy_gradient_loss | 0.0523 | -| std | 0.00794 | -| value_loss | 0.000581 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18620 | -| time_elapsed | 100735 | -| total_timesteps | 2383360 | -| train/ | | -| approx_kl | 0.023431806 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | 0.00655 | -| n_updates | 186190 | -| policy_gradient_loss | 0.0114 | -| std | 0.00794 | -| value_loss | 1.27e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18621 | -| time_elapsed | 100738 | -| total_timesteps | 2383488 | -| train/ | | -| approx_kl | 0.0008630329 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00822 | -| learning_rate | 0.0003 | -| loss | 0.00255 | -| n_updates | 186200 | -| policy_gradient_loss | 0.0196 | -| std | 0.00794 | -| value_loss | 1.58e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18622 | -| time_elapsed | 100743 | -| total_timesteps | 2383616 | -| train/ | | -| approx_kl | 0.14224835 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.0485 | -| n_updates | 186210 | -| policy_gradient_loss | 0.0111 | -| std | 0.00794 | -| value_loss | 3.65e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18623 | -| time_elapsed | 100747 | -| total_timesteps | 2383744 | -| train/ | | -| approx_kl | 0.01103829 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.00505 | -| n_updates | 186220 | -| policy_gradient_loss | 0.0196 | -| std | 0.00795 | -| value_loss | 2.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18624 | -| time_elapsed | 100752 | -| total_timesteps | 2383872 | -| train/ | | -| approx_kl | 0.13888907 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -4.08 | -| learning_rate | 0.0003 | -| loss | 0.0477 | -| n_updates | 186230 | -| policy_gradient_loss | 0.0451 | -| std | 0.00795 | -| value_loss | 6.11e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18625 | -| time_elapsed | 100755 | -| total_timesteps | 2384000 | -| train/ | | -| approx_kl | 0.12727526 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0791 | -| n_updates | 186240 | -| policy_gradient_loss | 0.0819 | -| std | 0.00796 | -| value_loss | 1.43e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18626 | -| time_elapsed | 100761 | -| total_timesteps | 2384128 | -| train/ | | -| approx_kl | 0.115140185 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.0043 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 186250 | -| policy_gradient_loss | 0.12 | -| std | 0.00796 | -| value_loss | 9.17e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18627 | -| time_elapsed | 100771 | -| total_timesteps | 2384256 | -| train/ | | -| approx_kl | 0.06682778 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.756 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 186260 | -| policy_gradient_loss | 0.0615 | -| std | 0.00796 | -| value_loss | 0.00608 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18628 | -| time_elapsed | 100775 | -| total_timesteps | 2384384 | -| train/ | | -| approx_kl | 0.07315376 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | 0.0546 | -| n_updates | 186270 | -| policy_gradient_loss | 0.0904 | -| std | 0.00796 | -| value_loss | 2.9e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18629 | -| time_elapsed | 100779 | -| total_timesteps | 2384512 | -| train/ | | -| approx_kl | 0.019449048 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00745 | -| learning_rate | 0.0003 | -| loss | 0.000633 | -| n_updates | 186280 | -| policy_gradient_loss | 0.0199 | -| std | 0.00796 | -| value_loss | 5.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18630 | -| time_elapsed | 100781 | -| total_timesteps | 2384640 | -| train/ | | -| approx_kl | 0.028939236 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 186290 | -| policy_gradient_loss | -0.00732 | -| std | 0.00796 | -| value_loss | 3.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18631 | -| time_elapsed | 100786 | -| total_timesteps | 2384768 | -| train/ | | -| approx_kl | 0.089903876 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 186300 | -| policy_gradient_loss | 0.0997 | -| std | 0.00795 | -| value_loss | 1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 18632 | -| time_elapsed | 100790 | -| total_timesteps | 2384896 | -| train/ | | -| approx_kl | 0.06549386 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | 0.0442 | -| n_updates | 186310 | -| policy_gradient_loss | 0.0656 | -| std | 0.00795 | -| value_loss | 5.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18633 | -| time_elapsed | 100796 | -| total_timesteps | 2385024 | -| train/ | | -| approx_kl | 0.09973214 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | 0.067 | -| n_updates | 186320 | -| policy_gradient_loss | 0.0937 | -| std | 0.00796 | -| value_loss | 3.09e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18634 | -| time_elapsed | 100808 | -| total_timesteps | 2385152 | -| train/ | | -| approx_kl | 0.14011288 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.823 | -| learning_rate | 0.0003 | -| loss | 0.0521 | -| n_updates | 186330 | -| policy_gradient_loss | 0.048 | -| std | 0.00796 | -| value_loss | 0.00376 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18635 | -| time_elapsed | 100813 | -| total_timesteps | 2385280 | -| train/ | | -| approx_kl | 0.045602366 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 186340 | -| policy_gradient_loss | 0.0234 | -| std | 0.00795 | -| value_loss | 4.37e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18636 | -| time_elapsed | 100818 | -| total_timesteps | 2385408 | -| train/ | | -| approx_kl | 0.4908939 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.275 | -| learning_rate | 0.0003 | -| loss | 0.201 | -| n_updates | 186350 | -| policy_gradient_loss | 0.0507 | -| std | 0.00794 | -| value_loss | 4.77e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18637 | -| time_elapsed | 100823 | -| total_timesteps | 2385536 | -| train/ | | -| approx_kl | 0.01004665 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0708 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 186360 | -| policy_gradient_loss | 0.00334 | -| std | 0.00794 | -| value_loss | 5.97e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18638 | -| time_elapsed | 100828 | -| total_timesteps | 2385664 | -| train/ | | -| approx_kl | 0.002058453 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 186370 | -| policy_gradient_loss | 0.00373 | -| std | 0.00794 | -| value_loss | 1.85e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18639 | -| time_elapsed | 100833 | -| total_timesteps | 2385792 | -| train/ | | -| approx_kl | 0.05775606 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 186380 | -| policy_gradient_loss | 0.00414 | -| std | 0.00794 | -| value_loss | 4.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18640 | -| time_elapsed | 100838 | -| total_timesteps | 2385920 | -| train/ | | -| approx_kl | 0.030248981 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00659 | -| n_updates | 186390 | -| policy_gradient_loss | 0.0247 | -| std | 0.00794 | -| value_loss | 1.27e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18641 | -| time_elapsed | 100843 | -| total_timesteps | 2386048 | -| train/ | | -| approx_kl | 0.08435224 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.0911 | -| n_updates | 186400 | -| policy_gradient_loss | 0.0409 | -| std | 0.00795 | -| value_loss | 9.53e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18642 | -| time_elapsed | 100853 | -| total_timesteps | 2386176 | -| train/ | | -| approx_kl | 0.035676558 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 186410 | -| policy_gradient_loss | -0.0125 | -| std | 0.00795 | -| value_loss | 0.00413 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18643 | -| time_elapsed | 100859 | -| total_timesteps | 2386304 | -| train/ | | -| approx_kl | 0.12001915 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 186420 | -| policy_gradient_loss | 0.104 | -| std | 0.00795 | -| value_loss | 1.66e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18644 | -| time_elapsed | 100863 | -| total_timesteps | 2386432 | -| train/ | | -| approx_kl | 0.028455641 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00704 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 186430 | -| policy_gradient_loss | 0.0205 | -| std | 0.00795 | -| value_loss | 2.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18645 | -| time_elapsed | 100868 | -| total_timesteps | 2386560 | -| train/ | | -| approx_kl | 0.030669043 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | -0.00904 | -| n_updates | 186440 | -| policy_gradient_loss | -0.00096 | -| std | 0.00795 | -| value_loss | 3.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18646 | -| time_elapsed | 100872 | -| total_timesteps | 2386688 | -| train/ | | -| approx_kl | 0.01076475 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 186450 | -| policy_gradient_loss | 0.0152 | -| std | 0.00795 | -| value_loss | 7.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18647 | -| time_elapsed | 100877 | -| total_timesteps | 2386816 | -| train/ | | -| approx_kl | 0.038652215 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 186460 | -| policy_gradient_loss | 0.00292 | -| std | 0.00795 | -| value_loss | 1.8e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18648 | -| time_elapsed | 100882 | -| total_timesteps | 2386944 | -| train/ | | -| approx_kl | 0.0012663449 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 186470 | -| policy_gradient_loss | 0.014 | -| std | 0.00795 | -| value_loss | 1.03e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18649 | -| time_elapsed | 100886 | -| total_timesteps | 2387072 | -| train/ | | -| approx_kl | 0.10438261 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 186480 | -| policy_gradient_loss | 0.0089 | -| std | 0.00794 | -| value_loss | 8.07e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18650 | -| time_elapsed | 100895 | -| total_timesteps | 2387200 | -| train/ | | -| approx_kl | 0.003380837 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 186490 | -| policy_gradient_loss | 0.00268 | -| std | 0.00794 | -| value_loss | 0.000515 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18651 | -| time_elapsed | 100899 | -| total_timesteps | 2387328 | -| train/ | | -| approx_kl | 0.030328186 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 186500 | -| policy_gradient_loss | 0.014 | -| std | 0.00794 | -| value_loss | 1.47e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18652 | -| time_elapsed | 100905 | -| total_timesteps | 2387456 | -| train/ | | -| approx_kl | 0.0016548708 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.00828 | -| n_updates | 186510 | -| policy_gradient_loss | 0.0011 | -| std | 0.00794 | -| value_loss | 7.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18653 | -| time_elapsed | 100910 | -| total_timesteps | 2387584 | -| train/ | | -| approx_kl | 0.032017928 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 186520 | -| policy_gradient_loss | 0.0148 | -| std | 0.00794 | -| value_loss | 4.86e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18654 | -| time_elapsed | 100915 | -| total_timesteps | 2387712 | -| train/ | | -| approx_kl | 0.3509637 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 186530 | -| policy_gradient_loss | 0.0344 | -| std | 0.00794 | -| value_loss | 1.91e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18655 | -| time_elapsed | 100920 | -| total_timesteps | 2387840 | -| train/ | | -| approx_kl | 0.007756786 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.061 | -| learning_rate | 0.0003 | -| loss | -0.00634 | -| n_updates | 186540 | -| policy_gradient_loss | 0.00251 | -| std | 0.00794 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18656 | -| time_elapsed | 100925 | -| total_timesteps | 2387968 | -| train/ | | -| approx_kl | 0.049235713 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.00617 | -| n_updates | 186550 | -| policy_gradient_loss | -3.36e-06 | -| std | 0.00794 | -| value_loss | 9.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18657 | -| time_elapsed | 100930 | -| total_timesteps | 2388096 | -| train/ | | -| approx_kl | 0.030432716 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | -0.0092 | -| n_updates | 186560 | -| policy_gradient_loss | -0.00349 | -| std | 0.00794 | -| value_loss | 6.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18658 | -| time_elapsed | 100941 | -| total_timesteps | 2388224 | -| train/ | | -| approx_kl | 0.059719685 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 186570 | -| policy_gradient_loss | -0.0158 | -| std | 0.00794 | -| value_loss | 7.75e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18659 | -| time_elapsed | 100946 | -| total_timesteps | 2388352 | -| train/ | | -| approx_kl | 0.0011770711 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00895 | -| learning_rate | 0.0003 | -| loss | -0.00393 | -| n_updates | 186580 | -| policy_gradient_loss | 0.00176 | -| std | 0.00794 | -| value_loss | 7.22e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18660 | -| time_elapsed | 100951 | -| total_timesteps | 2388480 | -| train/ | | -| approx_kl | 0.008494657 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 186590 | -| policy_gradient_loss | 0.00266 | -| std | 0.00795 | -| value_loss | 2.47e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18661 | -| time_elapsed | 100956 | -| total_timesteps | 2388608 | -| train/ | | -| approx_kl | 0.0013290998 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 186600 | -| policy_gradient_loss | 0.00544 | -| std | 0.00794 | -| value_loss | 2.02e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18662 | -| time_elapsed | 100960 | -| total_timesteps | 2388736 | -| train/ | | -| approx_kl | 0.038707092 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 186610 | -| policy_gradient_loss | 0.0093 | -| std | 0.00794 | -| value_loss | 5.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18663 | -| time_elapsed | 100964 | -| total_timesteps | 2388864 | -| train/ | | -| approx_kl | 0.010178328 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0499 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 186620 | -| policy_gradient_loss | -0.0024 | -| std | 0.00795 | -| value_loss | 8.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18664 | -| time_elapsed | 100969 | -| total_timesteps | 2388992 | -| train/ | | -| approx_kl | 0.008369939 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | -0.00506 | -| n_updates | 186630 | -| policy_gradient_loss | -0.00258 | -| std | 0.00795 | -| value_loss | 8.53e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18665 | -| time_elapsed | 100973 | -| total_timesteps | 2389120 | -| train/ | | -| approx_kl | 0.01672149 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 186640 | -| policy_gradient_loss | 0.0144 | -| std | 0.00795 | -| value_loss | 8.52e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18666 | -| time_elapsed | 100986 | -| total_timesteps | 2389248 | -| train/ | | -| approx_kl | 0.055893358 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.213 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 186650 | -| policy_gradient_loss | -0.00588 | -| std | 0.00795 | -| value_loss | 0.00166 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18667 | -| time_elapsed | 100991 | -| total_timesteps | 2389376 | -| train/ | | -| approx_kl | 0.037611205 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -66.7 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 186660 | -| policy_gradient_loss | 0.00217 | -| std | 0.00795 | -| value_loss | 3.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18668 | -| time_elapsed | 100997 | -| total_timesteps | 2389504 | -| train/ | | -| approx_kl | 0.034287617 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 186670 | -| policy_gradient_loss | 0.0035 | -| std | 0.00793 | -| value_loss | 7.99e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18669 | -| time_elapsed | 101001 | -| total_timesteps | 2389632 | -| train/ | | -| approx_kl | 0.038000647 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00279 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 186680 | -| policy_gradient_loss | 0.00606 | -| std | 0.00792 | -| value_loss | 9.34e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18670 | -| time_elapsed | 101006 | -| total_timesteps | 2389760 | -| train/ | | -| approx_kl | 0.03570834 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 186690 | -| policy_gradient_loss | 0.0116 | -| std | 0.00792 | -| value_loss | 1.88e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 18671 | -| time_elapsed | 101011 | -| total_timesteps | 2389888 | -| train/ | | -| approx_kl | 0.015680062 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.00175 | -| n_updates | 186700 | -| policy_gradient_loss | 0.0541 | -| std | 0.00792 | -| value_loss | 1.06e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18672 | -| time_elapsed | 101015 | -| total_timesteps | 2390016 | -| train/ | | -| approx_kl | 0.1897051 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 186710 | -| policy_gradient_loss | 0.0192 | -| std | 0.00792 | -| value_loss | 9.25e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18673 | -| time_elapsed | 101025 | -| total_timesteps | 2390144 | -| train/ | | -| approx_kl | 0.018215768 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 186720 | -| policy_gradient_loss | 0.0195 | -| std | 0.00792 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18674 | -| time_elapsed | 101029 | -| total_timesteps | 2390272 | -| train/ | | -| approx_kl | 0.018834073 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.0423 | -| learning_rate | 0.0003 | -| loss | -0.00885 | -| n_updates | 186730 | -| policy_gradient_loss | -0.00406 | -| std | 0.00791 | -| value_loss | 5.15e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18675 | -| time_elapsed | 101033 | -| total_timesteps | 2390400 | -| train/ | | -| approx_kl | 0.00082792155 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 186740 | -| policy_gradient_loss | 0.00331 | -| std | 0.00789 | -| value_loss | 8.44e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18676 | -| time_elapsed | 101038 | -| total_timesteps | 2390528 | -| train/ | | -| approx_kl | 0.00044810586 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.806 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 186750 | -| policy_gradient_loss | 0.00609 | -| std | 0.00788 | -| value_loss | 4.71e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18677 | -| time_elapsed | 101043 | -| total_timesteps | 2390656 | -| train/ | | -| approx_kl | 2.4652109e-05 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.302 | -| learning_rate | 0.0003 | -| loss | -0.000195 | -| n_updates | 186760 | -| policy_gradient_loss | 0.00359 | -| std | 0.00788 | -| value_loss | 2.62e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18678 | -| time_elapsed | 101047 | -| total_timesteps | 2390784 | -| train/ | | -| approx_kl | 0.00015132362 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 186770 | -| policy_gradient_loss | -0.00165 | -| std | 0.00788 | -| value_loss | 2.39e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18679 | -| time_elapsed | 101051 | -| total_timesteps | 2390912 | -| train/ | | -| approx_kl | 8.902885e-05 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | -0.000755 | -| n_updates | 186780 | -| policy_gradient_loss | 0.00543 | -| std | 0.00788 | -| value_loss | 1.09e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18680 | -| time_elapsed | 101055 | -| total_timesteps | 2391040 | -| train/ | | -| approx_kl | 0.00011929497 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0549 | -| learning_rate | 0.0003 | -| loss | -0.000672 | -| n_updates | 186790 | -| policy_gradient_loss | 0.00881 | -| std | 0.00788 | -| value_loss | 6.83e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18681 | -| time_elapsed | 101068 | -| total_timesteps | 2391168 | -| train/ | | -| approx_kl | 0.015559617 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 186800 | -| policy_gradient_loss | -0.0138 | -| std | 0.00788 | -| value_loss | 0.00142 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18682 | -| time_elapsed | 101074 | -| total_timesteps | 2391296 | -| train/ | | -| approx_kl | 0.0037579178 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0946 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 186810 | -| policy_gradient_loss | 0.00659 | -| std | 0.00788 | -| value_loss | 0.000524 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18683 | -| time_elapsed | 101079 | -| total_timesteps | 2391424 | -| train/ | | -| approx_kl | 0.00014392566 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.861 | -| learning_rate | 0.0003 | -| loss | 1.76e-05 | -| n_updates | 186820 | -| policy_gradient_loss | 0.00609 | -| std | 0.00788 | -| value_loss | 2.38e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18684 | -| time_elapsed | 101084 | -| total_timesteps | 2391552 | -| train/ | | -| approx_kl | 0.00046995003 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00069 | -| learning_rate | 0.0003 | -| loss | -0.000607 | -| n_updates | 186830 | -| policy_gradient_loss | 0.00781 | -| std | 0.00788 | -| value_loss | 9.99e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18685 | -| time_elapsed | 101090 | -| total_timesteps | 2391680 | -| train/ | | -| approx_kl | 0.039152384 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.676 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 186840 | -| policy_gradient_loss | 0.0358 | -| std | 0.00789 | -| value_loss | 6.92e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18686 | -| time_elapsed | 101094 | -| total_timesteps | 2391808 | -| train/ | | -| approx_kl | 3.3993274e-07 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | -2.47e-05 | -| n_updates | 186850 | -| policy_gradient_loss | 0.069 | -| std | 0.00789 | -| value_loss | 2.1e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18687 | -| time_elapsed | 101099 | -| total_timesteps | 2391936 | -| train/ | | -| approx_kl | 0.025981348 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 186860 | -| policy_gradient_loss | 0.02 | -| std | 0.00789 | -| value_loss | 2.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18688 | -| time_elapsed | 101104 | -| total_timesteps | 2392064 | -| train/ | | -| approx_kl | 0.024248492 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.00915 | -| n_updates | 186870 | -| policy_gradient_loss | 0.0191 | -| std | 0.00789 | -| value_loss | 2.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18689 | -| time_elapsed | 101114 | -| total_timesteps | 2392192 | -| train/ | | -| approx_kl | 0.02442906 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 186880 | -| policy_gradient_loss | -0.00739 | -| std | 0.00789 | -| value_loss | 0.000133 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18690 | -| time_elapsed | 101119 | -| total_timesteps | 2392320 | -| train/ | | -| approx_kl | 0.1281423 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | 0.0411 | -| n_updates | 186890 | -| policy_gradient_loss | 0.0103 | -| std | 0.00789 | -| value_loss | 1.52e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18691 | -| time_elapsed | 101123 | -| total_timesteps | 2392448 | -| train/ | | -| approx_kl | 0.11460362 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | 0.0428 | -| n_updates | 186900 | -| policy_gradient_loss | 0.0196 | -| std | 0.00789 | -| value_loss | 3.98e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18692 | -| time_elapsed | 101127 | -| total_timesteps | 2392576 | -| train/ | | -| approx_kl | 0.0664758 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | 0.00749 | -| n_updates | 186910 | -| policy_gradient_loss | 0.00896 | -| std | 0.00788 | -| value_loss | 1.9e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18693 | -| time_elapsed | 101132 | -| total_timesteps | 2392704 | -| train/ | | -| approx_kl | 0.10093341 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.000239 | -| learning_rate | 0.0003 | -| loss | 0.0784 | -| n_updates | 186920 | -| policy_gradient_loss | 0.0316 | -| std | 0.00788 | -| value_loss | 6.97e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18694 | -| time_elapsed | 101135 | -| total_timesteps | 2392832 | -| train/ | | -| approx_kl | 0.028315675 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00537 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 186930 | -| policy_gradient_loss | 0.00166 | -| std | 0.00788 | -| value_loss | 3.3e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18695 | -| time_elapsed | 101139 | -| total_timesteps | 2392960 | -| train/ | | -| approx_kl | 0.0014832402 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00676 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 186940 | -| policy_gradient_loss | 0.0187 | -| std | 0.00788 | -| value_loss | 1.11e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18696 | -| time_elapsed | 101143 | -| total_timesteps | 2393088 | -| train/ | | -| approx_kl | 0.13463952 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | 0.0631 | -| n_updates | 186950 | -| policy_gradient_loss | 0.0125 | -| std | 0.00787 | -| value_loss | 1.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18697 | -| time_elapsed | 101150 | -| total_timesteps | 2393216 | -| train/ | | -| approx_kl | 0.047605418 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -6.34 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 186960 | -| policy_gradient_loss | -0.0141 | -| std | 0.00787 | -| value_loss | 0.00427 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18698 | -| time_elapsed | 101154 | -| total_timesteps | 2393344 | -| train/ | | -| approx_kl | 0.11544353 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 186970 | -| policy_gradient_loss | 0.0339 | -| std | 0.00787 | -| value_loss | 1.07e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18699 | -| time_elapsed | 101159 | -| total_timesteps | 2393472 | -| train/ | | -| approx_kl | 0.29561788 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.00349 | -| learning_rate | 0.0003 | -| loss | 0.192 | -| n_updates | 186980 | -| policy_gradient_loss | 0.119 | -| std | 0.00787 | -| value_loss | 8.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18700 | -| time_elapsed | 101165 | -| total_timesteps | 2393600 | -| train/ | | -| approx_kl | 0.12408347 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 186990 | -| policy_gradient_loss | 0.11 | -| std | 0.00787 | -| value_loss | 6.14e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18701 | -| time_elapsed | 101169 | -| total_timesteps | 2393728 | -| train/ | | -| approx_kl | 0.11443867 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0841 | -| n_updates | 187000 | -| policy_gradient_loss | 0.111 | -| std | 0.00787 | -| value_loss | 7.28e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18702 | -| time_elapsed | 101177 | -| total_timesteps | 2393856 | -| train/ | | -| approx_kl | 0.08459966 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 187010 | -| policy_gradient_loss | 0.107 | -| std | 0.00787 | -| value_loss | 1.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 18703 | -| time_elapsed | 101182 | -| total_timesteps | 2393984 | -| train/ | | -| approx_kl | 0.020761777 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.00288 | -| n_updates | 187020 | -| policy_gradient_loss | 0.0113 | -| std | 0.00788 | -| value_loss | 3.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18704 | -| time_elapsed | 101187 | -| total_timesteps | 2394112 | -| train/ | | -| approx_kl | 0.43740058 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.24 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 187030 | -| policy_gradient_loss | 0.051 | -| std | 0.00788 | -| value_loss | 6.65e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18705 | -| time_elapsed | 101198 | -| total_timesteps | 2394240 | -| train/ | | -| approx_kl | 0.023101583 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 187040 | -| policy_gradient_loss | -0.0141 | -| std | 0.00787 | -| value_loss | 7.4e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18706 | -| time_elapsed | 101202 | -| total_timesteps | 2394368 | -| train/ | | -| approx_kl | 4.484318e-06 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | -4.03e-05 | -| n_updates | 187050 | -| policy_gradient_loss | 0.00137 | -| std | 0.00787 | -| value_loss | 1.41e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18707 | -| time_elapsed | 101207 | -| total_timesteps | 2394496 | -| train/ | | -| approx_kl | 0.00021320861 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 187060 | -| policy_gradient_loss | -0.000125 | -| std | 0.00788 | -| value_loss | 4.67e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18708 | -| time_elapsed | 101212 | -| total_timesteps | 2394624 | -| train/ | | -| approx_kl | 0.0060986476 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | -0.00864 | -| n_updates | 187070 | -| policy_gradient_loss | 0.00273 | -| std | 0.00788 | -| value_loss | 2.39e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18709 | -| time_elapsed | 101218 | -| total_timesteps | 2394752 | -| train/ | | -| approx_kl | 0.06322047 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00361 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 187080 | -| policy_gradient_loss | 0.00157 | -| std | 0.00788 | -| value_loss | 5.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 18710 | -| time_elapsed | 101221 | -| total_timesteps | 2394880 | -| train/ | | -| approx_kl | 0.033934623 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 187090 | -| policy_gradient_loss | -0.000685 | -| std | 0.00788 | -| value_loss | 1.17e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18711 | -| time_elapsed | 101226 | -| total_timesteps | 2395008 | -| train/ | | -| approx_kl | 3.504008e-05 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | -0.000985 | -| n_updates | 187100 | -| policy_gradient_loss | 0.00215 | -| std | 0.00788 | -| value_loss | 8.36e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18712 | -| time_elapsed | 101238 | -| total_timesteps | 2395136 | -| train/ | | -| approx_kl | 0.047767695 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.00201 | -| n_updates | 187110 | -| policy_gradient_loss | 0.00102 | -| std | 0.00788 | -| value_loss | 0.00012 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18713 | -| time_elapsed | 101242 | -| total_timesteps | 2395264 | -| train/ | | -| approx_kl | 0.035958797 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.0645 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 187120 | -| policy_gradient_loss | 0.00534 | -| std | 0.00788 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18714 | -| time_elapsed | 101247 | -| total_timesteps | 2395392 | -| train/ | | -| approx_kl | 0.0051566497 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 187130 | -| policy_gradient_loss | 0.00273 | -| std | 0.00788 | -| value_loss | 1.12e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18715 | -| time_elapsed | 101251 | -| total_timesteps | 2395520 | -| train/ | | -| approx_kl | 0.03998703 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00246 | -| learning_rate | 0.0003 | -| loss | 0.00822 | -| n_updates | 187140 | -| policy_gradient_loss | 0.000784 | -| std | 0.00788 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18716 | -| time_elapsed | 101254 | -| total_timesteps | 2395648 | -| train/ | | -| approx_kl | 0.009457726 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 187150 | -| policy_gradient_loss | 0.00333 | -| std | 0.00788 | -| value_loss | 5.16e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18717 | -| time_elapsed | 101256 | -| total_timesteps | 2395776 | -| train/ | | -| approx_kl | 0.00040772697 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.000588 | -| n_updates | 187160 | -| policy_gradient_loss | 0.00641 | -| std | 0.00788 | -| value_loss | 2.98e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 18718 | -| time_elapsed | 101261 | -| total_timesteps | 2395904 | -| train/ | | -| approx_kl | 0.042005803 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | 0.00932 | -| n_updates | 187170 | -| policy_gradient_loss | 0.00351 | -| std | 0.00788 | -| value_loss | 3.23e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18719 | -| time_elapsed | 101266 | -| total_timesteps | 2396032 | -| train/ | | -| approx_kl | 0.036431648 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 187180 | -| policy_gradient_loss | 0.00671 | -| std | 0.00788 | -| value_loss | 1.66e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18720 | -| time_elapsed | 101276 | -| total_timesteps | 2396160 | -| train/ | | -| approx_kl | 0.0033776998 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.815 | -| learning_rate | 0.0003 | -| loss | -0.00906 | -| n_updates | 187190 | -| policy_gradient_loss | 8.43e-05 | -| std | 0.00788 | -| value_loss | 0.00105 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18721 | -| time_elapsed | 101282 | -| total_timesteps | 2396288 | -| train/ | | -| approx_kl | 0.08903333 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 187200 | -| policy_gradient_loss | 0.00635 | -| std | 0.00788 | -| value_loss | 4.35e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18722 | -| time_elapsed | 101286 | -| total_timesteps | 2396416 | -| train/ | | -| approx_kl | 0.17311585 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -2.39 | -| learning_rate | 0.0003 | -| loss | 0.0436 | -| n_updates | 187210 | -| policy_gradient_loss | 0.0278 | -| std | 0.00787 | -| value_loss | 1.95e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18723 | -| time_elapsed | 101291 | -| total_timesteps | 2396544 | -| train/ | | -| approx_kl | 0.0010087136 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 187220 | -| policy_gradient_loss | 0.00198 | -| std | 0.00787 | -| value_loss | 5.72e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18724 | -| time_elapsed | 101294 | -| total_timesteps | 2396672 | -| train/ | | -| approx_kl | 0.04639833 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.084 | -| learning_rate | 0.0003 | -| loss | 0.00699 | -| n_updates | 187230 | -| policy_gradient_loss | 0.0333 | -| std | 0.00787 | -| value_loss | 3.8e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18725 | -| time_elapsed | 101300 | -| total_timesteps | 2396800 | -| train/ | | -| approx_kl | 0.17524408 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.0528 | -| n_updates | 187240 | -| policy_gradient_loss | 0.0339 | -| std | 0.00788 | -| value_loss | 2.95e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18726 | -| time_elapsed | 101304 | -| total_timesteps | 2396928 | -| train/ | | -| approx_kl | 0.044851802 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.0279 | -| n_updates | 187250 | -| policy_gradient_loss | 0.0505 | -| std | 0.00789 | -| value_loss | 1.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18727 | -| time_elapsed | 101309 | -| total_timesteps | 2397056 | -| train/ | | -| approx_kl | 0.012651917 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -5.27 | -| learning_rate | 0.0003 | -| loss | -0.00834 | -| n_updates | 187260 | -| policy_gradient_loss | -0.00173 | -| std | 0.00789 | -| value_loss | 2e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18728 | -| time_elapsed | 101318 | -| total_timesteps | 2397184 | -| train/ | | -| approx_kl | 0.1941521 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.923 | -| learning_rate | 0.0003 | -| loss | 0.0461 | -| n_updates | 187270 | -| policy_gradient_loss | 0.0124 | -| std | 0.00789 | -| value_loss | 0.00233 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18729 | -| time_elapsed | 101324 | -| total_timesteps | 2397312 | -| train/ | | -| approx_kl | 0.040450882 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 187280 | -| policy_gradient_loss | 0.0475 | -| std | 0.0079 | -| value_loss | 5.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18730 | -| time_elapsed | 101329 | -| total_timesteps | 2397440 | -| train/ | | -| approx_kl | 0.013376484 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00419 | -| learning_rate | 0.0003 | -| loss | -0.00499 | -| n_updates | 187290 | -| policy_gradient_loss | 0.00943 | -| std | 0.0079 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18731 | -| time_elapsed | 101334 | -| total_timesteps | 2397568 | -| train/ | | -| approx_kl | 0.022434106 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.00624 | -| n_updates | 187300 | -| policy_gradient_loss | 0.047 | -| std | 0.0079 | -| value_loss | 4.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18732 | -| time_elapsed | 101339 | -| total_timesteps | 2397696 | -| train/ | | -| approx_kl | 0.0033705742 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | -0.000854 | -| n_updates | 187310 | -| policy_gradient_loss | 0.0683 | -| std | 0.0079 | -| value_loss | 2.7e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18733 | -| time_elapsed | 101344 | -| total_timesteps | 2397824 | -| train/ | | -| approx_kl | 0.005696604 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 187320 | -| policy_gradient_loss | 0.013 | -| std | 0.0079 | -| value_loss | 4.06e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18734 | -| time_elapsed | 101349 | -| total_timesteps | 2397952 | -| train/ | | -| approx_kl | 0.05612502 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.0399 | -| n_updates | 187330 | -| policy_gradient_loss | 0.0339 | -| std | 0.00789 | -| value_loss | 3e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18735 | -| time_elapsed | 101353 | -| total_timesteps | 2398080 | -| train/ | | -| approx_kl | 0.24425521 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00468 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 187340 | -| policy_gradient_loss | 0.0878 | -| std | 0.00789 | -| value_loss | 1.3e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18736 | -| time_elapsed | 101364 | -| total_timesteps | 2398208 | -| train/ | | -| approx_kl | 0.0015245117 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 187350 | -| policy_gradient_loss | 0.0054 | -| std | 0.00789 | -| value_loss | 0.000436 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18737 | -| time_elapsed | 101368 | -| total_timesteps | 2398336 | -| train/ | | -| approx_kl | 0.13300063 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.83 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 187360 | -| policy_gradient_loss | 0.0372 | -| std | 0.00789 | -| value_loss | 4.11e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18738 | -| time_elapsed | 101373 | -| total_timesteps | 2398464 | -| train/ | | -| approx_kl | 0.00028970325 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00672 | -| learning_rate | 0.0003 | -| loss | -0.0009 | -| n_updates | 187370 | -| policy_gradient_loss | 0.00345 | -| std | 0.00788 | -| value_loss | 1.1e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18739 | -| time_elapsed | 101377 | -| total_timesteps | 2398592 | -| train/ | | -| approx_kl | 0.01651353 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -2.11 | -| learning_rate | 0.0003 | -| loss | -0.00412 | -| n_updates | 187380 | -| policy_gradient_loss | -0.00322 | -| std | 0.00788 | -| value_loss | 2.73e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18740 | -| time_elapsed | 101382 | -| total_timesteps | 2398720 | -| train/ | | -| approx_kl | 0.010571957 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00974 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 187390 | -| policy_gradient_loss | -0.00376 | -| std | 0.00788 | -| value_loss | 3.67e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18741 | -| time_elapsed | 101387 | -| total_timesteps | 2398848 | -| train/ | | -| approx_kl | 0.0149394935 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 187400 | -| policy_gradient_loss | 0.0136 | -| std | 0.00788 | -| value_loss | 3.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 18742 | -| time_elapsed | 101391 | -| total_timesteps | 2398976 | -| train/ | | -| approx_kl | 0.065826885 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00556 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 187410 | -| policy_gradient_loss | 0.0121 | -| std | 0.00789 | -| value_loss | 5.68e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18743 | -| time_elapsed | 101396 | -| total_timesteps | 2399104 | -| train/ | | -| approx_kl | 0.0046878317 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.00234 | -| n_updates | 187420 | -| policy_gradient_loss | 0.00454 | -| std | 0.00789 | -| value_loss | 4.09e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18744 | -| time_elapsed | 101408 | -| total_timesteps | 2399232 | -| train/ | | -| approx_kl | 0.2119858 | -| clip_fraction | 0.664 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -5.75 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 187430 | -| policy_gradient_loss | 0.0179 | -| std | 0.00789 | -| value_loss | 0.00353 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18745 | -| time_elapsed | 101413 | -| total_timesteps | 2399360 | -| train/ | | -| approx_kl | 0.15115665 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 187440 | -| policy_gradient_loss | 0.11 | -| std | 0.0079 | -| value_loss | 4.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18746 | -| time_elapsed | 101418 | -| total_timesteps | 2399488 | -| train/ | | -| approx_kl | 0.11308944 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00226 | -| learning_rate | 0.0003 | -| loss | 0.0846 | -| n_updates | 187450 | -| policy_gradient_loss | 0.113 | -| std | 0.0079 | -| value_loss | 1.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18747 | -| time_elapsed | 101424 | -| total_timesteps | 2399616 | -| train/ | | -| approx_kl | 0.023776744 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.00263 | -| n_updates | 187460 | -| policy_gradient_loss | 0.0118 | -| std | 0.0079 | -| value_loss | 5.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18748 | -| time_elapsed | 101430 | -| total_timesteps | 2399744 | -| train/ | | -| approx_kl | 0.12156543 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.0437 | -| n_updates | 187470 | -| policy_gradient_loss | 0.0105 | -| std | 0.0079 | -| value_loss | 3.82e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 18749 | -| time_elapsed | 101436 | -| total_timesteps | 2399872 | -| train/ | | -| approx_kl | 0.010005092 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0542 | -| learning_rate | 0.0003 | -| loss | 0.000192 | -| n_updates | 187480 | -| policy_gradient_loss | -0.000874 | -| std | 0.0079 | -| value_loss | 2.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18750 | -| time_elapsed | 101441 | -| total_timesteps | 2400000 | -| train/ | | -| approx_kl | 0.009912729 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 187490 | -| policy_gradient_loss | -0.00283 | -| std | 0.0079 | -| value_loss | 1.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18751 | -| time_elapsed | 101446 | -| total_timesteps | 2400128 | -| train/ | | -| approx_kl | 0.12623227 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00523 | -| learning_rate | 0.0003 | -| loss | 0.0566 | -| n_updates | 187500 | -| policy_gradient_loss | 0.0263 | -| std | 0.00791 | -| value_loss | 9.79e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18752 | -| time_elapsed | 101456 | -| total_timesteps | 2400256 | -| train/ | | -| approx_kl | 0.20683634 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | 0.059 | -| n_updates | 187510 | -| policy_gradient_loss | 0.0168 | -| std | 0.00791 | -| value_loss | 0.000138 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18753 | -| time_elapsed | 101461 | -| total_timesteps | 2400384 | -| train/ | | -| approx_kl | 0.0350337 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -6.52 | -| learning_rate | 0.0003 | -| loss | 0.00808 | -| n_updates | 187520 | -| policy_gradient_loss | 0.0331 | -| std | 0.00791 | -| value_loss | 1.75e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18754 | -| time_elapsed | 101467 | -| total_timesteps | 2400512 | -| train/ | | -| approx_kl | 0.013627683 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | 0.000177 | -| n_updates | 187530 | -| policy_gradient_loss | 0.021 | -| std | 0.00791 | -| value_loss | 4.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18755 | -| time_elapsed | 101471 | -| total_timesteps | 2400640 | -| train/ | | -| approx_kl | 0.020938668 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.00757 | -| n_updates | 187540 | -| policy_gradient_loss | 0.0411 | -| std | 0.00791 | -| value_loss | 2.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18756 | -| time_elapsed | 101476 | -| total_timesteps | 2400768 | -| train/ | | -| approx_kl | 0.106869824 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 187550 | -| policy_gradient_loss | 0.0239 | -| std | 0.00791 | -| value_loss | 3.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 18757 | -| time_elapsed | 101480 | -| total_timesteps | 2400896 | -| train/ | | -| approx_kl | 0.027190164 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0947 | -| learning_rate | 0.0003 | -| loss | 0.00475 | -| n_updates | 187560 | -| policy_gradient_loss | 0.0452 | -| std | 0.00791 | -| value_loss | 1.44e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18758 | -| time_elapsed | 101484 | -| total_timesteps | 2401024 | -| train/ | | -| approx_kl | 0.00030304538 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 3.28e-05 | -| n_updates | 187570 | -| policy_gradient_loss | 0.0626 | -| std | 0.0079 | -| value_loss | 1.57e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18759 | -| time_elapsed | 101495 | -| total_timesteps | 2401152 | -| train/ | | -| approx_kl | 0.038206812 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.232 | -| learning_rate | 0.0003 | -| loss | -0.0093 | -| n_updates | 187580 | -| policy_gradient_loss | 0.00364 | -| std | 0.00789 | -| value_loss | 0.00143 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18760 | -| time_elapsed | 101501 | -| total_timesteps | 2401280 | -| train/ | | -| approx_kl | 0.0051450753 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.276 | -| learning_rate | 0.0003 | -| loss | -0.00999 | -| n_updates | 187590 | -| policy_gradient_loss | 0.0478 | -| std | 0.00789 | -| value_loss | 7.45e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18761 | -| time_elapsed | 101506 | -| total_timesteps | 2401408 | -| train/ | | -| approx_kl | 0.092923395 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.000791 | -| learning_rate | 0.0003 | -| loss | 0.0565 | -| n_updates | 187600 | -| policy_gradient_loss | 0.105 | -| std | 0.00789 | -| value_loss | 3.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18762 | -| time_elapsed | 101511 | -| total_timesteps | 2401536 | -| train/ | | -| approx_kl | 0.067786254 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0891 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 187610 | -| policy_gradient_loss | 0.0306 | -| std | 0.00791 | -| value_loss | 1.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18763 | -| time_elapsed | 101516 | -| total_timesteps | 2401664 | -| train/ | | -| approx_kl | 0.08465841 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 187620 | -| policy_gradient_loss | 0.0162 | -| std | 0.00792 | -| value_loss | 2.13e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18764 | -| time_elapsed | 101520 | -| total_timesteps | 2401792 | -| train/ | | -| approx_kl | 0.0005242727 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 187630 | -| policy_gradient_loss | 0.0188 | -| std | 0.00792 | -| value_loss | 1.14e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 18765 | -| time_elapsed | 101525 | -| total_timesteps | 2401920 | -| train/ | | -| approx_kl | 0.13320628 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.0448 | -| n_updates | 187640 | -| policy_gradient_loss | 0.0133 | -| std | 0.00793 | -| value_loss | 7.5e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18766 | -| time_elapsed | 101530 | -| total_timesteps | 2402048 | -| train/ | | -| approx_kl | 0.016878977 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | -0.00571 | -| n_updates | 187650 | -| policy_gradient_loss | 0.0177 | -| std | 0.00793 | -| value_loss | 4.95e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18767 | -| time_elapsed | 101538 | -| total_timesteps | 2402176 | -| train/ | | -| approx_kl | 0.02390343 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | -0.00878 | -| n_updates | 187660 | -| policy_gradient_loss | -0.00565 | -| std | 0.00793 | -| value_loss | 0.00482 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18768 | -| time_elapsed | 101542 | -| total_timesteps | 2402304 | -| train/ | | -| approx_kl | 0.12502931 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.0728 | -| n_updates | 187670 | -| policy_gradient_loss | 0.0162 | -| std | 0.00793 | -| value_loss | 1.96e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18769 | -| time_elapsed | 101548 | -| total_timesteps | 2402432 | -| train/ | | -| approx_kl | 0.012716533 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.0085 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 187680 | -| policy_gradient_loss | 0.0143 | -| std | 0.00792 | -| value_loss | 1.29e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18770 | -| time_elapsed | 101552 | -| total_timesteps | 2402560 | -| train/ | | -| approx_kl | 0.07868281 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.0373 | -| n_updates | 187690 | -| policy_gradient_loss | 0.0197 | -| std | 0.00792 | -| value_loss | 9.02e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18771 | -| time_elapsed | 101557 | -| total_timesteps | 2402688 | -| train/ | | -| approx_kl | 0.0041984515 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.00478 | -| n_updates | 187700 | -| policy_gradient_loss | 0.0061 | -| std | 0.00792 | -| value_loss | 5.79e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18772 | -| time_elapsed | 101563 | -| total_timesteps | 2402816 | -| train/ | | -| approx_kl | 0.041252427 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 187710 | -| policy_gradient_loss | 0.0142 | -| std | 0.00792 | -| value_loss | 4.13e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 18773 | -| time_elapsed | 101568 | -| total_timesteps | 2402944 | -| train/ | | -| approx_kl | 0.00025238097 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.000747 | -| n_updates | 187720 | -| policy_gradient_loss | 0.0203 | -| std | 0.00792 | -| value_loss | 2.53e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18774 | -| time_elapsed | 101572 | -| total_timesteps | 2403072 | -| train/ | | -| approx_kl | 0.00015550805 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.0025 | -| n_updates | 187730 | -| policy_gradient_loss | -0.0019 | -| std | 0.00793 | -| value_loss | 1.79e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18775 | -| time_elapsed | 101579 | -| total_timesteps | 2403200 | -| train/ | | -| approx_kl | 0.1930905 | -| clip_fraction | 0.633 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.76 | -| learning_rate | 0.0003 | -| loss | 0.0758 | -| n_updates | 187740 | -| policy_gradient_loss | 0.066 | -| std | 0.00793 | -| value_loss | 0.00539 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18776 | -| time_elapsed | 101584 | -| total_timesteps | 2403328 | -| train/ | | -| approx_kl | 0.064658076 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0678 | -| learning_rate | 0.0003 | -| loss | 0.00898 | -| n_updates | 187750 | -| policy_gradient_loss | 0.0145 | -| std | 0.00793 | -| value_loss | 4.37e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18777 | -| time_elapsed | 101590 | -| total_timesteps | 2403456 | -| train/ | | -| approx_kl | 0.014394414 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | 0.00184 | -| n_updates | 187760 | -| policy_gradient_loss | 0.000833 | -| std | 0.00793 | -| value_loss | 0.000177 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18778 | -| time_elapsed | 101595 | -| total_timesteps | 2403584 | -| train/ | | -| approx_kl | 0.0040873173 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -3.52 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 187770 | -| policy_gradient_loss | 0.00143 | -| std | 0.00793 | -| value_loss | 3.9e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18779 | -| time_elapsed | 101599 | -| total_timesteps | 2403712 | -| train/ | | -| approx_kl | 5.993666e-05 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00118 | -| learning_rate | 0.0003 | -| loss | 0.000396 | -| n_updates | 187780 | -| policy_gradient_loss | 0.00783 | -| std | 0.00792 | -| value_loss | 2.32e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18780 | -| time_elapsed | 101604 | -| total_timesteps | 2403840 | -| train/ | | -| approx_kl | 0.041613713 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0969 | -| learning_rate | 0.0003 | -| loss | 0.00199 | -| n_updates | 187790 | -| policy_gradient_loss | 0.029 | -| std | 0.00792 | -| value_loss | 1.3e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18781 | -| time_elapsed | 101609 | -| total_timesteps | 2403968 | -| train/ | | -| approx_kl | 0.21413895 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.0574 | -| n_updates | 187800 | -| policy_gradient_loss | 0.0311 | -| std | 0.00792 | -| value_loss | 6.4e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18782 | -| time_elapsed | 101613 | -| total_timesteps | 2404096 | -| train/ | | -| approx_kl | 0.0008229236 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 187810 | -| policy_gradient_loss | 0.00628 | -| std | 0.00792 | -| value_loss | 4.33e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18783 | -| time_elapsed | 101624 | -| total_timesteps | 2404224 | -| train/ | | -| approx_kl | 0.025560148 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.895 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 187820 | -| policy_gradient_loss | 0.0256 | -| std | 0.00792 | -| value_loss | 0.00151 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18784 | -| time_elapsed | 101629 | -| total_timesteps | 2404352 | -| train/ | | -| approx_kl | 0.18407218 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -3.58 | -| learning_rate | 0.0003 | -| loss | 0.0533 | -| n_updates | 187830 | -| policy_gradient_loss | 0.0167 | -| std | 0.00792 | -| value_loss | 8.24e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18785 | -| time_elapsed | 101633 | -| total_timesteps | 2404480 | -| train/ | | -| approx_kl | 0.00015717 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 187840 | -| policy_gradient_loss | 0.00124 | -| std | 0.00792 | -| value_loss | 1.93e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18786 | -| time_elapsed | 101637 | -| total_timesteps | 2404608 | -| train/ | | -| approx_kl | 7.594982e-05 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | -0.000588 | -| n_updates | 187850 | -| policy_gradient_loss | 0.0065 | -| std | 0.00792 | -| value_loss | 1.34e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18787 | -| time_elapsed | 101643 | -| total_timesteps | 2404736 | -| train/ | | -| approx_kl | 0.00010355376 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 187860 | -| policy_gradient_loss | 0.00111 | -| std | 0.00792 | -| value_loss | 1.02e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18788 | -| time_elapsed | 101648 | -| total_timesteps | 2404864 | -| train/ | | -| approx_kl | 0.00010198448 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 187870 | -| policy_gradient_loss | 0.00138 | -| std | 0.00793 | -| value_loss | 6.74e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18789 | -| time_elapsed | 101654 | -| total_timesteps | 2404992 | -| train/ | | -| approx_kl | 0.054388676 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 187880 | -| policy_gradient_loss | 0.0616 | -| std | 0.00792 | -| value_loss | 3.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 18790 | -| time_elapsed | 101658 | -| total_timesteps | 2405120 | -| train/ | | -| approx_kl | 0.025805041 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 187890 | -| policy_gradient_loss | 0.0177 | -| std | 0.00792 | -| value_loss | 2.75e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 18791 | -| time_elapsed | 101670 | -| total_timesteps | 2405248 | -| train/ | | -| approx_kl | 0.05590223 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 187900 | -| policy_gradient_loss | -0.0184 | -| std | 0.00792 | -| value_loss | 0.000382 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 18792 | -| time_elapsed | 101675 | -| total_timesteps | 2405376 | -| train/ | | -| approx_kl | 0.0132807605 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.401 | -| learning_rate | 0.0003 | -| loss | -0.000269 | -| n_updates | 187910 | -| policy_gradient_loss | 0.038 | -| std | 0.00792 | -| value_loss | 5.65e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 18793 | -| time_elapsed | 101681 | -| total_timesteps | 2405504 | -| train/ | | -| approx_kl | 0.21216236 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 187920 | -| policy_gradient_loss | 0.0315 | -| std | 0.00792 | -| value_loss | 4.24e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 18794 | -| time_elapsed | 101685 | -| total_timesteps | 2405632 | -| train/ | | -| approx_kl | 0.00031366805 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0692 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 187930 | -| policy_gradient_loss | 0.00178 | -| std | 0.00792 | -| value_loss | 3.21e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 18795 | -| time_elapsed | 101689 | -| total_timesteps | 2405760 | -| train/ | | -| approx_kl | 4.135864e-05 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | -0.000268 | -| n_updates | 187940 | -| policy_gradient_loss | 0.0131 | -| std | 0.00791 | -| value_loss | 2.7e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 18796 | -| time_elapsed | 101692 | -| total_timesteps | 2405888 | -| train/ | | -| approx_kl | 0.00014729844 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | -0.000387 | -| n_updates | 187950 | -| policy_gradient_loss | 0.0103 | -| std | 0.0079 | -| value_loss | 3.55e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18797 | -| time_elapsed | 101697 | -| total_timesteps | 2406016 | -| train/ | | -| approx_kl | 7.0731156e-05 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 187960 | -| policy_gradient_loss | -0.00239 | -| std | 0.0079 | -| value_loss | 8.92e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18798 | -| time_elapsed | 101709 | -| total_timesteps | 2406144 | -| train/ | | -| approx_kl | 0.006244209 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 187970 | -| policy_gradient_loss | -0.00534 | -| std | 0.0079 | -| value_loss | 0.000175 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18799 | -| time_elapsed | 101715 | -| total_timesteps | 2406272 | -| train/ | | -| approx_kl | 0.09131585 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.298 | -| learning_rate | 0.0003 | -| loss | 0.0295 | -| n_updates | 187980 | -| policy_gradient_loss | 0.027 | -| std | 0.00789 | -| value_loss | 4.01e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18800 | -| time_elapsed | 101722 | -| total_timesteps | 2406400 | -| train/ | | -| approx_kl | 0.02752495 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.542 | -| learning_rate | 0.0003 | -| loss | 0.0134 | -| n_updates | 187990 | -| policy_gradient_loss | 0.0664 | -| std | 0.00789 | -| value_loss | 4.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18801 | -| time_elapsed | 101727 | -| total_timesteps | 2406528 | -| train/ | | -| approx_kl | 0.18306012 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -5.26 | -| learning_rate | 0.0003 | -| loss | 0.0375 | -| n_updates | 188000 | -| policy_gradient_loss | 0.0182 | -| std | 0.00789 | -| value_loss | 1.73e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18802 | -| time_elapsed | 101732 | -| total_timesteps | 2406656 | -| train/ | | -| approx_kl | 0.043521285 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00457 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 188010 | -| policy_gradient_loss | 0.0597 | -| std | 0.00789 | -| value_loss | 1.3e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18803 | -| time_elapsed | 101736 | -| total_timesteps | 2406784 | -| train/ | | -| approx_kl | 0.038807847 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 188020 | -| policy_gradient_loss | 0.0219 | -| std | 0.00789 | -| value_loss | 9.86e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 18804 | -| time_elapsed | 101741 | -| total_timesteps | 2406912 | -| train/ | | -| approx_kl | 0.080554195 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.000328 | -| n_updates | 188030 | -| policy_gradient_loss | -0.00513 | -| std | 0.00789 | -| value_loss | 6.02e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18805 | -| time_elapsed | 101744 | -| total_timesteps | 2407040 | -| train/ | | -| approx_kl | 0.0074928836 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 188040 | -| policy_gradient_loss | 0.0586 | -| std | 0.00789 | -| value_loss | 3.2e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18806 | -| time_elapsed | 101750 | -| total_timesteps | 2407168 | -| train/ | | -| approx_kl | 0.06421032 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 188050 | -| policy_gradient_loss | 0.0279 | -| std | 0.00791 | -| value_loss | 0.00176 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18807 | -| time_elapsed | 101754 | -| total_timesteps | 2407296 | -| train/ | | -| approx_kl | 0.0032435218 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 188060 | -| policy_gradient_loss | 0.0289 | -| std | 0.00791 | -| value_loss | 8.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18808 | -| time_elapsed | 101759 | -| total_timesteps | 2407424 | -| train/ | | -| approx_kl | 0.046347886 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00886 | -| learning_rate | 0.0003 | -| loss | 0.0284 | -| n_updates | 188070 | -| policy_gradient_loss | 0.0205 | -| std | 0.00791 | -| value_loss | 5.49e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18809 | -| time_elapsed | 101764 | -| total_timesteps | 2407552 | -| train/ | | -| approx_kl | 0.4432884 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.639 | -| learning_rate | 0.0003 | -| loss | 0.0967 | -| n_updates | 188080 | -| policy_gradient_loss | 0.0302 | -| std | 0.00791 | -| value_loss | 2.3e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18810 | -| time_elapsed | 101769 | -| total_timesteps | 2407680 | -| train/ | | -| approx_kl | 0.009765632 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 188090 | -| policy_gradient_loss | 0.000839 | -| std | 0.00791 | -| value_loss | 7.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18811 | -| time_elapsed | 101775 | -| total_timesteps | 2407808 | -| train/ | | -| approx_kl | 0.042767122 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 188100 | -| policy_gradient_loss | 0.0127 | -| std | 0.00792 | -| value_loss | 5.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 18812 | -| time_elapsed | 101780 | -| total_timesteps | 2407936 | -| train/ | | -| approx_kl | 0.026182607 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.00762 | -| n_updates | 188110 | -| policy_gradient_loss | 0.00398 | -| std | 0.00792 | -| value_loss | 8.32e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18813 | -| time_elapsed | 101784 | -| total_timesteps | 2408064 | -| train/ | | -| approx_kl | 0.0050531183 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | -0.000604 | -| n_updates | 188120 | -| policy_gradient_loss | 0.00371 | -| std | 0.00792 | -| value_loss | 3.76e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18814 | -| time_elapsed | 101793 | -| total_timesteps | 2408192 | -| train/ | | -| approx_kl | 0.0030137878 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | -0.00285 | -| n_updates | 188130 | -| policy_gradient_loss | 0.00594 | -| std | 0.00792 | -| value_loss | 0.000522 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18815 | -| time_elapsed | 101798 | -| total_timesteps | 2408320 | -| train/ | | -| approx_kl | 0.04328259 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 188140 | -| policy_gradient_loss | 0.00738 | -| std | 0.00791 | -| value_loss | 1.14e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18816 | -| time_elapsed | 101803 | -| total_timesteps | 2408448 | -| train/ | | -| approx_kl | 0.03196331 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00983 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 188150 | -| policy_gradient_loss | 0.0127 | -| std | 0.00792 | -| value_loss | 1.23e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18817 | -| time_elapsed | 101807 | -| total_timesteps | 2408576 | -| train/ | | -| approx_kl | 4.4891145e-05 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 188160 | -| policy_gradient_loss | -0.00154 | -| std | 0.00792 | -| value_loss | 1.18e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18818 | -| time_elapsed | 101812 | -| total_timesteps | 2408704 | -| train/ | | -| approx_kl | 0.0064091 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 188170 | -| policy_gradient_loss | 0.00347 | -| std | 0.00792 | -| value_loss | 3.89e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18819 | -| time_elapsed | 101817 | -| total_timesteps | 2408832 | -| train/ | | -| approx_kl | 0.04836925 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 188180 | -| policy_gradient_loss | 0.00733 | -| std | 0.00792 | -| value_loss | 8.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 18820 | -| time_elapsed | 101822 | -| total_timesteps | 2408960 | -| train/ | | -| approx_kl | 0.029100161 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00299 | -| learning_rate | 0.0003 | -| loss | 0.00379 | -| n_updates | 188190 | -| policy_gradient_loss | 0.00274 | -| std | 0.00792 | -| value_loss | 2.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18821 | -| time_elapsed | 101827 | -| total_timesteps | 2409088 | -| train/ | | -| approx_kl | 0.0057736775 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 188200 | -| policy_gradient_loss | 0.00415 | -| std | 0.00792 | -| value_loss | 1.53e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18822 | -| time_elapsed | 101838 | -| total_timesteps | 2409216 | -| train/ | | -| approx_kl | 0.10664324 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 188210 | -| policy_gradient_loss | 0.00807 | -| std | 0.00792 | -| value_loss | 0.00319 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18823 | -| time_elapsed | 101843 | -| total_timesteps | 2409344 | -| train/ | | -| approx_kl | 0.06251511 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.0966 | -| n_updates | 188220 | -| policy_gradient_loss | 0.00791 | -| std | 0.00791 | -| value_loss | 2.39e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18824 | -| time_elapsed | 101848 | -| total_timesteps | 2409472 | -| train/ | | -| approx_kl | 0.0004987046 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.000179 | -| n_updates | 188230 | -| policy_gradient_loss | 0.0266 | -| std | 0.0079 | -| value_loss | 0.000265 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18825 | -| time_elapsed | 101855 | -| total_timesteps | 2409600 | -| train/ | | -| approx_kl | 0.14464065 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00756 | -| learning_rate | 0.0003 | -| loss | 0.0901 | -| n_updates | 188240 | -| policy_gradient_loss | 0.117 | -| std | 0.00788 | -| value_loss | 0.00709 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18826 | -| time_elapsed | 101860 | -| total_timesteps | 2409728 | -| train/ | | -| approx_kl | 0.12078872 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.0761 | -| n_updates | 188250 | -| policy_gradient_loss | 0.12 | -| std | 0.00788 | -| value_loss | 0.000586 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18827 | -| time_elapsed | 101864 | -| total_timesteps | 2409856 | -| train/ | | -| approx_kl | 0.08437054 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00312 | -| learning_rate | 0.0003 | -| loss | 0.0965 | -| n_updates | 188260 | -| policy_gradient_loss | 0.0807 | -| std | 0.00788 | -| value_loss | 0.000334 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18828 | -| time_elapsed | 101870 | -| total_timesteps | 2409984 | -| train/ | | -| approx_kl | 0.08266772 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0616 | -| n_updates | 188270 | -| policy_gradient_loss | 0.0944 | -| std | 0.00788 | -| value_loss | 0.000193 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18829 | -| time_elapsed | 101875 | -| total_timesteps | 2410112 | -| train/ | | -| approx_kl | 0.022645347 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 188280 | -| policy_gradient_loss | 0.0205 | -| std | 0.00788 | -| value_loss | 0.000166 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18830 | -| time_elapsed | 101887 | -| total_timesteps | 2410240 | -| train/ | | -| approx_kl | 0.095909834 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | 0.0431 | -| n_updates | 188290 | -| policy_gradient_loss | 0.012 | -| std | 0.00788 | -| value_loss | 0.000827 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18831 | -| time_elapsed | 101891 | -| total_timesteps | 2410368 | -| train/ | | -| approx_kl | 0.098543055 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 188300 | -| policy_gradient_loss | -0.00156 | -| std | 0.00788 | -| value_loss | 4.72e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18832 | -| time_elapsed | 101895 | -| total_timesteps | 2410496 | -| train/ | | -| approx_kl | 0.015901761 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 188310 | -| policy_gradient_loss | 0.0172 | -| std | 0.00788 | -| value_loss | 3.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18833 | -| time_elapsed | 101899 | -| total_timesteps | 2410624 | -| train/ | | -| approx_kl | 0.070941985 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 188320 | -| policy_gradient_loss | 0.0461 | -| std | 0.00788 | -| value_loss | 2.91e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18834 | -| time_elapsed | 101903 | -| total_timesteps | 2410752 | -| train/ | | -| approx_kl | 0.16550888 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.0924 | -| n_updates | 188330 | -| policy_gradient_loss | 0.0338 | -| std | 0.00788 | -| value_loss | 1.73e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18835 | -| time_elapsed | 101909 | -| total_timesteps | 2410880 | -| train/ | | -| approx_kl | 0.0014648121 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 188340 | -| policy_gradient_loss | 0.00748 | -| std | 0.00787 | -| value_loss | 1.12e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18836 | -| time_elapsed | 101914 | -| total_timesteps | 2411008 | -| train/ | | -| approx_kl | 9.359792e-08 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0576 | -| learning_rate | 0.0003 | -| loss | -7.29e-05 | -| n_updates | 188350 | -| policy_gradient_loss | -0.00536 | -| std | 0.00787 | -| value_loss | 9.96e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18837 | -| time_elapsed | 101925 | -| total_timesteps | 2411136 | -| train/ | | -| approx_kl | 0.005465344 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.938 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 188360 | -| policy_gradient_loss | -0.00177 | -| std | 0.00788 | -| value_loss | 0.000303 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18838 | -| time_elapsed | 101932 | -| total_timesteps | 2411264 | -| train/ | | -| approx_kl | 0.04133762 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.196 | -| learning_rate | 0.0003 | -| loss | 0.00795 | -| n_updates | 188370 | -| policy_gradient_loss | 0.0155 | -| std | 0.00788 | -| value_loss | 4.17e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18839 | -| time_elapsed | 101938 | -| total_timesteps | 2411392 | -| train/ | | -| approx_kl | 0.0015109745 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | -0.000312 | -| n_updates | 188380 | -| policy_gradient_loss | 0.0187 | -| std | 0.00789 | -| value_loss | 1.4e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18840 | -| time_elapsed | 101944 | -| total_timesteps | 2411520 | -| train/ | | -| approx_kl | 0.0066394447 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00143 | -| learning_rate | 0.0003 | -| loss | 0.00322 | -| n_updates | 188390 | -| policy_gradient_loss | 0.0184 | -| std | 0.0079 | -| value_loss | 1.92e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18841 | -| time_elapsed | 101949 | -| total_timesteps | 2411648 | -| train/ | | -| approx_kl | 0.3538922 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 188400 | -| policy_gradient_loss | 0.126 | -| std | 0.0079 | -| value_loss | 4.98e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18842 | -| time_elapsed | 101954 | -| total_timesteps | 2411776 | -| train/ | | -| approx_kl | 0.14980379 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 188410 | -| policy_gradient_loss | 0.0954 | -| std | 0.0079 | -| value_loss | 2.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18843 | -| time_elapsed | 101960 | -| total_timesteps | 2411904 | -| train/ | | -| approx_kl | 0.14429095 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.0848 | -| n_updates | 188420 | -| policy_gradient_loss | 0.107 | -| std | 0.0079 | -| value_loss | 1.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18844 | -| time_elapsed | 101965 | -| total_timesteps | 2412032 | -| train/ | | -| approx_kl | 0.02459472 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 188430 | -| policy_gradient_loss | 0.0215 | -| std | 0.0079 | -| value_loss | 1.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18845 | -| time_elapsed | 101978 | -| total_timesteps | 2412160 | -| train/ | | -| approx_kl | 0.002903876 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.874 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 188440 | -| policy_gradient_loss | -0.0136 | -| std | 0.0079 | -| value_loss | 0.000518 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18846 | -| time_elapsed | 101983 | -| total_timesteps | 2412288 | -| train/ | | -| approx_kl | 0.03309147 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | 0.00682 | -| n_updates | 188450 | -| policy_gradient_loss | 0.0243 | -| std | 0.0079 | -| value_loss | 1.73e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18847 | -| time_elapsed | 101988 | -| total_timesteps | 2412416 | -| train/ | | -| approx_kl | 0.8445649 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | 0.441 | -| n_updates | 188460 | -| policy_gradient_loss | 0.174 | -| std | 0.0079 | -| value_loss | 4.12e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18848 | -| time_elapsed | 101993 | -| total_timesteps | 2412544 | -| train/ | | -| approx_kl | 0.0048872293 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 188470 | -| policy_gradient_loss | 0.0136 | -| std | 0.0079 | -| value_loss | 3.28e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18849 | -| time_elapsed | 101996 | -| total_timesteps | 2412672 | -| train/ | | -| approx_kl | 0.00015777675 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 188480 | -| policy_gradient_loss | 0.0224 | -| std | 0.00791 | -| value_loss | 2.23e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18850 | -| time_elapsed | 101999 | -| total_timesteps | 2412800 | -| train/ | | -| approx_kl | 0.30252352 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00772 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 188490 | -| policy_gradient_loss | 0.0373 | -| std | 0.00794 | -| value_loss | 0.000233 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 18851 | -| time_elapsed | 102004 | -| total_timesteps | 2412928 | -| train/ | | -| approx_kl | 0.027579874 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0918 | -| learning_rate | 0.0003 | -| loss | 0.00301 | -| n_updates | 188500 | -| policy_gradient_loss | 0.00172 | -| std | 0.00795 | -| value_loss | 4.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18852 | -| time_elapsed | 102010 | -| total_timesteps | 2413056 | -| train/ | | -| approx_kl | 0.029041432 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 188510 | -| policy_gradient_loss | -0.0114 | -| std | 0.00796 | -| value_loss | 4.03e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18853 | -| time_elapsed | 102019 | -| total_timesteps | 2413184 | -| train/ | | -| approx_kl | 0.0076061096 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.867 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 188520 | -| policy_gradient_loss | 0.00458 | -| std | 0.00796 | -| value_loss | 0.000661 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18854 | -| time_elapsed | 102025 | -| total_timesteps | 2413312 | -| train/ | | -| approx_kl | 0.123488896 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.0091 | -| learning_rate | 0.0003 | -| loss | 0.0914 | -| n_updates | 188530 | -| policy_gradient_loss | 0.0227 | -| std | 0.00795 | -| value_loss | 4.29e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18855 | -| time_elapsed | 102029 | -| total_timesteps | 2413440 | -| train/ | | -| approx_kl | 0.018109618 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -2.24 | -| learning_rate | 0.0003 | -| loss | -0.00616 | -| n_updates | 188540 | -| policy_gradient_loss | 0.0109 | -| std | 0.00795 | -| value_loss | 2.79e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18856 | -| time_elapsed | 102034 | -| total_timesteps | 2413568 | -| train/ | | -| approx_kl | 0.18258001 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.837 | -| learning_rate | 0.0003 | -| loss | 0.077 | -| n_updates | 188550 | -| policy_gradient_loss | 0.0668 | -| std | 0.00795 | -| value_loss | 5.39e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18857 | -| time_elapsed | 102039 | -| total_timesteps | 2413696 | -| train/ | | -| approx_kl | 0.029280145 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0733 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 188560 | -| policy_gradient_loss | 0.0119 | -| std | 0.00795 | -| value_loss | 2.53e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18858 | -| time_elapsed | 102043 | -| total_timesteps | 2413824 | -| train/ | | -| approx_kl | 0.00056511024 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.000229 | -| n_updates | 188570 | -| policy_gradient_loss | 0.0255 | -| std | 0.00795 | -| value_loss | 1.8e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 18859 | -| time_elapsed | 102047 | -| total_timesteps | 2413952 | -| train/ | | -| approx_kl | 0.12214502 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.0651 | -| n_updates | 188580 | -| policy_gradient_loss | 0.0159 | -| std | 0.00795 | -| value_loss | 1.9e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18860 | -| time_elapsed | 102053 | -| total_timesteps | 2414080 | -| train/ | | -| approx_kl | 0.014821723 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.00332 | -| n_updates | 188590 | -| policy_gradient_loss | 0.0208 | -| std | 0.00795 | -| value_loss | 6.1e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18861 | -| time_elapsed | 102063 | -| total_timesteps | 2414208 | -| train/ | | -| approx_kl | 0.49112177 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.919 | -| learning_rate | 0.0003 | -| loss | 0.0806 | -| n_updates | 188600 | -| policy_gradient_loss | 0.0539 | -| std | 0.00795 | -| value_loss | 0.00105 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18862 | -| time_elapsed | 102070 | -| total_timesteps | 2414336 | -| train/ | | -| approx_kl | 0.033333834 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.075 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 188610 | -| policy_gradient_loss | 0.0107 | -| std | 0.00794 | -| value_loss | 5.58e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18863 | -| time_elapsed | 102075 | -| total_timesteps | 2414464 | -| train/ | | -| approx_kl | 0.0039835777 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.443 | -| learning_rate | 0.0003 | -| loss | 0.000934 | -| n_updates | 188620 | -| policy_gradient_loss | 0.0159 | -| std | 0.00792 | -| value_loss | 3.18e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18864 | -| time_elapsed | 102079 | -| total_timesteps | 2414592 | -| train/ | | -| approx_kl | 0.0017441656 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.336 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 188630 | -| policy_gradient_loss | 0.00723 | -| std | 0.00792 | -| value_loss | 4.16e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18865 | -| time_elapsed | 102084 | -| total_timesteps | 2414720 | -| train/ | | -| approx_kl | 0.052410226 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.00323 | -| n_updates | 188640 | -| policy_gradient_loss | 0.00922 | -| std | 0.00792 | -| value_loss | 1.13e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18866 | -| time_elapsed | 102088 | -| total_timesteps | 2414848 | -| train/ | | -| approx_kl | 0.023652656 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.00715 | -| n_updates | 188650 | -| policy_gradient_loss | 0.0218 | -| std | 0.00792 | -| value_loss | 7.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 18867 | -| time_elapsed | 102093 | -| total_timesteps | 2414976 | -| train/ | | -| approx_kl | 0.20448293 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.0544 | -| n_updates | 188660 | -| policy_gradient_loss | 0.0182 | -| std | 0.00792 | -| value_loss | 5.97e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18868 | -| time_elapsed | 102096 | -| total_timesteps | 2415104 | -| train/ | | -| approx_kl | 8.808449e-06 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | -0.000263 | -| n_updates | 188670 | -| policy_gradient_loss | 0.00499 | -| std | 0.00792 | -| value_loss | 3.85e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18869 | -| time_elapsed | 102108 | -| total_timesteps | 2415232 | -| train/ | | -| approx_kl | 3.5723206e-05 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 188680 | -| policy_gradient_loss | -0.00265 | -| std | 0.00792 | -| value_loss | 1.52e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18870 | -| time_elapsed | 102113 | -| total_timesteps | 2415360 | -| train/ | | -| approx_kl | 0.04101335 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.922 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 188690 | -| policy_gradient_loss | 0.041 | -| std | 0.00791 | -| value_loss | 1.81e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18871 | -| time_elapsed | 102117 | -| total_timesteps | 2415488 | -| train/ | | -| approx_kl | 0.017769383 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -21.2 | -| learning_rate | 0.0003 | -| loss | -0.00778 | -| n_updates | 188700 | -| policy_gradient_loss | 0.00271 | -| std | 0.00791 | -| value_loss | 5.37e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18872 | -| time_elapsed | 102121 | -| total_timesteps | 2415616 | -| train/ | | -| approx_kl | 0.10824108 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 188710 | -| policy_gradient_loss | 0.00746 | -| std | 0.00791 | -| value_loss | 2.07e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18873 | -| time_elapsed | 102125 | -| total_timesteps | 2415744 | -| train/ | | -| approx_kl | 0.035625797 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 188720 | -| policy_gradient_loss | 0.0222 | -| std | 0.00791 | -| value_loss | 1.42e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.878 | -| time/ | | -| fps | 23 | -| iterations | 18874 | -| time_elapsed | 102130 | -| total_timesteps | 2415872 | -| train/ | | -| approx_kl | 0.20695423 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 188730 | -| policy_gradient_loss | 0.0973 | -| std | 0.00791 | -| value_loss | 1.15e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18875 | -| time_elapsed | 102134 | -| total_timesteps | 2416000 | -| train/ | | -| approx_kl | 0.036050748 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 188740 | -| policy_gradient_loss | 0.0167 | -| std | 0.00791 | -| value_loss | 6.83e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18876 | -| time_elapsed | 102138 | -| total_timesteps | 2416128 | -| train/ | | -| approx_kl | 0.032027513 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00472 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 188750 | -| policy_gradient_loss | -0.002 | -| std | 0.00791 | -| value_loss | 4.13e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18877 | -| time_elapsed | 102147 | -| total_timesteps | 2416256 | -| train/ | | -| approx_kl | 0.004682919 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 188760 | -| policy_gradient_loss | -0.00319 | -| std | 0.00791 | -| value_loss | 0.000854 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18878 | -| time_elapsed | 102151 | -| total_timesteps | 2416384 | -| train/ | | -| approx_kl | 0.032958113 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0159 | -| n_updates | 188770 | -| policy_gradient_loss | 0.00705 | -| std | 0.00791 | -| value_loss | 3.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18879 | -| time_elapsed | 102155 | -| total_timesteps | 2416512 | -| train/ | | -| approx_kl | 0.033232316 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | -0.00795 | -| n_updates | 188780 | -| policy_gradient_loss | -0.00363 | -| std | 0.00791 | -| value_loss | 5.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18880 | -| time_elapsed | 102159 | -| total_timesteps | 2416640 | -| train/ | | -| approx_kl | 0.039394487 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 188790 | -| policy_gradient_loss | 0.0104 | -| std | 0.00791 | -| value_loss | 3.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18881 | -| time_elapsed | 102164 | -| total_timesteps | 2416768 | -| train/ | | -| approx_kl | 0.031934045 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 188800 | -| policy_gradient_loss | 0.00607 | -| std | 0.00791 | -| value_loss | 2.29e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 18882 | -| time_elapsed | 102168 | -| total_timesteps | 2416896 | -| train/ | | -| approx_kl | 0.0068784975 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | -0.00963 | -| n_updates | 188810 | -| policy_gradient_loss | 0.00333 | -| std | 0.0079 | -| value_loss | 1.93e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18883 | -| time_elapsed | 102172 | -| total_timesteps | 2417024 | -| train/ | | -| approx_kl | 0.030346518 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 188820 | -| policy_gradient_loss | 0.104 | -| std | 0.00791 | -| value_loss | 9.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18884 | -| time_elapsed | 102182 | -| total_timesteps | 2417152 | -| train/ | | -| approx_kl | 0.025287136 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 188830 | -| policy_gradient_loss | 0.0352 | -| std | 0.00791 | -| value_loss | 0.00324 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18885 | -| time_elapsed | 102188 | -| total_timesteps | 2417280 | -| train/ | | -| approx_kl | 0.091772124 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | 0.0847 | -| n_updates | 188840 | -| policy_gradient_loss | 0.107 | -| std | 0.00791 | -| value_loss | 5.81e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18886 | -| time_elapsed | 102193 | -| total_timesteps | 2417408 | -| train/ | | -| approx_kl | 0.09744388 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00859 | -| learning_rate | 0.0003 | -| loss | 0.0962 | -| n_updates | 188850 | -| policy_gradient_loss | 0.105 | -| std | 0.00791 | -| value_loss | 1.94e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18887 | -| time_elapsed | 102198 | -| total_timesteps | 2417536 | -| train/ | | -| approx_kl | 0.018924229 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00772 | -| learning_rate | 0.0003 | -| loss | -0.00665 | -| n_updates | 188860 | -| policy_gradient_loss | 0.0156 | -| std | 0.00791 | -| value_loss | 1.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18888 | -| time_elapsed | 102203 | -| total_timesteps | 2417664 | -| train/ | | -| approx_kl | 0.15265091 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.0681 | -| n_updates | 188870 | -| policy_gradient_loss | 0.0176 | -| std | 0.00791 | -| value_loss | 5.52e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18889 | -| time_elapsed | 102207 | -| total_timesteps | 2417792 | -| train/ | | -| approx_kl | 0.115390316 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 188880 | -| policy_gradient_loss | 0.00817 | -| std | 0.00792 | -| value_loss | 3.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 18890 | -| time_elapsed | 102211 | -| total_timesteps | 2417920 | -| train/ | | -| approx_kl | 0.13957624 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.0868 | -| n_updates | 188890 | -| policy_gradient_loss | 0.0152 | -| std | 0.00797 | -| value_loss | 0.000109 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18891 | -| time_elapsed | 102216 | -| total_timesteps | 2418048 | -| train/ | | -| approx_kl | 0.08881698 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -13.5 | -| learning_rate | 0.0003 | -| loss | 0.00359 | -| n_updates | 188900 | -| policy_gradient_loss | 0.00174 | -| std | 0.00802 | -| value_loss | 0.000534 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18892 | -| time_elapsed | 102225 | -| total_timesteps | 2418176 | -| train/ | | -| approx_kl | 0.08270659 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 188910 | -| policy_gradient_loss | 0.00494 | -| std | 0.00805 | -| value_loss | 0.00168 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18893 | -| time_elapsed | 102231 | -| total_timesteps | 2418304 | -| train/ | | -| approx_kl | 0.052029666 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -2.79 | -| learning_rate | 0.0003 | -| loss | 0.0623 | -| n_updates | 188920 | -| policy_gradient_loss | 0.00834 | -| std | 0.00805 | -| value_loss | 0.000129 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18894 | -| time_elapsed | 102236 | -| total_timesteps | 2418432 | -| train/ | | -| approx_kl | 0.034651052 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.754 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 188930 | -| policy_gradient_loss | 0.0211 | -| std | 0.00806 | -| value_loss | 7.77e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18895 | -| time_elapsed | 102240 | -| total_timesteps | 2418560 | -| train/ | | -| approx_kl | 0.10768521 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0944 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 188940 | -| policy_gradient_loss | 0.0245 | -| std | 0.00806 | -| value_loss | 4.61e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18896 | -| time_elapsed | 102244 | -| total_timesteps | 2418688 | -| train/ | | -| approx_kl | 0.24085045 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 188950 | -| policy_gradient_loss | 0.0967 | -| std | 0.00806 | -| value_loss | 2.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18897 | -| time_elapsed | 102248 | -| total_timesteps | 2418816 | -| train/ | | -| approx_kl | 0.050046593 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 188960 | -| policy_gradient_loss | 0.015 | -| std | 0.00806 | -| value_loss | 2.37e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 18898 | -| time_elapsed | 102254 | -| total_timesteps | 2418944 | -| train/ | | -| approx_kl | 0.00014903629 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 7.49e-05 | -| n_updates | 188970 | -| policy_gradient_loss | 0.0205 | -| std | 0.00806 | -| value_loss | 2.46e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18899 | -| time_elapsed | 102259 | -| total_timesteps | 2419072 | -| train/ | | -| approx_kl | 0.15230584 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0661 | -| n_updates | 188980 | -| policy_gradient_loss | 0.0196 | -| std | 0.00806 | -| value_loss | 6.83e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18900 | -| time_elapsed | 102267 | -| total_timesteps | 2419200 | -| train/ | | -| approx_kl | 0.12204479 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | 0.0587 | -| n_updates | 188990 | -| policy_gradient_loss | 0.00708 | -| std | 0.00806 | -| value_loss | 0.00113 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18901 | -| time_elapsed | 102272 | -| total_timesteps | 2419328 | -| train/ | | -| approx_kl | 0.035788845 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 189000 | -| policy_gradient_loss | 0.0212 | -| std | 0.00806 | -| value_loss | 1.37e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18902 | -| time_elapsed | 102276 | -| total_timesteps | 2419456 | -| train/ | | -| approx_kl | 0.2694656 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.234 | -| n_updates | 189010 | -| policy_gradient_loss | 0.0748 | -| std | 0.00805 | -| value_loss | 4.34e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18903 | -| time_elapsed | 102280 | -| total_timesteps | 2419584 | -| train/ | | -| approx_kl | 0.004942877 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | -0.00762 | -| n_updates | 189020 | -| policy_gradient_loss | 0.00585 | -| std | 0.00805 | -| value_loss | 5.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18904 | -| time_elapsed | 102286 | -| total_timesteps | 2419712 | -| train/ | | -| approx_kl | 0.050587203 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 189030 | -| policy_gradient_loss | 0.0472 | -| std | 0.00805 | -| value_loss | 4.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18905 | -| time_elapsed | 102291 | -| total_timesteps | 2419840 | -| train/ | | -| approx_kl | 0.16226476 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 189040 | -| policy_gradient_loss | 0.0194 | -| std | 0.00805 | -| value_loss | 5.11e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 18906 | -| time_elapsed | 102294 | -| total_timesteps | 2419968 | -| train/ | | -| approx_kl | 0.00014623487 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -60.9 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 189050 | -| policy_gradient_loss | -0.00756 | -| std | 0.00805 | -| value_loss | 2.49e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18907 | -| time_elapsed | 102299 | -| total_timesteps | 2420096 | -| train/ | | -| approx_kl | 0.0066903653 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 189060 | -| policy_gradient_loss | 0.0811 | -| std | 0.00805 | -| value_loss | 3.05e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18908 | -| time_elapsed | 102310 | -| total_timesteps | 2420224 | -| train/ | | -| approx_kl | 0.2515599 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 189070 | -| policy_gradient_loss | 0.00795 | -| std | 0.00805 | -| value_loss | 0.000463 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18909 | -| time_elapsed | 102315 | -| total_timesteps | 2420352 | -| train/ | | -| approx_kl | 0.04375421 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.00231 | -| n_updates | 189080 | -| policy_gradient_loss | 0.0361 | -| std | 0.00804 | -| value_loss | 2.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18910 | -| time_elapsed | 102320 | -| total_timesteps | 2420480 | -| train/ | | -| approx_kl | 0.21206768 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00414 | -| learning_rate | 0.0003 | -| loss | 0.064 | -| n_updates | 189090 | -| policy_gradient_loss | 0.0243 | -| std | 0.00805 | -| value_loss | 5.53e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18911 | -| time_elapsed | 102325 | -| total_timesteps | 2420608 | -| train/ | | -| approx_kl | 0.0012219264 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.000685 | -| n_updates | 189100 | -| policy_gradient_loss | 0.0091 | -| std | 0.00805 | -| value_loss | 2.9e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18912 | -| time_elapsed | 102330 | -| total_timesteps | 2420736 | -| train/ | | -| approx_kl | 0.059479676 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0834 | -| learning_rate | 0.0003 | -| loss | 0.0381 | -| n_updates | 189110 | -| policy_gradient_loss | 0.0562 | -| std | 0.00805 | -| value_loss | 2.98e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18913 | -| time_elapsed | 102334 | -| total_timesteps | 2420864 | -| train/ | | -| approx_kl | 0.1408289 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 189120 | -| policy_gradient_loss | 0.0202 | -| std | 0.00805 | -| value_loss | 1.84e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 18914 | -| time_elapsed | 102338 | -| total_timesteps | 2420992 | -| train/ | | -| approx_kl | 0.0009886231 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 189130 | -| policy_gradient_loss | 0.0073 | -| std | 0.00806 | -| value_loss | 9.04e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 18915 | -| time_elapsed | 102344 | -| total_timesteps | 2421120 | -| train/ | | -| approx_kl | 8.381903e-08 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | -5.22e-05 | -| n_updates | 189140 | -| policy_gradient_loss | -0.000477 | -| std | 0.00806 | -| value_loss | 7.58e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 18916 | -| time_elapsed | 102355 | -| total_timesteps | 2421248 | -| train/ | | -| approx_kl | 0.0016618562 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 189150 | -| policy_gradient_loss | 0.00302 | -| std | 0.00805 | -| value_loss | 6.1e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 18917 | -| time_elapsed | 102360 | -| total_timesteps | 2421376 | -| train/ | | -| approx_kl | 0.000501432 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.33 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 189160 | -| policy_gradient_loss | 0.00618 | -| std | 0.00805 | -| value_loss | 3.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 18918 | -| time_elapsed | 102364 | -| total_timesteps | 2421504 | -| train/ | | -| approx_kl | 0.046505142 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 189170 | -| policy_gradient_loss | 0.0465 | -| std | 0.00805 | -| value_loss | 1.19e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 18919 | -| time_elapsed | 102369 | -| total_timesteps | 2421632 | -| train/ | | -| approx_kl | 0.2248786 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 189180 | -| policy_gradient_loss | 0.048 | -| std | 0.00804 | -| value_loss | 8.36e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 18920 | -| time_elapsed | 102373 | -| total_timesteps | 2421760 | -| train/ | | -| approx_kl | 0.0006679408 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0477 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 189190 | -| policy_gradient_loss | 0.00215 | -| std | 0.00804 | -| value_loss | 6.59e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 18921 | -| time_elapsed | 102378 | -| total_timesteps | 2421888 | -| train/ | | -| approx_kl | 3.000861e-05 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | -0.000424 | -| n_updates | 189200 | -| policy_gradient_loss | 0.00482 | -| std | 0.00804 | -| value_loss | 4.13e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18922 | -| time_elapsed | 102382 | -| total_timesteps | 2422016 | -| train/ | | -| approx_kl | 0.04961951 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0466 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 189210 | -| policy_gradient_loss | 0.0535 | -| std | 0.00804 | -| value_loss | 3.41e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18923 | -| time_elapsed | 102392 | -| total_timesteps | 2422144 | -| train/ | | -| approx_kl | 0.02105549 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 189220 | -| policy_gradient_loss | 0.0336 | -| std | 0.00804 | -| value_loss | 0.0015 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18924 | -| time_elapsed | 102397 | -| total_timesteps | 2422272 | -| train/ | | -| approx_kl | 0.18668868 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 189230 | -| policy_gradient_loss | 0.0188 | -| std | 0.00804 | -| value_loss | 9.42e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18925 | -| time_elapsed | 102401 | -| total_timesteps | 2422400 | -| train/ | | -| approx_kl | 0.037205696 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.811 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 189240 | -| policy_gradient_loss | 0.0349 | -| std | 0.00803 | -| value_loss | 7.3e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18926 | -| time_elapsed | 102407 | -| total_timesteps | 2422528 | -| train/ | | -| approx_kl | 0.17462263 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -235 | -| learning_rate | 0.0003 | -| loss | 0.00713 | -| n_updates | 189250 | -| policy_gradient_loss | 0.00379 | -| std | 0.00804 | -| value_loss | 1.31e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18927 | -| time_elapsed | 102412 | -| total_timesteps | 2422656 | -| train/ | | -| approx_kl | 0.00013372116 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.000244 | -| n_updates | 189260 | -| policy_gradient_loss | 0.0202 | -| std | 0.00804 | -| value_loss | 1.09e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18928 | -| time_elapsed | 102417 | -| total_timesteps | 2422784 | -| train/ | | -| approx_kl | 0.060635973 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 189270 | -| policy_gradient_loss | 0.0429 | -| std | 0.00802 | -| value_loss | 1.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 18929 | -| time_elapsed | 102421 | -| total_timesteps | 2422912 | -| train/ | | -| approx_kl | 0.25891668 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.203 | -| n_updates | 189280 | -| policy_gradient_loss | 0.128 | -| std | 0.00801 | -| value_loss | 9.11e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18930 | -| time_elapsed | 102426 | -| total_timesteps | 2423040 | -| train/ | | -| approx_kl | 0.11519583 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 189290 | -| policy_gradient_loss | 0.0844 | -| std | 0.00801 | -| value_loss | 1.77e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18931 | -| time_elapsed | 102435 | -| total_timesteps | 2423168 | -| train/ | | -| approx_kl | 0.5220873 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | 0.0728 | -| n_updates | 189300 | -| policy_gradient_loss | 0.0495 | -| std | 0.00801 | -| value_loss | 0.00305 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18932 | -| time_elapsed | 102440 | -| total_timesteps | 2423296 | -| train/ | | -| approx_kl | 0.22325037 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 189310 | -| policy_gradient_loss | 0.102 | -| std | 0.00801 | -| value_loss | 2.39e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18933 | -| time_elapsed | 102444 | -| total_timesteps | 2423424 | -| train/ | | -| approx_kl | 0.13199371 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00216 | -| learning_rate | 0.0003 | -| loss | 0.0849 | -| n_updates | 189320 | -| policy_gradient_loss | 0.0972 | -| std | 0.00801 | -| value_loss | 1.43e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18934 | -| time_elapsed | 102448 | -| total_timesteps | 2423552 | -| train/ | | -| approx_kl | 0.092492536 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -86 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 189330 | -| policy_gradient_loss | -0.00871 | -| std | 0.00801 | -| value_loss | 4.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18935 | -| time_elapsed | 102453 | -| total_timesteps | 2423680 | -| train/ | | -| approx_kl | 0.10939291 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | 0.0761 | -| n_updates | 189340 | -| policy_gradient_loss | 0.0654 | -| std | 0.00801 | -| value_loss | 6.2e-08 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18936 | -| time_elapsed | 102458 | -| total_timesteps | 2423808 | -| train/ | | -| approx_kl | 0.107211 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -2.24 | -| learning_rate | 0.0003 | -| loss | 0.0603 | -| n_updates | 189350 | -| policy_gradient_loss | 0.0716 | -| std | 0.00801 | -| value_loss | 1.38e-09 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 18937 | -| time_elapsed | 102462 | -| total_timesteps | 2423936 | -| train/ | | -| approx_kl | 0.019475374 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00946 | -| learning_rate | 0.0003 | -| loss | 0.00648 | -| n_updates | 189360 | -| policy_gradient_loss | 0.0147 | -| std | 0.00801 | -| value_loss | 3.45e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18938 | -| time_elapsed | 102467 | -| total_timesteps | 2424064 | -| train/ | | -| approx_kl | 0.35666615 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 189370 | -| policy_gradient_loss | 0.0405 | -| std | 0.00801 | -| value_loss | 2.33e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18939 | -| time_elapsed | 102473 | -| total_timesteps | 2424192 | -| train/ | | -| approx_kl | 0.008737711 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 189380 | -| policy_gradient_loss | 0.00634 | -| std | 0.00801 | -| value_loss | 0.00235 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18940 | -| time_elapsed | 102476 | -| total_timesteps | 2424320 | -| train/ | | -| approx_kl | 0.019453902 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 189390 | -| policy_gradient_loss | -0.00884 | -| std | 0.00801 | -| value_loss | 0.000104 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18941 | -| time_elapsed | 102479 | -| total_timesteps | 2424448 | -| train/ | | -| approx_kl | 0.10490538 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00803 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 189400 | -| policy_gradient_loss | 0.0108 | -| std | 0.00801 | -| value_loss | 1.36e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18942 | -| time_elapsed | 102482 | -| total_timesteps | 2424576 | -| train/ | | -| approx_kl | 0.07784997 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.0344 | -| n_updates | 189410 | -| policy_gradient_loss | 0.0285 | -| std | 0.00801 | -| value_loss | 8.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18943 | -| time_elapsed | 102486 | -| total_timesteps | 2424704 | -| train/ | | -| approx_kl | 0.20469376 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 189420 | -| policy_gradient_loss | 0.0929 | -| std | 0.00801 | -| value_loss | 6.21e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18944 | -| time_elapsed | 102490 | -| total_timesteps | 2424832 | -| train/ | | -| approx_kl | 0.040803272 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 189430 | -| policy_gradient_loss | 0.0152 | -| std | 0.00801 | -| value_loss | 4.48e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 18945 | -| time_elapsed | 102495 | -| total_timesteps | 2424960 | -| train/ | | -| approx_kl | 0.08286458 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 189440 | -| policy_gradient_loss | 0.0118 | -| std | 0.00802 | -| value_loss | 2.94e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18946 | -| time_elapsed | 102501 | -| total_timesteps | 2425088 | -| train/ | | -| approx_kl | 0.112268135 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0871 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 189450 | -| policy_gradient_loss | 0.0205 | -| std | 0.00801 | -| value_loss | 8.04e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18947 | -| time_elapsed | 102512 | -| total_timesteps | 2425216 | -| train/ | | -| approx_kl | 0.0041385656 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 189460 | -| policy_gradient_loss | -0.00497 | -| std | 0.00801 | -| value_loss | 0.000126 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18948 | -| time_elapsed | 102516 | -| total_timesteps | 2425344 | -| train/ | | -| approx_kl | 0.018766355 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -275 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 189470 | -| policy_gradient_loss | 0.00325 | -| std | 0.00801 | -| value_loss | 1.75e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18949 | -| time_elapsed | 102520 | -| total_timesteps | 2425472 | -| train/ | | -| approx_kl | 0.014671088 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.000221 | -| n_updates | 189480 | -| policy_gradient_loss | 0.0135 | -| std | 0.00801 | -| value_loss | 2.58e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18950 | -| time_elapsed | 102524 | -| total_timesteps | 2425600 | -| train/ | | -| approx_kl | 0.11120045 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -1.57 | -| learning_rate | 0.0003 | -| loss | 0.0418 | -| n_updates | 189490 | -| policy_gradient_loss | 0.0258 | -| std | 0.00801 | -| value_loss | 5.74e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18951 | -| time_elapsed | 102528 | -| total_timesteps | 2425728 | -| train/ | | -| approx_kl | 0.09439213 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 189500 | -| policy_gradient_loss | 0.0146 | -| std | 0.00801 | -| value_loss | 0.000513 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18952 | -| time_elapsed | 102532 | -| total_timesteps | 2425856 | -| train/ | | -| approx_kl | 0.022645282 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00987 | -| n_updates | 189510 | -| policy_gradient_loss | 0.000986 | -| std | 0.00802 | -| value_loss | 2.23e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 18953 | -| time_elapsed | 102535 | -| total_timesteps | 2425984 | -| train/ | | -| approx_kl | 0.33599502 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | 0.261 | -| n_updates | 189520 | -| policy_gradient_loss | 0.0805 | -| std | 0.00801 | -| value_loss | 4.43e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18954 | -| time_elapsed | 102539 | -| total_timesteps | 2426112 | -| train/ | | -| approx_kl | 4.422851e-06 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | 0.000283 | -| n_updates | 189530 | -| policy_gradient_loss | -0.00156 | -| std | 0.00801 | -| value_loss | 2.43e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18955 | -| time_elapsed | 102547 | -| total_timesteps | 2426240 | -| train/ | | -| approx_kl | 0.0019514654 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.819 | -| learning_rate | 0.0003 | -| loss | -0.0205 | -| n_updates | 189540 | -| policy_gradient_loss | -0.0113 | -| std | 0.008 | -| value_loss | 0.00452 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18956 | -| time_elapsed | 102552 | -| total_timesteps | 2426368 | -| train/ | | -| approx_kl | 2.022367e-06 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | 0.000643 | -| n_updates | 189550 | -| policy_gradient_loss | 0.0125 | -| std | 0.00801 | -| value_loss | 0.000295 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18957 | -| time_elapsed | 102556 | -| total_timesteps | 2426496 | -| train/ | | -| approx_kl | 0.7929972 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | 0.433 | -| n_updates | 189560 | -| policy_gradient_loss | 0.197 | -| std | 0.00802 | -| value_loss | 0.000427 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18958 | -| time_elapsed | 102562 | -| total_timesteps | 2426624 | -| train/ | | -| approx_kl | 0.00763137 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -260 | -| learning_rate | 0.0003 | -| loss | -0.000673 | -| n_updates | 189570 | -| policy_gradient_loss | 0.00949 | -| std | 0.00802 | -| value_loss | 3.3e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18959 | -| time_elapsed | 102566 | -| total_timesteps | 2426752 | -| train/ | | -| approx_kl | 0.21408443 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.224 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 189580 | -| policy_gradient_loss | 0.111 | -| std | 0.00802 | -| value_loss | 3.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 18960 | -| time_elapsed | 102571 | -| total_timesteps | 2426880 | -| train/ | | -| approx_kl | 0.031021774 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 189590 | -| policy_gradient_loss | 0.0182 | -| std | 0.00802 | -| value_loss | 2.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18961 | -| time_elapsed | 102574 | -| total_timesteps | 2427008 | -| train/ | | -| approx_kl | 0.124817796 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.0716 | -| n_updates | 189600 | -| policy_gradient_loss | 0.0193 | -| std | 0.00802 | -| value_loss | 2.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18962 | -| time_elapsed | 102587 | -| total_timesteps | 2427136 | -| train/ | | -| approx_kl | 0.015660087 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 189610 | -| policy_gradient_loss | -0.00778 | -| std | 0.00802 | -| value_loss | 0.000198 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18963 | -| time_elapsed | 102591 | -| total_timesteps | 2427264 | -| train/ | | -| approx_kl | 0.04577254 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.503 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 189620 | -| policy_gradient_loss | 0.0178 | -| std | 0.00802 | -| value_loss | 5.35e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18964 | -| time_elapsed | 102595 | -| total_timesteps | 2427392 | -| train/ | | -| approx_kl | 0.002160035 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 189630 | -| policy_gradient_loss | 0.0232 | -| std | 0.00802 | -| value_loss | 2.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18965 | -| time_elapsed | 102599 | -| total_timesteps | 2427520 | -| train/ | | -| approx_kl | 0.01005829 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | 0.00643 | -| n_updates | 189640 | -| policy_gradient_loss | 0.019 | -| std | 0.00802 | -| value_loss | 1.44e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18966 | -| time_elapsed | 102603 | -| total_timesteps | 2427648 | -| train/ | | -| approx_kl | 0.013667144 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | -0.00302 | -| n_updates | 189650 | -| policy_gradient_loss | 0.0166 | -| std | 0.00802 | -| value_loss | 4.44e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18967 | -| time_elapsed | 102607 | -| total_timesteps | 2427776 | -| train/ | | -| approx_kl | 0.08832669 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 189660 | -| policy_gradient_loss | 0.0227 | -| std | 0.00802 | -| value_loss | 3.07e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 18968 | -| time_elapsed | 102612 | -| total_timesteps | 2427904 | -| train/ | | -| approx_kl | 0.0036164797 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.00768 | -| n_updates | 189670 | -| policy_gradient_loss | 0.00487 | -| std | 0.00802 | -| value_loss | 2.16e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18969 | -| time_elapsed | 102615 | -| total_timesteps | 2428032 | -| train/ | | -| approx_kl | 0.037375458 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.00813 | -| n_updates | 189680 | -| policy_gradient_loss | 0.0124 | -| std | 0.00802 | -| value_loss | 1.46e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18970 | -| time_elapsed | 102624 | -| total_timesteps | 2428160 | -| train/ | | -| approx_kl | 0.0049891993 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 189690 | -| policy_gradient_loss | -0.0138 | -| std | 0.00802 | -| value_loss | 4.05e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18971 | -| time_elapsed | 102629 | -| total_timesteps | 2428288 | -| train/ | | -| approx_kl | 0.12212521 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.0178 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 189700 | -| policy_gradient_loss | 0.112 | -| std | 0.00802 | -| value_loss | 5.31e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18972 | -| time_elapsed | 102633 | -| total_timesteps | 2428416 | -| train/ | | -| approx_kl | 0.09467592 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00748 | -| learning_rate | 0.0003 | -| loss | 0.0681 | -| n_updates | 189710 | -| policy_gradient_loss | 0.101 | -| std | 0.00802 | -| value_loss | 3.69e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18973 | -| time_elapsed | 102636 | -| total_timesteps | 2428544 | -| train/ | | -| approx_kl | 0.020466069 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 189720 | -| policy_gradient_loss | 0.0186 | -| std | 0.00802 | -| value_loss | 2.58e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18974 | -| time_elapsed | 102640 | -| total_timesteps | 2428672 | -| train/ | | -| approx_kl | 0.12209581 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | 0.0586 | -| n_updates | 189730 | -| policy_gradient_loss | 0.0138 | -| std | 0.00802 | -| value_loss | 1.88e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18975 | -| time_elapsed | 102645 | -| total_timesteps | 2428800 | -| train/ | | -| approx_kl | 0.00892386 | -| clip_fraction | 0.0711 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0843 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 189740 | -| policy_gradient_loss | -0.0031 | -| std | 0.00801 | -| value_loss | 9.95e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18976 | -| time_elapsed | 102648 | -| total_timesteps | 2428928 | -| train/ | | -| approx_kl | 0.008201219 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0829 | -| learning_rate | 0.0003 | -| loss | 0.000523 | -| n_updates | 189750 | -| policy_gradient_loss | 0.000167 | -| std | 0.00801 | -| value_loss | 6.03e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18977 | -| time_elapsed | 102652 | -| total_timesteps | 2429056 | -| train/ | | -| approx_kl | 0.015153535 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 189760 | -| policy_gradient_loss | 0.00806 | -| std | 0.00801 | -| value_loss | 3.53e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18978 | -| time_elapsed | 102661 | -| total_timesteps | 2429184 | -| train/ | | -| approx_kl | 0.19234875 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 189770 | -| policy_gradient_loss | 0.0218 | -| std | 0.00802 | -| value_loss | 8.92e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18979 | -| time_elapsed | 102665 | -| total_timesteps | 2429312 | -| train/ | | -| approx_kl | 0.13562927 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 189780 | -| policy_gradient_loss | 0.101 | -| std | 0.00802 | -| value_loss | 1.51e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18980 | -| time_elapsed | 102669 | -| total_timesteps | 2429440 | -| train/ | | -| approx_kl | 0.0982475 | -| clip_fraction | 0.646 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00225 | -| learning_rate | 0.0003 | -| loss | 0.0789 | -| n_updates | 189790 | -| policy_gradient_loss | 0.0885 | -| std | 0.00802 | -| value_loss | 3.83e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18981 | -| time_elapsed | 102672 | -| total_timesteps | 2429568 | -| train/ | | -| approx_kl | 0.09238349 | -| clip_fraction | 0.65 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.000568 | -| learning_rate | 0.0003 | -| loss | 0.0757 | -| n_updates | 189800 | -| policy_gradient_loss | 0.0911 | -| std | 0.00802 | -| value_loss | 2.16e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18982 | -| time_elapsed | 102677 | -| total_timesteps | 2429696 | -| train/ | | -| approx_kl | 0.10077474 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0998 | -| n_updates | 189810 | -| policy_gradient_loss | 0.0982 | -| std | 0.00802 | -| value_loss | 1.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18983 | -| time_elapsed | 102681 | -| total_timesteps | 2429824 | -| train/ | | -| approx_kl | 0.019061137 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.00229 | -| n_updates | 189820 | -| policy_gradient_loss | 0.0194 | -| std | 0.00802 | -| value_loss | 1.2e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 18984 | -| time_elapsed | 102685 | -| total_timesteps | 2429952 | -| train/ | | -| approx_kl | 0.42490208 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 189830 | -| policy_gradient_loss | 0.0423 | -| std | 0.00803 | -| value_loss | 8.04e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18985 | -| time_elapsed | 102690 | -| total_timesteps | 2430080 | -| train/ | | -| approx_kl | 0.0351791 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.00743 | -| n_updates | 189840 | -| policy_gradient_loss | 0.00418 | -| std | 0.00803 | -| value_loss | 6.07e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18986 | -| time_elapsed | 102697 | -| total_timesteps | 2430208 | -| train/ | | -| approx_kl | 0.0605954 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 189850 | -| policy_gradient_loss | -0.00162 | -| std | 0.00803 | -| value_loss | 0.00226 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18987 | -| time_elapsed | 102702 | -| total_timesteps | 2430336 | -| train/ | | -| approx_kl | 0.022868846 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | 0.00237 | -| n_updates | 189860 | -| policy_gradient_loss | 0.0187 | -| std | 0.00803 | -| value_loss | 6.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18988 | -| time_elapsed | 102706 | -| total_timesteps | 2430464 | -| train/ | | -| approx_kl | 0.102752976 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00972 | -| learning_rate | 0.0003 | -| loss | 0.0411 | -| n_updates | 189870 | -| policy_gradient_loss | 0.0256 | -| std | 0.00802 | -| value_loss | 7.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18989 | -| time_elapsed | 102711 | -| total_timesteps | 2430592 | -| train/ | | -| approx_kl | 0.09839575 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.0539 | -| n_updates | 189880 | -| policy_gradient_loss | 0.021 | -| std | 0.00802 | -| value_loss | 4.52e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18990 | -| time_elapsed | 102717 | -| total_timesteps | 2430720 | -| train/ | | -| approx_kl | 0.07790908 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0784 | -| learning_rate | 0.0003 | -| loss | 0.0518 | -| n_updates | 189890 | -| policy_gradient_loss | 0.0158 | -| std | 0.00802 | -| value_loss | 3.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18991 | -| time_elapsed | 102722 | -| total_timesteps | 2430848 | -| train/ | | -| approx_kl | 0.020718195 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.00266 | -| n_updates | 189900 | -| policy_gradient_loss | 0.0182 | -| std | 0.00802 | -| value_loss | 1.11e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 18992 | -| time_elapsed | 102727 | -| total_timesteps | 2430976 | -| train/ | | -| approx_kl | 0.18750691 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 189910 | -| policy_gradient_loss | 0.112 | -| std | 0.00802 | -| value_loss | 9.34e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 18993 | -| time_elapsed | 102731 | -| total_timesteps | 2431104 | -| train/ | | -| approx_kl | 0.03886689 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 189920 | -| policy_gradient_loss | 0.025 | -| std | 0.00803 | -| value_loss | 7.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 18994 | -| time_elapsed | 102743 | -| total_timesteps | 2431232 | -| train/ | | -| approx_kl | 0.029827632 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.426 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 189930 | -| policy_gradient_loss | -0.0153 | -| std | 0.00803 | -| value_loss | 0.00149 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 18995 | -| time_elapsed | 102749 | -| total_timesteps | 2431360 | -| train/ | | -| approx_kl | 0.061538838 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -30.8 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 189940 | -| policy_gradient_loss | -7.09e-05 | -| std | 0.00803 | -| value_loss | 5.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 18996 | -| time_elapsed | 102753 | -| total_timesteps | 2431488 | -| train/ | | -| approx_kl | 0.005022487 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.66 | -| learning_rate | 0.0003 | -| loss | 0.00297 | -| n_updates | 189950 | -| policy_gradient_loss | 0.00718 | -| std | 0.00803 | -| value_loss | 1.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 18997 | -| time_elapsed | 102758 | -| total_timesteps | 2431616 | -| train/ | | -| approx_kl | 0.03727554 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.00981 | -| n_updates | 189960 | -| policy_gradient_loss | 0.0123 | -| std | 0.00803 | -| value_loss | 6.89e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 18998 | -| time_elapsed | 102762 | -| total_timesteps | 2431744 | -| train/ | | -| approx_kl | 0.08460185 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -3.8 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 189970 | -| policy_gradient_loss | 0.0111 | -| std | 0.00802 | -| value_loss | 3.3e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 18999 | -| time_elapsed | 102765 | -| total_timesteps | 2431872 | -| train/ | | -| approx_kl | 0.011015443 | -| clip_fraction | 0.075 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00774 | -| learning_rate | 0.0003 | -| loss | -0.000892 | -| n_updates | 189980 | -| policy_gradient_loss | -0.000509 | -| std | 0.00802 | -| value_loss | 6.84e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19000 | -| time_elapsed | 102768 | -| total_timesteps | 2432000 | -| train/ | | -| approx_kl | 0.017379206 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00753 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 189990 | -| policy_gradient_loss | 0.0174 | -| std | 0.00802 | -| value_loss | 5.83e-11 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19001 | -| time_elapsed | 102772 | -| total_timesteps | 2432128 | -| train/ | | -| approx_kl | 0.2032821 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.000158 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 190000 | -| policy_gradient_loss | 0.083 | -| std | 0.00803 | -| value_loss | 2.65e-10 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19002 | -| time_elapsed | 102779 | -| total_timesteps | 2432256 | -| train/ | | -| approx_kl | 0.17959847 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | 0.0423 | -| n_updates | 190010 | -| policy_gradient_loss | 0.0239 | -| std | 0.00803 | -| value_loss | 9.54e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19003 | -| time_elapsed | 102784 | -| total_timesteps | 2432384 | -| train/ | | -| approx_kl | 0.08322342 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -8.07 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 190020 | -| policy_gradient_loss | 0.0109 | -| std | 0.00803 | -| value_loss | 6.42e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19004 | -| time_elapsed | 102788 | -| total_timesteps | 2432512 | -| train/ | | -| approx_kl | 0.48277554 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -2.53 | -| learning_rate | 0.0003 | -| loss | 0.0983 | -| n_updates | 190030 | -| policy_gradient_loss | 0.0282 | -| std | 0.00803 | -| value_loss | 4.06e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19005 | -| time_elapsed | 102792 | -| total_timesteps | 2432640 | -| train/ | | -| approx_kl | 0.009748034 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.931 | -| learning_rate | 0.0003 | -| loss | -0.00099 | -| n_updates | 190040 | -| policy_gradient_loss | 0.00188 | -| std | 0.00803 | -| value_loss | 1.97e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19006 | -| time_elapsed | 102797 | -| total_timesteps | 2432768 | -| train/ | | -| approx_kl | 0.0003581727 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.409 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 190050 | -| policy_gradient_loss | 0.00323 | -| std | 0.00803 | -| value_loss | 9.34e-12 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19007 | -| time_elapsed | 102802 | -| total_timesteps | 2432896 | -| train/ | | -| approx_kl | 0.005026747 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 190060 | -| policy_gradient_loss | 0.0048 | -| std | 0.00803 | -| value_loss | 5.44e-12 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19008 | -| time_elapsed | 102806 | -| total_timesteps | 2433024 | -| train/ | | -| approx_kl | 0.02742358 | -| clip_fraction | 0.608 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | 0.0366 | -| n_updates | 190070 | -| policy_gradient_loss | 0.0728 | -| std | 0.00802 | -| value_loss | 1.39e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19009 | -| time_elapsed | 102816 | -| total_timesteps | 2433152 | -| train/ | | -| approx_kl | 0.14534602 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.146 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 190080 | -| policy_gradient_loss | 0.0194 | -| std | 0.00802 | -| value_loss | 0.00181 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19010 | -| time_elapsed | 102820 | -| total_timesteps | 2433280 | -| train/ | | -| approx_kl | 0.18117733 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0606 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 190090 | -| policy_gradient_loss | 0.0994 | -| std | 0.00802 | -| value_loss | 2.58e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19011 | -| time_elapsed | 102825 | -| total_timesteps | 2433408 | -| train/ | | -| approx_kl | 0.109770164 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00702 | -| learning_rate | 0.0003 | -| loss | 0.0623 | -| n_updates | 190100 | -| policy_gradient_loss | 0.0832 | -| std | 0.00803 | -| value_loss | 1.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19012 | -| time_elapsed | 102830 | -| total_timesteps | 2433536 | -| train/ | | -| approx_kl | 0.027214235 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 190110 | -| policy_gradient_loss | 0.0199 | -| std | 0.00803 | -| value_loss | 1.42e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19013 | -| time_elapsed | 102835 | -| total_timesteps | 2433664 | -| train/ | | -| approx_kl | 0.3590024 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0523 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 190120 | -| policy_gradient_loss | 0.0452 | -| std | 0.00803 | -| value_loss | 8.68e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19014 | -| time_elapsed | 102841 | -| total_timesteps | 2433792 | -| train/ | | -| approx_kl | 0.03180368 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.0047 | -| n_updates | 190130 | -| policy_gradient_loss | 0.00276 | -| std | 0.00803 | -| value_loss | 6.3e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 19015 | -| time_elapsed | 102845 | -| total_timesteps | 2433920 | -| train/ | | -| approx_kl | 0.03143727 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.00925 | -| n_updates | 190140 | -| policy_gradient_loss | 0.00409 | -| std | 0.00803 | -| value_loss | 3.87e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19016 | -| time_elapsed | 102849 | -| total_timesteps | 2434048 | -| train/ | | -| approx_kl | 0.029178735 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 190150 | -| policy_gradient_loss | 0.0122 | -| std | 0.00803 | -| value_loss | 2.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19017 | -| time_elapsed | 102857 | -| total_timesteps | 2434176 | -| train/ | | -| approx_kl | 0.051928993 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.796 | -| learning_rate | 0.0003 | -| loss | -0.00882 | -| n_updates | 190160 | -| policy_gradient_loss | -0.0118 | -| std | 0.00802 | -| value_loss | 0.00539 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19018 | -| time_elapsed | 102861 | -| total_timesteps | 2434304 | -| train/ | | -| approx_kl | 0.008328801 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | 0.00387 | -| n_updates | 190170 | -| policy_gradient_loss | 0.0133 | -| std | 0.00802 | -| value_loss | 2.36e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19019 | -| time_elapsed | 102867 | -| total_timesteps | 2434432 | -| train/ | | -| approx_kl | 0.11338958 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00277 | -| learning_rate | 0.0003 | -| loss | 0.0635 | -| n_updates | 190180 | -| policy_gradient_loss | 0.0235 | -| std | 0.00803 | -| value_loss | 0.00016 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19020 | -| time_elapsed | 102871 | -| total_timesteps | 2434560 | -| train/ | | -| approx_kl | 0.37502152 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00354 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 190190 | -| policy_gradient_loss | 0.0379 | -| std | 0.00803 | -| value_loss | 1.3e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19021 | -| time_elapsed | 102876 | -| total_timesteps | 2434688 | -| train/ | | -| approx_kl | 0.022923617 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 190200 | -| policy_gradient_loss | 0.00663 | -| std | 0.00803 | -| value_loss | 5.57e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19022 | -| time_elapsed | 102880 | -| total_timesteps | 2434816 | -| train/ | | -| approx_kl | 0.0039411723 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0785 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 190210 | -| policy_gradient_loss | 0.00127 | -| std | 0.00804 | -| value_loss | 5.02e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19023 | -| time_elapsed | 102884 | -| total_timesteps | 2434944 | -| train/ | | -| approx_kl | 0.028145144 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 190220 | -| policy_gradient_loss | 0.00159 | -| std | 0.00806 | -| value_loss | 4.54e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19024 | -| time_elapsed | 102889 | -| total_timesteps | 2435072 | -| train/ | | -| approx_kl | 0.0055773673 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00909 | -| learning_rate | 0.0003 | -| loss | 8.37e-05 | -| n_updates | 190230 | -| policy_gradient_loss | 0.0198 | -| std | 0.00806 | -| value_loss | 3.73e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19025 | -| time_elapsed | 102896 | -| total_timesteps | 2435200 | -| train/ | | -| approx_kl | 0.04813476 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.721 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 190240 | -| policy_gradient_loss | -0.00816 | -| std | 0.00806 | -| value_loss | 0.00103 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19026 | -| time_elapsed | 102900 | -| total_timesteps | 2435328 | -| train/ | | -| approx_kl | 0.0006984598 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 190250 | -| policy_gradient_loss | 0.0151 | -| std | 0.00806 | -| value_loss | 1.88e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19027 | -| time_elapsed | 102904 | -| total_timesteps | 2435456 | -| train/ | | -| approx_kl | 0.00063742977 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | 0.00268 | -| n_updates | 190260 | -| policy_gradient_loss | 0.00233 | -| std | 0.00805 | -| value_loss | 4.97e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19028 | -| time_elapsed | 102909 | -| total_timesteps | 2435584 | -| train/ | | -| approx_kl | 0.028398424 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00723 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 190270 | -| policy_gradient_loss | 0.00886 | -| std | 0.00805 | -| value_loss | 7.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19029 | -| time_elapsed | 102914 | -| total_timesteps | 2435712 | -| train/ | | -| approx_kl | 0.30880284 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0516 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 190280 | -| policy_gradient_loss | 0.0334 | -| std | 0.00805 | -| value_loss | 5.9e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19030 | -| time_elapsed | 102919 | -| total_timesteps | 2435840 | -| train/ | | -| approx_kl | 0.026906624 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.000536 | -| n_updates | 190290 | -| policy_gradient_loss | 0.00107 | -| std | 0.00805 | -| value_loss | 4e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 19031 | -| time_elapsed | 102924 | -| total_timesteps | 2435968 | -| train/ | | -| approx_kl | 1.937244e-05 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -0.000551 | -| n_updates | 190300 | -| policy_gradient_loss | -8.39e-06 | -| std | 0.00805 | -| value_loss | 2.6e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19032 | -| time_elapsed | 102930 | -| total_timesteps | 2436096 | -| train/ | | -| approx_kl | 0.040120754 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 190310 | -| policy_gradient_loss | 0.00556 | -| std | 0.00806 | -| value_loss | 1.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19033 | -| time_elapsed | 102936 | -| total_timesteps | 2436224 | -| train/ | | -| approx_kl | 0.01844382 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 190320 | -| policy_gradient_loss | -0.00637 | -| std | 0.00806 | -| value_loss | 0.000663 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19034 | -| time_elapsed | 102941 | -| total_timesteps | 2436352 | -| train/ | | -| approx_kl | 0.065936014 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.285 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 190330 | -| policy_gradient_loss | 0.0261 | -| std | 0.00809 | -| value_loss | 4.5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19035 | -| time_elapsed | 102946 | -| total_timesteps | 2436480 | -| train/ | | -| approx_kl | 0.07925473 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.749 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 190340 | -| policy_gradient_loss | 0.00472 | -| std | 0.00809 | -| value_loss | 1.05e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19036 | -| time_elapsed | 102951 | -| total_timesteps | 2436608 | -| train/ | | -| approx_kl | 0.00052657165 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.449 | -| learning_rate | 0.0003 | -| loss | 0.00274 | -| n_updates | 190350 | -| policy_gradient_loss | 0.0129 | -| std | 0.00809 | -| value_loss | 5.36e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19037 | -| time_elapsed | 102956 | -| total_timesteps | 2436736 | -| train/ | | -| approx_kl | 0.30339643 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 190360 | -| policy_gradient_loss | 0.13 | -| std | 0.00809 | -| value_loss | 1.61e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19038 | -| time_elapsed | 102962 | -| total_timesteps | 2436864 | -| train/ | | -| approx_kl | 0.043664012 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 190370 | -| policy_gradient_loss | 0.00668 | -| std | 0.00809 | -| value_loss | 5.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19039 | -| time_elapsed | 102967 | -| total_timesteps | 2436992 | -| train/ | | -| approx_kl | 0.026413724 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | -0.0092 | -| n_updates | 190380 | -| policy_gradient_loss | 0.00548 | -| std | 0.00808 | -| value_loss | 1.02e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19040 | -| time_elapsed | 102972 | -| total_timesteps | 2437120 | -| train/ | | -| approx_kl | 0.0020792997 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -2.16 | -| learning_rate | 0.0003 | -| loss | -0.0024 | -| n_updates | 190390 | -| policy_gradient_loss | 0.00711 | -| std | 0.00808 | -| value_loss | 3.19e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19041 | -| time_elapsed | 102984 | -| total_timesteps | 2437248 | -| train/ | | -| approx_kl | 0.030128399 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | 0.00384 | -| n_updates | 190400 | -| policy_gradient_loss | 0.00384 | -| std | 0.00808 | -| value_loss | 0.00537 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19042 | -| time_elapsed | 102990 | -| total_timesteps | 2437376 | -| train/ | | -| approx_kl | 0.012377145 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | 0.00529 | -| n_updates | 190410 | -| policy_gradient_loss | 0.0269 | -| std | 0.00809 | -| value_loss | 6.14e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19043 | -| time_elapsed | 102995 | -| total_timesteps | 2437504 | -| train/ | | -| approx_kl | 0.19035201 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00926 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 190420 | -| policy_gradient_loss | 0.109 | -| std | 0.00809 | -| value_loss | 9.93e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19044 | -| time_elapsed | 103000 | -| total_timesteps | 2437632 | -| train/ | | -| approx_kl | 0.032261934 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 190430 | -| policy_gradient_loss | 0.0196 | -| std | 0.00809 | -| value_loss | 5.35e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19045 | -| time_elapsed | 103006 | -| total_timesteps | 2437760 | -| train/ | | -| approx_kl | 0.38741592 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0836 | -| learning_rate | 0.0003 | -| loss | 0.0994 | -| n_updates | 190440 | -| policy_gradient_loss | 0.0334 | -| std | 0.00809 | -| value_loss | 3.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19046 | -| time_elapsed | 103011 | -| total_timesteps | 2437888 | -| train/ | | -| approx_kl | 0.007606238 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 5.06e-05 | -| n_updates | 190450 | -| policy_gradient_loss | 0.00315 | -| std | 0.00809 | -| value_loss | 2.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19047 | -| time_elapsed | 103016 | -| total_timesteps | 2438016 | -| train/ | | -| approx_kl | 0.036603887 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0995 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 190460 | -| policy_gradient_loss | 0.0023 | -| std | 0.00809 | -| value_loss | 2.36e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19048 | -| time_elapsed | 103028 | -| total_timesteps | 2438144 | -| train/ | | -| approx_kl | 0.0222793 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.144 | -| learning_rate | 0.0003 | -| loss | -0.0281 | -| n_updates | 190470 | -| policy_gradient_loss | -0.0186 | -| std | 0.00808 | -| value_loss | 0.00196 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19049 | -| time_elapsed | 103034 | -| total_timesteps | 2438272 | -| train/ | | -| approx_kl | 0.014147976 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.245 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 190480 | -| policy_gradient_loss | 0.00535 | -| std | 0.00808 | -| value_loss | 3.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19050 | -| time_elapsed | 103038 | -| total_timesteps | 2438400 | -| train/ | | -| approx_kl | 0.070780955 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -2.04 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 190490 | -| policy_gradient_loss | 0.00976 | -| std | 0.00808 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19051 | -| time_elapsed | 103042 | -| total_timesteps | 2438528 | -| train/ | | -| approx_kl | 0.005210364 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -11.9 | -| learning_rate | 0.0003 | -| loss | 0.00801 | -| n_updates | 190500 | -| policy_gradient_loss | 0.00105 | -| std | 0.00808 | -| value_loss | 3.06e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19052 | -| time_elapsed | 103046 | -| total_timesteps | 2438656 | -| train/ | | -| approx_kl | 0.1504744 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | 0.0776 | -| n_updates | 190510 | -| policy_gradient_loss | 0.0661 | -| std | 0.00808 | -| value_loss | 8.32e-10 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19053 | -| time_elapsed | 103049 | -| total_timesteps | 2438784 | -| train/ | | -| approx_kl | 0.12283045 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.315 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 190520 | -| policy_gradient_loss | 0.0951 | -| std | 0.00808 | -| value_loss | 4.54e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 19054 | -| time_elapsed | 103054 | -| total_timesteps | 2438912 | -| train/ | | -| approx_kl | 0.021514762 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.00347 | -| n_updates | 190530 | -| policy_gradient_loss | 0.00981 | -| std | 0.00809 | -| value_loss | 1.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19055 | -| time_elapsed | 103060 | -| total_timesteps | 2439040 | -| train/ | | -| approx_kl | 0.015775729 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.464 | -| learning_rate | 0.0003 | -| loss | 0.00582 | -| n_updates | 190540 | -| policy_gradient_loss | 0.0282 | -| std | 0.00809 | -| value_loss | 9.5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19056 | -| time_elapsed | 103070 | -| total_timesteps | 2439168 | -| train/ | | -| approx_kl | 0.30729932 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -3.77 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 190550 | -| policy_gradient_loss | 0.000103 | -| std | 0.00809 | -| value_loss | 0.0037 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19057 | -| time_elapsed | 103075 | -| total_timesteps | 2439296 | -| train/ | | -| approx_kl | 0.020343702 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.00171 | -| n_updates | 190560 | -| policy_gradient_loss | 0.00307 | -| std | 0.00809 | -| value_loss | 3.89e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19058 | -| time_elapsed | 103080 | -| total_timesteps | 2439424 | -| train/ | | -| approx_kl | 0.03171534 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 190570 | -| policy_gradient_loss | 0.00472 | -| std | 0.0081 | -| value_loss | 6.21e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19059 | -| time_elapsed | 103083 | -| total_timesteps | 2439552 | -| train/ | | -| approx_kl | 0.00624848 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.087 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 190580 | -| policy_gradient_loss | -8.97e-05 | -| std | 0.0081 | -| value_loss | 4.4e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19060 | -| time_elapsed | 103087 | -| total_timesteps | 2439680 | -| train/ | | -| approx_kl | 0.04257336 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 190590 | -| policy_gradient_loss | 0.00302 | -| std | 0.00811 | -| value_loss | 7.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19061 | -| time_elapsed | 103090 | -| total_timesteps | 2439808 | -| train/ | | -| approx_kl | 0.008113541 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.00956 | -| learning_rate | 0.0003 | -| loss | -0.00968 | -| n_updates | 190600 | -| policy_gradient_loss | -0.00108 | -| std | 0.00811 | -| value_loss | 2.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19062 | -| time_elapsed | 103094 | -| total_timesteps | 2439936 | -| train/ | | -| approx_kl | 0.017683972 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | 0.0257 | -| n_updates | 190610 | -| policy_gradient_loss | 0.0664 | -| std | 0.00812 | -| value_loss | 1.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19063 | -| time_elapsed | 103098 | -| total_timesteps | 2440064 | -| train/ | | -| approx_kl | 0.074003704 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 190620 | -| policy_gradient_loss | 0.0979 | -| std | 0.00812 | -| value_loss | 1.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19064 | -| time_elapsed | 103108 | -| total_timesteps | 2440192 | -| train/ | | -| approx_kl | 0.14954135 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | 0.0362 | -| n_updates | 190630 | -| policy_gradient_loss | 0.0366 | -| std | 0.00812 | -| value_loss | 8.62e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19065 | -| time_elapsed | 103113 | -| total_timesteps | 2440320 | -| train/ | | -| approx_kl | 0.087366864 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.815 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 190640 | -| policy_gradient_loss | 0.0234 | -| std | 0.00812 | -| value_loss | 1.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19066 | -| time_elapsed | 103117 | -| total_timesteps | 2440448 | -| train/ | | -| approx_kl | 0.47772822 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -1.39 | -| learning_rate | 0.0003 | -| loss | 0.0781 | -| n_updates | 190650 | -| policy_gradient_loss | 0.0254 | -| std | 0.00812 | -| value_loss | 2.5e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19067 | -| time_elapsed | 103121 | -| total_timesteps | 2440576 | -| train/ | | -| approx_kl | 0.011940591 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0812 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 190660 | -| policy_gradient_loss | 0.00333 | -| std | 0.00812 | -| value_loss | 1.26e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19068 | -| time_elapsed | 103127 | -| total_timesteps | 2440704 | -| train/ | | -| approx_kl | 0.00031627342 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 190670 | -| policy_gradient_loss | 0.00284 | -| std | 0.00812 | -| value_loss | 8.26e-10 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19069 | -| time_elapsed | 103133 | -| total_timesteps | 2440832 | -| train/ | | -| approx_kl | 0.031009365 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.06 | -| learning_rate | 0.0003 | -| loss | -0.0362 | -| n_updates | 190680 | -| policy_gradient_loss | -0.0187 | -| std | 0.00813 | -| value_loss | 5.6e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19070 | -| time_elapsed | 103137 | -| total_timesteps | 2440960 | -| train/ | | -| approx_kl | 0.043467943 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0826 | -| learning_rate | 0.0003 | -| loss | 0.0067 | -| n_updates | 190690 | -| policy_gradient_loss | 0.00363 | -| std | 0.00813 | -| value_loss | 3.18e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19071 | -| time_elapsed | 103143 | -| total_timesteps | 2441088 | -| train/ | | -| approx_kl | 0.032863732 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 190700 | -| policy_gradient_loss | 0.00802 | -| std | 0.00813 | -| value_loss | 2.14e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19072 | -| time_elapsed | 103153 | -| total_timesteps | 2441216 | -| train/ | | -| approx_kl | 0.017004881 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.00918 | -| n_updates | 190710 | -| policy_gradient_loss | -0.000986 | -| std | 0.00812 | -| value_loss | 0.00026 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19073 | -| time_elapsed | 103158 | -| total_timesteps | 2441344 | -| train/ | | -| approx_kl | 0.040310457 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 190720 | -| policy_gradient_loss | 0.00581 | -| std | 0.00812 | -| value_loss | 1.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19074 | -| time_elapsed | 103163 | -| total_timesteps | 2441472 | -| train/ | | -| approx_kl | 0.004585521 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00654 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 190730 | -| policy_gradient_loss | 0.00152 | -| std | 0.00812 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19075 | -| time_elapsed | 103169 | -| total_timesteps | 2441600 | -| train/ | | -| approx_kl | 0.058164556 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 190740 | -| policy_gradient_loss | 0.00466 | -| std | 0.0081 | -| value_loss | 6.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19076 | -| time_elapsed | 103174 | -| total_timesteps | 2441728 | -| train/ | | -| approx_kl | 0.066721395 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00269 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 190750 | -| policy_gradient_loss | 0.00281 | -| std | 0.00809 | -| value_loss | 8.47e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19077 | -| time_elapsed | 103179 | -| total_timesteps | 2441856 | -| train/ | | -| approx_kl | 0.020428263 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | 0.00445 | -| n_updates | 190760 | -| policy_gradient_loss | 0.0037 | -| std | 0.00808 | -| value_loss | 5.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19078 | -| time_elapsed | 103184 | -| total_timesteps | 2441984 | -| train/ | | -| approx_kl | 0.029677633 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 190770 | -| policy_gradient_loss | 0.00812 | -| std | 0.00808 | -| value_loss | 3.35e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19079 | -| time_elapsed | 103190 | -| total_timesteps | 2442112 | -| train/ | | -| approx_kl | 0.03192158 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 190780 | -| policy_gradient_loss | 0.00875 | -| std | 0.00808 | -| value_loss | 2.15e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19080 | -| time_elapsed | 103201 | -| total_timesteps | 2442240 | -| train/ | | -| approx_kl | 0.011324642 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 190790 | -| policy_gradient_loss | -0.0115 | -| std | 0.00808 | -| value_loss | 2.39e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19081 | -| time_elapsed | 103206 | -| total_timesteps | 2442368 | -| train/ | | -| approx_kl | 0.041077815 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.00731 | -| learning_rate | 0.0003 | -| loss | 0.00908 | -| n_updates | 190800 | -| policy_gradient_loss | 0.0209 | -| std | 0.00809 | -| value_loss | 8.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19082 | -| time_elapsed | 103210 | -| total_timesteps | 2442496 | -| train/ | | -| approx_kl | 0.07544096 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.00293 | -| learning_rate | 0.0003 | -| loss | 0.0636 | -| n_updates | 190810 | -| policy_gradient_loss | 0.0452 | -| std | 0.00809 | -| value_loss | 2.21e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19083 | -| time_elapsed | 103216 | -| total_timesteps | 2442624 | -| train/ | | -| approx_kl | 0.13596693 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | 0.0816 | -| n_updates | 190820 | -| policy_gradient_loss | 0.0222 | -| std | 0.00809 | -| value_loss | 1.51e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19084 | -| time_elapsed | 103221 | -| total_timesteps | 2442752 | -| train/ | | -| approx_kl | 0.00042446982 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | 0.000342 | -| n_updates | 190830 | -| policy_gradient_loss | 0.0196 | -| std | 0.00808 | -| value_loss | 9.59e-09 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19085 | -| time_elapsed | 103226 | -| total_timesteps | 2442880 | -| train/ | | -| approx_kl | 0.332519 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 190840 | -| policy_gradient_loss | 0.0339 | -| std | 0.00808 | -| value_loss | 6.82e-09 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19086 | -| time_elapsed | 103230 | -| total_timesteps | 2443008 | -| train/ | | -| approx_kl | 0.027034173 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.00932 | -| n_updates | 190850 | -| policy_gradient_loss | 0.00465 | -| std | 0.00808 | -| value_loss | 3.66e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19087 | -| time_elapsed | 103242 | -| total_timesteps | 2443136 | -| train/ | | -| approx_kl | 0.030892871 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 190860 | -| policy_gradient_loss | -0.00845 | -| std | 0.00808 | -| value_loss | 0.00206 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19088 | -| time_elapsed | 103246 | -| total_timesteps | 2443264 | -| train/ | | -| approx_kl | 0.10372292 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 190870 | -| policy_gradient_loss | 0.0125 | -| std | 0.00808 | -| value_loss | 3.67e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19089 | -| time_elapsed | 103249 | -| total_timesteps | 2443392 | -| train/ | | -| approx_kl | 0.094842225 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 190880 | -| policy_gradient_loss | 0.0193 | -| std | 0.00809 | -| value_loss | 5.44e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19090 | -| time_elapsed | 103253 | -| total_timesteps | 2443520 | -| train/ | | -| approx_kl | 0.34674746 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0775 | -| n_updates | 190890 | -| policy_gradient_loss | 0.0204 | -| std | 0.00809 | -| value_loss | 5.91e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19091 | -| time_elapsed | 103256 | -| total_timesteps | 2443648 | -| train/ | | -| approx_kl | 0.011714592 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 190900 | -| policy_gradient_loss | -0.00215 | -| std | 0.0081 | -| value_loss | 2.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19092 | -| time_elapsed | 103261 | -| total_timesteps | 2443776 | -| train/ | | -| approx_kl | 0.06452054 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 190910 | -| policy_gradient_loss | 0.00604 | -| std | 0.00811 | -| value_loss | 2.63e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19093 | -| time_elapsed | 103264 | -| total_timesteps | 2443904 | -| train/ | | -| approx_kl | 0.030870462 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 190920 | -| policy_gradient_loss | 0.0105 | -| std | 0.00811 | -| value_loss | 3.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19094 | -| time_elapsed | 103268 | -| total_timesteps | 2444032 | -| train/ | | -| approx_kl | 0.10766426 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.096 | -| n_updates | 190930 | -| policy_gradient_loss | 0.0343 | -| std | 0.00811 | -| value_loss | 1.11e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19095 | -| time_elapsed | 103275 | -| total_timesteps | 2444160 | -| train/ | | -| approx_kl | 0.021655412 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.017 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 190940 | -| policy_gradient_loss | -0.00989 | -| std | 0.00812 | -| value_loss | 0.0018 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19096 | -| time_elapsed | 103279 | -| total_timesteps | 2444288 | -| train/ | | -| approx_kl | 0.17797363 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00484 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 190950 | -| policy_gradient_loss | 0.101 | -| std | 0.00812 | -| value_loss | 2.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19097 | -| time_elapsed | 103284 | -| total_timesteps | 2444416 | -| train/ | | -| approx_kl | 0.02890382 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.00993 | -| n_updates | 190960 | -| policy_gradient_loss | 0.0157 | -| std | 0.00812 | -| value_loss | 6.09e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19098 | -| time_elapsed | 103289 | -| total_timesteps | 2444544 | -| train/ | | -| approx_kl | 0.44304243 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 190970 | -| policy_gradient_loss | 0.06 | -| std | 0.00812 | -| value_loss | 3.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19099 | -| time_elapsed | 103296 | -| total_timesteps | 2444672 | -| train/ | | -| approx_kl | 0.006809285 | -| clip_fraction | 0.128 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 190980 | -| policy_gradient_loss | 0.00252 | -| std | 0.00812 | -| value_loss | 2.3e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19100 | -| time_elapsed | 103301 | -| total_timesteps | 2444800 | -| train/ | | -| approx_kl | 0.0417097 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0731 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 190990 | -| policy_gradient_loss | 0.00439 | -| std | 0.00812 | -| value_loss | 1.76e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19101 | -| time_elapsed | 103304 | -| total_timesteps | 2444928 | -| train/ | | -| approx_kl | 0.0069697117 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 191000 | -| policy_gradient_loss | 0.00514 | -| std | 0.00812 | -| value_loss | 9.08e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19102 | -| time_elapsed | 103309 | -| total_timesteps | 2445056 | -| train/ | | -| approx_kl | 0.0022122422 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 191010 | -| policy_gradient_loss | 0.00565 | -| std | 0.00812 | -| value_loss | 6.27e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19103 | -| time_elapsed | 103314 | -| total_timesteps | 2445184 | -| train/ | | -| approx_kl | 0.0032110242 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.000711 | -| n_updates | 191020 | -| policy_gradient_loss | 0.00717 | -| std | 0.00811 | -| value_loss | 0.000113 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19104 | -| time_elapsed | 103319 | -| total_timesteps | 2445312 | -| train/ | | -| approx_kl | 0.40339684 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.468 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 191030 | -| policy_gradient_loss | 0.0471 | -| std | 0.00811 | -| value_loss | 6.35e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19105 | -| time_elapsed | 103324 | -| total_timesteps | 2445440 | -| train/ | | -| approx_kl | 0.03098852 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00144 | -| learning_rate | 0.0003 | -| loss | 0.00582 | -| n_updates | 191040 | -| policy_gradient_loss | 0.00325 | -| std | 0.00811 | -| value_loss | 5.99e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19106 | -| time_elapsed | 103329 | -| total_timesteps | 2445568 | -| train/ | | -| approx_kl | 0.030524567 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 191050 | -| policy_gradient_loss | 0.00569 | -| std | 0.00811 | -| value_loss | 2.79e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19107 | -| time_elapsed | 103333 | -| total_timesteps | 2445696 | -| train/ | | -| approx_kl | 0.0348678 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0657 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 191060 | -| policy_gradient_loss | 0.00857 | -| std | 0.00811 | -| value_loss | 1.82e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19108 | -| time_elapsed | 103335 | -| total_timesteps | 2445824 | -| train/ | | -| approx_kl | 0.046704676 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 191070 | -| policy_gradient_loss | 0.0126 | -| std | 0.00811 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19109 | -| time_elapsed | 103338 | -| total_timesteps | 2445952 | -| train/ | | -| approx_kl | 0.033393085 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.000856 | -| n_updates | 191080 | -| policy_gradient_loss | -0.000518 | -| std | 0.00811 | -| value_loss | 8.69e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19110 | -| time_elapsed | 103342 | -| total_timesteps | 2446080 | -| train/ | | -| approx_kl | 0.029194595 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 191090 | -| policy_gradient_loss | 0.00617 | -| std | 0.00811 | -| value_loss | 5.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19111 | -| time_elapsed | 103350 | -| total_timesteps | 2446208 | -| train/ | | -| approx_kl | 0.03876285 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.000686 | -| n_updates | 191100 | -| policy_gradient_loss | -0.00336 | -| std | 0.00811 | -| value_loss | 5.74e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19112 | -| time_elapsed | 103355 | -| total_timesteps | 2446336 | -| train/ | | -| approx_kl | 0.0007144618 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.00452 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 191110 | -| policy_gradient_loss | 0.0207 | -| std | 0.00814 | -| value_loss | 4.33e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19113 | -| time_elapsed | 103360 | -| total_timesteps | 2446464 | -| train/ | | -| approx_kl | 0.12642795 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.479 | -| learning_rate | 0.0003 | -| loss | 0.0731 | -| n_updates | 191120 | -| policy_gradient_loss | 0.021 | -| std | 0.00816 | -| value_loss | 2.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19114 | -| time_elapsed | 103365 | -| total_timesteps | 2446592 | -| train/ | | -| approx_kl | 0.017225076 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | -6.94e-05 | -| n_updates | 191130 | -| policy_gradient_loss | 0.0128 | -| std | 0.00817 | -| value_loss | 1.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19115 | -| time_elapsed | 103370 | -| total_timesteps | 2446720 | -| train/ | | -| approx_kl | 0.07625229 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 191140 | -| policy_gradient_loss | 0.013 | -| std | 0.00817 | -| value_loss | 9.18e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19116 | -| time_elapsed | 103375 | -| total_timesteps | 2446848 | -| train/ | | -| approx_kl | 0.00012846664 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | -0.000409 | -| n_updates | 191150 | -| policy_gradient_loss | 0.0139 | -| std | 0.00818 | -| value_loss | 5.28e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19117 | -| time_elapsed | 103380 | -| total_timesteps | 2446976 | -| train/ | | -| approx_kl | 0.11320187 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | 0.0669 | -| n_updates | 191160 | -| policy_gradient_loss | 0.0158 | -| std | 0.00819 | -| value_loss | 1.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19118 | -| time_elapsed | 103384 | -| total_timesteps | 2447104 | -| train/ | | -| approx_kl | 0.009785618 | -| clip_fraction | 0.0664 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.000609 | -| n_updates | 191170 | -| policy_gradient_loss | -0.000416 | -| std | 0.00821 | -| value_loss | 2.76e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19119 | -| time_elapsed | 103395 | -| total_timesteps | 2447232 | -| train/ | | -| approx_kl | 0.3418094 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 191180 | -| policy_gradient_loss | -0.000123 | -| std | 0.00823 | -| value_loss | 0.0052 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19120 | -| time_elapsed | 103399 | -| total_timesteps | 2447360 | -| train/ | | -| approx_kl | 0.00407411 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.00876 | -| n_updates | 191190 | -| policy_gradient_loss | 0.00465 | -| std | 0.00823 | -| value_loss | 2.11e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19121 | -| time_elapsed | 103404 | -| total_timesteps | 2447488 | -| train/ | | -| approx_kl | 0.017689874 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0957 | -| learning_rate | 0.0003 | -| loss | 0.0059 | -| n_updates | 191200 | -| policy_gradient_loss | 0.0288 | -| std | 0.00823 | -| value_loss | 2.66e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19122 | -| time_elapsed | 103409 | -| total_timesteps | 2447616 | -| train/ | | -| approx_kl | 0.081830665 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -10 | -| learning_rate | 0.0003 | -| loss | 0.0402 | -| n_updates | 191210 | -| policy_gradient_loss | 0.0177 | -| std | 0.00823 | -| value_loss | 3.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19123 | -| time_elapsed | 103415 | -| total_timesteps | 2447744 | -| train/ | | -| approx_kl | 0.23592784 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | 0.0728 | -| n_updates | 191220 | -| policy_gradient_loss | 0.00576 | -| std | 0.00823 | -| value_loss | 3.09e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19124 | -| time_elapsed | 103418 | -| total_timesteps | 2447872 | -| train/ | | -| approx_kl | 0.0038455287 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 191230 | -| policy_gradient_loss | 0.0228 | -| std | 0.00823 | -| value_loss | 7.77e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19125 | -| time_elapsed | 103423 | -| total_timesteps | 2448000 | -| train/ | | -| approx_kl | 0.1192516 | -| clip_fraction | 0.619 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | 0.0689 | -| n_updates | 191240 | -| policy_gradient_loss | 0.0673 | -| std | 0.00823 | -| value_loss | 1.45e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19126 | -| time_elapsed | 103428 | -| total_timesteps | 2448128 | -| train/ | | -| approx_kl | 0.08540595 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.0483 | -| n_updates | 191250 | -| policy_gradient_loss | 0.0204 | -| std | 0.00826 | -| value_loss | 2.27e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19127 | -| time_elapsed | 103436 | -| total_timesteps | 2448256 | -| train/ | | -| approx_kl | 0.0054770987 | -| clip_fraction | 0.0344 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.865 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 191260 | -| policy_gradient_loss | -0.0135 | -| std | 0.00827 | -| value_loss | 0.00249 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19128 | -| time_elapsed | 103441 | -| total_timesteps | 2448384 | -| train/ | | -| approx_kl | 0.02055014 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.559 | -| learning_rate | 0.0003 | -| loss | 0.00873 | -| n_updates | 191270 | -| policy_gradient_loss | 0.00275 | -| std | 0.00828 | -| value_loss | 8.88e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19129 | -| time_elapsed | 103445 | -| total_timesteps | 2448512 | -| train/ | | -| approx_kl | 0.014224136 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -3.45 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 191280 | -| policy_gradient_loss | 0.00555 | -| std | 0.00828 | -| value_loss | 1.06e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19130 | -| time_elapsed | 103449 | -| total_timesteps | 2448640 | -| train/ | | -| approx_kl | 0.41371825 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0701 | -| learning_rate | 0.0003 | -| loss | 0.0969 | -| n_updates | 191290 | -| policy_gradient_loss | 0.0339 | -| std | 0.00829 | -| value_loss | 3.59e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19131 | -| time_elapsed | 103454 | -| total_timesteps | 2448768 | -| train/ | | -| approx_kl | 0.010273267 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.339 | -| learning_rate | 0.0003 | -| loss | 0.00112 | -| n_updates | 191300 | -| policy_gradient_loss | 0.00502 | -| std | 0.00829 | -| value_loss | 1.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 19132 | -| time_elapsed | 103460 | -| total_timesteps | 2448896 | -| train/ | | -| approx_kl | 0.05198651 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.575 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 191310 | -| policy_gradient_loss | 0.0141 | -| std | 0.00829 | -| value_loss | 5.45e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19133 | -| time_elapsed | 103465 | -| total_timesteps | 2449024 | -| train/ | | -| approx_kl | 0.5028793 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | 0.204 | -| n_updates | 191320 | -| policy_gradient_loss | 0.075 | -| std | 0.00829 | -| value_loss | 9.09e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19134 | -| time_elapsed | 103474 | -| total_timesteps | 2449152 | -| train/ | | -| approx_kl | 0.032986008 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.0245 | -| n_updates | 191330 | -| policy_gradient_loss | -0.0023 | -| std | 0.00829 | -| value_loss | 0.000576 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19135 | -| time_elapsed | 103479 | -| total_timesteps | 2449280 | -| train/ | | -| approx_kl | 0.17535704 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.0231 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 191340 | -| policy_gradient_loss | 0.0608 | -| std | 0.0083 | -| value_loss | 0.000774 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19136 | -| time_elapsed | 103484 | -| total_timesteps | 2449408 | -| train/ | | -| approx_kl | 0.0039602784 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0679 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 191350 | -| policy_gradient_loss | 0.0554 | -| std | 0.0083 | -| value_loss | 3.27e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19137 | -| time_elapsed | 103490 | -| total_timesteps | 2449536 | -| train/ | | -| approx_kl | 0.06652567 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00232 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 191360 | -| policy_gradient_loss | 0.0778 | -| std | 0.0083 | -| value_loss | 7.91e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19138 | -| time_elapsed | 103495 | -| total_timesteps | 2449664 | -| train/ | | -| approx_kl | 0.0008173422 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | 0.000809 | -| n_updates | 191370 | -| policy_gradient_loss | 0.0172 | -| std | 0.0083 | -| value_loss | 2.48e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19139 | -| time_elapsed | 103499 | -| total_timesteps | 2449792 | -| train/ | | -| approx_kl | 0.04580432 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 191380 | -| policy_gradient_loss | 0.0101 | -| std | 0.0083 | -| value_loss | 1.62e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19140 | -| time_elapsed | 103504 | -| total_timesteps | 2449920 | -| train/ | | -| approx_kl | 0.10913182 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 191390 | -| policy_gradient_loss | 0.0184 | -| std | 0.0083 | -| value_loss | 2.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19141 | -| time_elapsed | 103509 | -| total_timesteps | 2450048 | -| train/ | | -| approx_kl | 0.020236779 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | 0.00784 | -| n_updates | 191400 | -| policy_gradient_loss | 0.025 | -| std | 0.0083 | -| value_loss | 3.14e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19142 | -| time_elapsed | 103519 | -| total_timesteps | 2450176 | -| train/ | | -| approx_kl | 0.07210171 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | 0.00855 | -| n_updates | 191410 | -| policy_gradient_loss | 0.00778 | -| std | 0.0083 | -| value_loss | 5.35e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19143 | -| time_elapsed | 103524 | -| total_timesteps | 2450304 | -| train/ | | -| approx_kl | 0.08335011 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00718 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 191420 | -| policy_gradient_loss | 0.0144 | -| std | 0.0083 | -| value_loss | 2.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19144 | -| time_elapsed | 103530 | -| total_timesteps | 2450432 | -| train/ | | -| approx_kl | 0.020198751 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 191430 | -| policy_gradient_loss | 0.0231 | -| std | 0.00831 | -| value_loss | 9.94e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19145 | -| time_elapsed | 103535 | -| total_timesteps | 2450560 | -| train/ | | -| approx_kl | 0.072816126 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 191440 | -| policy_gradient_loss | 0.0147 | -| std | 0.00831 | -| value_loss | 7.35e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19146 | -| time_elapsed | 103540 | -| total_timesteps | 2450688 | -| train/ | | -| approx_kl | 0.00012168987 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | -0.000299 | -| n_updates | 191450 | -| policy_gradient_loss | 0.0188 | -| std | 0.00831 | -| value_loss | 4.48e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19147 | -| time_elapsed | 103544 | -| total_timesteps | 2450816 | -| train/ | | -| approx_kl | 0.08466838 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | 0.0512 | -| n_updates | 191460 | -| policy_gradient_loss | 0.0112 | -| std | 0.0083 | -| value_loss | 3.12e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19148 | -| time_elapsed | 103549 | -| total_timesteps | 2450944 | -| train/ | | -| approx_kl | 0.015996821 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.07 | -| learning_rate | 0.0003 | -| loss | -0.00903 | -| n_updates | 191470 | -| policy_gradient_loss | 0.0148 | -| std | 0.0083 | -| value_loss | 1.7e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19149 | -| time_elapsed | 103554 | -| total_timesteps | 2451072 | -| train/ | | -| approx_kl | 0.20167089 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0445 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 191480 | -| policy_gradient_loss | 0.134 | -| std | 0.0083 | -| value_loss | 3.2e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19150 | -| time_elapsed | 103563 | -| total_timesteps | 2451200 | -| train/ | | -| approx_kl | 0.021953378 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | 0.00997 | -| n_updates | 191490 | -| policy_gradient_loss | 0.00666 | -| std | 0.0083 | -| value_loss | 0.00261 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19151 | -| time_elapsed | 103567 | -| total_timesteps | 2451328 | -| train/ | | -| approx_kl | 0.06785026 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.0977 | -| n_updates | 191500 | -| policy_gradient_loss | 0.0101 | -| std | 0.0083 | -| value_loss | 4.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19152 | -| time_elapsed | 103572 | -| total_timesteps | 2451456 | -| train/ | | -| approx_kl | 0.012105447 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00955 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 191510 | -| policy_gradient_loss | -0.00195 | -| std | 0.0083 | -| value_loss | 8.01e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19153 | -| time_elapsed | 103576 | -| total_timesteps | 2451584 | -| train/ | | -| approx_kl | 0.0016850745 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.000118 | -| n_updates | 191520 | -| policy_gradient_loss | 0.0195 | -| std | 0.00829 | -| value_loss | 2.33e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19154 | -| time_elapsed | 103580 | -| total_timesteps | 2451712 | -| train/ | | -| approx_kl | 0.5253778 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 191530 | -| policy_gradient_loss | 0.138 | -| std | 0.00829 | -| value_loss | 6.37e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19155 | -| time_elapsed | 103584 | -| total_timesteps | 2451840 | -| train/ | | -| approx_kl | 0.13801803 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00676 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 191540 | -| policy_gradient_loss | 0.00966 | -| std | 0.00828 | -| value_loss | 7.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 19156 | -| time_elapsed | 103588 | -| total_timesteps | 2451968 | -| train/ | | -| approx_kl | 0.011682346 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 191550 | -| policy_gradient_loss | 0.0195 | -| std | 0.00829 | -| value_loss | 1.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19157 | -| time_elapsed | 103593 | -| total_timesteps | 2452096 | -| train/ | | -| approx_kl | 0.03582238 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.382 | -| learning_rate | 0.0003 | -| loss | 0.0265 | -| n_updates | 191560 | -| policy_gradient_loss | 0.00583 | -| std | 0.0083 | -| value_loss | 2.7e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19158 | -| time_elapsed | 103605 | -| total_timesteps | 2452224 | -| train/ | | -| approx_kl | 0.04103094 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | 0.0516 | -| n_updates | 191570 | -| policy_gradient_loss | 0.00161 | -| std | 0.0083 | -| value_loss | 0.00066 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19159 | -| time_elapsed | 103610 | -| total_timesteps | 2452352 | -| train/ | | -| approx_kl | 0.006988596 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 191580 | -| policy_gradient_loss | 0.0159 | -| std | 0.0083 | -| value_loss | 7.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19160 | -| time_elapsed | 103615 | -| total_timesteps | 2452480 | -| train/ | | -| approx_kl | 0.16094545 | -| clip_fraction | 0.633 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 191590 | -| policy_gradient_loss | 0.0828 | -| std | 0.0083 | -| value_loss | 1.68e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19161 | -| time_elapsed | 103620 | -| total_timesteps | 2452608 | -| train/ | | -| approx_kl | 0.10531043 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0997 | -| learning_rate | 0.0003 | -| loss | 0.0986 | -| n_updates | 191600 | -| policy_gradient_loss | 0.0783 | -| std | 0.0083 | -| value_loss | 1.03e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19162 | -| time_elapsed | 103625 | -| total_timesteps | 2452736 | -| train/ | | -| approx_kl | 0.08248258 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 191610 | -| policy_gradient_loss | 0.0978 | -| std | 0.0083 | -| value_loss | 5.8e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19163 | -| time_elapsed | 103629 | -| total_timesteps | 2452864 | -| train/ | | -| approx_kl | 0.09585328 | -| clip_fraction | 0.632 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | 0.0861 | -| n_updates | 191620 | -| policy_gradient_loss | 0.105 | -| std | 0.0083 | -| value_loss | 4.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19164 | -| time_elapsed | 103634 | -| total_timesteps | 2452992 | -| train/ | | -| approx_kl | 0.10911507 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 191630 | -| policy_gradient_loss | 0.0922 | -| std | 0.0083 | -| value_loss | 3.55e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19165 | -| time_elapsed | 103638 | -| total_timesteps | 2453120 | -| train/ | | -| approx_kl | 0.073779695 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0648 | -| n_updates | 191640 | -| policy_gradient_loss | 0.0775 | -| std | 0.00831 | -| value_loss | 1.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19166 | -| time_elapsed | 103650 | -| total_timesteps | 2453248 | -| train/ | | -| approx_kl | 0.13032071 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 191650 | -| policy_gradient_loss | 0.0185 | -| std | 0.00831 | -| value_loss | 0.000119 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19167 | -| time_elapsed | 103655 | -| total_timesteps | 2453376 | -| train/ | | -| approx_kl | 0.06408485 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 191660 | -| policy_gradient_loss | 0.0237 | -| std | 0.00831 | -| value_loss | 1.1e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19168 | -| time_elapsed | 103660 | -| total_timesteps | 2453504 | -| train/ | | -| approx_kl | 0.3835994 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 191670 | -| policy_gradient_loss | 0.0401 | -| std | 0.00831 | -| value_loss | 7.86e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19169 | -| time_elapsed | 103665 | -| total_timesteps | 2453632 | -| train/ | | -| approx_kl | 0.008353956 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.000655 | -| learning_rate | 0.0003 | -| loss | -0.0087 | -| n_updates | 191680 | -| policy_gradient_loss | 0.00154 | -| std | 0.00831 | -| value_loss | 1.85e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19170 | -| time_elapsed | 103670 | -| total_timesteps | 2453760 | -| train/ | | -| approx_kl | 0.00032229722 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.00213 | -| n_updates | 191690 | -| policy_gradient_loss | 0.000967 | -| std | 0.00831 | -| value_loss | 5.53e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19171 | -| time_elapsed | 103676 | -| total_timesteps | 2453888 | -| train/ | | -| approx_kl | 0.03247943 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.898 | -| learning_rate | 0.0003 | -| loss | 0.00833 | -| n_updates | 191700 | -| policy_gradient_loss | 0.00345 | -| std | 0.00831 | -| value_loss | 2.54e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19172 | -| time_elapsed | 103680 | -| total_timesteps | 2454016 | -| train/ | | -| approx_kl | 0.005954118 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 191710 | -| policy_gradient_loss | -9.16e-05 | -| std | 0.00832 | -| value_loss | 1.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19173 | -| time_elapsed | 103691 | -| total_timesteps | 2454144 | -| train/ | | -| approx_kl | 0.08274323 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | 0.0472 | -| n_updates | 191720 | -| policy_gradient_loss | 0.0253 | -| std | 0.00832 | -| value_loss | 0.000405 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19174 | -| time_elapsed | 103696 | -| total_timesteps | 2454272 | -| train/ | | -| approx_kl | 0.072278515 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | 0.00588 | -| n_updates | 191730 | -| policy_gradient_loss | -0.00356 | -| std | 0.00832 | -| value_loss | 6.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19175 | -| time_elapsed | 103700 | -| total_timesteps | 2454400 | -| train/ | | -| approx_kl | 0.01971046 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.00473 | -| n_updates | 191740 | -| policy_gradient_loss | 0.00418 | -| std | 0.00832 | -| value_loss | 2.13e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19176 | -| time_elapsed | 103704 | -| total_timesteps | 2454528 | -| train/ | | -| approx_kl | 0.0040765377 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 191750 | -| policy_gradient_loss | 0.00368 | -| std | 0.00832 | -| value_loss | 8.82e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19177 | -| time_elapsed | 103708 | -| total_timesteps | 2454656 | -| train/ | | -| approx_kl | 7.400755e-05 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 191760 | -| policy_gradient_loss | 0.0249 | -| std | 0.00832 | -| value_loss | 2.85e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19178 | -| time_elapsed | 103713 | -| total_timesteps | 2454784 | -| train/ | | -| approx_kl | 0.098073654 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | 0.0668 | -| n_updates | 191770 | -| policy_gradient_loss | 0.0356 | -| std | 0.00829 | -| value_loss | 0.00014 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19179 | -| time_elapsed | 103717 | -| total_timesteps | 2454912 | -| train/ | | -| approx_kl | 0.07143251 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 191780 | -| policy_gradient_loss | 0.00754 | -| std | 0.00828 | -| value_loss | 5.79e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19180 | -| time_elapsed | 103721 | -| total_timesteps | 2455040 | -| train/ | | -| approx_kl | 0.021864953 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00686 | -| learning_rate | 0.0003 | -| loss | 0.00514 | -| n_updates | 191790 | -| policy_gradient_loss | 0.00388 | -| std | 0.00828 | -| value_loss | 8.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19181 | -| time_elapsed | 103728 | -| total_timesteps | 2455168 | -| train/ | | -| approx_kl | 0.0017951741 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.921 | -| learning_rate | 0.0003 | -| loss | -0.0241 | -| n_updates | 191800 | -| policy_gradient_loss | -0.00882 | -| std | 0.00828 | -| value_loss | 0.00146 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19182 | -| time_elapsed | 103732 | -| total_timesteps | 2455296 | -| train/ | | -| approx_kl | 0.0005645901 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | -0.000362 | -| n_updates | 191810 | -| policy_gradient_loss | 0.00554 | -| std | 0.00827 | -| value_loss | 0.000389 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19183 | -| time_elapsed | 103738 | -| total_timesteps | 2455424 | -| train/ | | -| approx_kl | 0.0013897149 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00922 | -| learning_rate | 0.0003 | -| loss | 0.00272 | -| n_updates | 191820 | -| policy_gradient_loss | 0.00241 | -| std | 0.00826 | -| value_loss | 0.000501 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19184 | -| time_elapsed | 103743 | -| total_timesteps | 2455552 | -| train/ | | -| approx_kl | 0.039188202 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00452 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 191830 | -| policy_gradient_loss | -0.00499 | -| std | 0.00825 | -| value_loss | 0.000195 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19185 | -| time_elapsed | 103747 | -| total_timesteps | 2455680 | -| train/ | | -| approx_kl | 0.0012155441 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -5.79 | -| learning_rate | 0.0003 | -| loss | -0.00118 | -| n_updates | 191840 | -| policy_gradient_loss | 0.0103 | -| std | 0.00825 | -| value_loss | 1.63e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19186 | -| time_elapsed | 103752 | -| total_timesteps | 2455808 | -| train/ | | -| approx_kl | 0.0024732105 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.00643 | -| n_updates | 191850 | -| policy_gradient_loss | 0.064 | -| std | 0.00825 | -| value_loss | 1.79e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 19187 | -| time_elapsed | 103757 | -| total_timesteps | 2455936 | -| train/ | | -| approx_kl | 0.058192097 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0428 | -| n_updates | 191860 | -| policy_gradient_loss | 0.124 | -| std | 0.00825 | -| value_loss | 4.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19188 | -| time_elapsed | 103761 | -| total_timesteps | 2456064 | -| train/ | | -| approx_kl | 0.09379743 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -3.72 | -| learning_rate | 0.0003 | -| loss | 0.0701 | -| n_updates | 191870 | -| policy_gradient_loss | 0.0519 | -| std | 0.00825 | -| value_loss | 1.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19189 | -| time_elapsed | 103770 | -| total_timesteps | 2456192 | -| train/ | | -| approx_kl | 0.104618125 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.7 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 191880 | -| policy_gradient_loss | -0.0111 | -| std | 0.00825 | -| value_loss | 0.00439 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19190 | -| time_elapsed | 103775 | -| total_timesteps | 2456320 | -| train/ | | -| approx_kl | 0.0019624494 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 191890 | -| policy_gradient_loss | -0.00297 | -| std | 0.00825 | -| value_loss | 3.72e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19191 | -| time_elapsed | 103779 | -| total_timesteps | 2456448 | -| train/ | | -| approx_kl | 0.024564747 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 191900 | -| policy_gradient_loss | -0.00585 | -| std | 0.00825 | -| value_loss | 1.02e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19192 | -| time_elapsed | 103783 | -| total_timesteps | 2456576 | -| train/ | | -| approx_kl | 0.037671 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 191910 | -| policy_gradient_loss | -0.00329 | -| std | 0.00826 | -| value_loss | 3.85e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19193 | -| time_elapsed | 103788 | -| total_timesteps | 2456704 | -| train/ | | -| approx_kl | 0.007404363 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | -0.000352 | -| n_updates | 191920 | -| policy_gradient_loss | 0.00808 | -| std | 0.00825 | -| value_loss | 1.98e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19194 | -| time_elapsed | 103792 | -| total_timesteps | 2456832 | -| train/ | | -| approx_kl | 0.05506065 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 191930 | -| policy_gradient_loss | 0.0123 | -| std | 0.00826 | -| value_loss | 1.52e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19195 | -| time_elapsed | 103796 | -| total_timesteps | 2456960 | -| train/ | | -| approx_kl | 0.009662187 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 191940 | -| policy_gradient_loss | 0.00292 | -| std | 0.00826 | -| value_loss | 5.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19196 | -| time_elapsed | 103801 | -| total_timesteps | 2457088 | -| train/ | | -| approx_kl | 0.034819882 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00176 | -| learning_rate | 0.0003 | -| loss | 0.00717 | -| n_updates | 191950 | -| policy_gradient_loss | 0.00167 | -| std | 0.00826 | -| value_loss | 9.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19197 | -| time_elapsed | 103811 | -| total_timesteps | 2457216 | -| train/ | | -| approx_kl | 0.060033675 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.69 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 191960 | -| policy_gradient_loss | -0.0125 | -| std | 0.00826 | -| value_loss | 0.00404 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19198 | -| time_elapsed | 103816 | -| total_timesteps | 2457344 | -| train/ | | -| approx_kl | 0.1868394 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 0.0551 | -| n_updates | 191970 | -| policy_gradient_loss | 0.0214 | -| std | 0.00826 | -| value_loss | 5.06e-06 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19199 | -| time_elapsed | 103820 | -| total_timesteps | 2457472 | -| train/ | | -| approx_kl | 0.00056914426 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | -0.00544 | -| n_updates | 191980 | -| policy_gradient_loss | -0.00255 | -| std | 0.00826 | -| value_loss | 1e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19200 | -| time_elapsed | 103825 | -| total_timesteps | 2457600 | -| train/ | | -| approx_kl | 1.0266434e-05 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.055 | -| learning_rate | 0.0003 | -| loss | -0.000365 | -| n_updates | 191990 | -| policy_gradient_loss | 0.00231 | -| std | 0.00826 | -| value_loss | 6.44e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19201 | -| time_elapsed | 103830 | -| total_timesteps | 2457728 | -| train/ | | -| approx_kl | 0.05114025 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 192000 | -| policy_gradient_loss | 0.0708 | -| std | 0.00826 | -| value_loss | 4.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19202 | -| time_elapsed | 103835 | -| total_timesteps | 2457856 | -| train/ | | -| approx_kl | 0.03242063 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 192010 | -| policy_gradient_loss | 0.023 | -| std | 0.00826 | -| value_loss | 3.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19203 | -| time_elapsed | 103839 | -| total_timesteps | 2457984 | -| train/ | | -| approx_kl | 0.19064504 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.056 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 192020 | -| policy_gradient_loss | 0.0302 | -| std | 0.00826 | -| value_loss | 2.03e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19204 | -| time_elapsed | 103843 | -| total_timesteps | 2458112 | -| train/ | | -| approx_kl | 0.0013196529 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 192030 | -| policy_gradient_loss | 0.0173 | -| std | 0.00826 | -| value_loss | 1.32e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19205 | -| time_elapsed | 103857 | -| total_timesteps | 2458240 | -| train/ | | -| approx_kl | 0.0037525082 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.739 | -| learning_rate | 0.0003 | -| loss | -0.00367 | -| n_updates | 192040 | -| policy_gradient_loss | 0.000318 | -| std | 0.00826 | -| value_loss | 0.00163 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19206 | -| time_elapsed | 103863 | -| total_timesteps | 2458368 | -| train/ | | -| approx_kl | 0.0008825236 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.494 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 192050 | -| policy_gradient_loss | 0.00842 | -| std | 0.00826 | -| value_loss | 1.74e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19207 | -| time_elapsed | 103867 | -| total_timesteps | 2458496 | -| train/ | | -| approx_kl | 7.3377974e-05 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | -0.00077 | -| n_updates | 192060 | -| policy_gradient_loss | 0.00244 | -| std | 0.00826 | -| value_loss | 1.2e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19208 | -| time_elapsed | 103872 | -| total_timesteps | 2458624 | -| train/ | | -| approx_kl | 5.6535937e-05 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0828 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 192070 | -| policy_gradient_loss | -0.000505 | -| std | 0.00826 | -| value_loss | 9.31e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19209 | -| time_elapsed | 103877 | -| total_timesteps | 2458752 | -| train/ | | -| approx_kl | 0.00016886136 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 192080 | -| policy_gradient_loss | 0.00356 | -| std | 0.00826 | -| value_loss | 5.83e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19210 | -| time_elapsed | 103882 | -| total_timesteps | 2458880 | -| train/ | | -| approx_kl | 0.057727013 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 192090 | -| policy_gradient_loss | 0.0611 | -| std | 0.00826 | -| value_loss | 4.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19211 | -| time_elapsed | 103887 | -| total_timesteps | 2459008 | -| train/ | | -| approx_kl | 0.0005712402 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.000171 | -| n_updates | 192100 | -| policy_gradient_loss | 0.055 | -| std | 0.00825 | -| value_loss | 6.01e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19212 | -| time_elapsed | 103898 | -| total_timesteps | 2459136 | -| train/ | | -| approx_kl | 0.022002822 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.0253 | -| n_updates | 192110 | -| policy_gradient_loss | 0.00481 | -| std | 0.00824 | -| value_loss | 0.00221 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19213 | -| time_elapsed | 103903 | -| total_timesteps | 2459264 | -| train/ | | -| approx_kl | 0.10134572 | -| clip_fraction | 0.621 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 192120 | -| policy_gradient_loss | 0.0632 | -| std | 0.00823 | -| value_loss | 2.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19214 | -| time_elapsed | 103907 | -| total_timesteps | 2459392 | -| train/ | | -| approx_kl | 0.047593545 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0995 | -| learning_rate | 0.0003 | -| loss | -0.00761 | -| n_updates | 192130 | -| policy_gradient_loss | 0.00484 | -| std | 0.00823 | -| value_loss | 7.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19215 | -| time_elapsed | 103911 | -| total_timesteps | 2459520 | -| train/ | | -| approx_kl | 0.10440407 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 192140 | -| policy_gradient_loss | 0.016 | -| std | 0.00823 | -| value_loss | 3.41e-09 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19216 | -| time_elapsed | 103916 | -| total_timesteps | 2459648 | -| train/ | | -| approx_kl | 0.395014 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.28 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 192150 | -| policy_gradient_loss | 0.0339 | -| std | 0.00824 | -| value_loss | 8.17e-09 | --------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19217 | -| time_elapsed | 103919 | -| total_timesteps | 2459776 | -| train/ | | -| approx_kl | 0.0290576 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0841 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 192160 | -| policy_gradient_loss | 0.00651 | -| std | 0.00824 | -| value_loss | 2.45e-08 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19218 | -| time_elapsed | 103924 | -| total_timesteps | 2459904 | -| train/ | | -| approx_kl | 9.0846326e-05 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00974 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 192170 | -| policy_gradient_loss | -0.00318 | -| std | 0.00824 | -| value_loss | 1.41e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19219 | -| time_elapsed | 103928 | -| total_timesteps | 2460032 | -| train/ | | -| approx_kl | 0.0064841984 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0663 | -| learning_rate | 0.0003 | -| loss | -0.00477 | -| n_updates | 192180 | -| policy_gradient_loss | 0.00516 | -| std | 0.00823 | -| value_loss | 1.01e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19220 | -| time_elapsed | 103939 | -| total_timesteps | 2460160 | -| train/ | | -| approx_kl | 0.0095243845 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.819 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 192190 | -| policy_gradient_loss | -0.00427 | -| std | 0.00823 | -| value_loss | 0.0047 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19221 | -| time_elapsed | 103945 | -| total_timesteps | 2460288 | -| train/ | | -| approx_kl | 0.060256798 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | 0.0341 | -| n_updates | 192200 | -| policy_gradient_loss | 0.0116 | -| std | 0.00823 | -| value_loss | 4.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19222 | -| time_elapsed | 103950 | -| total_timesteps | 2460416 | -| train/ | | -| approx_kl | 0.011737598 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | -0.00939 | -| n_updates | 192210 | -| policy_gradient_loss | 0.00168 | -| std | 0.00822 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19223 | -| time_elapsed | 103956 | -| total_timesteps | 2460544 | -| train/ | | -| approx_kl | 0.051306985 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 192220 | -| policy_gradient_loss | 0.0115 | -| std | 0.00823 | -| value_loss | 6.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19224 | -| time_elapsed | 103961 | -| total_timesteps | 2460672 | -| train/ | | -| approx_kl | 0.011895264 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0885 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 192230 | -| policy_gradient_loss | 0.00557 | -| std | 0.00823 | -| value_loss | 6.76e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19225 | -| time_elapsed | 103965 | -| total_timesteps | 2460800 | -| train/ | | -| approx_kl | 9.5609576e-05 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -0.000979 | -| n_updates | 192240 | -| policy_gradient_loss | 0.00613 | -| std | 0.00823 | -| value_loss | 7.3e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19226 | -| time_elapsed | 103971 | -| total_timesteps | 2460928 | -| train/ | | -| approx_kl | 0.025834404 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.542 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 192250 | -| policy_gradient_loss | 0.00076 | -| std | 0.00823 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19227 | -| time_elapsed | 103976 | -| total_timesteps | 2461056 | -| train/ | | -| approx_kl | 0.045507085 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.23 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 192260 | -| policy_gradient_loss | 0.0074 | -| std | 0.00823 | -| value_loss | 7.53e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19228 | -| time_elapsed | 103983 | -| total_timesteps | 2461184 | -| train/ | | -| approx_kl | 0.09236606 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.966 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 192270 | -| policy_gradient_loss | -0.00609 | -| std | 0.00823 | -| value_loss | 0.000466 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19229 | -| time_elapsed | 103988 | -| total_timesteps | 2461312 | -| train/ | | -| approx_kl | 0.014286685 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.00575 | -| n_updates | 192280 | -| policy_gradient_loss | 0.0249 | -| std | 0.00823 | -| value_loss | 1.52e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19230 | -| time_elapsed | 103992 | -| total_timesteps | 2461440 | -| train/ | | -| approx_kl | 0.07741166 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 192290 | -| policy_gradient_loss | 0.0134 | -| std | 0.00823 | -| value_loss | 3.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19231 | -| time_elapsed | 103996 | -| total_timesteps | 2461568 | -| train/ | | -| approx_kl | 0.39134496 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.0943 | -| n_updates | 192300 | -| policy_gradient_loss | 0.0334 | -| std | 0.00823 | -| value_loss | 2.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19232 | -| time_elapsed | 104001 | -| total_timesteps | 2461696 | -| train/ | | -| approx_kl | 0.009861536 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.00115 | -| n_updates | 192310 | -| policy_gradient_loss | 0.00497 | -| std | 0.00823 | -| value_loss | 1.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19233 | -| time_elapsed | 104006 | -| total_timesteps | 2461824 | -| train/ | | -| approx_kl | 0.05129847 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 192320 | -| policy_gradient_loss | 0.013 | -| std | 0.00822 | -| value_loss | 9.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19234 | -| time_elapsed | 104009 | -| total_timesteps | 2461952 | -| train/ | | -| approx_kl | 0.008040558 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | -0.00725 | -| n_updates | 192330 | -| policy_gradient_loss | 0.00342 | -| std | 0.00822 | -| value_loss | 6.72e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19235 | -| time_elapsed | 104014 | -| total_timesteps | 2462080 | -| train/ | | -| approx_kl | 0.05251517 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 192340 | -| policy_gradient_loss | 0.01 | -| std | 0.00822 | -| value_loss | 4.17e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19236 | -| time_elapsed | 104021 | -| total_timesteps | 2462208 | -| train/ | | -| approx_kl | 0.04999323 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 192350 | -| policy_gradient_loss | -0.00819 | -| std | 0.00822 | -| value_loss | 0.00314 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19237 | -| time_elapsed | 104027 | -| total_timesteps | 2462336 | -| train/ | | -| approx_kl | 0.010763649 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 192360 | -| policy_gradient_loss | 0.00511 | -| std | 0.00822 | -| value_loss | 1.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19238 | -| time_elapsed | 104032 | -| total_timesteps | 2462464 | -| train/ | | -| approx_kl | 0.046848606 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 192370 | -| policy_gradient_loss | 0.0245 | -| std | 0.00822 | -| value_loss | 2.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19239 | -| time_elapsed | 104036 | -| total_timesteps | 2462592 | -| train/ | | -| approx_kl | 0.023665734 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 192380 | -| policy_gradient_loss | 0.0146 | -| std | 0.00822 | -| value_loss | 5.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19240 | -| time_elapsed | 104041 | -| total_timesteps | 2462720 | -| train/ | | -| approx_kl | 0.004595154 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00778 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 192390 | -| policy_gradient_loss | 0.00507 | -| std | 0.00822 | -| value_loss | 1.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19241 | -| time_elapsed | 104046 | -| total_timesteps | 2462848 | -| train/ | | -| approx_kl | 0.05741418 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00457 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 192400 | -| policy_gradient_loss | 0.0276 | -| std | 0.00822 | -| value_loss | 2.02e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19242 | -| time_elapsed | 104051 | -| total_timesteps | 2462976 | -| train/ | | -| approx_kl | 0.15320773 | -| clip_fraction | 0.507 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | 0.0027 | -| n_updates | 192410 | -| policy_gradient_loss | 0.00692 | -| std | 0.00822 | -| value_loss | 3.96e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19243 | -| time_elapsed | 104057 | -| total_timesteps | 2463104 | -| train/ | | -| approx_kl | 0.01445366 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | 0.00228 | -| n_updates | 192420 | -| policy_gradient_loss | 0.0158 | -| std | 0.00822 | -| value_loss | 1.92e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19244 | -| time_elapsed | 104068 | -| total_timesteps | 2463232 | -| train/ | | -| approx_kl | 0.03917111 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.856 | -| learning_rate | 0.0003 | -| loss | -0.00796 | -| n_updates | 192430 | -| policy_gradient_loss | 0.0142 | -| std | 0.00823 | -| value_loss | 0.00325 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19245 | -| time_elapsed | 104072 | -| total_timesteps | 2463360 | -| train/ | | -| approx_kl | 0.13652125 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.33 | -| learning_rate | 0.0003 | -| loss | 0.0587 | -| n_updates | 192440 | -| policy_gradient_loss | 0.0304 | -| std | 0.00822 | -| value_loss | 3.02e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19246 | -| time_elapsed | 104076 | -| total_timesteps | 2463488 | -| train/ | | -| approx_kl | 0.042092368 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.0011 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 192450 | -| policy_gradient_loss | 0.0688 | -| std | 0.00822 | -| value_loss | 1.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19247 | -| time_elapsed | 104082 | -| total_timesteps | 2463616 | -| train/ | | -| approx_kl | 0.18700032 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | 0.074 | -| n_updates | 192460 | -| policy_gradient_loss | 0.0293 | -| std | 0.00823 | -| value_loss | 9.89e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19248 | -| time_elapsed | 104087 | -| total_timesteps | 2463744 | -| train/ | | -| approx_kl | 0.0378273 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 192470 | -| policy_gradient_loss | 0.0354 | -| std | 0.00823 | -| value_loss | 7.17e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19249 | -| time_elapsed | 104092 | -| total_timesteps | 2463872 | -| train/ | | -| approx_kl | 0.017187243 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | -0.00517 | -| n_updates | 192480 | -| policy_gradient_loss | 0.0141 | -| std | 0.00823 | -| value_loss | 4.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19250 | -| time_elapsed | 104096 | -| total_timesteps | 2464000 | -| train/ | | -| approx_kl | 0.01979973 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.00105 | -| n_updates | 192490 | -| policy_gradient_loss | 0.0307 | -| std | 0.00823 | -| value_loss | 2.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19251 | -| time_elapsed | 104100 | -| total_timesteps | 2464128 | -| train/ | | -| approx_kl | 0.12190637 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.005 | -| learning_rate | 0.0003 | -| loss | 0.0725 | -| n_updates | 192500 | -| policy_gradient_loss | 0.0402 | -| std | 0.00823 | -| value_loss | 1.63e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19252 | -| time_elapsed | 104111 | -| total_timesteps | 2464256 | -| train/ | | -| approx_kl | 0.03098308 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.886 | -| learning_rate | 0.0003 | -| loss | 0.003 | -| n_updates | 192510 | -| policy_gradient_loss | 0.0382 | -| std | 0.00823 | -| value_loss | 0.00229 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19253 | -| time_elapsed | 104116 | -| total_timesteps | 2464384 | -| train/ | | -| approx_kl | 0.22541097 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.0971 | -| n_updates | 192520 | -| policy_gradient_loss | 0.0334 | -| std | 0.00822 | -| value_loss | 8.7e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19254 | -| time_elapsed | 104121 | -| total_timesteps | 2464512 | -| train/ | | -| approx_kl | 0.00024358649 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00965 | -| learning_rate | 0.0003 | -| loss | -0.000437 | -| n_updates | 192530 | -| policy_gradient_loss | 0.00655 | -| std | 0.00822 | -| value_loss | 1.04e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19255 | -| time_elapsed | 104127 | -| total_timesteps | 2464640 | -| train/ | | -| approx_kl | 5.2420422e-05 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0759 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 192540 | -| policy_gradient_loss | -0.00192 | -| std | 0.00822 | -| value_loss | 2.02e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19256 | -| time_elapsed | 104132 | -| total_timesteps | 2464768 | -| train/ | | -| approx_kl | 0.00011930475 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00653 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 192550 | -| policy_gradient_loss | 0.00289 | -| std | 0.00822 | -| value_loss | 4.69e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 19257 | -| time_elapsed | 104138 | -| total_timesteps | 2464896 | -| train/ | | -| approx_kl | 9.697117e-05 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | -0.000631 | -| n_updates | 192560 | -| policy_gradient_loss | 0.00342 | -| std | 0.00822 | -| value_loss | 3.12e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19258 | -| time_elapsed | 104142 | -| total_timesteps | 2465024 | -| train/ | | -| approx_kl | 9.2872884e-05 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0624 | -| learning_rate | 0.0003 | -| loss | -0.00282 | -| n_updates | 192570 | -| policy_gradient_loss | -0.00696 | -| std | 0.00822 | -| value_loss | 2.49e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19259 | -| time_elapsed | 104153 | -| total_timesteps | 2465152 | -| train/ | | -| approx_kl | 0.2037757 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.0432 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 192580 | -| policy_gradient_loss | -0.0111 | -| std | 0.00822 | -| value_loss | 0.00215 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19260 | -| time_elapsed | 104157 | -| total_timesteps | 2465280 | -| train/ | | -| approx_kl | 0.103743285 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.513 | -| learning_rate | 0.0003 | -| loss | 0.056 | -| n_updates | 192590 | -| policy_gradient_loss | 0.0086 | -| std | 0.00822 | -| value_loss | 4.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19261 | -| time_elapsed | 104160 | -| total_timesteps | 2465408 | -| train/ | | -| approx_kl | 0.036810894 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 192600 | -| policy_gradient_loss | 0.0177 | -| std | 0.00823 | -| value_loss | 1.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19262 | -| time_elapsed | 104165 | -| total_timesteps | 2465536 | -| train/ | | -| approx_kl | 0.074628755 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.742 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 192610 | -| policy_gradient_loss | 0.0106 | -| std | 0.00823 | -| value_loss | 6.1e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19263 | -| time_elapsed | 104170 | -| total_timesteps | 2465664 | -| train/ | | -| approx_kl | 0.00038628 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 192620 | -| policy_gradient_loss | 0.0147 | -| std | 0.00823 | -| value_loss | 1.05e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19264 | -| time_elapsed | 104176 | -| total_timesteps | 2465792 | -| train/ | | -| approx_kl | 0.113525465 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.0626 | -| n_updates | 192630 | -| policy_gradient_loss | 0.0151 | -| std | 0.00823 | -| value_loss | 3.52e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 19265 | -| time_elapsed | 104180 | -| total_timesteps | 2465920 | -| train/ | | -| approx_kl | 0.13599661 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0901 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 192640 | -| policy_gradient_loss | 0.0131 | -| std | 0.00823 | -| value_loss | 1.85e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19266 | -| time_elapsed | 104185 | -| total_timesteps | 2466048 | -| train/ | | -| approx_kl | 0.06159832 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00883 | -| learning_rate | 0.0003 | -| loss | 0.00907 | -| n_updates | 192650 | -| policy_gradient_loss | 0.0102 | -| std | 0.00823 | -| value_loss | 4.21e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19267 | -| time_elapsed | 104197 | -| total_timesteps | 2466176 | -| train/ | | -| approx_kl | 0.026076807 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -2.43 | -| learning_rate | 0.0003 | -| loss | -0.0249 | -| n_updates | 192660 | -| policy_gradient_loss | -0.00062 | -| std | 0.00823 | -| value_loss | 0.00348 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19268 | -| time_elapsed | 104202 | -| total_timesteps | 2466304 | -| train/ | | -| approx_kl | 0.38255483 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.0786 | -| n_updates | 192670 | -| policy_gradient_loss | 0.0433 | -| std | 0.00823 | -| value_loss | 8.14e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19269 | -| time_elapsed | 104207 | -| total_timesteps | 2466432 | -| train/ | | -| approx_kl | 0.028828468 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00249 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 192680 | -| policy_gradient_loss | 0.0075 | -| std | 0.00824 | -| value_loss | 8.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19270 | -| time_elapsed | 104211 | -| total_timesteps | 2466560 | -| train/ | | -| approx_kl | 0.032248974 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 192690 | -| policy_gradient_loss | 0.00753 | -| std | 0.00825 | -| value_loss | 1.16e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19271 | -| time_elapsed | 104214 | -| total_timesteps | 2466688 | -| train/ | | -| approx_kl | 6.0320366e-05 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 192700 | -| policy_gradient_loss | -0.00357 | -| std | 0.00825 | -| value_loss | 9.21e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19272 | -| time_elapsed | 104219 | -| total_timesteps | 2466816 | -| train/ | | -| approx_kl | 0.12106896 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.0636 | -| n_updates | 192710 | -| policy_gradient_loss | 0.0402 | -| std | 0.00828 | -| value_loss | 0.000215 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19273 | -| time_elapsed | 104223 | -| total_timesteps | 2466944 | -| train/ | | -| approx_kl | 0.064291105 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 192720 | -| policy_gradient_loss | 0.00485 | -| std | 0.00829 | -| value_loss | 9.74e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19274 | -| time_elapsed | 104227 | -| total_timesteps | 2467072 | -| train/ | | -| approx_kl | 0.011648089 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.00699 | -| learning_rate | 0.0003 | -| loss | 0.00273 | -| n_updates | 192730 | -| policy_gradient_loss | 0.00474 | -| std | 0.0083 | -| value_loss | 2.83e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19275 | -| time_elapsed | 104237 | -| total_timesteps | 2467200 | -| train/ | | -| approx_kl | 0.011057094 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -5.38 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 192740 | -| policy_gradient_loss | -0.017 | -| std | 0.0083 | -| value_loss | 0.00419 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19276 | -| time_elapsed | 104241 | -| total_timesteps | 2467328 | -| train/ | | -| approx_kl | 0.00073133316 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.00144 | -| n_updates | 192750 | -| policy_gradient_loss | 0.0192 | -| std | 0.0083 | -| value_loss | 7.08e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19277 | -| time_elapsed | 104246 | -| total_timesteps | 2467456 | -| train/ | | -| approx_kl | 0.05612448 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | 0.00192 | -| n_updates | 192760 | -| policy_gradient_loss | 0.00925 | -| std | 0.0083 | -| value_loss | 8.66e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19278 | -| time_elapsed | 104252 | -| total_timesteps | 2467584 | -| train/ | | -| approx_kl | 0.10053651 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 192770 | -| policy_gradient_loss | 0.0148 | -| std | 0.0083 | -| value_loss | 3.21e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19279 | -| time_elapsed | 104256 | -| total_timesteps | 2467712 | -| train/ | | -| approx_kl | 0.00019982224 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | 0.000125 | -| n_updates | 192780 | -| policy_gradient_loss | 0.0236 | -| std | 0.00829 | -| value_loss | 4.66e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19280 | -| time_elapsed | 104259 | -| total_timesteps | 2467840 | -| train/ | | -| approx_kl | 0.045021895 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 192790 | -| policy_gradient_loss | 0.0304 | -| std | 0.00829 | -| value_loss | 1.45e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19281 | -| time_elapsed | 104263 | -| total_timesteps | 2467968 | -| train/ | | -| approx_kl | 0.20760038 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00215 | -| learning_rate | 0.0003 | -| loss | 0.0891 | -| n_updates | 192800 | -| policy_gradient_loss | 0.0842 | -| std | 0.00829 | -| value_loss | 2.81e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19282 | -| time_elapsed | 104267 | -| total_timesteps | 2468096 | -| train/ | | -| approx_kl | 0.11824919 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.0851 | -| n_updates | 192810 | -| policy_gradient_loss | 0.131 | -| std | 0.00829 | -| value_loss | 6.38e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19283 | -| time_elapsed | 104274 | -| total_timesteps | 2468224 | -| train/ | | -| approx_kl | 0.08447351 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 192820 | -| policy_gradient_loss | -0.00661 | -| std | 0.00829 | -| value_loss | 0.000483 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19284 | -| time_elapsed | 104278 | -| total_timesteps | 2468352 | -| train/ | | -| approx_kl | 0.7915028 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.272 | -| n_updates | 192830 | -| policy_gradient_loss | 0.186 | -| std | 0.00829 | -| value_loss | 1.33e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19285 | -| time_elapsed | 104282 | -| total_timesteps | 2468480 | -| train/ | | -| approx_kl | 0.0009896406 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.485 | -| learning_rate | 0.0003 | -| loss | -0.000545 | -| n_updates | 192840 | -| policy_gradient_loss | 0.0143 | -| std | 0.00828 | -| value_loss | 1.23e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19286 | -| time_elapsed | 104286 | -| total_timesteps | 2468608 | -| train/ | | -| approx_kl | 0.11545005 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.0511 | -| n_updates | 192850 | -| policy_gradient_loss | 0.0128 | -| std | 0.00829 | -| value_loss | 8.44e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19287 | -| time_elapsed | 104291 | -| total_timesteps | 2468736 | -| train/ | | -| approx_kl | 0.014608886 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 192860 | -| policy_gradient_loss | 0.0175 | -| std | 0.00829 | -| value_loss | 1.77e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19288 | -| time_elapsed | 104296 | -| total_timesteps | 2468864 | -| train/ | | -| approx_kl | 0.06211815 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 192870 | -| policy_gradient_loss | 0.00765 | -| std | 0.00829 | -| value_loss | 1.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19289 | -| time_elapsed | 104303 | -| total_timesteps | 2468992 | -| train/ | | -| approx_kl | 0.004029131 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.000666 | -| n_updates | 192880 | -| policy_gradient_loss | 0.00334 | -| std | 0.00829 | -| value_loss | 1.21e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19290 | -| time_elapsed | 104308 | -| total_timesteps | 2469120 | -| train/ | | -| approx_kl | 0.16036974 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0863 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 192890 | -| policy_gradient_loss | 0.116 | -| std | 0.0083 | -| value_loss | 9.4e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19291 | -| time_elapsed | 104321 | -| total_timesteps | 2469248 | -| train/ | | -| approx_kl | 0.006774004 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.00748 | -| n_updates | 192900 | -| policy_gradient_loss | 0.00688 | -| std | 0.0083 | -| value_loss | 0.000151 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19292 | -| time_elapsed | 104326 | -| total_timesteps | 2469376 | -| train/ | | -| approx_kl | 0.031735577 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.00919 | -| n_updates | 192910 | -| policy_gradient_loss | 0.00303 | -| std | 0.00829 | -| value_loss | 4.16e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19293 | -| time_elapsed | 104332 | -| total_timesteps | 2469504 | -| train/ | | -| approx_kl | 0.24786152 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.00413 | -| learning_rate | 0.0003 | -| loss | 0.0691 | -| n_updates | 192920 | -| policy_gradient_loss | 0.0201 | -| std | 0.00828 | -| value_loss | 1.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19294 | -| time_elapsed | 104337 | -| total_timesteps | 2469632 | -| train/ | | -| approx_kl | 0.10287088 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.37 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | 0.0762 | -| n_updates | 192930 | -| policy_gradient_loss | 0.0285 | -| std | 0.00828 | -| value_loss | 2.11e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19295 | -| time_elapsed | 104342 | -| total_timesteps | 2469760 | -| train/ | | -| approx_kl | 0.10502514 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0452 | -| n_updates | 192940 | -| policy_gradient_loss | 0.00953 | -| std | 0.00826 | -| value_loss | 1.65e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19296 | -| time_elapsed | 104347 | -| total_timesteps | 2469888 | -| train/ | | -| approx_kl | 0.0017667594 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.443 | -| learning_rate | 0.0003 | -| loss | 0.00331 | -| n_updates | 192950 | -| policy_gradient_loss | 0.0121 | -| std | 0.00826 | -| value_loss | 4.9e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19297 | -| time_elapsed | 104352 | -| total_timesteps | 2470016 | -| train/ | | -| approx_kl | 0.24271706 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 192960 | -| policy_gradient_loss | 0.0937 | -| std | 0.00826 | -| value_loss | 1.15e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19298 | -| time_elapsed | 104363 | -| total_timesteps | 2470144 | -| train/ | | -| approx_kl | 0.1628241 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | 0.0748 | -| n_updates | 192970 | -| policy_gradient_loss | 0.0603 | -| std | 0.00826 | -| value_loss | 0.000112 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19299 | -| time_elapsed | 104367 | -| total_timesteps | 2470272 | -| train/ | | -| approx_kl | 0.1530388 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.0983 | -| n_updates | 192980 | -| policy_gradient_loss | 0.0976 | -| std | 0.00826 | -| value_loss | 5.05e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19300 | -| time_elapsed | 104372 | -| total_timesteps | 2470400 | -| train/ | | -| approx_kl | 0.110460475 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.481 | -| learning_rate | 0.0003 | -| loss | 0.0933 | -| n_updates | 192990 | -| policy_gradient_loss | 0.106 | -| std | 0.00826 | -| value_loss | 4.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19301 | -| time_elapsed | 104378 | -| total_timesteps | 2470528 | -| train/ | | -| approx_kl | 0.023321439 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00922 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 193000 | -| policy_gradient_loss | 0.0184 | -| std | 0.00826 | -| value_loss | 1.38e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19302 | -| time_elapsed | 104381 | -| total_timesteps | 2470656 | -| train/ | | -| approx_kl | 0.122599065 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.00936 | -| learning_rate | 0.0003 | -| loss | 0.0492 | -| n_updates | 193010 | -| policy_gradient_loss | 0.0126 | -| std | 0.00826 | -| value_loss | 5.85e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19303 | -| time_elapsed | 104386 | -| total_timesteps | 2470784 | -| train/ | | -| approx_kl | 0.012826236 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 193020 | -| policy_gradient_loss | 0.0164 | -| std | 0.00826 | -| value_loss | 2.76e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19304 | -| time_elapsed | 104390 | -| total_timesteps | 2470912 | -| train/ | | -| approx_kl | 0.16195843 | -| clip_fraction | 0.624 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 193030 | -| policy_gradient_loss | 0.0847 | -| std | 0.00826 | -| value_loss | 1.99e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19305 | -| time_elapsed | 104394 | -| total_timesteps | 2471040 | -| train/ | | -| approx_kl | 0.112804845 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0773 | -| learning_rate | 0.0003 | -| loss | 0.0935 | -| n_updates | 193040 | -| policy_gradient_loss | 0.109 | -| std | 0.00826 | -| value_loss | 9.43e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19306 | -| time_elapsed | 104403 | -| total_timesteps | 2471168 | -| train/ | | -| approx_kl | 0.14704211 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | 0.097 | -| n_updates | 193050 | -| policy_gradient_loss | 0.0819 | -| std | 0.00826 | -| value_loss | 0.00229 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19307 | -| time_elapsed | 104407 | -| total_timesteps | 2471296 | -| train/ | | -| approx_kl | 0.025295839 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.51 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 193060 | -| policy_gradient_loss | 0.00628 | -| std | 0.00826 | -| value_loss | 2.25e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19308 | -| time_elapsed | 104412 | -| total_timesteps | 2471424 | -| train/ | | -| approx_kl | 0.3419732 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00913 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 193070 | -| policy_gradient_loss | 0.0371 | -| std | 0.00826 | -| value_loss | 2.32e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19309 | -| time_elapsed | 104417 | -| total_timesteps | 2471552 | -| train/ | | -| approx_kl | 0.028133001 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 193080 | -| policy_gradient_loss | 0.00163 | -| std | 0.00826 | -| value_loss | 1.61e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19310 | -| time_elapsed | 104421 | -| total_timesteps | 2471680 | -| train/ | | -| approx_kl | 0.03455759 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 193090 | -| policy_gradient_loss | 0.00946 | -| std | 0.00826 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19311 | -| time_elapsed | 104425 | -| total_timesteps | 2471808 | -| train/ | | -| approx_kl | 0.029247966 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 193100 | -| policy_gradient_loss | 0.00623 | -| std | 0.00826 | -| value_loss | 1.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19312 | -| time_elapsed | 104430 | -| total_timesteps | 2471936 | -| train/ | | -| approx_kl | 0.028496811 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 193110 | -| policy_gradient_loss | 0.0047 | -| std | 0.00826 | -| value_loss | 4.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19313 | -| time_elapsed | 104434 | -| total_timesteps | 2472064 | -| train/ | | -| approx_kl | 0.026803624 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.00393 | -| n_updates | 193120 | -| policy_gradient_loss | 0.00181 | -| std | 0.00826 | -| value_loss | 3.14e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19314 | -| time_elapsed | 104441 | -| total_timesteps | 2472192 | -| train/ | | -| approx_kl | 0.03526097 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 193130 | -| policy_gradient_loss | -0.011 | -| std | 0.00826 | -| value_loss | 0.00192 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19315 | -| time_elapsed | 104445 | -| total_timesteps | 2472320 | -| train/ | | -| approx_kl | 0.04466971 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 193140 | -| policy_gradient_loss | 0.0238 | -| std | 0.00827 | -| value_loss | 2.71e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19316 | -| time_elapsed | 104450 | -| total_timesteps | 2472448 | -| train/ | | -| approx_kl | 0.21326701 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00423 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 193150 | -| policy_gradient_loss | 0.0984 | -| std | 0.00827 | -| value_loss | 3.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19317 | -| time_elapsed | 104455 | -| total_timesteps | 2472576 | -| train/ | | -| approx_kl | 0.037225667 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.00737 | -| n_updates | 193160 | -| policy_gradient_loss | 0.0155 | -| std | 0.00827 | -| value_loss | 1.98e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19318 | -| time_elapsed | 104461 | -| total_timesteps | 2472704 | -| train/ | | -| approx_kl | 0.10667845 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0605 | -| n_updates | 193170 | -| policy_gradient_loss | 0.0149 | -| std | 0.00826 | -| value_loss | 1.2e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19319 | -| time_elapsed | 104466 | -| total_timesteps | 2472832 | -| train/ | | -| approx_kl | 0.0072862944 | -| clip_fraction | 0.0523 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | -0.00222 | -| n_updates | 193180 | -| policy_gradient_loss | -0.00129 | -| std | 0.00826 | -| value_loss | 7.49e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19320 | -| time_elapsed | 104471 | -| total_timesteps | 2472960 | -| train/ | | -| approx_kl | 0.0088308435 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0659 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 193190 | -| policy_gradient_loss | -0.00129 | -| std | 0.00826 | -| value_loss | 4.49e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19321 | -| time_elapsed | 104476 | -| total_timesteps | 2473088 | -| train/ | | -| approx_kl | 0.012987129 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | -0.00903 | -| n_updates | 193200 | -| policy_gradient_loss | 0.00971 | -| std | 0.00826 | -| value_loss | 3.16e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19322 | -| time_elapsed | 104486 | -| total_timesteps | 2473216 | -| train/ | | -| approx_kl | 0.2066751 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | 0.0562 | -| n_updates | 193210 | -| policy_gradient_loss | 0.0488 | -| std | 0.00826 | -| value_loss | 0.00185 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19323 | -| time_elapsed | 104492 | -| total_timesteps | 2473344 | -| train/ | | -| approx_kl | 0.06407462 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 193220 | -| policy_gradient_loss | 0.0195 | -| std | 0.00825 | -| value_loss | 7.19e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19324 | -| time_elapsed | 104496 | -| total_timesteps | 2473472 | -| train/ | | -| approx_kl | 0.0036418536 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | 0.00565 | -| n_updates | 193230 | -| policy_gradient_loss | 0.00864 | -| std | 0.00825 | -| value_loss | 1.09e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19325 | -| time_elapsed | 104501 | -| total_timesteps | 2473600 | -| train/ | | -| approx_kl | 0.03284088 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 193240 | -| policy_gradient_loss | 0.0129 | -| std | 0.00825 | -| value_loss | 7.78e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19326 | -| time_elapsed | 104507 | -| total_timesteps | 2473728 | -| train/ | | -| approx_kl | 0.00029198965 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0808 | -| learning_rate | 0.0003 | -| loss | 0.000461 | -| n_updates | 193250 | -| policy_gradient_loss | 0.0227 | -| std | 0.00825 | -| value_loss | 3.24e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19327 | -| time_elapsed | 104510 | -| total_timesteps | 2473856 | -| train/ | | -| approx_kl | 0.1279061 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.0621 | -| n_updates | 193260 | -| policy_gradient_loss | 0.0145 | -| std | 0.00825 | -| value_loss | 2.79e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19328 | -| time_elapsed | 104515 | -| total_timesteps | 2473984 | -| train/ | | -| approx_kl | 0.13271192 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 193270 | -| policy_gradient_loss | 0.00337 | -| std | 0.00825 | -| value_loss | 7.25e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19329 | -| time_elapsed | 104519 | -| total_timesteps | 2474112 | -| train/ | | -| approx_kl | 0.040863745 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.324 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 193280 | -| policy_gradient_loss | 0.0222 | -| std | 0.00825 | -| value_loss | 8.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19330 | -| time_elapsed | 104527 | -| total_timesteps | 2474240 | -| train/ | | -| approx_kl | 0.02169606 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 193290 | -| policy_gradient_loss | -0.014 | -| std | 0.00825 | -| value_loss | 6.58e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19331 | -| time_elapsed | 104531 | -| total_timesteps | 2474368 | -| train/ | | -| approx_kl | 0.03281322 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.0018 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 193300 | -| policy_gradient_loss | 0.00529 | -| std | 0.00825 | -| value_loss | 4.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19332 | -| time_elapsed | 104535 | -| total_timesteps | 2474496 | -| train/ | | -| approx_kl | 0.034754977 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.00928 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 193310 | -| policy_gradient_loss | 0.0104 | -| std | 0.00824 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19333 | -| time_elapsed | 104538 | -| total_timesteps | 2474624 | -| train/ | | -| approx_kl | 0.005346896 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 193320 | -| policy_gradient_loss | 0.00356 | -| std | 0.00824 | -| value_loss | 7.01e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19334 | -| time_elapsed | 104542 | -| total_timesteps | 2474752 | -| train/ | | -| approx_kl | 0.052926548 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 193330 | -| policy_gradient_loss | 0.00436 | -| std | 0.00823 | -| value_loss | 5.74e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19335 | -| time_elapsed | 104546 | -| total_timesteps | 2474880 | -| train/ | | -| approx_kl | 0.026579788 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 193340 | -| policy_gradient_loss | -0.00714 | -| std | 0.00823 | -| value_loss | 3.42e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19336 | -| time_elapsed | 104550 | -| total_timesteps | 2475008 | -| train/ | | -| approx_kl | 0.0042943824 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 193350 | -| policy_gradient_loss | 0.00403 | -| std | 0.00823 | -| value_loss | 2.26e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19337 | -| time_elapsed | 104561 | -| total_timesteps | 2475136 | -| train/ | | -| approx_kl | 0.006628808 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.9 | -| learning_rate | 0.0003 | -| loss | -0.000592 | -| n_updates | 193360 | -| policy_gradient_loss | -0.00862 | -| std | 0.00822 | -| value_loss | 0.00142 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19338 | -| time_elapsed | 104566 | -| total_timesteps | 2475264 | -| train/ | | -| approx_kl | 0.03400311 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.499 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 193370 | -| policy_gradient_loss | 0.00476 | -| std | 0.00822 | -| value_loss | 4.58e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19339 | -| time_elapsed | 104569 | -| total_timesteps | 2475392 | -| train/ | | -| approx_kl | 0.012891163 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0936 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 193380 | -| policy_gradient_loss | 0.000632 | -| std | 0.00822 | -| value_loss | 2.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19340 | -| time_elapsed | 104573 | -| total_timesteps | 2475520 | -| train/ | | -| approx_kl | 0.0005107047 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0793 | -| learning_rate | 0.0003 | -| loss | 0.000842 | -| n_updates | 193390 | -| policy_gradient_loss | 0.00381 | -| std | 0.00821 | -| value_loss | 2.97e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19341 | -| time_elapsed | 104577 | -| total_timesteps | 2475648 | -| train/ | | -| approx_kl | 0.048279382 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 193400 | -| policy_gradient_loss | 0.00782 | -| std | 0.00821 | -| value_loss | 4.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19342 | -| time_elapsed | 104582 | -| total_timesteps | 2475776 | -| train/ | | -| approx_kl | 0.089540236 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0821 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 193410 | -| policy_gradient_loss | 0.0503 | -| std | 0.00821 | -| value_loss | 1.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19343 | -| time_elapsed | 104587 | -| total_timesteps | 2475904 | -| train/ | | -| approx_kl | 0.15279067 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 193420 | -| policy_gradient_loss | 0.0296 | -| std | 0.0082 | -| value_loss | 1.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19344 | -| time_elapsed | 104592 | -| total_timesteps | 2476032 | -| train/ | | -| approx_kl | 0.080905676 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0783 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 193430 | -| policy_gradient_loss | 0.0113 | -| std | 0.0082 | -| value_loss | 5.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19345 | -| time_elapsed | 104603 | -| total_timesteps | 2476160 | -| train/ | | -| approx_kl | 0.028857999 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | 0.761 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 193440 | -| policy_gradient_loss | -0.00894 | -| std | 0.0082 | -| value_loss | 0.00641 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19346 | -| time_elapsed | 104608 | -| total_timesteps | 2476288 | -| train/ | | -| approx_kl | 0.00616791 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0859 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 193450 | -| policy_gradient_loss | 0.0148 | -| std | 0.0082 | -| value_loss | 1.07e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19347 | -| time_elapsed | 104613 | -| total_timesteps | 2476416 | -| train/ | | -| approx_kl | 0.05484552 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.00981 | -| n_updates | 193460 | -| policy_gradient_loss | 0.0147 | -| std | 0.0082 | -| value_loss | 4.27e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19348 | -| time_elapsed | 104616 | -| total_timesteps | 2476544 | -| train/ | | -| approx_kl | 0.08502385 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.38 | -| explained_variance | -0.406 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 193470 | -| policy_gradient_loss | 0.0186 | -| std | 0.0082 | -| value_loss | 1.97e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19349 | -| time_elapsed | 104620 | -| total_timesteps | 2476672 | -| train/ | | -| approx_kl | 0.00030711573 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | -0.000216 | -| n_updates | 193480 | -| policy_gradient_loss | 0.0193 | -| std | 0.00819 | -| value_loss | 1.22e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19350 | -| time_elapsed | 104623 | -| total_timesteps | 2476800 | -| train/ | | -| approx_kl | 0.16983151 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 193490 | -| policy_gradient_loss | 0.136 | -| std | 0.00816 | -| value_loss | 0.00328 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19351 | -| time_elapsed | 104627 | -| total_timesteps | 2476928 | -| train/ | | -| approx_kl | 0.02957793 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.000896 | -| n_updates | 193500 | -| policy_gradient_loss | 0.0117 | -| std | 0.00815 | -| value_loss | 0.000347 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19352 | -| time_elapsed | 104631 | -| total_timesteps | 2477056 | -| train/ | | -| approx_kl | 0.1225502 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.00177 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 193510 | -| policy_gradient_loss | 0.00879 | -| std | 0.00814 | -| value_loss | 0.000107 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19353 | -| time_elapsed | 104641 | -| total_timesteps | 2477184 | -| train/ | | -| approx_kl | 0.118348144 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | 0.00958 | -| n_updates | 193520 | -| policy_gradient_loss | 0.00091 | -| std | 0.00814 | -| value_loss | 0.00393 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19354 | -| time_elapsed | 104646 | -| total_timesteps | 2477312 | -| train/ | | -| approx_kl | 0.049557343 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0335 | -| n_updates | 193530 | -| policy_gradient_loss | 0.0283 | -| std | 0.00814 | -| value_loss | 2.13e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19355 | -| time_elapsed | 104651 | -| total_timesteps | 2477440 | -| train/ | | -| approx_kl | 0.09693752 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.0524 | -| n_updates | 193540 | -| policy_gradient_loss | 0.022 | -| std | 0.00814 | -| value_loss | 1.76e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19356 | -| time_elapsed | 104654 | -| total_timesteps | 2477568 | -| train/ | | -| approx_kl | 0.023425417 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 193550 | -| policy_gradient_loss | -8.6e-05 | -| std | 0.00814 | -| value_loss | 9.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19357 | -| time_elapsed | 104660 | -| total_timesteps | 2477696 | -| train/ | | -| approx_kl | 0.38086668 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 193560 | -| policy_gradient_loss | 0.0493 | -| std | 0.00813 | -| value_loss | 8.93e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19358 | -| time_elapsed | 104665 | -| total_timesteps | 2477824 | -| train/ | | -| approx_kl | 0.03771842 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.00627 | -| n_updates | 193570 | -| policy_gradient_loss | 0.00214 | -| std | 0.00813 | -| value_loss | 5.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19359 | -| time_elapsed | 104669 | -| total_timesteps | 2477952 | -| train/ | | -| approx_kl | 0.023225086 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.00453 | -| n_updates | 193580 | -| policy_gradient_loss | 0.00244 | -| std | 0.00813 | -| value_loss | 3.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19360 | -| time_elapsed | 104673 | -| total_timesteps | 2478080 | -| train/ | | -| approx_kl | 0.030850645 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.000612 | -| n_updates | 193590 | -| policy_gradient_loss | -0.000245 | -| std | 0.00813 | -| value_loss | 2.24e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19361 | -| time_elapsed | 104681 | -| total_timesteps | 2478208 | -| train/ | | -| approx_kl | 0.0061292867 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 193600 | -| policy_gradient_loss | 0.00181 | -| std | 0.00813 | -| value_loss | 0.000108 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19362 | -| time_elapsed | 104686 | -| total_timesteps | 2478336 | -| train/ | | -| approx_kl | 0.0010425742 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0771 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 193610 | -| policy_gradient_loss | 0.0266 | -| std | 0.00813 | -| value_loss | 9.11e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19363 | -| time_elapsed | 104691 | -| total_timesteps | 2478464 | -| train/ | | -| approx_kl | 0.0016373196 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | -0.00982 | -| n_updates | 193620 | -| policy_gradient_loss | 0.0247 | -| std | 0.00812 | -| value_loss | 6.97e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19364 | -| time_elapsed | 104696 | -| total_timesteps | 2478592 | -| train/ | | -| approx_kl | 0.0029919897 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.39 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 193630 | -| policy_gradient_loss | 0.0251 | -| std | 0.00812 | -| value_loss | 1.05e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19365 | -| time_elapsed | 104701 | -| total_timesteps | 2478720 | -| train/ | | -| approx_kl | 0.16640736 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 193640 | -| policy_gradient_loss | 0.00461 | -| std | 0.00811 | -| value_loss | 1.22e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19366 | -| time_elapsed | 104706 | -| total_timesteps | 2478848 | -| train/ | | -| approx_kl | 0.13285907 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00944 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 193650 | -| policy_gradient_loss | 0.0154 | -| std | 0.00811 | -| value_loss | 1.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 19367 | -| time_elapsed | 104710 | -| total_timesteps | 2478976 | -| train/ | | -| approx_kl | 0.012017364 | -| clip_fraction | 0.0758 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | 0.00719 | -| n_updates | 193660 | -| policy_gradient_loss | 0.000863 | -| std | 0.00807 | -| value_loss | 7.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19368 | -| time_elapsed | 104715 | -| total_timesteps | 2479104 | -| train/ | | -| approx_kl | 0.020491056 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.956 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 193670 | -| policy_gradient_loss | 0.00787 | -| std | 0.00805 | -| value_loss | 5.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19369 | -| time_elapsed | 104727 | -| total_timesteps | 2479232 | -| train/ | | -| approx_kl | 0.30394718 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0658 | -| learning_rate | 0.0003 | -| loss | 0.00692 | -| n_updates | 193680 | -| policy_gradient_loss | 0.0106 | -| std | 0.00805 | -| value_loss | 0.00184 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19370 | -| time_elapsed | 104732 | -| total_timesteps | 2479360 | -| train/ | | -| approx_kl | 0.22459126 | -| clip_fraction | 0.694 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00155 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 193690 | -| policy_gradient_loss | 0.157 | -| std | 0.00804 | -| value_loss | 2.85e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19371 | -| time_elapsed | 104737 | -| total_timesteps | 2479488 | -| train/ | | -| approx_kl | 0.15152974 | -| clip_fraction | 0.656 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | 0.0698 | -| n_updates | 193700 | -| policy_gradient_loss | 0.0955 | -| std | 0.00806 | -| value_loss | 4.35e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19372 | -| time_elapsed | 104742 | -| total_timesteps | 2479616 | -| train/ | | -| approx_kl | 0.1305309 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -10.3 | -| learning_rate | 0.0003 | -| loss | 0.00585 | -| n_updates | 193710 | -| policy_gradient_loss | -0.0053 | -| std | 0.00806 | -| value_loss | 2.06e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19373 | -| time_elapsed | 104746 | -| total_timesteps | 2479744 | -| train/ | | -| approx_kl | 0.019891333 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -6.04 | -| learning_rate | 0.0003 | -| loss | 0.00012 | -| n_updates | 193720 | -| policy_gradient_loss | 0.0178 | -| std | 0.00805 | -| value_loss | 5.14e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 19374 | -| time_elapsed | 104749 | -| total_timesteps | 2479872 | -| train/ | | -| approx_kl | 0.6202385 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.283 | -| n_updates | 193730 | -| policy_gradient_loss | 0.142 | -| std | 0.00805 | -| value_loss | 7.49e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19375 | -| time_elapsed | 104753 | -| total_timesteps | 2480000 | -| train/ | | -| approx_kl | 0.0058784494 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 193740 | -| policy_gradient_loss | 0.0154 | -| std | 0.00805 | -| value_loss | 6.88e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19376 | -| time_elapsed | 104757 | -| total_timesteps | 2480128 | -| train/ | | -| approx_kl | 0.11393914 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.00347 | -| learning_rate | 0.0003 | -| loss | 0.0681 | -| n_updates | 193750 | -| policy_gradient_loss | 0.0172 | -| std | 0.00805 | -| value_loss | 5.04e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19377 | -| time_elapsed | 104771 | -| total_timesteps | 2480256 | -| train/ | | -| approx_kl | 0.25954655 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.713 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 193760 | -| policy_gradient_loss | 0.00681 | -| std | 0.00805 | -| value_loss | 0.000965 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19378 | -| time_elapsed | 104776 | -| total_timesteps | 2480384 | -| train/ | | -| approx_kl | 0.017242644 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 193770 | -| policy_gradient_loss | -0.00139 | -| std | 0.00806 | -| value_loss | 4.97e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19379 | -| time_elapsed | 104781 | -| total_timesteps | 2480512 | -| train/ | | -| approx_kl | 0.0712296 | -| clip_fraction | 0.636 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 193780 | -| policy_gradient_loss | 0.0856 | -| std | 0.00806 | -| value_loss | 3.41e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19380 | -| time_elapsed | 104784 | -| total_timesteps | 2480640 | -| train/ | | -| approx_kl | 0.088554755 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0707 | -| n_updates | 193790 | -| policy_gradient_loss | 0.0994 | -| std | 0.00806 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19381 | -| time_elapsed | 104789 | -| total_timesteps | 2480768 | -| train/ | | -| approx_kl | 0.08320321 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.0701 | -| n_updates | 193800 | -| policy_gradient_loss | 0.0981 | -| std | 0.00806 | -| value_loss | 9.67e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19382 | -| time_elapsed | 104793 | -| total_timesteps | 2480896 | -| train/ | | -| approx_kl | 0.020480951 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 193810 | -| policy_gradient_loss | 0.0178 | -| std | 0.00806 | -| value_loss | 8.85e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19383 | -| time_elapsed | 104798 | -| total_timesteps | 2481024 | -| train/ | | -| approx_kl | 0.42798054 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.22 | -| n_updates | 193820 | -| policy_gradient_loss | 0.0586 | -| std | 0.00806 | -| value_loss | 5.15e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19384 | -| time_elapsed | 104808 | -| total_timesteps | 2481152 | -| train/ | | -| approx_kl | 0.13136527 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 193830 | -| policy_gradient_loss | -0.0127 | -| std | 0.00806 | -| value_loss | 0.000188 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19385 | -| time_elapsed | 104813 | -| total_timesteps | 2481280 | -| train/ | | -| approx_kl | 0.010218117 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.4 | -| explained_variance | -0.427 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 193840 | -| policy_gradient_loss | 0.00351 | -| std | 0.00801 | -| value_loss | 3.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19386 | -| time_elapsed | 104818 | -| total_timesteps | 2481408 | -| train/ | | -| approx_kl | 0.17312045 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | 0.0617 | -| n_updates | 193850 | -| policy_gradient_loss | 0.00459 | -| std | 0.00798 | -| value_loss | 2.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19387 | -| time_elapsed | 104822 | -| total_timesteps | 2481536 | -| train/ | | -| approx_kl | 0.010693286 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.0072 | -| learning_rate | 0.0003 | -| loss | 0.0201 | -| n_updates | 193860 | -| policy_gradient_loss | 0.0223 | -| std | 0.00796 | -| value_loss | 2.84e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19388 | -| time_elapsed | 104828 | -| total_timesteps | 2481664 | -| train/ | | -| approx_kl | 0.03584758 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -5.97 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 193870 | -| policy_gradient_loss | 0.0032 | -| std | 0.00796 | -| value_loss | 9.76e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19389 | -| time_elapsed | 104832 | -| total_timesteps | 2481792 | -| train/ | | -| approx_kl | 0.010813432 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00931 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 193880 | -| policy_gradient_loss | -0.00345 | -| std | 0.00796 | -| value_loss | 5.52e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19390 | -| time_elapsed | 104836 | -| total_timesteps | 2481920 | -| train/ | | -| approx_kl | 0.07106654 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 193890 | -| policy_gradient_loss | 0.0364 | -| std | 0.00795 | -| value_loss | 3.88e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19391 | -| time_elapsed | 104841 | -| total_timesteps | 2482048 | -| train/ | | -| approx_kl | 0.25307074 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 193900 | -| policy_gradient_loss | 0.117 | -| std | 0.00795 | -| value_loss | 2.88e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19392 | -| time_elapsed | 104848 | -| total_timesteps | 2482176 | -| train/ | | -| approx_kl | 0.08621323 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | 0.0417 | -| n_updates | 193910 | -| policy_gradient_loss | 0.0424 | -| std | 0.00795 | -| value_loss | 0.000398 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19393 | -| time_elapsed | 104852 | -| total_timesteps | 2482304 | -| train/ | | -| approx_kl | 0.009792246 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0847 | -| learning_rate | 0.0003 | -| loss | 0.000711 | -| n_updates | 193920 | -| policy_gradient_loss | 0.0178 | -| std | 0.00795 | -| value_loss | 8.47e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19394 | -| time_elapsed | 104855 | -| total_timesteps | 2482432 | -| train/ | | -| approx_kl | 0.48657972 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00814 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 193930 | -| policy_gradient_loss | 0.0547 | -| std | 0.00795 | -| value_loss | 9.91e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19395 | -| time_elapsed | 104860 | -| total_timesteps | 2482560 | -| train/ | | -| approx_kl | 0.0312604 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 193940 | -| policy_gradient_loss | 0.00584 | -| std | 0.00795 | -| value_loss | 6.89e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19396 | -| time_elapsed | 104864 | -| total_timesteps | 2482688 | -| train/ | | -| approx_kl | 0.005783303 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | -0.000439 | -| n_updates | 193950 | -| policy_gradient_loss | 0.00417 | -| std | 0.00795 | -| value_loss | 4.87e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19397 | -| time_elapsed | 104869 | -| total_timesteps | 2482816 | -| train/ | | -| approx_kl | 0.0028013238 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0882 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 193960 | -| policy_gradient_loss | 0.00834 | -| std | 0.00795 | -| value_loss | 2.75e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19398 | -| time_elapsed | 104874 | -| total_timesteps | 2482944 | -| train/ | | -| approx_kl | 0.026789824 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0724 | -| learning_rate | 0.0003 | -| loss | 0.0217 | -| n_updates | 193970 | -| policy_gradient_loss | 0.111 | -| std | 0.00794 | -| value_loss | 1.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19399 | -| time_elapsed | 104878 | -| total_timesteps | 2483072 | -| train/ | | -| approx_kl | 0.067167975 | -| clip_fraction | 0.619 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 193980 | -| policy_gradient_loss | 0.0992 | -| std | 0.00794 | -| value_loss | 4.96e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19400 | -| time_elapsed | 104887 | -| total_timesteps | 2483200 | -| train/ | | -| approx_kl | 0.018678145 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.757 | -| learning_rate | 0.0003 | -| loss | 0.0011 | -| n_updates | 193990 | -| policy_gradient_loss | 0.0228 | -| std | 0.00794 | -| value_loss | 0.00419 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19401 | -| time_elapsed | 104894 | -| total_timesteps | 2483328 | -| train/ | | -| approx_kl | 0.111316316 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | 0.0604 | -| n_updates | 194000 | -| policy_gradient_loss | 0.0144 | -| std | 0.00794 | -| value_loss | 4.76e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19402 | -| time_elapsed | 104899 | -| total_timesteps | 2483456 | -| train/ | | -| approx_kl | 0.0110247 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | 0.00862 | -| n_updates | 194010 | -| policy_gradient_loss | 0.00356 | -| std | 0.00794 | -| value_loss | 4.48e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19403 | -| time_elapsed | 104902 | -| total_timesteps | 2483584 | -| train/ | | -| approx_kl | 0.16108866 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0711 | -| learning_rate | 0.0003 | -| loss | 0.0822 | -| n_updates | 194020 | -| policy_gradient_loss | 0.0215 | -| std | 0.00796 | -| value_loss | 0.000598 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19404 | -| time_elapsed | 104907 | -| total_timesteps | 2483712 | -| train/ | | -| approx_kl | 0.19502535 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 194030 | -| policy_gradient_loss | 0.0323 | -| std | 0.00797 | -| value_loss | 0.0238 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19405 | -| time_elapsed | 104912 | -| total_timesteps | 2483840 | -| train/ | | -| approx_kl | 0.046643045 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.0381 | -| n_updates | 194040 | -| policy_gradient_loss | 0.0619 | -| std | 0.00798 | -| value_loss | 0.00487 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19406 | -| time_elapsed | 104918 | -| total_timesteps | 2483968 | -| train/ | | -| approx_kl | 0.012287634 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | -0.000804 | -| n_updates | 194050 | -| policy_gradient_loss | 0.0116 | -| std | 0.00798 | -| value_loss | 0.0025 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19407 | -| time_elapsed | 104921 | -| total_timesteps | 2484096 | -| train/ | | -| approx_kl | 0.024652904 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00478 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 194060 | -| policy_gradient_loss | 0.0307 | -| std | 0.00798 | -| value_loss | 0.00145 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19408 | -| time_elapsed | 104933 | -| total_timesteps | 2484224 | -| train/ | | -| approx_kl | 0.009358339 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.573 | -| learning_rate | 0.0003 | -| loss | 0.00679 | -| n_updates | 194070 | -| policy_gradient_loss | 0.00594 | -| std | 0.00799 | -| value_loss | 0.00917 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19409 | -| time_elapsed | 104939 | -| total_timesteps | 2484352 | -| train/ | | -| approx_kl | 0.013813428 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 194080 | -| policy_gradient_loss | 0.00376 | -| std | 0.00799 | -| value_loss | 0.00042 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19410 | -| time_elapsed | 104944 | -| total_timesteps | 2484480 | -| train/ | | -| approx_kl | 0.0025757016 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 194090 | -| policy_gradient_loss | 0.000449 | -| std | 0.00799 | -| value_loss | 0.000446 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19411 | -| time_elapsed | 104949 | -| total_timesteps | 2484608 | -| train/ | | -| approx_kl | 1.7591752e-05 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0005 | -| n_updates | 194100 | -| policy_gradient_loss | 0.00153 | -| std | 0.00799 | -| value_loss | 0.000417 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19412 | -| time_elapsed | 104953 | -| total_timesteps | 2484736 | -| train/ | | -| approx_kl | 0.00023997249 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 194110 | -| policy_gradient_loss | 0.00656 | -| std | 0.00799 | -| value_loss | 0.00037 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19413 | -| time_elapsed | 104958 | -| total_timesteps | 2484864 | -| train/ | | -| approx_kl | 0.054953694 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 194120 | -| policy_gradient_loss | 0.0578 | -| std | 0.00799 | -| value_loss | 0.000353 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19414 | -| time_elapsed | 104961 | -| total_timesteps | 2484992 | -| train/ | | -| approx_kl | 0.1697247 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.00958 | -| learning_rate | 0.0003 | -| loss | 0.0919 | -| n_updates | 194130 | -| policy_gradient_loss | 0.0334 | -| std | 0.00799 | -| value_loss | 0.00034 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 19415 | -| time_elapsed | 104966 | -| total_timesteps | 2485120 | -| train/ | | -| approx_kl | 0.0007917085 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0077 | -| learning_rate | 0.0003 | -| loss | -0.00157 | -| n_updates | 194140 | -| policy_gradient_loss | 0.0118 | -| std | 0.008 | -| value_loss | 0.000256 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 19416 | -| time_elapsed | 104978 | -| total_timesteps | 2485248 | -| train/ | | -| approx_kl | 0.033736702 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -1.29 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 194150 | -| policy_gradient_loss | 0.0257 | -| std | 0.008 | -| value_loss | 0.00296 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 19417 | -| time_elapsed | 104982 | -| total_timesteps | 2485376 | -| train/ | | -| approx_kl | 0.04242139 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 194160 | -| policy_gradient_loss | 0.0193 | -| std | 0.008 | -| value_loss | 9.77e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 19418 | -| time_elapsed | 104988 | -| total_timesteps | 2485504 | -| train/ | | -| approx_kl | 0.05338399 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0844 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 194170 | -| policy_gradient_loss | 0.0418 | -| std | 0.008 | -| value_loss | 5.71e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 19419 | -| time_elapsed | 104992 | -| total_timesteps | 2485632 | -| train/ | | -| approx_kl | 0.0010025841 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 194180 | -| policy_gradient_loss | 0.0747 | -| std | 0.008 | -| value_loss | 4.99e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 19420 | -| time_elapsed | 104997 | -| total_timesteps | 2485760 | -| train/ | | -| approx_kl | 0.10216987 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.0997 | -| n_updates | 194190 | -| policy_gradient_loss | 0.195 | -| std | 0.008 | -| value_loss | 3e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 19421 | -| time_elapsed | 105002 | -| total_timesteps | 2485888 | -| train/ | | -| approx_kl | 0.05971791 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 194200 | -| policy_gradient_loss | 0.0341 | -| std | 0.008 | -| value_loss | 2.89e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19422 | -| time_elapsed | 105007 | -| total_timesteps | 2486016 | -| train/ | | -| approx_kl | 0.08512666 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0556 | -| n_updates | 194210 | -| policy_gradient_loss | 0.0237 | -| std | 0.008 | -| value_loss | 2.1e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19423 | -| time_elapsed | 105017 | -| total_timesteps | 2486144 | -| train/ | | -| approx_kl | 0.16243549 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.765 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 194220 | -| policy_gradient_loss | -0.0156 | -| std | 0.00799 | -| value_loss | 0.00436 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19424 | -| time_elapsed | 105022 | -| total_timesteps | 2486272 | -| train/ | | -| approx_kl | 0.014252216 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00686 | -| learning_rate | 0.0003 | -| loss | 0.00809 | -| n_updates | 194230 | -| policy_gradient_loss | 0.0181 | -| std | 0.00799 | -| value_loss | 1.33e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19425 | -| time_elapsed | 105026 | -| total_timesteps | 2486400 | -| train/ | | -| approx_kl | 0.0013737702 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 194240 | -| policy_gradient_loss | 0.0181 | -| std | 0.00797 | -| value_loss | 3.13e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19426 | -| time_elapsed | 105029 | -| total_timesteps | 2486528 | -| train/ | | -| approx_kl | 0.0059868093 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.00739 | -| n_updates | 194250 | -| policy_gradient_loss | 0.0144 | -| std | 0.00796 | -| value_loss | 0.000118 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19427 | -| time_elapsed | 105032 | -| total_timesteps | 2486656 | -| train/ | | -| approx_kl | 0.0018439009 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.41 | -| explained_variance | 0.00263 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 194260 | -| policy_gradient_loss | 0.0181 | -| std | 0.00795 | -| value_loss | 2.4e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19428 | -| time_elapsed | 105036 | -| total_timesteps | 2486784 | -| train/ | | -| approx_kl | 0.053609986 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 194270 | -| policy_gradient_loss | 0.0178 | -| std | 0.00795 | -| value_loss | 1.08e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 19429 | -| time_elapsed | 105040 | -| total_timesteps | 2486912 | -| train/ | | -| approx_kl | 0.1913726 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 194280 | -| policy_gradient_loss | 0.0906 | -| std | 0.00795 | -| value_loss | 1.19e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19430 | -| time_elapsed | 105045 | -| total_timesteps | 2487040 | -| train/ | | -| approx_kl | 0.11865662 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0767 | -| n_updates | 194290 | -| policy_gradient_loss | 0.103 | -| std | 0.00795 | -| value_loss | 7.02e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19431 | -| time_elapsed | 105056 | -| total_timesteps | 2487168 | -| train/ | | -| approx_kl | 0.04608505 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -2.62 | -| learning_rate | 0.0003 | -| loss | 0.00718 | -| n_updates | 194300 | -| policy_gradient_loss | 0.0126 | -| std | 0.00795 | -| value_loss | 0.00244 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19432 | -| time_elapsed | 105061 | -| total_timesteps | 2487296 | -| train/ | | -| approx_kl | 0.0048980154 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.535 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 194310 | -| policy_gradient_loss | 0.015 | -| std | 0.00795 | -| value_loss | 3.11e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19433 | -| time_elapsed | 105067 | -| total_timesteps | 2487424 | -| train/ | | -| approx_kl | 0.1514569 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 194320 | -| policy_gradient_loss | 0.0475 | -| std | 0.00795 | -| value_loss | 2.74e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19434 | -| time_elapsed | 105071 | -| total_timesteps | 2487552 | -| train/ | | -| approx_kl | 0.06262574 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | 0.0374 | -| n_updates | 194330 | -| policy_gradient_loss | 0.0123 | -| std | 0.00795 | -| value_loss | 2.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19435 | -| time_elapsed | 105075 | -| total_timesteps | 2487680 | -| train/ | | -| approx_kl | 0.02873692 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 194340 | -| policy_gradient_loss | 0.0102 | -| std | 0.00795 | -| value_loss | 1.67e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19436 | -| time_elapsed | 105080 | -| total_timesteps | 2487808 | -| train/ | | -| approx_kl | 0.03700068 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.0242 | -| n_updates | 194350 | -| policy_gradient_loss | 0.0109 | -| std | 0.00795 | -| value_loss | 1.36e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19437 | -| time_elapsed | 105084 | -| total_timesteps | 2487936 | -| train/ | | -| approx_kl | 0.03589451 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 194360 | -| policy_gradient_loss | 0.00967 | -| std | 0.00795 | -| value_loss | 1.25e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19438 | -| time_elapsed | 105090 | -| total_timesteps | 2488064 | -| train/ | | -| approx_kl | 0.030628126 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | -0.000802 | -| n_updates | 194370 | -| policy_gradient_loss | -0.000614 | -| std | 0.00795 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19439 | -| time_elapsed | 105101 | -| total_timesteps | 2488192 | -| train/ | | -| approx_kl | 0.0068110516 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 194380 | -| policy_gradient_loss | -0.0109 | -| std | 0.00795 | -| value_loss | 0.000223 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19440 | -| time_elapsed | 105106 | -| total_timesteps | 2488320 | -| train/ | | -| approx_kl | 0.036978014 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00981 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 194390 | -| policy_gradient_loss | 0.00242 | -| std | 0.00795 | -| value_loss | 4.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19441 | -| time_elapsed | 105110 | -| total_timesteps | 2488448 | -| train/ | | -| approx_kl | 0.034044996 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00792 | -| learning_rate | 0.0003 | -| loss | 0.0257 | -| n_updates | 194400 | -| policy_gradient_loss | 0.0134 | -| std | 0.00795 | -| value_loss | 1.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19442 | -| time_elapsed | 105115 | -| total_timesteps | 2488576 | -| train/ | | -| approx_kl | 0.02936196 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.00494 | -| n_updates | 194410 | -| policy_gradient_loss | 0.00193 | -| std | 0.00795 | -| value_loss | 1.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19443 | -| time_elapsed | 105120 | -| total_timesteps | 2488704 | -| train/ | | -| approx_kl | 0.006944667 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | -4.52e-05 | -| n_updates | 194420 | -| policy_gradient_loss | 0.00439 | -| std | 0.00794 | -| value_loss | 8.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19444 | -| time_elapsed | 105125 | -| total_timesteps | 2488832 | -| train/ | | -| approx_kl | 0.043278255 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 194430 | -| policy_gradient_loss | 0.0123 | -| std | 0.00794 | -| value_loss | 5.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19445 | -| time_elapsed | 105130 | -| total_timesteps | 2488960 | -| train/ | | -| approx_kl | 0.008146657 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.00187 | -| n_updates | 194440 | -| policy_gradient_loss | 0.00407 | -| std | 0.00793 | -| value_loss | 3.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19446 | -| time_elapsed | 105135 | -| total_timesteps | 2489088 | -| train/ | | -| approx_kl | 0.0018046079 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.556 | -| learning_rate | 0.0003 | -| loss | -0.000462 | -| n_updates | 194450 | -| policy_gradient_loss | 0.00371 | -| std | 0.00793 | -| value_loss | 1.07e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19447 | -| time_elapsed | 105143 | -| total_timesteps | 2489216 | -| train/ | | -| approx_kl | 0.0141953565 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.753 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 194460 | -| policy_gradient_loss | 0.00801 | -| std | 0.00792 | -| value_loss | 0.00517 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19448 | -| time_elapsed | 105148 | -| total_timesteps | 2489344 | -| train/ | | -| approx_kl | 0.0034824177 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 194470 | -| policy_gradient_loss | 0.0202 | -| std | 0.00792 | -| value_loss | 1.55e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19449 | -| time_elapsed | 105154 | -| total_timesteps | 2489472 | -| train/ | | -| approx_kl | 0.51901114 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00707 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 194480 | -| policy_gradient_loss | 0.0503 | -| std | 0.00792 | -| value_loss | 1.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19450 | -| time_elapsed | 105159 | -| total_timesteps | 2489600 | -| train/ | | -| approx_kl | 0.025125813 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | 0.00872 | -| n_updates | 194490 | -| policy_gradient_loss | 0.00499 | -| std | 0.00792 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19451 | -| time_elapsed | 105164 | -| total_timesteps | 2489728 | -| train/ | | -| approx_kl | 0.035204466 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 194500 | -| policy_gradient_loss | 0.00945 | -| std | 0.00792 | -| value_loss | 8.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19452 | -| time_elapsed | 105170 | -| total_timesteps | 2489856 | -| train/ | | -| approx_kl | 0.003793364 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 4.28e-05 | -| n_updates | 194510 | -| policy_gradient_loss | 0.00384 | -| std | 0.00792 | -| value_loss | 4.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19453 | -| time_elapsed | 105175 | -| total_timesteps | 2489984 | -| train/ | | -| approx_kl | 0.19313134 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 194520 | -| policy_gradient_loss | 0.0576 | -| std | 0.00792 | -| value_loss | 0.000194 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19454 | -| time_elapsed | 105181 | -| total_timesteps | 2490112 | -| train/ | | -| approx_kl | 0.004823518 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.625 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 194530 | -| policy_gradient_loss | 0.0597 | -| std | 0.00792 | -| value_loss | 3.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19455 | -| time_elapsed | 105192 | -| total_timesteps | 2490240 | -| train/ | | -| approx_kl | 0.037433874 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.695 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 194540 | -| policy_gradient_loss | -0.0049 | -| std | 0.00791 | -| value_loss | 0.0086 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19456 | -| time_elapsed | 105196 | -| total_timesteps | 2490368 | -| train/ | | -| approx_kl | 0.25718695 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -236 | -| learning_rate | 0.0003 | -| loss | 0.0501 | -| n_updates | 194550 | -| policy_gradient_loss | 0.0159 | -| std | 0.00791 | -| value_loss | 3.11e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19457 | -| time_elapsed | 105200 | -| total_timesteps | 2490496 | -| train/ | | -| approx_kl | 0.037602246 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.00562 | -| n_updates | 194560 | -| policy_gradient_loss | 0.0426 | -| std | 0.0079 | -| value_loss | 4.71e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19458 | -| time_elapsed | 105205 | -| total_timesteps | 2490624 | -| train/ | | -| approx_kl | 0.14376959 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0619 | -| learning_rate | 0.0003 | -| loss | 0.0634 | -| n_updates | 194570 | -| policy_gradient_loss | 0.0237 | -| std | 0.0079 | -| value_loss | 5.15e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19459 | -| time_elapsed | 105209 | -| total_timesteps | 2490752 | -| train/ | | -| approx_kl | 0.04067959 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.00726 | -| n_updates | 194580 | -| policy_gradient_loss | 0.0485 | -| std | 0.0079 | -| value_loss | 4.85e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 19460 | -| time_elapsed | 105214 | -| total_timesteps | 2490880 | -| train/ | | -| approx_kl | 0.2097386 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 194590 | -| policy_gradient_loss | 0.0286 | -| std | 0.0079 | -| value_loss | 4.61e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19461 | -| time_elapsed | 105217 | -| total_timesteps | 2491008 | -| train/ | | -| approx_kl | 0.00076631736 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00359 | -| n_updates | 194600 | -| policy_gradient_loss | -0.00065 | -| std | 0.0079 | -| value_loss | 3.9e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19462 | -| time_elapsed | 105227 | -| total_timesteps | 2491136 | -| train/ | | -| approx_kl | 0.0014994736 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.76 | -| learning_rate | 0.0003 | -| loss | -0.00924 | -| n_updates | 194610 | -| policy_gradient_loss | 0.019 | -| std | 0.0079 | -| value_loss | 0.00518 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19463 | -| time_elapsed | 105232 | -| total_timesteps | 2491264 | -| train/ | | -| approx_kl | 0.010855834 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.384 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 194620 | -| policy_gradient_loss | 0.00944 | -| std | 0.0079 | -| value_loss | 1.1e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19464 | -| time_elapsed | 105236 | -| total_timesteps | 2491392 | -| train/ | | -| approx_kl | 0.31635776 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00749 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 194630 | -| policy_gradient_loss | 0.117 | -| std | 0.0079 | -| value_loss | 1.99e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19465 | -| time_elapsed | 105241 | -| total_timesteps | 2491520 | -| train/ | | -| approx_kl | 0.06133855 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00628 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 194640 | -| policy_gradient_loss | 0.0236 | -| std | 0.0079 | -| value_loss | 1.31e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19466 | -| time_elapsed | 105245 | -| total_timesteps | 2491648 | -| train/ | | -| approx_kl | 0.44950974 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 194650 | -| policy_gradient_loss | 0.0432 | -| std | 0.0079 | -| value_loss | 1.08e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19467 | -| time_elapsed | 105250 | -| total_timesteps | 2491776 | -| train/ | | -| approx_kl | 0.009936256 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0112 | -| learning_rate | 0.0003 | -| loss | -3.86e-06 | -| n_updates | 194660 | -| policy_gradient_loss | 0.00344 | -| std | 0.0079 | -| value_loss | 7.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19468 | -| time_elapsed | 105253 | -| total_timesteps | 2491904 | -| train/ | | -| approx_kl | 0.044476878 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.00757 | -| n_updates | 194670 | -| policy_gradient_loss | 0.0184 | -| std | 0.0079 | -| value_loss | 4.87e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19469 | -| time_elapsed | 105257 | -| total_timesteps | 2492032 | -| train/ | | -| approx_kl | 0.49880674 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 194680 | -| policy_gradient_loss | 0.0948 | -| std | 0.00791 | -| value_loss | 3.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19470 | -| time_elapsed | 105267 | -| total_timesteps | 2492160 | -| train/ | | -| approx_kl | 0.21927415 | -| clip_fraction | 0.46 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 194690 | -| policy_gradient_loss | 0.000762 | -| std | 0.00791 | -| value_loss | 0.000159 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19471 | -| time_elapsed | 105271 | -| total_timesteps | 2492288 | -| train/ | | -| approx_kl | 0.021022439 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.00877 | -| n_updates | 194700 | -| policy_gradient_loss | 0.0293 | -| std | 0.00791 | -| value_loss | 1.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19472 | -| time_elapsed | 105275 | -| total_timesteps | 2492416 | -| train/ | | -| approx_kl | 0.079647824 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 194710 | -| policy_gradient_loss | 0.0418 | -| std | 0.00791 | -| value_loss | 1.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19473 | -| time_elapsed | 105279 | -| total_timesteps | 2492544 | -| train/ | | -| approx_kl | 0.12035884 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0799 | -| n_updates | 194720 | -| policy_gradient_loss | 0.0213 | -| std | 0.0079 | -| value_loss | 1.01e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19474 | -| time_elapsed | 105285 | -| total_timesteps | 2492672 | -| train/ | | -| approx_kl | 0.11958751 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0528 | -| n_updates | 194730 | -| policy_gradient_loss | 0.0141 | -| std | 0.0079 | -| value_loss | 7.03e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19475 | -| time_elapsed | 105291 | -| total_timesteps | 2492800 | -| train/ | | -| approx_kl | 0.02116294 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 194740 | -| policy_gradient_loss | 0.0221 | -| std | 0.0079 | -| value_loss | 7.02e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19476 | -| time_elapsed | 105296 | -| total_timesteps | 2492928 | -| train/ | | -| approx_kl | 0.2011365 | -| clip_fraction | 0.681 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 194750 | -| policy_gradient_loss | 0.118 | -| std | 0.00789 | -| value_loss | 2.7e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19477 | -| time_elapsed | 105301 | -| total_timesteps | 2493056 | -| train/ | | -| approx_kl | 0.031667605 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 194760 | -| policy_gradient_loss | 0.00936 | -| std | 0.00788 | -| value_loss | 2.2e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19478 | -| time_elapsed | 105309 | -| total_timesteps | 2493184 | -| train/ | | -| approx_kl | 0.06913903 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.541 | -| learning_rate | 0.0003 | -| loss | -0.000581 | -| n_updates | 194770 | -| policy_gradient_loss | -0.00335 | -| std | 0.00788 | -| value_loss | 0.000961 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19479 | -| time_elapsed | 105313 | -| total_timesteps | 2493312 | -| train/ | | -| approx_kl | 0.010445558 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.36 | -| learning_rate | 0.0003 | -| loss | 0.00195 | -| n_updates | 194780 | -| policy_gradient_loss | 0.0602 | -| std | 0.00788 | -| value_loss | 3.98e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19480 | -| time_elapsed | 105316 | -| total_timesteps | 2493440 | -| train/ | | -| approx_kl | 0.0066464534 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.000902 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 194790 | -| policy_gradient_loss | 0.0132 | -| std | 0.00788 | -| value_loss | 8.44e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19481 | -| time_elapsed | 105321 | -| total_timesteps | 2493568 | -| train/ | | -| approx_kl | 0.052171517 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 194800 | -| policy_gradient_loss | 0.0163 | -| std | 0.00789 | -| value_loss | 1.55e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19482 | -| time_elapsed | 105325 | -| total_timesteps | 2493696 | -| train/ | | -| approx_kl | 0.091967106 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0855 | -| learning_rate | 0.0003 | -| loss | 0.0201 | -| n_updates | 194810 | -| policy_gradient_loss | 0.0142 | -| std | 0.00789 | -| value_loss | 1.44e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19483 | -| time_elapsed | 105331 | -| total_timesteps | 2493824 | -| train/ | | -| approx_kl | 0.257551 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 194820 | -| policy_gradient_loss | 0.092 | -| std | 0.00789 | -| value_loss | 1.14e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19484 | -| time_elapsed | 105337 | -| total_timesteps | 2493952 | -| train/ | | -| approx_kl | 0.15432723 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0833 | -| n_updates | 194830 | -| policy_gradient_loss | 0.0909 | -| std | 0.00789 | -| value_loss | 5.7e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19485 | -| time_elapsed | 105341 | -| total_timesteps | 2494080 | -| train/ | | -| approx_kl | 0.12795901 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | 0.0861 | -| n_updates | 194840 | -| policy_gradient_loss | 0.101 | -| std | 0.0079 | -| value_loss | 4.44e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19486 | -| time_elapsed | 105351 | -| total_timesteps | 2494208 | -| train/ | | -| approx_kl | 0.029346835 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.000621 | -| n_updates | 194850 | -| policy_gradient_loss | 0.0232 | -| std | 0.0079 | -| value_loss | 0.000759 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19487 | -| time_elapsed | 105355 | -| total_timesteps | 2494336 | -| train/ | | -| approx_kl | 0.19721232 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.463 | -| learning_rate | 0.0003 | -| loss | 0.0725 | -| n_updates | 194860 | -| policy_gradient_loss | 0.0245 | -| std | 0.0079 | -| value_loss | 1.02e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19488 | -| time_elapsed | 105361 | -| total_timesteps | 2494464 | -| train/ | | -| approx_kl | 0.00028277142 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | -0.00577 | -| n_updates | 194870 | -| policy_gradient_loss | -0.00993 | -| std | 0.0079 | -| value_loss | 3.03e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19489 | -| time_elapsed | 105365 | -| total_timesteps | 2494592 | -| train/ | | -| approx_kl | 0.047707498 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.0057 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 194880 | -| policy_gradient_loss | 0.0464 | -| std | 0.0079 | -| value_loss | 1.88e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19490 | -| time_elapsed | 105370 | -| total_timesteps | 2494720 | -| train/ | | -| approx_kl | 2.3789238e-05 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.00346 | -| learning_rate | 0.0003 | -| loss | -0.000201 | -| n_updates | 194890 | -| policy_gradient_loss | 0.0778 | -| std | 0.00789 | -| value_loss | 6.86e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19491 | -| time_elapsed | 105374 | -| total_timesteps | 2494848 | -| train/ | | -| approx_kl | 0.10074487 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0925 | -| learning_rate | 0.0003 | -| loss | 0.0723 | -| n_updates | 194900 | -| policy_gradient_loss | 0.148 | -| std | 0.00788 | -| value_loss | 1.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19492 | -| time_elapsed | 105379 | -| total_timesteps | 2494976 | -| train/ | | -| approx_kl | 0.051103827 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | 0.00141 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 194910 | -| policy_gradient_loss | 0.0204 | -| std | 0.00787 | -| value_loss | 7.28e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19493 | -| time_elapsed | 105383 | -| total_timesteps | 2495104 | -| train/ | | -| approx_kl | 0.09226626 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 194920 | -| policy_gradient_loss | 0.0221 | -| std | 0.00787 | -| value_loss | 6.43e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19494 | -| time_elapsed | 105395 | -| total_timesteps | 2495232 | -| train/ | | -| approx_kl | 0.43365425 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.32 | -| learning_rate | 0.0003 | -| loss | 0.068 | -| n_updates | 194930 | -| policy_gradient_loss | 0.0309 | -| std | 0.00787 | -| value_loss | 0.00121 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19495 | -| time_elapsed | 105401 | -| total_timesteps | 2495360 | -| train/ | | -| approx_kl | 0.20197582 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 194940 | -| policy_gradient_loss | 0.1 | -| std | 0.00787 | -| value_loss | 9.41e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19496 | -| time_elapsed | 105407 | -| total_timesteps | 2495488 | -| train/ | | -| approx_kl | 0.02472836 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0924 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 194950 | -| policy_gradient_loss | 0.013 | -| std | 0.00788 | -| value_loss | 9.26e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19497 | -| time_elapsed | 105411 | -| total_timesteps | 2495616 | -| train/ | | -| approx_kl | 0.03768255 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.42 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | -0.00675 | -| n_updates | 194960 | -| policy_gradient_loss | 0.00952 | -| std | 0.00787 | -| value_loss | 6.1e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19498 | -| time_elapsed | 105416 | -| total_timesteps | 2495744 | -| train/ | | -| approx_kl | 0.36906323 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 194970 | -| policy_gradient_loss | 0.028 | -| std | 0.00787 | -| value_loss | 1.31e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19499 | -| time_elapsed | 105422 | -| total_timesteps | 2495872 | -| train/ | | -| approx_kl | 0.02183604 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 194980 | -| policy_gradient_loss | -0.000921 | -| std | 0.00787 | -| value_loss | 1.99e-12 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19500 | -| time_elapsed | 105426 | -| total_timesteps | 2496000 | -| train/ | | -| approx_kl | 0.03507777 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.00317 | -| learning_rate | 0.0003 | -| loss | 0.00832 | -| n_updates | 194990 | -| policy_gradient_loss | 0.00306 | -| std | 0.00787 | -| value_loss | 1.83e-12 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19501 | -| time_elapsed | 105431 | -| total_timesteps | 2496128 | -| train/ | | -| approx_kl | 0.005600667 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.00538 | -| learning_rate | 0.0003 | -| loss | -0.00492 | -| n_updates | 195000 | -| policy_gradient_loss | 0.00338 | -| std | 0.00787 | -| value_loss | 1.15e-11 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19502 | -| time_elapsed | 105443 | -| total_timesteps | 2496256 | -| train/ | | -| approx_kl | 0.0449591 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | 0.000137 | -| n_updates | 195010 | -| policy_gradient_loss | -0.00677 | -| std | 0.00787 | -| value_loss | 0.00086 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19503 | -| time_elapsed | 105448 | -| total_timesteps | 2496384 | -| train/ | | -| approx_kl | 0.011271769 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 195020 | -| policy_gradient_loss | 0.0137 | -| std | 0.00787 | -| value_loss | 3.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19504 | -| time_elapsed | 105453 | -| total_timesteps | 2496512 | -| train/ | | -| approx_kl | 0.06262532 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.00801 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 195030 | -| policy_gradient_loss | 0.0111 | -| std | 0.00787 | -| value_loss | 9.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19505 | -| time_elapsed | 105459 | -| total_timesteps | 2496640 | -| train/ | | -| approx_kl | 0.11180173 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | 0.0638 | -| n_updates | 195040 | -| policy_gradient_loss | 0.0187 | -| std | 0.00786 | -| value_loss | 4.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19506 | -| time_elapsed | 105464 | -| total_timesteps | 2496768 | -| train/ | | -| approx_kl | 0.022352716 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.000463 | -| n_updates | 195050 | -| policy_gradient_loss | 0.0215 | -| std | 0.00786 | -| value_loss | 3.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19507 | -| time_elapsed | 105468 | -| total_timesteps | 2496896 | -| train/ | | -| approx_kl | 0.09223119 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 195060 | -| policy_gradient_loss | 0.0183 | -| std | 0.00787 | -| value_loss | 3.51e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19508 | -| time_elapsed | 105473 | -| total_timesteps | 2497024 | -| train/ | | -| approx_kl | 0.00010270253 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -0.000107 | -| n_updates | 195070 | -| policy_gradient_loss | 0.0158 | -| std | 0.00786 | -| value_loss | 1.52e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19509 | -| time_elapsed | 105482 | -| total_timesteps | 2497152 | -| train/ | | -| approx_kl | 0.15085146 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.923 | -| learning_rate | 0.0003 | -| loss | 0.00712 | -| n_updates | 195080 | -| policy_gradient_loss | -0.00705 | -| std | 0.00786 | -| value_loss | 0.000806 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19510 | -| time_elapsed | 105488 | -| total_timesteps | 2497280 | -| train/ | | -| approx_kl | 0.006283313 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.000473 | -| n_updates | 195090 | -| policy_gradient_loss | 0.0189 | -| std | 0.00786 | -| value_loss | 3.5e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19511 | -| time_elapsed | 105493 | -| total_timesteps | 2497408 | -| train/ | | -| approx_kl | 0.17933474 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.00521 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 195100 | -| policy_gradient_loss | 0.114 | -| std | 0.00786 | -| value_loss | 5.2e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19512 | -| time_elapsed | 105498 | -| total_timesteps | 2497536 | -| train/ | | -| approx_kl | 0.11348341 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0489 | -| learning_rate | 0.0003 | -| loss | 0.0769 | -| n_updates | 195110 | -| policy_gradient_loss | 0.0924 | -| std | 0.00785 | -| value_loss | 5.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19513 | -| time_elapsed | 105503 | -| total_timesteps | 2497664 | -| train/ | | -| approx_kl | 0.019459466 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.000153 | -| n_updates | 195120 | -| policy_gradient_loss | 0.0147 | -| std | 0.00785 | -| value_loss | 5.27e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19514 | -| time_elapsed | 105507 | -| total_timesteps | 2497792 | -| train/ | | -| approx_kl | 0.3818578 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 195130 | -| policy_gradient_loss | 0.0474 | -| std | 0.00785 | -| value_loss | 4.58e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 19515 | -| time_elapsed | 105512 | -| total_timesteps | 2497920 | -| train/ | | -| approx_kl | 0.008217212 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | -0.00711 | -| n_updates | 195140 | -| policy_gradient_loss | 0.0026 | -| std | 0.00785 | -| value_loss | 3.92e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19516 | -| time_elapsed | 105518 | -| total_timesteps | 2498048 | -| train/ | | -| approx_kl | 0.037192963 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 195150 | -| policy_gradient_loss | 0.00375 | -| std | 0.00785 | -| value_loss | 2.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19517 | -| time_elapsed | 105528 | -| total_timesteps | 2498176 | -| train/ | | -| approx_kl | 0.08069995 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 195160 | -| policy_gradient_loss | 0.00467 | -| std | 0.00785 | -| value_loss | 0.000316 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19518 | -| time_elapsed | 105534 | -| total_timesteps | 2498304 | -| train/ | | -| approx_kl | 0.062382475 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.0049 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 195170 | -| policy_gradient_loss | 0.00741 | -| std | 0.00784 | -| value_loss | 1.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19519 | -| time_elapsed | 105540 | -| total_timesteps | 2498432 | -| train/ | | -| approx_kl | 0.13911182 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.00891 | -| learning_rate | 0.0003 | -| loss | 0.0856 | -| n_updates | 195180 | -| policy_gradient_loss | 0.0141 | -| std | 0.00784 | -| value_loss | 5.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19520 | -| time_elapsed | 105544 | -| total_timesteps | 2498560 | -| train/ | | -| approx_kl | 0.089496665 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0375 | -| n_updates | 195190 | -| policy_gradient_loss | 0.0247 | -| std | 0.00784 | -| value_loss | 3.34e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19521 | -| time_elapsed | 105549 | -| total_timesteps | 2498688 | -| train/ | | -| approx_kl | 0.11722114 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 195200 | -| policy_gradient_loss | 0.015 | -| std | 0.00784 | -| value_loss | 2.41e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19522 | -| time_elapsed | 105554 | -| total_timesteps | 2498816 | -| train/ | | -| approx_kl | 0.0012912247 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.00404 | -| n_updates | 195210 | -| policy_gradient_loss | 0.0175 | -| std | 0.00784 | -| value_loss | 2.31e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19523 | -| time_elapsed | 105559 | -| total_timesteps | 2498944 | -| train/ | | -| approx_kl | 0.11190187 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0749 | -| n_updates | 195220 | -| policy_gradient_loss | 0.0174 | -| std | 0.00784 | -| value_loss | 1.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19524 | -| time_elapsed | 105564 | -| total_timesteps | 2499072 | -| train/ | | -| approx_kl | 0.013388742 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.000155 | -| n_updates | 195230 | -| policy_gradient_loss | -0.000134 | -| std | 0.00784 | -| value_loss | 9.31e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19525 | -| time_elapsed | 105574 | -| total_timesteps | 2499200 | -| train/ | | -| approx_kl | 0.0075602266 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.762 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 195240 | -| policy_gradient_loss | -0.00889 | -| std | 0.00784 | -| value_loss | 0.000647 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19526 | -| time_elapsed | 105579 | -| total_timesteps | 2499328 | -| train/ | | -| approx_kl | 0.11927638 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.765 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 195250 | -| policy_gradient_loss | 0.0653 | -| std | 0.00784 | -| value_loss | 1.06e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19527 | -| time_elapsed | 105585 | -| total_timesteps | 2499456 | -| train/ | | -| approx_kl | 0.019280383 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.302 | -| learning_rate | 0.0003 | -| loss | 0.000962 | -| n_updates | 195260 | -| policy_gradient_loss | 0.0151 | -| std | 0.00784 | -| value_loss | 1.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19528 | -| time_elapsed | 105590 | -| total_timesteps | 2499584 | -| train/ | | -| approx_kl | 0.10756919 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.0029 | -| learning_rate | 0.0003 | -| loss | 0.0581 | -| n_updates | 195270 | -| policy_gradient_loss | 0.0136 | -| std | 0.00784 | -| value_loss | 3.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19529 | -| time_elapsed | 105595 | -| total_timesteps | 2499712 | -| train/ | | -| approx_kl | 0.016162857 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 195280 | -| policy_gradient_loss | 0.00784 | -| std | 0.00785 | -| value_loss | 2.3e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19530 | -| time_elapsed | 105600 | -| total_timesteps | 2499840 | -| train/ | | -| approx_kl | 0.08098079 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.0438 | -| n_updates | 195290 | -| policy_gradient_loss | 0.0223 | -| std | 0.00785 | -| value_loss | 1.62e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19531 | -| time_elapsed | 105605 | -| total_timesteps | 2499968 | -| train/ | | -| approx_kl | 0.4740881 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 195300 | -| policy_gradient_loss | 0.0413 | -| std | 0.00785 | -| value_loss | 1.3e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19532 | -| time_elapsed | 105611 | -| total_timesteps | 2500096 | -| train/ | | -| approx_kl | 0.024587916 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.00758 | -| n_updates | 195310 | -| policy_gradient_loss | 0.00482 | -| std | 0.00785 | -| value_loss | 6.87e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19533 | -| time_elapsed | 105622 | -| total_timesteps | 2500224 | -| train/ | | -| approx_kl | 0.066995405 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.769 | -| learning_rate | 0.0003 | -| loss | -0.00892 | -| n_updates | 195320 | -| policy_gradient_loss | -0.0112 | -| std | 0.00785 | -| value_loss | 0.00193 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19534 | -| time_elapsed | 105626 | -| total_timesteps | 2500352 | -| train/ | | -| approx_kl | 0.05763811 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.381 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 195330 | -| policy_gradient_loss | 0.00243 | -| std | 0.00785 | -| value_loss | 1.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19535 | -| time_elapsed | 105632 | -| total_timesteps | 2500480 | -| train/ | | -| approx_kl | 0.023882452 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.527 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 195340 | -| policy_gradient_loss | -0.00337 | -| std | 0.00785 | -| value_loss | 5.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19536 | -| time_elapsed | 105636 | -| total_timesteps | 2500608 | -| train/ | | -| approx_kl | 0.036883887 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 195350 | -| policy_gradient_loss | -0.0059 | -| std | 0.00785 | -| value_loss | 2.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19537 | -| time_elapsed | 105642 | -| total_timesteps | 2500736 | -| train/ | | -| approx_kl | 0.033058386 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 195360 | -| policy_gradient_loss | 0.00666 | -| std | 0.00785 | -| value_loss | 2e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19538 | -| time_elapsed | 105647 | -| total_timesteps | 2500864 | -| train/ | | -| approx_kl | 0.04196624 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 195370 | -| policy_gradient_loss | 0.0105 | -| std | 0.00785 | -| value_loss | 1.34e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19539 | -| time_elapsed | 105651 | -| total_timesteps | 2500992 | -| train/ | | -| approx_kl | 0.030513091 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 195380 | -| policy_gradient_loss | 0.00896 | -| std | 0.00785 | -| value_loss | 7.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19540 | -| time_elapsed | 105656 | -| total_timesteps | 2501120 | -| train/ | | -| approx_kl | 0.005287596 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0691 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 195390 | -| policy_gradient_loss | 0.00179 | -| std | 0.00786 | -| value_loss | 5.36e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19541 | -| time_elapsed | 105669 | -| total_timesteps | 2501248 | -| train/ | | -| approx_kl | 0.0033239485 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 195400 | -| policy_gradient_loss | -0.00942 | -| std | 0.00786 | -| value_loss | 0.000716 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19542 | -| time_elapsed | 105676 | -| total_timesteps | 2501376 | -| train/ | | -| approx_kl | 0.07159426 | -| clip_fraction | 0.619 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.291 | -| learning_rate | 0.0003 | -| loss | 0.0941 | -| n_updates | 195410 | -| policy_gradient_loss | 0.0817 | -| std | 0.00785 | -| value_loss | 2.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19543 | -| time_elapsed | 105681 | -| total_timesteps | 2501504 | -| train/ | | -| approx_kl | 0.016369458 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.00449 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 195420 | -| policy_gradient_loss | 0.014 | -| std | 0.00785 | -| value_loss | 6.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19544 | -| time_elapsed | 105686 | -| total_timesteps | 2501632 | -| train/ | | -| approx_kl | 0.35349283 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.00121 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 195430 | -| policy_gradient_loss | 0.0403 | -| std | 0.00785 | -| value_loss | 1.93e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19545 | -| time_elapsed | 105689 | -| total_timesteps | 2501760 | -| train/ | | -| approx_kl | 0.031216543 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 195440 | -| policy_gradient_loss | 0.00564 | -| std | 0.00785 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19546 | -| time_elapsed | 105692 | -| total_timesteps | 2501888 | -| train/ | | -| approx_kl | 0.007291171 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 195450 | -| policy_gradient_loss | 0.00617 | -| std | 0.00785 | -| value_loss | 1.04e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19547 | -| time_elapsed | 105696 | -| total_timesteps | 2502016 | -| train/ | | -| approx_kl | 0.00060600834 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.000708 | -| n_updates | 195460 | -| policy_gradient_loss | 0.00464 | -| std | 0.00785 | -| value_loss | 6.57e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19548 | -| time_elapsed | 105707 | -| total_timesteps | 2502144 | -| train/ | | -| approx_kl | 0.017380787 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.582 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 195470 | -| policy_gradient_loss | -0.00678 | -| std | 0.00785 | -| value_loss | 0.00088 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19549 | -| time_elapsed | 105712 | -| total_timesteps | 2502272 | -| train/ | | -| approx_kl | 0.0028200834 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.0966 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 195480 | -| policy_gradient_loss | 0.0451 | -| std | 0.00786 | -| value_loss | 6.07e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19550 | -| time_elapsed | 105716 | -| total_timesteps | 2502400 | -| train/ | | -| approx_kl | 0.10236494 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.0997 | -| n_updates | 195490 | -| policy_gradient_loss | 0.145 | -| std | 0.00786 | -| value_loss | 9.94e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19551 | -| time_elapsed | 105720 | -| total_timesteps | 2502528 | -| train/ | | -| approx_kl | 0.06673531 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 195500 | -| policy_gradient_loss | 0.02 | -| std | 0.00786 | -| value_loss | 6.35e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19552 | -| time_elapsed | 105724 | -| total_timesteps | 2502656 | -| train/ | | -| approx_kl | 0.117603295 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 195510 | -| policy_gradient_loss | 0.0408 | -| std | 0.00786 | -| value_loss | 5.75e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19553 | -| time_elapsed | 105727 | -| total_timesteps | 2502784 | -| train/ | | -| approx_kl | 0.00012561819 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.000112 | -| n_updates | 195520 | -| policy_gradient_loss | 0.0163 | -| std | 0.00786 | -| value_loss | 3.09e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19554 | -| time_elapsed | 105731 | -| total_timesteps | 2502912 | -| train/ | | -| approx_kl | 0.056487422 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.00283 | -| n_updates | 195530 | -| policy_gradient_loss | 0.0156 | -| std | 0.00787 | -| value_loss | 3.55e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19555 | -| time_elapsed | 105735 | -| total_timesteps | 2503040 | -| train/ | | -| approx_kl | 0.2714116 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 195540 | -| policy_gradient_loss | 0.154 | -| std | 0.00787 | -| value_loss | 3.15e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19556 | -| time_elapsed | 105744 | -| total_timesteps | 2503168 | -| train/ | | -| approx_kl | 0.05074634 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.811 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 195550 | -| policy_gradient_loss | -0.0136 | -| std | 0.00787 | -| value_loss | 0.00182 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19557 | -| time_elapsed | 105748 | -| total_timesteps | 2503296 | -| train/ | | -| approx_kl | 0.02896388 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.00879 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 195560 | -| policy_gradient_loss | 0.009 | -| std | 0.00786 | -| value_loss | 4.07e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19558 | -| time_elapsed | 105752 | -| total_timesteps | 2503424 | -| train/ | | -| approx_kl | 0.03810132 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 195570 | -| policy_gradient_loss | 0.0136 | -| std | 0.00785 | -| value_loss | 1.09e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19559 | -| time_elapsed | 105755 | -| total_timesteps | 2503552 | -| train/ | | -| approx_kl | 0.00019680662 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.484 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 195580 | -| policy_gradient_loss | 9.83e-05 | -| std | 0.00785 | -| value_loss | 3e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19560 | -| time_elapsed | 105759 | -| total_timesteps | 2503680 | -| train/ | | -| approx_kl | 0.00925119 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 195590 | -| policy_gradient_loss | 0.00626 | -| std | 0.00785 | -| value_loss | 4.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19561 | -| time_elapsed | 105764 | -| total_timesteps | 2503808 | -| train/ | | -| approx_kl | 0.050602686 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 195600 | -| policy_gradient_loss | 0.00892 | -| std | 0.00785 | -| value_loss | 1.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19562 | -| time_elapsed | 105769 | -| total_timesteps | 2503936 | -| train/ | | -| approx_kl | 0.030956829 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 195610 | -| policy_gradient_loss | 0.0108 | -| std | 0.00785 | -| value_loss | 2.77e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19563 | -| time_elapsed | 105774 | -| total_timesteps | 2504064 | -| train/ | | -| approx_kl | 0.04358032 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.00543 | -| n_updates | 195620 | -| policy_gradient_loss | 0.00218 | -| std | 0.00785 | -| value_loss | 2.65e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19564 | -| time_elapsed | 105782 | -| total_timesteps | 2504192 | -| train/ | | -| approx_kl | 0.04626787 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0211 | -| n_updates | 195630 | -| policy_gradient_loss | -0.0152 | -| std | 0.00784 | -| value_loss | 0.000106 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19565 | -| time_elapsed | 105787 | -| total_timesteps | 2504320 | -| train/ | | -| approx_kl | 9.561796e-05 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.436 | -| learning_rate | 0.0003 | -| loss | -0.000441 | -| n_updates | 195640 | -| policy_gradient_loss | 0.00628 | -| std | 0.00783 | -| value_loss | 2.68e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19566 | -| time_elapsed | 105793 | -| total_timesteps | 2504448 | -| train/ | | -| approx_kl | 0.027571779 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -13.7 | -| learning_rate | 0.0003 | -| loss | 0.00569 | -| n_updates | 195650 | -| policy_gradient_loss | 0.0154 | -| std | 0.00781 | -| value_loss | 5.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19567 | -| time_elapsed | 105798 | -| total_timesteps | 2504576 | -| train/ | | -| approx_kl | 0.055805266 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.365 | -| learning_rate | 0.0003 | -| loss | 0.0514 | -| n_updates | 195660 | -| policy_gradient_loss | 0.0884 | -| std | 0.0078 | -| value_loss | 1.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19568 | -| time_elapsed | 105802 | -| total_timesteps | 2504704 | -| train/ | | -| approx_kl | 0.08253839 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | 0.0968 | -| n_updates | 195670 | -| policy_gradient_loss | 0.0779 | -| std | 0.0078 | -| value_loss | 1.54e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19569 | -| time_elapsed | 105807 | -| total_timesteps | 2504832 | -| train/ | | -| approx_kl | 0.10147676 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 195680 | -| policy_gradient_loss | 0.129 | -| std | 0.0078 | -| value_loss | 1.37e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 19570 | -| time_elapsed | 105812 | -| total_timesteps | 2504960 | -| train/ | | -| approx_kl | 0.016599692 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | 0.00231 | -| n_updates | 195690 | -| policy_gradient_loss | 0.0114 | -| std | 0.0078 | -| value_loss | 7.94e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19571 | -| time_elapsed | 105815 | -| total_timesteps | 2505088 | -| train/ | | -| approx_kl | 0.4897169 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.193 | -| n_updates | 195700 | -| policy_gradient_loss | 0.0593 | -| std | 0.00781 | -| value_loss | 5.8e-10 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19572 | -| time_elapsed | 105824 | -| total_timesteps | 2505216 | -| train/ | | -| approx_kl | 0.0155748185 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.769 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 195710 | -| policy_gradient_loss | -0.00963 | -| std | 0.00781 | -| value_loss | 0.00436 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19573 | -| time_elapsed | 105828 | -| total_timesteps | 2505344 | -| train/ | | -| approx_kl | 0.014390359 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 195720 | -| policy_gradient_loss | 0.0112 | -| std | 0.00781 | -| value_loss | 3.58e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19574 | -| time_elapsed | 105832 | -| total_timesteps | 2505472 | -| train/ | | -| approx_kl | 0.060418304 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.00718 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 195730 | -| policy_gradient_loss | 0.0321 | -| std | 0.00779 | -| value_loss | 1.29e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19575 | -| time_elapsed | 105836 | -| total_timesteps | 2505600 | -| train/ | | -| approx_kl | 2.6559923e-05 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -5.29 | -| learning_rate | 0.0003 | -| loss | 0.000872 | -| n_updates | 195740 | -| policy_gradient_loss | -0.00286 | -| std | 0.00777 | -| value_loss | 0.000181 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19576 | -| time_elapsed | 105840 | -| total_timesteps | 2505728 | -| train/ | | -| approx_kl | 9.287894e-05 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.404 | -| learning_rate | 0.0003 | -| loss | -0.00013 | -| n_updates | 195750 | -| policy_gradient_loss | 0.00618 | -| std | 0.00778 | -| value_loss | 9.16e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19577 | -| time_elapsed | 105845 | -| total_timesteps | 2505856 | -| train/ | | -| approx_kl | 0.040571027 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0981 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 195760 | -| policy_gradient_loss | 0.045 | -| std | 0.0078 | -| value_loss | 0.000178 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 19578 | -| time_elapsed | 105848 | -| total_timesteps | 2505984 | -| train/ | | -| approx_kl | 0.16054872 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | 0.0783 | -| n_updates | 195770 | -| policy_gradient_loss | 0.0248 | -| std | 0.00781 | -| value_loss | 1.74e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19579 | -| time_elapsed | 105852 | -| total_timesteps | 2506112 | -| train/ | | -| approx_kl | 0.00097631663 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.0104 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 195780 | -| policy_gradient_loss | 0.00758 | -| std | 0.00781 | -| value_loss | 1.99e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19580 | -| time_elapsed | 105863 | -| total_timesteps | 2506240 | -| train/ | | -| approx_kl | 0.09873178 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.766 | -| learning_rate | 0.0003 | -| loss | 0.00527 | -| n_updates | 195790 | -| policy_gradient_loss | -0.00617 | -| std | 0.00781 | -| value_loss | 0.00458 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19581 | -| time_elapsed | 105869 | -| total_timesteps | 2506368 | -| train/ | | -| approx_kl | 0.479321 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.0075 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 195800 | -| policy_gradient_loss | 0.0471 | -| std | 0.00781 | -| value_loss | 2.43e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19582 | -| time_elapsed | 105874 | -| total_timesteps | 2506496 | -| train/ | | -| approx_kl | 0.030147124 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | 0.00471 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 195810 | -| policy_gradient_loss | 0.00942 | -| std | 0.0078 | -| value_loss | 8.51e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19583 | -| time_elapsed | 105880 | -| total_timesteps | 2506624 | -| train/ | | -| approx_kl | 0.0064195036 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 195820 | -| policy_gradient_loss | 0.00312 | -| std | 0.0078 | -| value_loss | 4.64e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19584 | -| time_elapsed | 105885 | -| total_timesteps | 2506752 | -| train/ | | -| approx_kl | 0.00017332472 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.43 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.000515 | -| n_updates | 195830 | -| policy_gradient_loss | 0.0267 | -| std | 0.0078 | -| value_loss | 2.99e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19585 | -| time_elapsed | 105889 | -| total_timesteps | 2506880 | -| train/ | | -| approx_kl | 0.14054675 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | 0.0921 | -| n_updates | 195840 | -| policy_gradient_loss | 0.0506 | -| std | 0.00779 | -| value_loss | 1.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19586 | -| time_elapsed | 105894 | -| total_timesteps | 2507008 | -| train/ | | -| approx_kl | 0.07920826 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 195850 | -| policy_gradient_loss | 0.00977 | -| std | 0.00779 | -| value_loss | 1.58e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19587 | -| time_elapsed | 105906 | -| total_timesteps | 2507136 | -| train/ | | -| approx_kl | 0.008423115 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.893 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 195860 | -| policy_gradient_loss | -0.00975 | -| std | 0.00777 | -| value_loss | 0.00127 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19588 | -| time_elapsed | 105909 | -| total_timesteps | 2507264 | -| train/ | | -| approx_kl | 0.13509887 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.1 | -| learning_rate | 0.0003 | -| loss | 0.0835 | -| n_updates | 195870 | -| policy_gradient_loss | 0.0192 | -| std | 0.00777 | -| value_loss | 0.000305 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19589 | -| time_elapsed | 105912 | -| total_timesteps | 2507392 | -| train/ | | -| approx_kl | 0.00034726132 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00802 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 195880 | -| policy_gradient_loss | 0.0224 | -| std | 0.00776 | -| value_loss | 8.48e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19590 | -| time_elapsed | 105916 | -| total_timesteps | 2507520 | -| train/ | | -| approx_kl | 0.15410286 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00585 | -| learning_rate | 0.0003 | -| loss | 0.0927 | -| n_updates | 195890 | -| policy_gradient_loss | 0.0226 | -| std | 0.00776 | -| value_loss | 2.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19591 | -| time_elapsed | 105920 | -| total_timesteps | 2507648 | -| train/ | | -| approx_kl | 0.017101295 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 195900 | -| policy_gradient_loss | 0.0189 | -| std | 0.00776 | -| value_loss | 1.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19592 | -| time_elapsed | 105924 | -| total_timesteps | 2507776 | -| train/ | | -| approx_kl | 0.09165564 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 195910 | -| policy_gradient_loss | 0.023 | -| std | 0.00776 | -| value_loss | 8.35e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19593 | -| time_elapsed | 105928 | -| total_timesteps | 2507904 | -| train/ | | -| approx_kl | 9.500887e-05 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 195920 | -| policy_gradient_loss | 0.0218 | -| std | 0.00776 | -| value_loss | 7.61e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19594 | -| time_elapsed | 105933 | -| total_timesteps | 2508032 | -| train/ | | -| approx_kl | 0.5690585 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.251 | -| n_updates | 195930 | -| policy_gradient_loss | 0.0657 | -| std | 0.00776 | -| value_loss | 6.55e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19595 | -| time_elapsed | 105945 | -| total_timesteps | 2508160 | -| train/ | | -| approx_kl | 0.08280692 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 195940 | -| policy_gradient_loss | -0.00622 | -| std | 0.00776 | -| value_loss | 0.000177 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19596 | -| time_elapsed | 105950 | -| total_timesteps | 2508288 | -| train/ | | -| approx_kl | 0.009732613 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.073 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 195950 | -| policy_gradient_loss | 0.0659 | -| std | 0.00776 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19597 | -| time_elapsed | 105955 | -| total_timesteps | 2508416 | -| train/ | | -| approx_kl | 0.008955276 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | -0.00721 | -| n_updates | 195960 | -| policy_gradient_loss | 0.013 | -| std | 0.00776 | -| value_loss | 1.57e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19598 | -| time_elapsed | 105961 | -| total_timesteps | 2508544 | -| train/ | | -| approx_kl | 0.08795056 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.0498 | -| n_updates | 195970 | -| policy_gradient_loss | 0.00765 | -| std | 0.00776 | -| value_loss | 9.3e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19599 | -| time_elapsed | 105964 | -| total_timesteps | 2508672 | -| train/ | | -| approx_kl | 0.04108814 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 195980 | -| policy_gradient_loss | 0.0142 | -| std | 0.00776 | -| value_loss | 8.36e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19600 | -| time_elapsed | 105969 | -| total_timesteps | 2508800 | -| train/ | | -| approx_kl | 0.09871989 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 195990 | -| policy_gradient_loss | 0.016 | -| std | 0.00775 | -| value_loss | 7.95e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19601 | -| time_elapsed | 105974 | -| total_timesteps | 2508928 | -| train/ | | -| approx_kl | 0.09627395 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 196000 | -| policy_gradient_loss | 0.0155 | -| std | 0.00776 | -| value_loss | 6.52e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19602 | -| time_elapsed | 105978 | -| total_timesteps | 2509056 | -| train/ | | -| approx_kl | 0.021978963 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -260 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 196010 | -| policy_gradient_loss | -0.000441 | -| std | 0.00776 | -| value_loss | 6.43e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19603 | -| time_elapsed | 105989 | -| total_timesteps | 2509184 | -| train/ | | -| approx_kl | 0.00064067636 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.867 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 196020 | -| policy_gradient_loss | 0.00377 | -| std | 0.00776 | -| value_loss | 0.0018 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19604 | -| time_elapsed | 105993 | -| total_timesteps | 2509312 | -| train/ | | -| approx_kl | 0.0074101784 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 196030 | -| policy_gradient_loss | 0.00341 | -| std | 0.00776 | -| value_loss | 1.79e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19605 | -| time_elapsed | 105999 | -| total_timesteps | 2509440 | -| train/ | | -| approx_kl | 0.056732774 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00513 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 196040 | -| policy_gradient_loss | -0.000762 | -| std | 0.00776 | -| value_loss | 5.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19606 | -| time_elapsed | 106004 | -| total_timesteps | 2509568 | -| train/ | | -| approx_kl | 0.009513624 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 196050 | -| policy_gradient_loss | 0.00364 | -| std | 0.00776 | -| value_loss | 3.89e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19607 | -| time_elapsed | 106008 | -| total_timesteps | 2509696 | -| train/ | | -| approx_kl | 0.06108198 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.0324 | -| n_updates | 196060 | -| policy_gradient_loss | 0.0125 | -| std | 0.00776 | -| value_loss | 2.55e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19608 | -| time_elapsed | 106013 | -| total_timesteps | 2509824 | -| train/ | | -| approx_kl | 0.032253318 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 196070 | -| policy_gradient_loss | 0.00711 | -| std | 0.00776 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 19609 | -| time_elapsed | 106019 | -| total_timesteps | 2509952 | -| train/ | | -| approx_kl | 0.0049463534 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | -0.00729 | -| n_updates | 196080 | -| policy_gradient_loss | 0.00221 | -| std | 0.00776 | -| value_loss | 1.17e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19610 | -| time_elapsed | 106025 | -| total_timesteps | 2510080 | -| train/ | | -| approx_kl | 0.063150086 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.0452 | -| n_updates | 196090 | -| policy_gradient_loss | 0.0108 | -| std | 0.00776 | -| value_loss | 6.5e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19611 | -| time_elapsed | 106034 | -| total_timesteps | 2510208 | -| train/ | | -| approx_kl | 0.00059634075 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.685 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 196100 | -| policy_gradient_loss | -0.00479 | -| std | 0.00776 | -| value_loss | 0.00941 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19612 | -| time_elapsed | 106040 | -| total_timesteps | 2510336 | -| train/ | | -| approx_kl | 0.00912297 | -| clip_fraction | 0.0672 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 196110 | -| policy_gradient_loss | -0.00233 | -| std | 0.00776 | -| value_loss | 4.62e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19613 | -| time_elapsed | 106044 | -| total_timesteps | 2510464 | -| train/ | | -| approx_kl | 0.007530086 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00527 | -| learning_rate | 0.0003 | -| loss | 0.001 | -| n_updates | 196120 | -| policy_gradient_loss | 0.00059 | -| std | 0.00776 | -| value_loss | 5.88e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19614 | -| time_elapsed | 106048 | -| total_timesteps | 2510592 | -| train/ | | -| approx_kl | 0.010593091 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0899 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 196130 | -| policy_gradient_loss | -0.00096 | -| std | 0.00776 | -| value_loss | 4.68e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19615 | -| time_elapsed | 106053 | -| total_timesteps | 2510720 | -| train/ | | -| approx_kl | 0.008990021 | -| clip_fraction | 0.0633 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 196140 | -| policy_gradient_loss | -0.00641 | -| std | 0.00776 | -| value_loss | 2.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19616 | -| time_elapsed | 106057 | -| total_timesteps | 2510848 | -| train/ | | -| approx_kl | 0.021282148 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.00644 | -| n_updates | 196150 | -| policy_gradient_loss | 0.0255 | -| std | 0.00776 | -| value_loss | 2.05e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 19617 | -| time_elapsed | 106061 | -| total_timesteps | 2510976 | -| train/ | | -| approx_kl | 0.08934949 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | -0.00735 | -| n_updates | 196160 | -| policy_gradient_loss | 0.00456 | -| std | 0.00776 | -| value_loss | 2.19e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19618 | -| time_elapsed | 106065 | -| total_timesteps | 2511104 | -| train/ | | -| approx_kl | 0.0046973363 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 196170 | -| policy_gradient_loss | 0.00679 | -| std | 0.00777 | -| value_loss | 1.74e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19619 | -| time_elapsed | 106076 | -| total_timesteps | 2511232 | -| train/ | | -| approx_kl | 0.021538477 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 196180 | -| policy_gradient_loss | -0.0119 | -| std | 0.00777 | -| value_loss | 0.000123 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19620 | -| time_elapsed | 106079 | -| total_timesteps | 2511360 | -| train/ | | -| approx_kl | 0.008181798 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.00783 | -| n_updates | 196190 | -| policy_gradient_loss | 0.0012 | -| std | 0.00777 | -| value_loss | 8.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19621 | -| time_elapsed | 106083 | -| total_timesteps | 2511488 | -| train/ | | -| approx_kl | 0.044626333 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0192 | -| n_updates | 196200 | -| policy_gradient_loss | 0.00737 | -| std | 0.00776 | -| value_loss | 5.24e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19622 | -| time_elapsed | 106088 | -| total_timesteps | 2511616 | -| train/ | | -| approx_kl | 0.0072740247 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.00443 | -| n_updates | 196210 | -| policy_gradient_loss | 0.00277 | -| std | 0.00776 | -| value_loss | 3.68e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19623 | -| time_elapsed | 106092 | -| total_timesteps | 2511744 | -| train/ | | -| approx_kl | 0.05997341 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.041 | -| n_updates | 196220 | -| policy_gradient_loss | 0.0164 | -| std | 0.00776 | -| value_loss | 2.92e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19624 | -| time_elapsed | 106098 | -| total_timesteps | 2511872 | -| train/ | | -| approx_kl | 0.033368785 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 196230 | -| policy_gradient_loss | 0.00738 | -| std | 0.00776 | -| value_loss | 1.95e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19625 | -| time_elapsed | 106102 | -| total_timesteps | 2512000 | -| train/ | | -| approx_kl | 0.005674143 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -0.000192 | -| n_updates | 196240 | -| policy_gradient_loss | 0.00512 | -| std | 0.00776 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19626 | -| time_elapsed | 106106 | -| total_timesteps | 2512128 | -| train/ | | -| approx_kl | 0.061358243 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00596 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 196250 | -| policy_gradient_loss | 0.00503 | -| std | 0.00776 | -| value_loss | 7.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19627 | -| time_elapsed | 106117 | -| total_timesteps | 2512256 | -| train/ | | -| approx_kl | 0.25847977 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.785 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 196260 | -| policy_gradient_loss | 0.0148 | -| std | 0.00776 | -| value_loss | 0.00458 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19628 | -| time_elapsed | 106121 | -| total_timesteps | 2512384 | -| train/ | | -| approx_kl | 0.008008069 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -0.00231 | -| n_updates | 196270 | -| policy_gradient_loss | 0.00507 | -| std | 0.00776 | -| value_loss | 1.31e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19629 | -| time_elapsed | 106126 | -| total_timesteps | 2512512 | -| train/ | | -| approx_kl | 0.000559764 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00847 | -| learning_rate | 0.0003 | -| loss | 0.0047 | -| n_updates | 196280 | -| policy_gradient_loss | -0.00113 | -| std | 0.00776 | -| value_loss | 1.2e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19630 | -| time_elapsed | 106130 | -| total_timesteps | 2512640 | -| train/ | | -| approx_kl | 0.048853304 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -21.6 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 196290 | -| policy_gradient_loss | -0.00619 | -| std | 0.00776 | -| value_loss | 2.39e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19631 | -| time_elapsed | 106136 | -| total_timesteps | 2512768 | -| train/ | | -| approx_kl | 0.015480936 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.439 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 196300 | -| policy_gradient_loss | 0.000671 | -| std | 0.00775 | -| value_loss | 3.25e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19632 | -| time_elapsed | 106141 | -| total_timesteps | 2512896 | -| train/ | | -| approx_kl | 0.33953598 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -26.2 | -| learning_rate | 0.0003 | -| loss | 0.0756 | -| n_updates | 196310 | -| policy_gradient_loss | 0.0281 | -| std | 0.00774 | -| value_loss | 1.77e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19633 | -| time_elapsed | 106146 | -| total_timesteps | 2513024 | -| train/ | | -| approx_kl | 0.05414802 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | 0.041 | -| n_updates | 196320 | -| policy_gradient_loss | 0.0174 | -| std | 0.00773 | -| value_loss | 1.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19634 | -| time_elapsed | 106158 | -| total_timesteps | 2513152 | -| train/ | | -| approx_kl | 0.014445022 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 196330 | -| policy_gradient_loss | -0.012 | -| std | 0.00773 | -| value_loss | 0.000257 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19635 | -| time_elapsed | 106163 | -| total_timesteps | 2513280 | -| train/ | | -| approx_kl | 0.1423998 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0302 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 196340 | -| policy_gradient_loss | 0.00702 | -| std | 0.00772 | -| value_loss | 7.46e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19636 | -| time_elapsed | 106168 | -| total_timesteps | 2513408 | -| train/ | | -| approx_kl | 0.014418112 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00529 | -| learning_rate | 0.0003 | -| loss | 0.00236 | -| n_updates | 196350 | -| policy_gradient_loss | 0.017 | -| std | 0.00772 | -| value_loss | 3.03e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19637 | -| time_elapsed | 106173 | -| total_timesteps | 2513536 | -| train/ | | -| approx_kl | 0.09753059 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 196360 | -| policy_gradient_loss | 0.0187 | -| std | 0.00772 | -| value_loss | 2.84e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19638 | -| time_elapsed | 106177 | -| total_timesteps | 2513664 | -| train/ | | -| approx_kl | 0.41256472 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 196370 | -| policy_gradient_loss | 0.0412 | -| std | 0.00772 | -| value_loss | 2.48e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19639 | -| time_elapsed | 106182 | -| total_timesteps | 2513792 | -| train/ | | -| approx_kl | 0.009646246 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 196380 | -| policy_gradient_loss | 0.00412 | -| std | 0.00772 | -| value_loss | 1.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19640 | -| time_elapsed | 106187 | -| total_timesteps | 2513920 | -| train/ | | -| approx_kl | 0.051765513 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0299 | -| n_updates | 196390 | -| policy_gradient_loss | 0.012 | -| std | 0.00772 | -| value_loss | 8.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19641 | -| time_elapsed | 106192 | -| total_timesteps | 2514048 | -| train/ | | -| approx_kl | 0.010159277 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | -0.0071 | -| n_updates | 196400 | -| policy_gradient_loss | 0.00382 | -| std | 0.00772 | -| value_loss | 7.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19642 | -| time_elapsed | 106200 | -| total_timesteps | 2514176 | -| train/ | | -| approx_kl | 0.008980088 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 196410 | -| policy_gradient_loss | -0.0147 | -| std | 0.00772 | -| value_loss | 0.00789 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19643 | -| time_elapsed | 106206 | -| total_timesteps | 2514304 | -| train/ | | -| approx_kl | 0.17008476 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0989 | -| learning_rate | 0.0003 | -| loss | 0.0602 | -| n_updates | 196420 | -| policy_gradient_loss | 0.0325 | -| std | 0.00772 | -| value_loss | 0.000551 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19644 | -| time_elapsed | 106211 | -| total_timesteps | 2514432 | -| train/ | | -| approx_kl | 0.037158556 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 196430 | -| policy_gradient_loss | 0.0571 | -| std | 0.00772 | -| value_loss | 0.0001 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19645 | -| time_elapsed | 106214 | -| total_timesteps | 2514560 | -| train/ | | -| approx_kl | 0.014649145 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00784 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 196440 | -| policy_gradient_loss | 0.0188 | -| std | 0.00772 | -| value_loss | 4.33e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19646 | -| time_elapsed | 106218 | -| total_timesteps | 2514688 | -| train/ | | -| approx_kl | 0.02391702 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.00323 | -| n_updates | 196450 | -| policy_gradient_loss | 0.0385 | -| std | 0.00771 | -| value_loss | 4.8e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19647 | -| time_elapsed | 106223 | -| total_timesteps | 2514816 | -| train/ | | -| approx_kl | 0.17141433 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.388 | -| learning_rate | 0.0003 | -| loss | 0.0937 | -| n_updates | 196460 | -| policy_gradient_loss | 0.0521 | -| std | 0.00771 | -| value_loss | 4.68e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19648 | -| time_elapsed | 106229 | -| total_timesteps | 2514944 | -| train/ | | -| approx_kl | 0.038908295 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 196470 | -| policy_gradient_loss | 0.0805 | -| std | 0.00771 | -| value_loss | 3.26e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19649 | -| time_elapsed | 106233 | -| total_timesteps | 2515072 | -| train/ | | -| approx_kl | 0.20243196 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 196480 | -| policy_gradient_loss | 0.039 | -| std | 0.0077 | -| value_loss | 5.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19650 | -| time_elapsed | 106242 | -| total_timesteps | 2515200 | -| train/ | | -| approx_kl | 0.006670813 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.625 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 196490 | -| policy_gradient_loss | 0.0544 | -| std | 0.0077 | -| value_loss | 0.0157 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19651 | -| time_elapsed | 106247 | -| total_timesteps | 2515328 | -| train/ | | -| approx_kl | 0.16944785 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 196500 | -| policy_gradient_loss | 0.134 | -| std | 0.0077 | -| value_loss | 0.00012 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19652 | -| time_elapsed | 106252 | -| total_timesteps | 2515456 | -| train/ | | -| approx_kl | 0.07585597 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00849 | -| learning_rate | 0.0003 | -| loss | 0.0534 | -| n_updates | 196510 | -| policy_gradient_loss | 0.0222 | -| std | 0.00772 | -| value_loss | 0.000116 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19653 | -| time_elapsed | 106256 | -| total_timesteps | 2515584 | -| train/ | | -| approx_kl | 0.015239548 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0031 | -| learning_rate | 0.0003 | -| loss | -0.00173 | -| n_updates | 196520 | -| policy_gradient_loss | -0.0025 | -| std | 0.00774 | -| value_loss | 7.08e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19654 | -| time_elapsed | 106260 | -| total_timesteps | 2515712 | -| train/ | | -| approx_kl | 0.015186479 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 196530 | -| policy_gradient_loss | 0.0103 | -| std | 0.00774 | -| value_loss | 2.14e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19655 | -| time_elapsed | 106265 | -| total_timesteps | 2515840 | -| train/ | | -| approx_kl | 0.098028705 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | 0.0629 | -| n_updates | 196540 | -| policy_gradient_loss | 0.0297 | -| std | 0.00774 | -| value_loss | 3.25e-05 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 19656 | -| time_elapsed | 106270 | -| total_timesteps | 2515968 | -| train/ | | -| approx_kl | 0.000114238355 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.000563 | -| n_updates | 196550 | -| policy_gradient_loss | 0.0203 | -| std | 0.00774 | -| value_loss | 0.000221 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19657 | -| time_elapsed | 106275 | -| total_timesteps | 2516096 | -| train/ | | -| approx_kl | 0.42452443 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00883 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 196560 | -| policy_gradient_loss | 0.046 | -| std | 0.00774 | -| value_loss | 1.9e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19658 | -| time_elapsed | 106285 | -| total_timesteps | 2516224 | -| train/ | | -| approx_kl | 0.03915054 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 196570 | -| policy_gradient_loss | -0.00859 | -| std | 0.00774 | -| value_loss | 0.000533 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19659 | -| time_elapsed | 106290 | -| total_timesteps | 2516352 | -| train/ | | -| approx_kl | 0.0045297565 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0853 | -| learning_rate | 0.0003 | -| loss | -0.00262 | -| n_updates | 196580 | -| policy_gradient_loss | 0.0202 | -| std | 0.00774 | -| value_loss | 7.67e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19660 | -| time_elapsed | 106295 | -| total_timesteps | 2516480 | -| train/ | | -| approx_kl | 0.12802798 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 196590 | -| policy_gradient_loss | 0.0512 | -| std | 0.00774 | -| value_loss | 8.47e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19661 | -| time_elapsed | 106300 | -| total_timesteps | 2516608 | -| train/ | | -| approx_kl | 0.035970554 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 196600 | -| policy_gradient_loss | 0.0313 | -| std | 0.00773 | -| value_loss | 5.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19662 | -| time_elapsed | 106305 | -| total_timesteps | 2516736 | -| train/ | | -| approx_kl | 0.08972558 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.069 | -| n_updates | 196610 | -| policy_gradient_loss | 0.0429 | -| std | 0.00773 | -| value_loss | 3.49e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19663 | -| time_elapsed | 106310 | -| total_timesteps | 2516864 | -| train/ | | -| approx_kl | 0.15007234 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 196620 | -| policy_gradient_loss | 0.026 | -| std | 0.00773 | -| value_loss | 3.05e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 19664 | -| time_elapsed | 106314 | -| total_timesteps | 2516992 | -| train/ | | -| approx_kl | 0.5023625 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.194 | -| n_updates | 196630 | -| policy_gradient_loss | 0.054 | -| std | 0.00773 | -| value_loss | 1.66e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19665 | -| time_elapsed | 106318 | -| total_timesteps | 2517120 | -| train/ | | -| approx_kl | 0.034299646 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 196640 | -| policy_gradient_loss | 0.0123 | -| std | 0.00773 | -| value_loss | 1.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19666 | -| time_elapsed | 106330 | -| total_timesteps | 2517248 | -| train/ | | -| approx_kl | 0.10123906 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.747 | -| learning_rate | 0.0003 | -| loss | -0.00968 | -| n_updates | 196650 | -| policy_gradient_loss | -0.00613 | -| std | 0.00773 | -| value_loss | 0.000854 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19667 | -| time_elapsed | 106334 | -| total_timesteps | 2517376 | -| train/ | | -| approx_kl | 0.016470049 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.474 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 196660 | -| policy_gradient_loss | 0.0532 | -| std | 0.00773 | -| value_loss | 7.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19668 | -| time_elapsed | 106338 | -| total_timesteps | 2517504 | -| train/ | | -| approx_kl | 0.011772713 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.233 | -| learning_rate | 0.0003 | -| loss | -0.00549 | -| n_updates | 196670 | -| policy_gradient_loss | 0.0118 | -| std | 0.00773 | -| value_loss | 4.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19669 | -| time_elapsed | 106343 | -| total_timesteps | 2517632 | -| train/ | | -| approx_kl | 0.023348067 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00947 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 196680 | -| policy_gradient_loss | 0.0419 | -| std | 0.00773 | -| value_loss | 2.55e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19670 | -| time_elapsed | 106346 | -| total_timesteps | 2517760 | -| train/ | | -| approx_kl | 0.12885582 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.0466 | -| n_updates | 196690 | -| policy_gradient_loss | 0.0298 | -| std | 0.00773 | -| value_loss | 2.09e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 19671 | -| time_elapsed | 106350 | -| total_timesteps | 2517888 | -| train/ | | -| approx_kl | 0.0030465582 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.0068 | -| n_updates | 196700 | -| policy_gradient_loss | 0.00288 | -| std | 0.00773 | -| value_loss | 1.57e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19672 | -| time_elapsed | 106354 | -| total_timesteps | 2518016 | -| train/ | | -| approx_kl | 3.8815197e-05 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.000841 | -| n_updates | 196710 | -| policy_gradient_loss | 0.00184 | -| std | 0.00773 | -| value_loss | 1.28e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19673 | -| time_elapsed | 106366 | -| total_timesteps | 2518144 | -| train/ | | -| approx_kl | 0.012340901 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.0081 | -| n_updates | 196720 | -| policy_gradient_loss | 0.0361 | -| std | 0.00773 | -| value_loss | 0.000126 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19674 | -| time_elapsed | 106372 | -| total_timesteps | 2518272 | -| train/ | | -| approx_kl | 0.06869178 | -| clip_fraction | 0.586 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0789 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 196730 | -| policy_gradient_loss | 0.0456 | -| std | 0.00772 | -| value_loss | 9.65e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19675 | -| time_elapsed | 106376 | -| total_timesteps | 2518400 | -| train/ | | -| approx_kl | 0.00011426117 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | -0.000253 | -| n_updates | 196740 | -| policy_gradient_loss | 0.0764 | -| std | 0.00772 | -| value_loss | 1.11e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19676 | -| time_elapsed | 106381 | -| total_timesteps | 2518528 | -| train/ | | -| approx_kl | 0.018571239 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 196750 | -| policy_gradient_loss | 0.039 | -| std | 0.00772 | -| value_loss | 4.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19677 | -| time_elapsed | 106385 | -| total_timesteps | 2518656 | -| train/ | | -| approx_kl | 0.079199664 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0478 | -| n_updates | 196760 | -| policy_gradient_loss | 0.0234 | -| std | 0.00772 | -| value_loss | 5.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19678 | -| time_elapsed | 106389 | -| total_timesteps | 2518784 | -| train/ | | -| approx_kl | 0.084550925 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.01 | -| learning_rate | 0.0003 | -| loss | 0.0393 | -| n_updates | 196770 | -| policy_gradient_loss | 0.0154 | -| std | 0.00772 | -| value_loss | 2.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19679 | -| time_elapsed | 106395 | -| total_timesteps | 2518912 | -| train/ | | -| approx_kl | 0.011026251 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00168 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 196780 | -| policy_gradient_loss | -0.00492 | -| std | 0.00773 | -| value_loss | 3.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19680 | -| time_elapsed | 106399 | -| total_timesteps | 2519040 | -| train/ | | -| approx_kl | 0.00985736 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 196790 | -| policy_gradient_loss | -0.00664 | -| std | 0.00773 | -| value_loss | 2.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19681 | -| time_elapsed | 106409 | -| total_timesteps | 2519168 | -| train/ | | -| approx_kl | 0.011078135 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 196800 | -| policy_gradient_loss | 0.00126 | -| std | 0.00773 | -| value_loss | 0.00213 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19682 | -| time_elapsed | 106414 | -| total_timesteps | 2519296 | -| train/ | | -| approx_kl | 0.003382911 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 196810 | -| policy_gradient_loss | 0.0297 | -| std | 0.00773 | -| value_loss | 1.32e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19683 | -| time_elapsed | 106418 | -| total_timesteps | 2519424 | -| train/ | | -| approx_kl | 0.3158437 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00615 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 196820 | -| policy_gradient_loss | 0.0426 | -| std | 0.00773 | -| value_loss | 9.69e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19684 | -| time_elapsed | 106422 | -| total_timesteps | 2519552 | -| train/ | | -| approx_kl | 1.3167039e-05 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | 0.000386 | -| n_updates | 196830 | -| policy_gradient_loss | 0.00466 | -| std | 0.00773 | -| value_loss | 1.16e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19685 | -| time_elapsed | 106427 | -| total_timesteps | 2519680 | -| train/ | | -| approx_kl | 0.006149824 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 196840 | -| policy_gradient_loss | 0.00216 | -| std | 0.00773 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19686 | -| time_elapsed | 106434 | -| total_timesteps | 2519808 | -| train/ | | -| approx_kl | 0.024078663 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.4 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 196850 | -| policy_gradient_loss | 0.0452 | -| std | 0.00773 | -| value_loss | 2.15e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19687 | -| time_elapsed | 106439 | -| total_timesteps | 2519936 | -| train/ | | -| approx_kl | 0.0598356 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0085 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 196860 | -| policy_gradient_loss | 0.0686 | -| std | 0.00773 | -| value_loss | 1.17e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19688 | -| time_elapsed | 106443 | -| total_timesteps | 2520064 | -| train/ | | -| approx_kl | 0.012273296 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 196870 | -| policy_gradient_loss | 0.012 | -| std | 0.00773 | -| value_loss | 9.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19689 | -| time_elapsed | 106452 | -| total_timesteps | 2520192 | -| train/ | | -| approx_kl | 0.008917648 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.0264 | -| n_updates | 196880 | -| policy_gradient_loss | -0.0207 | -| std | 0.00773 | -| value_loss | 0.000677 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19690 | -| time_elapsed | 106459 | -| total_timesteps | 2520320 | -| train/ | | -| approx_kl | 0.009144658 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.00109 | -| n_updates | 196890 | -| policy_gradient_loss | 0.0748 | -| std | 0.00772 | -| value_loss | 3.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19691 | -| time_elapsed | 106464 | -| total_timesteps | 2520448 | -| train/ | | -| approx_kl | 0.010042849 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | 0.00122 | -| n_updates | 196900 | -| policy_gradient_loss | 0.0116 | -| std | 0.00772 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19692 | -| time_elapsed | 106469 | -| total_timesteps | 2520576 | -| train/ | | -| approx_kl | 0.033924032 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 196910 | -| policy_gradient_loss | 0.0553 | -| std | 0.00773 | -| value_loss | 3.64e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19693 | -| time_elapsed | 106472 | -| total_timesteps | 2520704 | -| train/ | | -| approx_kl | 0.0032983813 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 196920 | -| policy_gradient_loss | 0.0579 | -| std | 0.00773 | -| value_loss | 8.14e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19694 | -| time_elapsed | 106475 | -| total_timesteps | 2520832 | -| train/ | | -| approx_kl | 0.020243866 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.000412 | -| n_updates | 196930 | -| policy_gradient_loss | 0.0169 | -| std | 0.00773 | -| value_loss | 6.61e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 19695 | -| time_elapsed | 106478 | -| total_timesteps | 2520960 | -| train/ | | -| approx_kl | 0.033779006 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0558 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 196940 | -| policy_gradient_loss | 0.0314 | -| std | 0.00774 | -| value_loss | 3.47e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19696 | -| time_elapsed | 106482 | -| total_timesteps | 2521088 | -| train/ | | -| approx_kl | 0.21264865 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 196950 | -| policy_gradient_loss | 0.114 | -| std | 0.00774 | -| value_loss | 2.68e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19697 | -| time_elapsed | 106492 | -| total_timesteps | 2521216 | -| train/ | | -| approx_kl | 0.007101618 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.722 | -| learning_rate | 0.0003 | -| loss | -0.0044 | -| n_updates | 196960 | -| policy_gradient_loss | 0.0569 | -| std | 0.00774 | -| value_loss | 0.00802 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19698 | -| time_elapsed | 106497 | -| total_timesteps | 2521344 | -| train/ | | -| approx_kl | 0.0035540233 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 196970 | -| policy_gradient_loss | 0.0244 | -| std | 0.00774 | -| value_loss | 3.08e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19699 | -| time_elapsed | 106502 | -| total_timesteps | 2521472 | -| train/ | | -| approx_kl | 0.022259846 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 196980 | -| policy_gradient_loss | 0.028 | -| std | 0.00774 | -| value_loss | 2.05e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19700 | -| time_elapsed | 106507 | -| total_timesteps | 2521600 | -| train/ | | -| approx_kl | 0.14466125 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.966 | -| learning_rate | 0.0003 | -| loss | 0.0429 | -| n_updates | 196990 | -| policy_gradient_loss | 0.0303 | -| std | 0.00774 | -| value_loss | 5.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19701 | -| time_elapsed | 106511 | -| total_timesteps | 2521728 | -| train/ | | -| approx_kl | 0.002974955 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.00127 | -| n_updates | 197000 | -| policy_gradient_loss | 0.0133 | -| std | 0.00774 | -| value_loss | 2.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19702 | -| time_elapsed | 106515 | -| total_timesteps | 2521856 | -| train/ | | -| approx_kl | 0.058009427 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 197010 | -| policy_gradient_loss | 0.0521 | -| std | 0.00773 | -| value_loss | 1.5e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19703 | -| time_elapsed | 106519 | -| total_timesteps | 2521984 | -| train/ | | -| approx_kl | 5.665375e-05 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | -0.000132 | -| n_updates | 197020 | -| policy_gradient_loss | 0.0696 | -| std | 0.00774 | -| value_loss | 1.18e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19704 | -| time_elapsed | 106523 | -| total_timesteps | 2522112 | -| train/ | | -| approx_kl | 0.018678704 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 197030 | -| policy_gradient_loss | 0.0277 | -| std | 0.00774 | -| value_loss | 1.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19705 | -| time_elapsed | 106535 | -| total_timesteps | 2522240 | -| train/ | | -| approx_kl | 0.18883944 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 197040 | -| policy_gradient_loss | 0.0318 | -| std | 0.00774 | -| value_loss | 0.000418 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19706 | -| time_elapsed | 106540 | -| total_timesteps | 2522368 | -| train/ | | -| approx_kl | 0.12552075 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0845 | -| learning_rate | 0.0003 | -| loss | 0.0844 | -| n_updates | 197050 | -| policy_gradient_loss | 0.0857 | -| std | 0.00774 | -| value_loss | 4.51e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19707 | -| time_elapsed | 106545 | -| total_timesteps | 2522496 | -| train/ | | -| approx_kl | 0.021046115 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00443 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 197060 | -| policy_gradient_loss | 0.0114 | -| std | 0.00774 | -| value_loss | 1.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19708 | -| time_elapsed | 106550 | -| total_timesteps | 2522624 | -| train/ | | -| approx_kl | 0.12302846 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00741 | -| learning_rate | 0.0003 | -| loss | 0.0638 | -| n_updates | 197070 | -| policy_gradient_loss | 0.0165 | -| std | 0.00775 | -| value_loss | 3.94e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19709 | -| time_elapsed | 106555 | -| total_timesteps | 2522752 | -| train/ | | -| approx_kl | 0.016516421 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | -0.00578 | -| n_updates | 197080 | -| policy_gradient_loss | 0.014 | -| std | 0.00775 | -| value_loss | 3.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19710 | -| time_elapsed | 106560 | -| total_timesteps | 2522880 | -| train/ | | -| approx_kl | 0.24964663 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 197090 | -| policy_gradient_loss | 0.143 | -| std | 0.00774 | -| value_loss | 1.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19711 | -| time_elapsed | 106567 | -| total_timesteps | 2523008 | -| train/ | | -| approx_kl | 0.038439464 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0704 | -| learning_rate | 0.0003 | -| loss | 0.029 | -| n_updates | 197100 | -| policy_gradient_loss | 0.0219 | -| std | 0.00774 | -| value_loss | 1.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19712 | -| time_elapsed | 106580 | -| total_timesteps | 2523136 | -| train/ | | -| approx_kl | 0.014237021 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.844 | -| learning_rate | 0.0003 | -| loss | -0.0285 | -| n_updates | 197110 | -| policy_gradient_loss | -0.0152 | -| std | 0.00774 | -| value_loss | 0.00344 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19713 | -| time_elapsed | 106585 | -| total_timesteps | 2523264 | -| train/ | | -| approx_kl | 0.0071284226 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0541 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 197120 | -| policy_gradient_loss | 0.00708 | -| std | 0.00774 | -| value_loss | 0.00559 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19714 | -| time_elapsed | 106590 | -| total_timesteps | 2523392 | -| train/ | | -| approx_kl | 0.41834685 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 197130 | -| policy_gradient_loss | 0.0365 | -| std | 0.00774 | -| value_loss | 6.81e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19715 | -| time_elapsed | 106594 | -| total_timesteps | 2523520 | -| train/ | | -| approx_kl | 0.010023699 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00867 | -| learning_rate | 0.0003 | -| loss | -0.00823 | -| n_updates | 197140 | -| policy_gradient_loss | 0.00144 | -| std | 0.00774 | -| value_loss | 1.39e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19716 | -| time_elapsed | 106599 | -| total_timesteps | 2523648 | -| train/ | | -| approx_kl | 0.0025161942 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 197150 | -| policy_gradient_loss | 0.00659 | -| std | 0.00774 | -| value_loss | 5.59e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19717 | -| time_elapsed | 106604 | -| total_timesteps | 2523776 | -| train/ | | -| approx_kl | 0.06575397 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0641 | -| learning_rate | 0.0003 | -| loss | 0.0351 | -| n_updates | 197160 | -| policy_gradient_loss | 0.00816 | -| std | 0.00774 | -| value_loss | 4.87e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 19718 | -| time_elapsed | 106608 | -| total_timesteps | 2523904 | -| train/ | | -| approx_kl | 0.027643884 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.0041 | -| n_updates | 197170 | -| policy_gradient_loss | 0.0234 | -| std | 0.00774 | -| value_loss | 3.57e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19719 | -| time_elapsed | 106613 | -| total_timesteps | 2524032 | -| train/ | | -| approx_kl | 0.46908644 | -| clip_fraction | 0.692 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 197180 | -| policy_gradient_loss | 0.127 | -| std | 0.00774 | -| value_loss | 2.86e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19720 | -| time_elapsed | 106625 | -| total_timesteps | 2524160 | -| train/ | | -| approx_kl | 0.013272919 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.0251 | -| n_updates | 197190 | -| policy_gradient_loss | -0.00921 | -| std | 0.00774 | -| value_loss | 0.000142 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19721 | -| time_elapsed | 106629 | -| total_timesteps | 2524288 | -| train/ | | -| approx_kl | 0.4536418 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0838 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 197200 | -| policy_gradient_loss | 0.0606 | -| std | 0.00773 | -| value_loss | 8.3e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19722 | -| time_elapsed | 106632 | -| total_timesteps | 2524416 | -| train/ | | -| approx_kl | 8.407049e-06 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0609 | -| learning_rate | 0.0003 | -| loss | 0.000336 | -| n_updates | 197210 | -| policy_gradient_loss | 0.00322 | -| std | 0.00773 | -| value_loss | 6.44e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19723 | -| time_elapsed | 106636 | -| total_timesteps | 2524544 | -| train/ | | -| approx_kl | 0.034598242 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 197220 | -| policy_gradient_loss | 0.0103 | -| std | 0.00772 | -| value_loss | 3.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19724 | -| time_elapsed | 106641 | -| total_timesteps | 2524672 | -| train/ | | -| approx_kl | 0.005690506 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | -0.00655 | -| n_updates | 197230 | -| policy_gradient_loss | 0.00278 | -| std | 0.00771 | -| value_loss | 2.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19725 | -| time_elapsed | 106645 | -| total_timesteps | 2524800 | -| train/ | | -| approx_kl | 0.024216386 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 197240 | -| policy_gradient_loss | 0.0785 | -| std | 0.00771 | -| value_loss | 4.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 19726 | -| time_elapsed | 106649 | -| total_timesteps | 2524928 | -| train/ | | -| approx_kl | 0.07012257 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0524 | -| n_updates | 197250 | -| policy_gradient_loss | 0.0896 | -| std | 0.00771 | -| value_loss | 1.65e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19727 | -| time_elapsed | 106653 | -| total_timesteps | 2525056 | -| train/ | | -| approx_kl | 0.017193178 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | -0.00711 | -| n_updates | 197260 | -| policy_gradient_loss | 0.0166 | -| std | 0.00771 | -| value_loss | 1.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19728 | -| time_elapsed | 106662 | -| total_timesteps | 2525184 | -| train/ | | -| approx_kl | 0.055282325 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.00899 | -| n_updates | 197270 | -| policy_gradient_loss | 0.00529 | -| std | 0.00771 | -| value_loss | 0.00543 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19729 | -| time_elapsed | 106668 | -| total_timesteps | 2525312 | -| train/ | | -| approx_kl | 0.000923553 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0776 | -| learning_rate | 0.0003 | -| loss | 0.000215 | -| n_updates | 197280 | -| policy_gradient_loss | 0.00497 | -| std | 0.00771 | -| value_loss | 3.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19730 | -| time_elapsed | 106672 | -| total_timesteps | 2525440 | -| train/ | | -| approx_kl | 0.046138715 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 197290 | -| policy_gradient_loss | 0.00651 | -| std | 0.00771 | -| value_loss | 1.61e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19731 | -| time_elapsed | 106677 | -| total_timesteps | 2525568 | -| train/ | | -| approx_kl | 0.6654974 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.331 | -| learning_rate | 0.0003 | -| loss | 0.216 | -| n_updates | 197300 | -| policy_gradient_loss | 0.129 | -| std | 0.00771 | -| value_loss | 2.28e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19732 | -| time_elapsed | 106681 | -| total_timesteps | 2525696 | -| train/ | | -| approx_kl | 0.017757077 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 197310 | -| policy_gradient_loss | 0.0133 | -| std | 0.00771 | -| value_loss | 1.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19733 | -| time_elapsed | 106686 | -| total_timesteps | 2525824 | -| train/ | | -| approx_kl | 0.18354338 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 197320 | -| policy_gradient_loss | 0.145 | -| std | 0.00771 | -| value_loss | 1.26e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 19734 | -| time_elapsed | 106691 | -| total_timesteps | 2525952 | -| train/ | | -| approx_kl | 0.03478125 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 197330 | -| policy_gradient_loss | 0.0247 | -| std | 0.00771 | -| value_loss | 1.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19735 | -| time_elapsed | 106695 | -| total_timesteps | 2526080 | -| train/ | | -| approx_kl | 0.57542694 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 197340 | -| policy_gradient_loss | 0.061 | -| std | 0.00771 | -| value_loss | 7.35e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19736 | -| time_elapsed | 106706 | -| total_timesteps | 2526208 | -| train/ | | -| approx_kl | 0.01668778 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 197350 | -| policy_gradient_loss | 0.00348 | -| std | 0.00771 | -| value_loss | 0.00443 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19737 | -| time_elapsed | 106710 | -| total_timesteps | 2526336 | -| train/ | | -| approx_kl | 0.0010950691 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 197360 | -| policy_gradient_loss | 0.0244 | -| std | 0.00771 | -| value_loss | 3.1e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19738 | -| time_elapsed | 106714 | -| total_timesteps | 2526464 | -| train/ | | -| approx_kl | 0.37835544 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00218 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 197370 | -| policy_gradient_loss | 0.0493 | -| std | 0.00771 | -| value_loss | 4.59e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19739 | -| time_elapsed | 106719 | -| total_timesteps | 2526592 | -| train/ | | -| approx_kl | 4.1350722e-07 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.000103 | -| n_updates | 197380 | -| policy_gradient_loss | 0.000422 | -| std | 0.00771 | -| value_loss | 2.44e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19740 | -| time_elapsed | 106724 | -| total_timesteps | 2526720 | -| train/ | | -| approx_kl | 0.03839768 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0606 | -| learning_rate | 0.0003 | -| loss | -0.00795 | -| n_updates | 197390 | -| policy_gradient_loss | -0.00419 | -| std | 0.00771 | -| value_loss | 1.95e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19741 | -| time_elapsed | 106727 | -| total_timesteps | 2526848 | -| train/ | | -| approx_kl | 0.043541107 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 197400 | -| policy_gradient_loss | 0.0145 | -| std | 0.00771 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19742 | -| time_elapsed | 106732 | -| total_timesteps | 2526976 | -| train/ | | -| approx_kl | 0.034503777 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 197410 | -| policy_gradient_loss | 0.0089 | -| std | 0.0077 | -| value_loss | 7.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19743 | -| time_elapsed | 106737 | -| total_timesteps | 2527104 | -| train/ | | -| approx_kl | 0.034123056 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 197420 | -| policy_gradient_loss | 0.00527 | -| std | 0.0077 | -| value_loss | 5.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19744 | -| time_elapsed | 106750 | -| total_timesteps | 2527232 | -| train/ | | -| approx_kl | 0.02424484 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 197430 | -| policy_gradient_loss | -0.0108 | -| std | 0.0077 | -| value_loss | 0.000298 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19745 | -| time_elapsed | 106756 | -| total_timesteps | 2527360 | -| train/ | | -| approx_kl | 0.6946544 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.376 | -| learning_rate | 0.0003 | -| loss | 0.197 | -| n_updates | 197440 | -| policy_gradient_loss | 0.143 | -| std | 0.0077 | -| value_loss | 5.64e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19746 | -| time_elapsed | 106762 | -| total_timesteps | 2527488 | -| train/ | | -| approx_kl | 0.015121749 | -| clip_fraction | 0.0883 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.457 | -| learning_rate | 0.0003 | -| loss | -0.00272 | -| n_updates | 197450 | -| policy_gradient_loss | -0.00226 | -| std | 0.00769 | -| value_loss | 3.31e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19747 | -| time_elapsed | 106767 | -| total_timesteps | 2527616 | -| train/ | | -| approx_kl | 0.016862558 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0732 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 197460 | -| policy_gradient_loss | 0.012 | -| std | 0.00769 | -| value_loss | 2.42e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19748 | -| time_elapsed | 106773 | -| total_timesteps | 2527744 | -| train/ | | -| approx_kl | 0.07236563 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00176 | -| learning_rate | 0.0003 | -| loss | 0.0363 | -| n_updates | 197470 | -| policy_gradient_loss | 0.0189 | -| std | 0.00769 | -| value_loss | 8.94e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 19749 | -| time_elapsed | 106779 | -| total_timesteps | 2527872 | -| train/ | | -| approx_kl | 0.00016751094 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -0.000293 | -| n_updates | 197480 | -| policy_gradient_loss | 0.0236 | -| std | 0.00769 | -| value_loss | 5e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19750 | -| time_elapsed | 106784 | -| total_timesteps | 2528000 | -| train/ | | -| approx_kl | 0.00047683623 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0646 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 197490 | -| policy_gradient_loss | 0.001 | -| std | 0.00768 | -| value_loss | 4.59e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19751 | -| time_elapsed | 106789 | -| total_timesteps | 2528128 | -| train/ | | -| approx_kl | 0.17327671 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00503 | -| learning_rate | 0.0003 | -| loss | 0.0754 | -| n_updates | 197500 | -| policy_gradient_loss | 0.0969 | -| std | 0.00769 | -| value_loss | 1.7e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19752 | -| time_elapsed | 106799 | -| total_timesteps | 2528256 | -| train/ | | -| approx_kl | 0.042726837 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.683 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 197510 | -| policy_gradient_loss | -0.00208 | -| std | 0.00769 | -| value_loss | 0.00114 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19753 | -| time_elapsed | 106803 | -| total_timesteps | 2528384 | -| train/ | | -| approx_kl | 0.06910005 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 0.0499 | -| n_updates | 197520 | -| policy_gradient_loss | 0.0497 | -| std | 0.00769 | -| value_loss | 1.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19754 | -| time_elapsed | 106806 | -| total_timesteps | 2528512 | -| train/ | | -| approx_kl | 0.26955637 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | 0.0607 | -| n_updates | 197530 | -| policy_gradient_loss | 0.00492 | -| std | 0.00769 | -| value_loss | 3.66e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19755 | -| time_elapsed | 106809 | -| total_timesteps | 2528640 | -| train/ | | -| approx_kl | 0.030983876 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.426 | -| learning_rate | 0.0003 | -| loss | 0.00902 | -| n_updates | 197540 | -| policy_gradient_loss | -0.000414 | -| std | 0.00769 | -| value_loss | 7.76e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19756 | -| time_elapsed | 106813 | -| total_timesteps | 2528768 | -| train/ | | -| approx_kl | 0.012725718 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00107 | -| n_updates | 197550 | -| policy_gradient_loss | 0.0178 | -| std | 0.00769 | -| value_loss | 7.2e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 19757 | -| time_elapsed | 106818 | -| total_timesteps | 2528896 | -| train/ | | -| approx_kl | 0.2032744 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 197560 | -| policy_gradient_loss | 0.0997 | -| std | 0.0077 | -| value_loss | 4.3e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19758 | -| time_elapsed | 106823 | -| total_timesteps | 2529024 | -| train/ | | -| approx_kl | 0.13395056 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.0785 | -| n_updates | 197570 | -| policy_gradient_loss | 0.0896 | -| std | 0.0077 | -| value_loss | 2.42e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19759 | -| time_elapsed | 106833 | -| total_timesteps | 2529152 | -| train/ | | -| approx_kl | 0.022416173 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.363 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 197580 | -| policy_gradient_loss | -0.00846 | -| std | 0.0077 | -| value_loss | 0.00247 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19760 | -| time_elapsed | 106838 | -| total_timesteps | 2529280 | -| train/ | | -| approx_kl | 0.03756065 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | -0.00321 | -| n_updates | 197590 | -| policy_gradient_loss | 0.0178 | -| std | 0.00771 | -| value_loss | 1.88e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19761 | -| time_elapsed | 106844 | -| total_timesteps | 2529408 | -| train/ | | -| approx_kl | 0.09735895 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00457 | -| learning_rate | 0.0003 | -| loss | 0.078 | -| n_updates | 197600 | -| policy_gradient_loss | 0.0471 | -| std | 0.00771 | -| value_loss | 2.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19762 | -| time_elapsed | 106848 | -| total_timesteps | 2529536 | -| train/ | | -| approx_kl | 0.029742897 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0533 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 197610 | -| policy_gradient_loss | 0.0374 | -| std | 0.00771 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19763 | -| time_elapsed | 106852 | -| total_timesteps | 2529664 | -| train/ | | -| approx_kl | 0.11899872 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0869 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 197620 | -| policy_gradient_loss | 0.0513 | -| std | 0.00771 | -| value_loss | 7.92e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19764 | -| time_elapsed | 106858 | -| total_timesteps | 2529792 | -| train/ | | -| approx_kl | 0.027244363 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 197630 | -| policy_gradient_loss | 0.0158 | -| std | 0.00771 | -| value_loss | 6.07e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19765 | -| time_elapsed | 106864 | -| total_timesteps | 2529920 | -| train/ | | -| approx_kl | 0.11103257 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | 0.0775 | -| n_updates | 197640 | -| policy_gradient_loss | 0.0464 | -| std | 0.00771 | -| value_loss | 3.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19766 | -| time_elapsed | 106870 | -| total_timesteps | 2530048 | -| train/ | | -| approx_kl | 0.004987354 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 197650 | -| policy_gradient_loss | 0.00476 | -| std | 0.00771 | -| value_loss | 3.09e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19767 | -| time_elapsed | 106881 | -| total_timesteps | 2530176 | -| train/ | | -| approx_kl | 0.10900815 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 197660 | -| policy_gradient_loss | -0.00853 | -| std | 0.00771 | -| value_loss | 0.000695 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19768 | -| time_elapsed | 106886 | -| total_timesteps | 2530304 | -| train/ | | -| approx_kl | 0.010224469 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00372 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 197670 | -| policy_gradient_loss | 0.0322 | -| std | 0.00771 | -| value_loss | 1.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19769 | -| time_elapsed | 106891 | -| total_timesteps | 2530432 | -| train/ | | -| approx_kl | 0.18062925 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0068 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 197680 | -| policy_gradient_loss | 0.0997 | -| std | 0.00771 | -| value_loss | 4.19e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19770 | -| time_elapsed | 106897 | -| total_timesteps | 2530560 | -| train/ | | -| approx_kl | 0.11848512 | -| clip_fraction | 0.656 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 197690 | -| policy_gradient_loss | 0.104 | -| std | 0.00771 | -| value_loss | 2.48e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19771 | -| time_elapsed | 106903 | -| total_timesteps | 2530688 | -| train/ | | -| approx_kl | 0.021701783 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 197700 | -| policy_gradient_loss | 0.0149 | -| std | 0.00771 | -| value_loss | 2.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19772 | -| time_elapsed | 106908 | -| total_timesteps | 2530816 | -| train/ | | -| approx_kl | 0.39243424 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 197710 | -| policy_gradient_loss | 0.0286 | -| std | 0.00771 | -| value_loss | 1.02e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 19773 | -| time_elapsed | 106913 | -| total_timesteps | 2530944 | -| train/ | | -| approx_kl | 0.0070125614 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.073 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 197720 | -| policy_gradient_loss | 0.0048 | -| std | 0.00772 | -| value_loss | 7.93e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19774 | -| time_elapsed | 106917 | -| total_timesteps | 2531072 | -| train/ | | -| approx_kl | 0.0017185989 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 197730 | -| policy_gradient_loss | 0.00607 | -| std | 0.00771 | -| value_loss | 5.06e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19775 | -| time_elapsed | 106925 | -| total_timesteps | 2531200 | -| train/ | | -| approx_kl | 0.17276089 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.43 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 197740 | -| policy_gradient_loss | -0.00338 | -| std | 0.00771 | -| value_loss | 0.00153 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19776 | -| time_elapsed | 106930 | -| total_timesteps | 2531328 | -| train/ | | -| approx_kl | 0.03090333 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -1.61 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 197750 | -| policy_gradient_loss | 0.0267 | -| std | 0.00771 | -| value_loss | 5.23e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19777 | -| time_elapsed | 106935 | -| total_timesteps | 2531456 | -| train/ | | -| approx_kl | 0.1076421 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | 0.0717 | -| n_updates | 197760 | -| policy_gradient_loss | 0.0487 | -| std | 0.0077 | -| value_loss | 1.48e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19778 | -| time_elapsed | 106939 | -| total_timesteps | 2531584 | -| train/ | | -| approx_kl | 0.0043115593 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.0086 | -| n_updates | 197770 | -| policy_gradient_loss | 0.00485 | -| std | 0.0077 | -| value_loss | 1.45e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19779 | -| time_elapsed | 106944 | -| total_timesteps | 2531712 | -| train/ | | -| approx_kl | 0.02292448 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.000616 | -| learning_rate | 0.0003 | -| loss | 0.00259 | -| n_updates | 197780 | -| policy_gradient_loss | 0.0289 | -| std | 0.00769 | -| value_loss | 7.42e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19780 | -| time_elapsed | 106948 | -| total_timesteps | 2531840 | -| train/ | | -| approx_kl | 0.113149956 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00967 | -| learning_rate | 0.0003 | -| loss | 0.0903 | -| n_updates | 197790 | -| policy_gradient_loss | 0.0527 | -| std | 0.00768 | -| value_loss | 2.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19781 | -| time_elapsed | 106952 | -| total_timesteps | 2531968 | -| train/ | | -| approx_kl | 0.02810064 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 197800 | -| policy_gradient_loss | 0.0234 | -| std | 0.00768 | -| value_loss | 1.31e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19782 | -| time_elapsed | 106955 | -| total_timesteps | 2532096 | -| train/ | | -| approx_kl | 0.67091227 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.286 | -| n_updates | 197810 | -| policy_gradient_loss | 0.148 | -| std | 0.00768 | -| value_loss | 1.01e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19783 | -| time_elapsed | 106964 | -| total_timesteps | 2532224 | -| train/ | | -| approx_kl | 0.020603586 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 197820 | -| policy_gradient_loss | -0.00245 | -| std | 0.00769 | -| value_loss | 0.00186 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19784 | -| time_elapsed | 106969 | -| total_timesteps | 2532352 | -| train/ | | -| approx_kl | 0.11227082 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.0784 | -| n_updates | 197830 | -| policy_gradient_loss | 0.0547 | -| std | 0.00769 | -| value_loss | 9.02e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19785 | -| time_elapsed | 106973 | -| total_timesteps | 2532480 | -| train/ | | -| approx_kl | 0.27131563 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00822 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 197840 | -| policy_gradient_loss | 0.101 | -| std | 0.00769 | -| value_loss | 8.35e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19786 | -| time_elapsed | 106978 | -| total_timesteps | 2532608 | -| train/ | | -| approx_kl | 0.0574124 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 197850 | -| policy_gradient_loss | 0.023 | -| std | 0.0077 | -| value_loss | 4.99e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19787 | -| time_elapsed | 106982 | -| total_timesteps | 2532736 | -| train/ | | -| approx_kl | 0.3758233 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 197860 | -| policy_gradient_loss | 0.0474 | -| std | 0.0077 | -| value_loss | 3.86e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19788 | -| time_elapsed | 106988 | -| total_timesteps | 2532864 | -| train/ | | -| approx_kl | 0.010317557 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00333 | -| n_updates | 197870 | -| policy_gradient_loss | 0.00283 | -| std | 0.0077 | -| value_loss | 2.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19789 | -| time_elapsed | 106993 | -| total_timesteps | 2532992 | -| train/ | | -| approx_kl | 0.04571389 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -0.00385 | -| n_updates | 197880 | -| policy_gradient_loss | -0.00461 | -| std | 0.0077 | -| value_loss | 1.39e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19790 | -| time_elapsed | 106996 | -| total_timesteps | 2533120 | -| train/ | | -| approx_kl | 0.03569147 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.0338 | -| n_updates | 197890 | -| policy_gradient_loss | 0.0171 | -| std | 0.0077 | -| value_loss | 8.52e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19791 | -| time_elapsed | 107011 | -| total_timesteps | 2533248 | -| train/ | | -| approx_kl | 0.0006557 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 197900 | -| policy_gradient_loss | -0.00123 | -| std | 0.0077 | -| value_loss | 0.00139 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19792 | -| time_elapsed | 107016 | -| total_timesteps | 2533376 | -| train/ | | -| approx_kl | 5.8544334e-05 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.000327 | -| n_updates | 197910 | -| policy_gradient_loss | 0.0274 | -| std | 0.00769 | -| value_loss | 1.03e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19793 | -| time_elapsed | 107021 | -| total_timesteps | 2533504 | -| train/ | | -| approx_kl | 0.0063723368 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | 0.008 | -| n_updates | 197920 | -| policy_gradient_loss | 0.0174 | -| std | 0.00768 | -| value_loss | 1.43e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19794 | -| time_elapsed | 107026 | -| total_timesteps | 2533632 | -| train/ | | -| approx_kl | 0.053930953 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 197930 | -| policy_gradient_loss | 0.00735 | -| std | 0.00767 | -| value_loss | 5.52e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19795 | -| time_elapsed | 107031 | -| total_timesteps | 2533760 | -| train/ | | -| approx_kl | 0.21742254 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0887 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 197940 | -| policy_gradient_loss | 0.0374 | -| std | 0.00768 | -| value_loss | 1.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 19796 | -| time_elapsed | 107037 | -| total_timesteps | 2533888 | -| train/ | | -| approx_kl | 0.04658775 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.272 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 197950 | -| policy_gradient_loss | 0.0509 | -| std | 0.00768 | -| value_loss | 1.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19797 | -| time_elapsed | 107042 | -| total_timesteps | 2534016 | -| train/ | | -| approx_kl | 0.022913601 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00801 | -| n_updates | 197960 | -| policy_gradient_loss | 0.00974 | -| std | 0.00768 | -| value_loss | 5.84e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19798 | -| time_elapsed | 107055 | -| total_timesteps | 2534144 | -| train/ | | -| approx_kl | 0.01330398 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.861 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 197970 | -| policy_gradient_loss | -0.00785 | -| std | 0.00767 | -| value_loss | 0.00278 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19799 | -| time_elapsed | 107059 | -| total_timesteps | 2534272 | -| train/ | | -| approx_kl | 0.011207692 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.485 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 197980 | -| policy_gradient_loss | 0.00349 | -| std | 0.00767 | -| value_loss | 4.23e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19800 | -| time_elapsed | 107065 | -| total_timesteps | 2534400 | -| train/ | | -| approx_kl | 0.04143464 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 197990 | -| policy_gradient_loss | 0.00766 | -| std | 0.00767 | -| value_loss | 1.12e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19801 | -| time_elapsed | 107069 | -| total_timesteps | 2534528 | -| train/ | | -| approx_kl | 0.009083862 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 198000 | -| policy_gradient_loss | 0.000727 | -| std | 0.00767 | -| value_loss | 9.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19802 | -| time_elapsed | 107074 | -| total_timesteps | 2534656 | -| train/ | | -| approx_kl | 0.02927984 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 198010 | -| policy_gradient_loss | 0.144 | -| std | 0.00767 | -| value_loss | 7.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19803 | -| time_elapsed | 107078 | -| total_timesteps | 2534784 | -| train/ | | -| approx_kl | 0.080564655 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | 0.0632 | -| n_updates | 198020 | -| policy_gradient_loss | 0.115 | -| std | 0.00767 | -| value_loss | 2.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 19804 | -| time_elapsed | 107082 | -| total_timesteps | 2534912 | -| train/ | | -| approx_kl | 0.094345994 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.0786 | -| n_updates | 198030 | -| policy_gradient_loss | 0.0908 | -| std | 0.00767 | -| value_loss | 1.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19805 | -| time_elapsed | 107085 | -| total_timesteps | 2535040 | -| train/ | | -| approx_kl | 0.018628178 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 198040 | -| policy_gradient_loss | 0.0212 | -| std | 0.00768 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19806 | -| time_elapsed | 107095 | -| total_timesteps | 2535168 | -| train/ | | -| approx_kl | 0.042213526 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.7 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 198050 | -| policy_gradient_loss | -0.0152 | -| std | 0.00768 | -| value_loss | 0.00286 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19807 | -| time_elapsed | 107099 | -| total_timesteps | 2535296 | -| train/ | | -| approx_kl | 0.12634465 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.401 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 198060 | -| policy_gradient_loss | 0.0146 | -| std | 0.00768 | -| value_loss | 2.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19808 | -| time_elapsed | 107104 | -| total_timesteps | 2535424 | -| train/ | | -| approx_kl | 0.027258268 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.765 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 198070 | -| policy_gradient_loss | 0.0642 | -| std | 0.00768 | -| value_loss | 6.6e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19809 | -| time_elapsed | 107109 | -| total_timesteps | 2535552 | -| train/ | | -| approx_kl | 0.00081376266 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | -0.000446 | -| n_updates | 198080 | -| policy_gradient_loss | 0.00941 | -| std | 0.00766 | -| value_loss | 4.31e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19810 | -| time_elapsed | 107114 | -| total_timesteps | 2535680 | -| train/ | | -| approx_kl | 0.0008368287 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 198090 | -| policy_gradient_loss | 0.0218 | -| std | 0.00763 | -| value_loss | 5.31e-08 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19811 | -| time_elapsed | 107119 | -| total_timesteps | 2535808 | -| train/ | | -| approx_kl | 0.635558 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0023 | -| learning_rate | 0.0003 | -| loss | 0.263 | -| n_updates | 198100 | -| policy_gradient_loss | 0.113 | -| std | 0.00763 | -| value_loss | 2.14e-09 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 19812 | -| time_elapsed | 107124 | -| total_timesteps | 2535936 | -| train/ | | -| approx_kl | 0.008775173 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | -0.000994 | -| n_updates | 198110 | -| policy_gradient_loss | 0.0256 | -| std | 0.00762 | -| value_loss | 1.53e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19813 | -| time_elapsed | 107129 | -| total_timesteps | 2536064 | -| train/ | | -| approx_kl | 0.2609821 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 198120 | -| policy_gradient_loss | 0.12 | -| std | 0.00762 | -| value_loss | 1.07e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19814 | -| time_elapsed | 107139 | -| total_timesteps | 2536192 | -| train/ | | -| approx_kl | 0.1807683 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 198130 | -| policy_gradient_loss | 0.0206 | -| std | 0.00762 | -| value_loss | 0.00288 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19815 | -| time_elapsed | 107146 | -| total_timesteps | 2536320 | -| train/ | | -| approx_kl | 0.048871715 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.254 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 198140 | -| policy_gradient_loss | 0.0116 | -| std | 0.00762 | -| value_loss | 6.68e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19816 | -| time_elapsed | 107150 | -| total_timesteps | 2536448 | -| train/ | | -| approx_kl | 0.0027679014 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.00174 | -| n_updates | 198150 | -| policy_gradient_loss | 0.00491 | -| std | 0.00763 | -| value_loss | 7.28e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19817 | -| time_elapsed | 107155 | -| total_timesteps | 2536576 | -| train/ | | -| approx_kl | 0.15741274 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 198160 | -| policy_gradient_loss | 0.11 | -| std | 0.00763 | -| value_loss | 6.22e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19818 | -| time_elapsed | 107161 | -| total_timesteps | 2536704 | -| train/ | | -| approx_kl | 0.11692028 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.0624 | -| n_updates | 198170 | -| policy_gradient_loss | 0.086 | -| std | 0.00763 | -| value_loss | 2.67e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19819 | -| time_elapsed | 107165 | -| total_timesteps | 2536832 | -| train/ | | -| approx_kl | 0.016997471 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 198180 | -| policy_gradient_loss | 0.00653 | -| std | 0.00764 | -| value_loss | 1.6e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 19820 | -| time_elapsed | 107169 | -| total_timesteps | 2536960 | -| train/ | | -| approx_kl | 0.00048930524 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0478 | -| learning_rate | 0.0003 | -| loss | 0.00247 | -| n_updates | 198190 | -| policy_gradient_loss | 0.000996 | -| std | 0.00765 | -| value_loss | 7.16e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19821 | -| time_elapsed | 107173 | -| total_timesteps | 2537088 | -| train/ | | -| approx_kl | 0.12887056 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.505 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 198200 | -| policy_gradient_loss | 0.118 | -| std | 0.00765 | -| value_loss | 3.4e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19822 | -| time_elapsed | 107182 | -| total_timesteps | 2537216 | -| train/ | | -| approx_kl | 0.21290797 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -4.12 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 198210 | -| policy_gradient_loss | 0.0364 | -| std | 0.00765 | -| value_loss | 0.00382 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19823 | -| time_elapsed | 107187 | -| total_timesteps | 2537344 | -| train/ | | -| approx_kl | 0.03567738 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 198220 | -| policy_gradient_loss | 0.0196 | -| std | 0.00765 | -| value_loss | 2.09e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19824 | -| time_elapsed | 107192 | -| total_timesteps | 2537472 | -| train/ | | -| approx_kl | 0.3761871 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 6.17e-05 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 198230 | -| policy_gradient_loss | 0.0483 | -| std | 0.00765 | -| value_loss | 3.94e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19825 | -| time_elapsed | 107196 | -| total_timesteps | 2537600 | -| train/ | | -| approx_kl | 0.024809035 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.00364 | -| n_updates | 198240 | -| policy_gradient_loss | 0.00222 | -| std | 0.00765 | -| value_loss | 2.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19826 | -| time_elapsed | 107200 | -| total_timesteps | 2537728 | -| train/ | | -| approx_kl | 0.038775463 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 198250 | -| policy_gradient_loss | 0.00907 | -| std | 0.00765 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19827 | -| time_elapsed | 107204 | -| total_timesteps | 2537856 | -| train/ | | -| approx_kl | 0.027251871 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | 0.00415 | -| n_updates | 198260 | -| policy_gradient_loss | 0.00193 | -| std | 0.00766 | -| value_loss | 8.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 19828 | -| time_elapsed | 107211 | -| total_timesteps | 2537984 | -| train/ | | -| approx_kl | 0.00632258 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0736 | -| learning_rate | 0.0003 | -| loss | -0.00767 | -| n_updates | 198270 | -| policy_gradient_loss | 0.00425 | -| std | 0.00766 | -| value_loss | 7.69e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19829 | -| time_elapsed | 107217 | -| total_timesteps | 2538112 | -| train/ | | -| approx_kl | 0.058535453 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 198280 | -| policy_gradient_loss | 0.00556 | -| std | 0.00766 | -| value_loss | 3.52e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19830 | -| time_elapsed | 107227 | -| total_timesteps | 2538240 | -| train/ | | -| approx_kl | 0.0076658046 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.549 | -| learning_rate | 0.0003 | -| loss | -0.0245 | -| n_updates | 198290 | -| policy_gradient_loss | -0.0121 | -| std | 0.00766 | -| value_loss | 0.00125 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19831 | -| time_elapsed | 107232 | -| total_timesteps | 2538368 | -| train/ | | -| approx_kl | 0.08747695 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0442 | -| n_updates | 198300 | -| policy_gradient_loss | 0.0502 | -| std | 0.00766 | -| value_loss | 2.42e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19832 | -| time_elapsed | 107237 | -| total_timesteps | 2538496 | -| train/ | | -| approx_kl | 0.14384167 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00023 | -| learning_rate | 0.0003 | -| loss | 0.0614 | -| n_updates | 198310 | -| policy_gradient_loss | 0.0249 | -| std | 0.00766 | -| value_loss | 2.41e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19833 | -| time_elapsed | 107242 | -| total_timesteps | 2538624 | -| train/ | | -| approx_kl | 0.0020918488 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | -0.00141 | -| n_updates | 198320 | -| policy_gradient_loss | 0.0106 | -| std | 0.00766 | -| value_loss | 1.57e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19834 | -| time_elapsed | 107247 | -| total_timesteps | 2538752 | -| train/ | | -| approx_kl | 3.1795353e-06 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.087 | -| learning_rate | 0.0003 | -| loss | 0.000272 | -| n_updates | 198330 | -| policy_gradient_loss | 0.00139 | -| std | 0.00767 | -| value_loss | 1.52e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19835 | -| time_elapsed | 107252 | -| total_timesteps | 2538880 | -| train/ | | -| approx_kl | 0.048620958 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.000987 | -| n_updates | 198340 | -| policy_gradient_loss | 0.04 | -| std | 0.00767 | -| value_loss | 8.68e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19836 | -| time_elapsed | 107256 | -| total_timesteps | 2539008 | -| train/ | | -| approx_kl | 0.108103916 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.00422 | -| n_updates | 198350 | -| policy_gradient_loss | -0.00634 | -| std | 0.00767 | -| value_loss | 1.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19837 | -| time_elapsed | 107270 | -| total_timesteps | 2539136 | -| train/ | | -| approx_kl | 0.009650892 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.00988 | -| n_updates | 198360 | -| policy_gradient_loss | 0.0179 | -| std | 0.00767 | -| value_loss | 3.42e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19838 | -| time_elapsed | 107275 | -| total_timesteps | 2539264 | -| train/ | | -| approx_kl | 0.001227743 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.569 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 198370 | -| policy_gradient_loss | 0.0534 | -| std | 0.00767 | -| value_loss | 4.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19839 | -| time_elapsed | 107280 | -| total_timesteps | 2539392 | -| train/ | | -| approx_kl | 0.019823126 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 198380 | -| policy_gradient_loss | 0.03 | -| std | 0.00767 | -| value_loss | 9.61e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19840 | -| time_elapsed | 107284 | -| total_timesteps | 2539520 | -| train/ | | -| approx_kl | 0.1818262 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00322 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 198390 | -| policy_gradient_loss | 0.0943 | -| std | 0.00767 | -| value_loss | 1.22e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19841 | -| time_elapsed | 107289 | -| total_timesteps | 2539648 | -| train/ | | -| approx_kl | 0.13819173 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.0911 | -| n_updates | 198400 | -| policy_gradient_loss | 0.101 | -| std | 0.00768 | -| value_loss | 7.11e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19842 | -| time_elapsed | 107294 | -| total_timesteps | 2539776 | -| train/ | | -| approx_kl | 0.09314222 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -3.43 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 198410 | -| policy_gradient_loss | 0.0578 | -| std | 0.00768 | -| value_loss | 3.59e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19843 | -| time_elapsed | 107298 | -| total_timesteps | 2539904 | -| train/ | | -| approx_kl | 0.11018586 | -| clip_fraction | 0.614 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00875 | -| learning_rate | 0.0003 | -| loss | 0.0873 | -| n_updates | 198420 | -| policy_gradient_loss | 0.131 | -| std | 0.00768 | -| value_loss | 2.78e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19844 | -| time_elapsed | 107302 | -| total_timesteps | 2540032 | -| train/ | | -| approx_kl | 0.020594617 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 198430 | -| policy_gradient_loss | 0.0138 | -| std | 0.00768 | -| value_loss | 2.49e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19845 | -| time_elapsed | 107311 | -| total_timesteps | 2540160 | -| train/ | | -| approx_kl | 0.025911989 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.755 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 198440 | -| policy_gradient_loss | -0.0158 | -| std | 0.00768 | -| value_loss | 0.000816 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19846 | -| time_elapsed | 107315 | -| total_timesteps | 2540288 | -| train/ | | -| approx_kl | 0.010650177 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.028 | -| learning_rate | 0.0003 | -| loss | 0.000367 | -| n_updates | 198450 | -| policy_gradient_loss | 0.0224 | -| std | 0.00768 | -| value_loss | 9.12e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19847 | -| time_elapsed | 107320 | -| total_timesteps | 2540416 | -| train/ | | -| approx_kl | 0.07676673 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 198460 | -| policy_gradient_loss | 0.0171 | -| std | 0.00768 | -| value_loss | 1.32e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19848 | -| time_elapsed | 107324 | -| total_timesteps | 2540544 | -| train/ | | -| approx_kl | 0.09167989 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 198470 | -| policy_gradient_loss | 0.0132 | -| std | 0.00768 | -| value_loss | 7.06e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19849 | -| time_elapsed | 107326 | -| total_timesteps | 2540672 | -| train/ | | -| approx_kl | 0.15841277 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 198480 | -| policy_gradient_loss | 0.00769 | -| std | 0.00768 | -| value_loss | 4.29e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19850 | -| time_elapsed | 107329 | -| total_timesteps | 2540800 | -| train/ | | -| approx_kl | 0.03549929 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | 0.0063 | -| n_updates | 198490 | -| policy_gradient_loss | 0.0162 | -| std | 0.00768 | -| value_loss | 3.07e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 19851 | -| time_elapsed | 107333 | -| total_timesteps | 2540928 | -| train/ | | -| approx_kl | 0.076697186 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 198500 | -| policy_gradient_loss | -0.0065 | -| std | 0.00768 | -| value_loss | 2.14e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19852 | -| time_elapsed | 107337 | -| total_timesteps | 2541056 | -| train/ | | -| approx_kl | 0.12387839 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.0657 | -| n_updates | 198510 | -| policy_gradient_loss | 0.0259 | -| std | 0.00769 | -| value_loss | 1.28e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19853 | -| time_elapsed | 107345 | -| total_timesteps | 2541184 | -| train/ | | -| approx_kl | 0.028601674 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 198520 | -| policy_gradient_loss | -0.00329 | -| std | 0.00769 | -| value_loss | 0.000256 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19854 | -| time_elapsed | 107349 | -| total_timesteps | 2541312 | -| train/ | | -| approx_kl | 0.023758776 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.00619 | -| n_updates | 198530 | -| policy_gradient_loss | 0.0212 | -| std | 0.00769 | -| value_loss | 6.97e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19855 | -| time_elapsed | 107355 | -| total_timesteps | 2541440 | -| train/ | | -| approx_kl | 0.07987651 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.34 | -| learning_rate | 0.0003 | -| loss | 0.0614 | -| n_updates | 198540 | -| policy_gradient_loss | 0.0283 | -| std | 0.00768 | -| value_loss | 2.87e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19856 | -| time_elapsed | 107360 | -| total_timesteps | 2541568 | -| train/ | | -| approx_kl | 0.2155729 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 198550 | -| policy_gradient_loss | 0.00894 | -| std | 0.00767 | -| value_loss | 1.06e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19857 | -| time_elapsed | 107366 | -| total_timesteps | 2541696 | -| train/ | | -| approx_kl | 0.041859396 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0796 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 198560 | -| policy_gradient_loss | 0.00183 | -| std | 0.00767 | -| value_loss | 2.19e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19858 | -| time_elapsed | 107370 | -| total_timesteps | 2541824 | -| train/ | | -| approx_kl | 0.21443023 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00846 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 198570 | -| policy_gradient_loss | 0.103 | -| std | 0.00767 | -| value_loss | 6.97e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19859 | -| time_elapsed | 107375 | -| total_timesteps | 2541952 | -| train/ | | -| approx_kl | 0.04221559 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 198580 | -| policy_gradient_loss | 0.0197 | -| std | 0.00767 | -| value_loss | 4.55e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19860 | -| time_elapsed | 107379 | -| total_timesteps | 2542080 | -| train/ | | -| approx_kl | 0.45861208 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0437 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 198590 | -| policy_gradient_loss | 0.0328 | -| std | 0.00767 | -| value_loss | 3.25e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19861 | -| time_elapsed | 107389 | -| total_timesteps | 2542208 | -| train/ | | -| approx_kl | 0.014189379 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 198600 | -| policy_gradient_loss | -0.00379 | -| std | 0.00767 | -| value_loss | 7.3e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19862 | -| time_elapsed | 107393 | -| total_timesteps | 2542336 | -| train/ | | -| approx_kl | 0.0022390136 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 198610 | -| policy_gradient_loss | -0.00308 | -| std | 0.00767 | -| value_loss | 4.47e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19863 | -| time_elapsed | 107397 | -| total_timesteps | 2542464 | -| train/ | | -| approx_kl | 0.0028331182 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0064 | -| learning_rate | 0.0003 | -| loss | 0.00537 | -| n_updates | 198620 | -| policy_gradient_loss | 0.00417 | -| std | 0.00767 | -| value_loss | 1.94e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19864 | -| time_elapsed | 107402 | -| total_timesteps | 2542592 | -| train/ | | -| approx_kl | 0.0017314046 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.00716 | -| n_updates | 198630 | -| policy_gradient_loss | -0.00119 | -| std | 0.00766 | -| value_loss | 1.96e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19865 | -| time_elapsed | 107406 | -| total_timesteps | 2542720 | -| train/ | | -| approx_kl | 0.01976895 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.00845 | -| n_updates | 198640 | -| policy_gradient_loss | 0.0324 | -| std | 0.00766 | -| value_loss | 8.27e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19866 | -| time_elapsed | 107410 | -| total_timesteps | 2542848 | -| train/ | | -| approx_kl | 0.12781785 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.063 | -| learning_rate | 0.0003 | -| loss | 0.0764 | -| n_updates | 198650 | -| policy_gradient_loss | 0.0417 | -| std | 0.00766 | -| value_loss | 7.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19867 | -| time_elapsed | 107415 | -| total_timesteps | 2542976 | -| train/ | | -| approx_kl | 0.027818153 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.00833 | -| n_updates | 198660 | -| policy_gradient_loss | 0.0285 | -| std | 0.00765 | -| value_loss | 2.48e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19868 | -| time_elapsed | 107419 | -| total_timesteps | 2543104 | -| train/ | | -| approx_kl | 0.5725866 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | 0.276 | -| n_updates | 198670 | -| policy_gradient_loss | 0.12 | -| std | 0.00766 | -| value_loss | 1.97e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19869 | -| time_elapsed | 107429 | -| total_timesteps | 2543232 | -| train/ | | -| approx_kl | 0.010657551 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 198680 | -| policy_gradient_loss | -0.00255 | -| std | 0.00765 | -| value_loss | 0.00396 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19870 | -| time_elapsed | 107433 | -| total_timesteps | 2543360 | -| train/ | | -| approx_kl | 0.11490421 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0747 | -| n_updates | 198690 | -| policy_gradient_loss | 0.0302 | -| std | 0.00765 | -| value_loss | 1.27e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19871 | -| time_elapsed | 107438 | -| total_timesteps | 2543488 | -| train/ | | -| approx_kl | 0.037458476 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00826 | -| learning_rate | 0.0003 | -| loss | -0.00731 | -| n_updates | 198700 | -| policy_gradient_loss | -0.0127 | -| std | 0.00764 | -| value_loss | 5.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19872 | -| time_elapsed | 107444 | -| total_timesteps | 2543616 | -| train/ | | -| approx_kl | 0.009652983 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00902 | -| learning_rate | 0.0003 | -| loss | -0.00993 | -| n_updates | 198710 | -| policy_gradient_loss | 0.0136 | -| std | 0.00763 | -| value_loss | 0.000384 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19873 | -| time_elapsed | 107448 | -| total_timesteps | 2543744 | -| train/ | | -| approx_kl | 0.1966352 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 198720 | -| policy_gradient_loss | 0.119 | -| std | 0.00763 | -| value_loss | 1.48e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 19874 | -| time_elapsed | 107452 | -| total_timesteps | 2543872 | -| train/ | | -| approx_kl | 0.121683866 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.0687 | -| n_updates | 198730 | -| policy_gradient_loss | 0.094 | -| std | 0.00764 | -| value_loss | 6.33e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19875 | -| time_elapsed | 107457 | -| total_timesteps | 2544000 | -| train/ | | -| approx_kl | 0.13732898 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.533 | -| learning_rate | 0.0003 | -| loss | 0.0992 | -| n_updates | 198740 | -| policy_gradient_loss | 0.0869 | -| std | 0.00764 | -| value_loss | 2.79e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19876 | -| time_elapsed | 107463 | -| total_timesteps | 2544128 | -| train/ | | -| approx_kl | 0.042456597 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0072 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 198750 | -| policy_gradient_loss | 0.00399 | -| std | 0.00768 | -| value_loss | 4.64e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19877 | -| time_elapsed | 107474 | -| total_timesteps | 2544256 | -| train/ | | -| approx_kl | 0.08902801 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 198760 | -| policy_gradient_loss | -0.01 | -| std | 0.00771 | -| value_loss | 0.000273 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19878 | -| time_elapsed | 107479 | -| total_timesteps | 2544384 | -| train/ | | -| approx_kl | 0.24462901 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 198770 | -| policy_gradient_loss | 0.118 | -| std | 0.00772 | -| value_loss | 3.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19879 | -| time_elapsed | 107484 | -| total_timesteps | 2544512 | -| train/ | | -| approx_kl | 0.12513876 | -| clip_fraction | 0.612 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.324 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 198780 | -| policy_gradient_loss | 0.0753 | -| std | 0.00772 | -| value_loss | 6.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19880 | -| time_elapsed | 107487 | -| total_timesteps | 2544640 | -| train/ | | -| approx_kl | 0.025383694 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 198790 | -| policy_gradient_loss | 0.0124 | -| std | 0.00773 | -| value_loss | 4.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19881 | -| time_elapsed | 107492 | -| total_timesteps | 2544768 | -| train/ | | -| approx_kl | 0.12472138 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0647 | -| learning_rate | 0.0003 | -| loss | 0.06 | -| n_updates | 198800 | -| policy_gradient_loss | 0.0154 | -| std | 0.00773 | -| value_loss | 2.67e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 19882 | -| time_elapsed | 107497 | -| total_timesteps | 2544896 | -| train/ | | -| approx_kl | 0.015099194 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | -0.00633 | -| n_updates | 198810 | -| policy_gradient_loss | 0.0139 | -| std | 0.00773 | -| value_loss | 1.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19883 | -| time_elapsed | 107502 | -| total_timesteps | 2545024 | -| train/ | | -| approx_kl | 0.087019406 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.0461 | -| n_updates | 198820 | -| policy_gradient_loss | 0.0225 | -| std | 0.00773 | -| value_loss | 1.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19884 | -| time_elapsed | 107510 | -| total_timesteps | 2545152 | -| train/ | | -| approx_kl | 0.089733064 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | 0.00891 | -| n_updates | 198830 | -| policy_gradient_loss | 4.03e-05 | -| std | 0.00773 | -| value_loss | 0.00104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19885 | -| time_elapsed | 107515 | -| total_timesteps | 2545280 | -| train/ | | -| approx_kl | 0.016073568 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.465 | -| learning_rate | 0.0003 | -| loss | -0.00236 | -| n_updates | 198840 | -| policy_gradient_loss | 0.0406 | -| std | 0.00773 | -| value_loss | 4.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19886 | -| time_elapsed | 107521 | -| total_timesteps | 2545408 | -| train/ | | -| approx_kl | 0.22330792 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00908 | -| learning_rate | 0.0003 | -| loss | 0.0869 | -| n_updates | 198850 | -| policy_gradient_loss | 0.0312 | -| std | 0.00773 | -| value_loss | 6.33e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19887 | -| time_elapsed | 107525 | -| total_timesteps | 2545536 | -| train/ | | -| approx_kl | 0.00046477607 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | -0.000267 | -| n_updates | 198860 | -| policy_gradient_loss | 0.00672 | -| std | 0.00773 | -| value_loss | 4.87e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19888 | -| time_elapsed | 107530 | -| total_timesteps | 2545664 | -| train/ | | -| approx_kl | 0.051945783 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.000275 | -| n_updates | 198870 | -| policy_gradient_loss | 0.0456 | -| std | 0.00773 | -| value_loss | 2.9e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19889 | -| time_elapsed | 107535 | -| total_timesteps | 2545792 | -| train/ | | -| approx_kl | 0.02682875 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 198880 | -| policy_gradient_loss | 0.0189 | -| std | 0.00772 | -| value_loss | 1.09e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 19890 | -| time_elapsed | 107538 | -| total_timesteps | 2545920 | -| train/ | | -| approx_kl | 0.15465698 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | 0.0767 | -| n_updates | 198890 | -| policy_gradient_loss | 0.0284 | -| std | 0.00772 | -| value_loss | 4.59e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19891 | -| time_elapsed | 107542 | -| total_timesteps | 2546048 | -| train/ | | -| approx_kl | 0.0374981 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 198900 | -| policy_gradient_loss | 0.0545 | -| std | 0.00772 | -| value_loss | 1.7e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19892 | -| time_elapsed | 107551 | -| total_timesteps | 2546176 | -| train/ | | -| approx_kl | 0.019924887 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -2.23 | -| learning_rate | 0.0003 | -| loss | -0.0245 | -| n_updates | 198910 | -| policy_gradient_loss | -0.0165 | -| std | 0.00773 | -| value_loss | 0.00296 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19893 | -| time_elapsed | 107557 | -| total_timesteps | 2546304 | -| train/ | | -| approx_kl | 0.02674473 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 198920 | -| policy_gradient_loss | -0.00691 | -| std | 0.00773 | -| value_loss | 4.66e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19894 | -| time_elapsed | 107561 | -| total_timesteps | 2546432 | -| train/ | | -| approx_kl | 0.0674389 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -18.8 | -| learning_rate | 0.0003 | -| loss | -0.00988 | -| n_updates | 198930 | -| policy_gradient_loss | 0.00152 | -| std | 0.00773 | -| value_loss | 2.56e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19895 | -| time_elapsed | 107566 | -| total_timesteps | 2546560 | -| train/ | | -| approx_kl | 0.7245006 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -1.35 | -| learning_rate | 0.0003 | -| loss | 0.27 | -| n_updates | 198940 | -| policy_gradient_loss | 0.104 | -| std | 0.00773 | -| value_loss | 3.21e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19896 | -| time_elapsed | 107571 | -| total_timesteps | 2546688 | -| train/ | | -| approx_kl | 0.004035961 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.366 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 198950 | -| policy_gradient_loss | 0.0166 | -| std | 0.00773 | -| value_loss | 1.78e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19897 | -| time_elapsed | 107577 | -| total_timesteps | 2546816 | -| train/ | | -| approx_kl | 0.3539102 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 198960 | -| policy_gradient_loss | 0.0367 | -| std | 0.00773 | -| value_loss | 1.3e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 19898 | -| time_elapsed | 107581 | -| total_timesteps | 2546944 | -| train/ | | -| approx_kl | 0.008297947 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0574 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 198970 | -| policy_gradient_loss | 0.00327 | -| std | 0.00773 | -| value_loss | 7.85e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19899 | -| time_elapsed | 107587 | -| total_timesteps | 2547072 | -| train/ | | -| approx_kl | 0.042599693 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 198980 | -| policy_gradient_loss | -0.00815 | -| std | 0.00773 | -| value_loss | 5.36e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19900 | -| time_elapsed | 107594 | -| total_timesteps | 2547200 | -| train/ | | -| approx_kl | 0.006679786 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.748 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 198990 | -| policy_gradient_loss | -0.00555 | -| std | 0.00773 | -| value_loss | 0.00686 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19901 | -| time_elapsed | 107599 | -| total_timesteps | 2547328 | -| train/ | | -| approx_kl | 0.08244876 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 199000 | -| policy_gradient_loss | -0.00049 | -| std | 0.00773 | -| value_loss | 3.53e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19902 | -| time_elapsed | 107604 | -| total_timesteps | 2547456 | -| train/ | | -| approx_kl | 0.0115664145 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0063 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 199010 | -| policy_gradient_loss | 0.000285 | -| std | 0.00772 | -| value_loss | 3.85e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19903 | -| time_elapsed | 107609 | -| total_timesteps | 2547584 | -| train/ | | -| approx_kl | 0.0027972679 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | -9.41e-05 | -| n_updates | 199020 | -| policy_gradient_loss | 0.00423 | -| std | 0.00771 | -| value_loss | 1.85e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19904 | -| time_elapsed | 107614 | -| total_timesteps | 2547712 | -| train/ | | -| approx_kl | 0.05696385 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | 0.0336 | -| n_updates | 199030 | -| policy_gradient_loss | 0.0129 | -| std | 0.0077 | -| value_loss | 0.000102 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19905 | -| time_elapsed | 107618 | -| total_timesteps | 2547840 | -| train/ | | -| approx_kl | 0.02840514 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00223 | -| learning_rate | 0.0003 | -| loss | -0.000589 | -| n_updates | 199040 | -| policy_gradient_loss | 0.000956 | -| std | 0.0077 | -| value_loss | 4.31e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 19906 | -| time_elapsed | 107622 | -| total_timesteps | 2547968 | -| train/ | | -| approx_kl | 0.0052541746 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 199050 | -| policy_gradient_loss | 0.00258 | -| std | 0.00769 | -| value_loss | 1.72e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19907 | -| time_elapsed | 107627 | -| total_timesteps | 2548096 | -| train/ | | -| approx_kl | 0.06050945 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.055 | -| learning_rate | 0.0003 | -| loss | 0.0438 | -| n_updates | 199060 | -| policy_gradient_loss | 0.0109 | -| std | 0.00769 | -| value_loss | 2.12e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19908 | -| time_elapsed | 107638 | -| total_timesteps | 2548224 | -| train/ | | -| approx_kl | 0.028144903 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 199070 | -| policy_gradient_loss | -0.00596 | -| std | 0.00769 | -| value_loss | 4.94e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19909 | -| time_elapsed | 107643 | -| total_timesteps | 2548352 | -| train/ | | -| approx_kl | 0.0012387657 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | -0.000748 | -| n_updates | 199080 | -| policy_gradient_loss | 0.00759 | -| std | 0.00767 | -| value_loss | 6.38e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19910 | -| time_elapsed | 107646 | -| total_timesteps | 2548480 | -| train/ | | -| approx_kl | 0.028185915 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0595 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 199090 | -| policy_gradient_loss | 0.073 | -| std | 0.00765 | -| value_loss | 8.9e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19911 | -| time_elapsed | 107650 | -| total_timesteps | 2548608 | -| train/ | | -| approx_kl | 0.08282842 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00719 | -| learning_rate | 0.0003 | -| loss | 0.0681 | -| n_updates | 199100 | -| policy_gradient_loss | 0.117 | -| std | 0.00764 | -| value_loss | 3.82e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19912 | -| time_elapsed | 107655 | -| total_timesteps | 2548736 | -| train/ | | -| approx_kl | 0.014216478 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 199110 | -| policy_gradient_loss | 0.0168 | -| std | 0.00764 | -| value_loss | 2.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19913 | -| time_elapsed | 107658 | -| total_timesteps | 2548864 | -| train/ | | -| approx_kl | 0.45788395 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0652 | -| learning_rate | 0.0003 | -| loss | 0.228 | -| n_updates | 199120 | -| policy_gradient_loss | 0.0633 | -| std | 0.00764 | -| value_loss | 1.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 19914 | -| time_elapsed | 107662 | -| total_timesteps | 2548992 | -| train/ | | -| approx_kl | 0.027493542 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0542 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 199130 | -| policy_gradient_loss | 0.00685 | -| std | 0.00764 | -| value_loss | 8.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19915 | -| time_elapsed | 107667 | -| total_timesteps | 2549120 | -| train/ | | -| approx_kl | 0.029783448 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 199140 | -| policy_gradient_loss | 0.00956 | -| std | 0.00764 | -| value_loss | 5.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19916 | -| time_elapsed | 107679 | -| total_timesteps | 2549248 | -| train/ | | -| approx_kl | 0.012253026 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -4.46 | -| learning_rate | 0.0003 | -| loss | -0.03 | -| n_updates | 199150 | -| policy_gradient_loss | -0.0206 | -| std | 0.00764 | -| value_loss | 0.00346 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19917 | -| time_elapsed | 107682 | -| total_timesteps | 2549376 | -| train/ | | -| approx_kl | 0.0476856 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | 0.00728 | -| n_updates | 199160 | -| policy_gradient_loss | 0.018 | -| std | 0.00763 | -| value_loss | 6.29e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19918 | -| time_elapsed | 107687 | -| total_timesteps | 2549504 | -| train/ | | -| approx_kl | 0.09165725 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -125 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 199170 | -| policy_gradient_loss | 0.0244 | -| std | 0.00763 | -| value_loss | 3.83e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19919 | -| time_elapsed | 107691 | -| total_timesteps | 2549632 | -| train/ | | -| approx_kl | 0.034094226 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -40.9 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 199180 | -| policy_gradient_loss | 0.00933 | -| std | 0.00763 | -| value_loss | 1.73e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19920 | -| time_elapsed | 107696 | -| total_timesteps | 2549760 | -| train/ | | -| approx_kl | 0.10583764 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -5.35 | -| learning_rate | 0.0003 | -| loss | 0.0451 | -| n_updates | 199190 | -| policy_gradient_loss | 0.032 | -| std | 0.00763 | -| value_loss | 2.2e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 19921 | -| time_elapsed | 107699 | -| total_timesteps | 2549888 | -| train/ | | -| approx_kl | 0.028516153 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.708 | -| learning_rate | 0.0003 | -| loss | 0.00819 | -| n_updates | 199200 | -| policy_gradient_loss | 0.0293 | -| std | 0.00762 | -| value_loss | 6.04e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19922 | -| time_elapsed | 107703 | -| total_timesteps | 2550016 | -| train/ | | -| approx_kl | 0.097959235 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | 0.098 | -| n_updates | 199210 | -| policy_gradient_loss | 0.0505 | -| std | 0.00762 | -| value_loss | 4.63e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19923 | -| time_elapsed | 107714 | -| total_timesteps | 2550144 | -| train/ | | -| approx_kl | 0.015030127 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | -0.0233 | -| n_updates | 199220 | -| policy_gradient_loss | -0.0126 | -| std | 0.00762 | -| value_loss | 0.000401 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19924 | -| time_elapsed | 107718 | -| total_timesteps | 2550272 | -| train/ | | -| approx_kl | 0.49321103 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.375 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 199230 | -| policy_gradient_loss | 0.0131 | -| std | 0.00763 | -| value_loss | 1.86e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19925 | -| time_elapsed | 107725 | -| total_timesteps | 2550400 | -| train/ | | -| approx_kl | 0.010557214 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 199240 | -| policy_gradient_loss | 0.00218 | -| std | 0.00763 | -| value_loss | 6.95e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19926 | -| time_elapsed | 107730 | -| total_timesteps | 2550528 | -| train/ | | -| approx_kl | 0.0031874836 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 199250 | -| policy_gradient_loss | 0.00452 | -| std | 0.00763 | -| value_loss | 6.67e-09 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19927 | -| time_elapsed | 107736 | -| total_timesteps | 2550656 | -| train/ | | -| approx_kl | 0.059845 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0722 | -| learning_rate | 0.0003 | -| loss | 0.0485 | -| n_updates | 199260 | -| policy_gradient_loss | 0.0116 | -| std | 0.00763 | -| value_loss | 7.63e-09 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19928 | -| time_elapsed | 107740 | -| total_timesteps | 2550784 | -| train/ | | -| approx_kl | 0.10014457 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.00643 | -| n_updates | 199270 | -| policy_gradient_loss | -0.00716 | -| std | 0.00763 | -| value_loss | 3.91e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 19929 | -| time_elapsed | 107745 | -| total_timesteps | 2550912 | -| train/ | | -| approx_kl | 0.011384951 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.00276 | -| n_updates | 199280 | -| policy_gradient_loss | 0.00556 | -| std | 0.00762 | -| value_loss | 2.6e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19930 | -| time_elapsed | 107751 | -| total_timesteps | 2551040 | -| train/ | | -| approx_kl | 0.0001963363 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | 0.00132 | -| n_updates | 199290 | -| policy_gradient_loss | 0.000798 | -| std | 0.00763 | -| value_loss | 1.72e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19931 | -| time_elapsed | 107760 | -| total_timesteps | 2551168 | -| train/ | | -| approx_kl | 0.025087126 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0088 | -| n_updates | 199300 | -| policy_gradient_loss | -0.00268 | -| std | 0.00762 | -| value_loss | 0.000156 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19932 | -| time_elapsed | 107765 | -| total_timesteps | 2551296 | -| train/ | | -| approx_kl | 0.010001603 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.308 | -| learning_rate | 0.0003 | -| loss | -0.00339 | -| n_updates | 199310 | -| policy_gradient_loss | 0.00301 | -| std | 0.00762 | -| value_loss | 6.62e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19933 | -| time_elapsed | 107771 | -| total_timesteps | 2551424 | -| train/ | | -| approx_kl | 0.0026410427 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00951 | -| learning_rate | 0.0003 | -| loss | -0.000919 | -| n_updates | 199320 | -| policy_gradient_loss | 0.00561 | -| std | 0.00762 | -| value_loss | 4.78e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19934 | -| time_elapsed | 107775 | -| total_timesteps | 2551552 | -| train/ | | -| approx_kl | 0.025781488 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.073 | -| learning_rate | 0.0003 | -| loss | 0.029 | -| n_updates | 199330 | -| policy_gradient_loss | 0.102 | -| std | 0.00761 | -| value_loss | 9.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19935 | -| time_elapsed | 107780 | -| total_timesteps | 2551680 | -| train/ | | -| approx_kl | 0.00752319 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00125 | -| learning_rate | 0.0003 | -| loss | -0.00837 | -| n_updates | 199340 | -| policy_gradient_loss | 0.0165 | -| std | 0.00761 | -| value_loss | 3.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19936 | -| time_elapsed | 107786 | -| total_timesteps | 2551808 | -| train/ | | -| approx_kl | 0.48305297 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 199350 | -| policy_gradient_loss | 0.0543 | -| std | 0.00761 | -| value_loss | 1.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 19937 | -| time_elapsed | 107792 | -| total_timesteps | 2551936 | -| train/ | | -| approx_kl | 0.006919734 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 199360 | -| policy_gradient_loss | 0.00328 | -| std | 0.0076 | -| value_loss | 9.04e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19938 | -| time_elapsed | 107797 | -| total_timesteps | 2552064 | -| train/ | | -| approx_kl | 0.00056384783 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.00238 | -| n_updates | 199370 | -| policy_gradient_loss | 0.00144 | -| std | 0.0076 | -| value_loss | 7.22e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19939 | -| time_elapsed | 107806 | -| total_timesteps | 2552192 | -| train/ | | -| approx_kl | 0.01225112 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.153 | -| learning_rate | 0.0003 | -| loss | -0.00842 | -| n_updates | 199380 | -| policy_gradient_loss | -0.00821 | -| std | 0.0076 | -| value_loss | 0.00136 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19940 | -| time_elapsed | 107811 | -| total_timesteps | 2552320 | -| train/ | | -| approx_kl | 0.025282182 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.367 | -| learning_rate | 0.0003 | -| loss | 0.00176 | -| n_updates | 199390 | -| policy_gradient_loss | -0.00216 | -| std | 0.0076 | -| value_loss | 5.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19941 | -| time_elapsed | 107817 | -| total_timesteps | 2552448 | -| train/ | | -| approx_kl | 0.012803037 | -| clip_fraction | 0.093 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.00419 | -| n_updates | 199400 | -| policy_gradient_loss | 0.00146 | -| std | 0.00759 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19942 | -| time_elapsed | 107822 | -| total_timesteps | 2552576 | -| train/ | | -| approx_kl | 0.019051973 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0857 | -| learning_rate | 0.0003 | -| loss | 0.00664 | -| n_updates | 199410 | -| policy_gradient_loss | 0.025 | -| std | 0.00759 | -| value_loss | 1.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19943 | -| time_elapsed | 107827 | -| total_timesteps | 2552704 | -| train/ | | -| approx_kl | 0.23449056 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 199420 | -| policy_gradient_loss | 0.0704 | -| std | 0.00759 | -| value_loss | 5.64e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19944 | -| time_elapsed | 107832 | -| total_timesteps | 2552832 | -| train/ | | -| approx_kl | 0.15209594 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0943 | -| n_updates | 199430 | -| policy_gradient_loss | 0.082 | -| std | 0.00759 | -| value_loss | 3.85e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.883 | -| time/ | | -| fps | 23 | -| iterations | 19945 | -| time_elapsed | 107838 | -| total_timesteps | 2552960 | -| train/ | | -| approx_kl | 0.025578618 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.0159 | -| n_updates | 199440 | -| policy_gradient_loss | 0.0163 | -| std | 0.00759 | -| value_loss | 3.36e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19946 | -| time_elapsed | 107843 | -| total_timesteps | 2553088 | -| train/ | | -| approx_kl | 0.5001687 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 199450 | -| policy_gradient_loss | 0.0427 | -| std | 0.0076 | -| value_loss | 2.1e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19947 | -| time_elapsed | 107855 | -| total_timesteps | 2553216 | -| train/ | | -| approx_kl | 0.018153217 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.98 | -| learning_rate | 0.0003 | -| loss | -0.0283 | -| n_updates | 199460 | -| policy_gradient_loss | -0.0155 | -| std | 0.0076 | -| value_loss | 0.000157 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19948 | -| time_elapsed | 107860 | -| total_timesteps | 2553344 | -| train/ | | -| approx_kl | 0.15009911 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -1.32 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 199470 | -| policy_gradient_loss | 0.0209 | -| std | 0.0076 | -| value_loss | 6.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19949 | -| time_elapsed | 107864 | -| total_timesteps | 2553472 | -| train/ | | -| approx_kl | 0.028498717 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -49.3 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 199480 | -| policy_gradient_loss | -0.00821 | -| std | 0.00761 | -| value_loss | 3.78e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19950 | -| time_elapsed | 107869 | -| total_timesteps | 2553600 | -| train/ | | -| approx_kl | 0.08636026 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | 0.0987 | -| n_updates | 199490 | -| policy_gradient_loss | 0.1 | -| std | 0.00761 | -| value_loss | 9.02e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19951 | -| time_elapsed | 107872 | -| total_timesteps | 2553728 | -| train/ | | -| approx_kl | 0.007829556 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 4.64e-05 | -| learning_rate | 0.0003 | -| loss | 0.000406 | -| n_updates | 199500 | -| policy_gradient_loss | 0.0207 | -| std | 0.00765 | -| value_loss | 3.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19952 | -| time_elapsed | 107877 | -| total_timesteps | 2553856 | -| train/ | | -| approx_kl | 0.06257302 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | 0.0504 | -| n_updates | 199510 | -| policy_gradient_loss | 0.0238 | -| std | 0.00765 | -| value_loss | 5.31e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19953 | -| time_elapsed | 107883 | -| total_timesteps | 2553984 | -| train/ | | -| approx_kl | 5.220622e-05 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00348 | -| learning_rate | 0.0003 | -| loss | -0.000399 | -| n_updates | 199520 | -| policy_gradient_loss | 0.0187 | -| std | 0.00765 | -| value_loss | 6.39e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19954 | -| time_elapsed | 107887 | -| total_timesteps | 2554112 | -| train/ | | -| approx_kl | 0.41990614 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 199530 | -| policy_gradient_loss | 0.0656 | -| std | 0.00765 | -| value_loss | 7.78e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19955 | -| time_elapsed | 107898 | -| total_timesteps | 2554240 | -| train/ | | -| approx_kl | 0.0292283 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 199540 | -| policy_gradient_loss | -0.00981 | -| std | 0.00765 | -| value_loss | 0.00164 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19956 | -| time_elapsed | 107902 | -| total_timesteps | 2554368 | -| train/ | | -| approx_kl | 0.1232869 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 199550 | -| policy_gradient_loss | 0.0483 | -| std | 0.00765 | -| value_loss | 3.35e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19957 | -| time_elapsed | 107907 | -| total_timesteps | 2554496 | -| train/ | | -| approx_kl | 0.03153624 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00166 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 199560 | -| policy_gradient_loss | 0.0285 | -| std | 0.00765 | -| value_loss | 1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19958 | -| time_elapsed | 107912 | -| total_timesteps | 2554624 | -| train/ | | -| approx_kl | 0.83864444 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 199570 | -| policy_gradient_loss | 0.12 | -| std | 0.00765 | -| value_loss | 4.97e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19959 | -| time_elapsed | 107915 | -| total_timesteps | 2554752 | -| train/ | | -| approx_kl | 0.15086752 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.0602 | -| n_updates | 199580 | -| policy_gradient_loss | 0.0219 | -| std | 0.00765 | -| value_loss | 3.11e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 19960 | -| time_elapsed | 107919 | -| total_timesteps | 2554880 | -| train/ | | -| approx_kl | 0.05695685 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 199590 | -| policy_gradient_loss | 0.0425 | -| std | 0.00764 | -| value_loss | 7.2e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19961 | -| time_elapsed | 107923 | -| total_timesteps | 2555008 | -| train/ | | -| approx_kl | 0.10057692 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.0574 | -| n_updates | 199600 | -| policy_gradient_loss | 0.0267 | -| std | 0.00764 | -| value_loss | 2.96e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19962 | -| time_elapsed | 107936 | -| total_timesteps | 2555136 | -| train/ | | -| approx_kl | 0.005414834 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -2.43 | -| learning_rate | 0.0003 | -| loss | -0.0237 | -| n_updates | 199610 | -| policy_gradient_loss | -0.00436 | -| std | 0.00764 | -| value_loss | 0.00232 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19963 | -| time_elapsed | 107941 | -| total_timesteps | 2555264 | -| train/ | | -| approx_kl | 0.00089170225 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.32 | -| learning_rate | 0.0003 | -| loss | 0.00398 | -| n_updates | 199620 | -| policy_gradient_loss | 0.000564 | -| std | 0.00764 | -| value_loss | 1.19e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19964 | -| time_elapsed | 107944 | -| total_timesteps | 2555392 | -| train/ | | -| approx_kl | 0.0003770478 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 199630 | -| policy_gradient_loss | 0.00426 | -| std | 0.00764 | -| value_loss | 1.57e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19965 | -| time_elapsed | 107947 | -| total_timesteps | 2555520 | -| train/ | | -| approx_kl | 3.8941856e-05 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | -6.72e-05 | -| n_updates | 199640 | -| policy_gradient_loss | 0.00638 | -| std | 0.00765 | -| value_loss | 4.83e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19966 | -| time_elapsed | 107950 | -| total_timesteps | 2555648 | -| train/ | | -| approx_kl | 0.00012676092 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 199650 | -| policy_gradient_loss | -0.00338 | -| std | 0.00766 | -| value_loss | 3.64e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19967 | -| time_elapsed | 107955 | -| total_timesteps | 2555776 | -| train/ | | -| approx_kl | 0.05934778 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -87.9 | -| learning_rate | 0.0003 | -| loss | -0.00832 | -| n_updates | 199660 | -| policy_gradient_loss | 0.0257 | -| std | 0.00766 | -| value_loss | 5.7e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 19968 | -| time_elapsed | 107960 | -| total_timesteps | 2555904 | -| train/ | | -| approx_kl | 0.1843609 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.0754 | -| n_updates | 199670 | -| policy_gradient_loss | 0.0341 | -| std | 0.00766 | -| value_loss | 1.46e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19969 | -| time_elapsed | 107963 | -| total_timesteps | 2556032 | -| train/ | | -| approx_kl | 0.04712946 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 199680 | -| policy_gradient_loss | 0.0565 | -| std | 0.00766 | -| value_loss | 1.35e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19970 | -| time_elapsed | 107973 | -| total_timesteps | 2556160 | -| train/ | | -| approx_kl | 0.00423908 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 199690 | -| policy_gradient_loss | 0.00557 | -| std | 0.00766 | -| value_loss | 0.0016 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19971 | -| time_elapsed | 107977 | -| total_timesteps | 2556288 | -| train/ | | -| approx_kl | 0.13509984 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.0564 | -| n_updates | 199700 | -| policy_gradient_loss | 0.0361 | -| std | 0.00766 | -| value_loss | 6.73e-06 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19972 | -| time_elapsed | 107983 | -| total_timesteps | 2556416 | -| train/ | | -| approx_kl | 0.275323 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0083 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 199710 | -| policy_gradient_loss | 0.114 | -| std | 0.00766 | -| value_loss | 1.16e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19973 | -| time_elapsed | 107987 | -| total_timesteps | 2556544 | -| train/ | | -| approx_kl | 0.049419895 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 199720 | -| policy_gradient_loss | 0.0191 | -| std | 0.00766 | -| value_loss | 7.66e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19974 | -| time_elapsed | 107992 | -| total_timesteps | 2556672 | -| train/ | | -| approx_kl | 0.47650093 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 199730 | -| policy_gradient_loss | 0.0434 | -| std | 0.00766 | -| value_loss | 5.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19975 | -| time_elapsed | 107997 | -| total_timesteps | 2556800 | -| train/ | | -| approx_kl | 0.030982614 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.000235 | -| n_updates | 199740 | -| policy_gradient_loss | 0.00119 | -| std | 0.00766 | -| value_loss | 4.25e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 19976 | -| time_elapsed | 108002 | -| total_timesteps | 2556928 | -| train/ | | -| approx_kl | 0.0055131773 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.000464 | -| n_updates | 199750 | -| policy_gradient_loss | 0.00615 | -| std | 0.00765 | -| value_loss | 2.23e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19977 | -| time_elapsed | 108007 | -| total_timesteps | 2557056 | -| train/ | | -| approx_kl | 0.056885198 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 199760 | -| policy_gradient_loss | 0.0132 | -| std | 0.00764 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19978 | -| time_elapsed | 108016 | -| total_timesteps | 2557184 | -| train/ | | -| approx_kl | 0.002243178 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.706 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 199770 | -| policy_gradient_loss | -0.0148 | -| std | 0.00762 | -| value_loss | 0.0069 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19979 | -| time_elapsed | 108021 | -| total_timesteps | 2557312 | -| train/ | | -| approx_kl | 0.45136955 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 199780 | -| policy_gradient_loss | 0.0531 | -| std | 0.00761 | -| value_loss | 0.000186 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19980 | -| time_elapsed | 108026 | -| total_timesteps | 2557440 | -| train/ | | -| approx_kl | 0.0352267 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0968 | -| learning_rate | 0.0003 | -| loss | 0.0294 | -| n_updates | 199790 | -| policy_gradient_loss | 0.014 | -| std | 0.0076 | -| value_loss | 0.00289 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19981 | -| time_elapsed | 108031 | -| total_timesteps | 2557568 | -| train/ | | -| approx_kl | 0.038429964 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0039 | -| learning_rate | 0.0003 | -| loss | 0.00643 | -| n_updates | 199800 | -| policy_gradient_loss | 0.00264 | -| std | 0.00759 | -| value_loss | 0.000195 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19982 | -| time_elapsed | 108038 | -| total_timesteps | 2557696 | -| train/ | | -| approx_kl | 0.0064524957 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 199810 | -| policy_gradient_loss | 0.00221 | -| std | 0.00759 | -| value_loss | 3.01e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19983 | -| time_elapsed | 108042 | -| total_timesteps | 2557824 | -| train/ | | -| approx_kl | 0.045323543 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 199820 | -| policy_gradient_loss | -0.0075 | -| std | 0.00759 | -| value_loss | 3.77e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 19984 | -| time_elapsed | 108047 | -| total_timesteps | 2557952 | -| train/ | | -| approx_kl | 0.0062871524 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.000586 | -| n_updates | 199830 | -| policy_gradient_loss | 0.00638 | -| std | 0.00761 | -| value_loss | 0.000353 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19985 | -| time_elapsed | 108052 | -| total_timesteps | 2558080 | -| train/ | | -| approx_kl | 0.060661778 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -9.7 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 199840 | -| policy_gradient_loss | -0.00679 | -| std | 0.00762 | -| value_loss | 1.41e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19986 | -| time_elapsed | 108059 | -| total_timesteps | 2558208 | -| train/ | | -| approx_kl | 0.05077416 | -| clip_fraction | 0.539 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | -0.00798 | -| n_updates | 199850 | -| policy_gradient_loss | -0.00394 | -| std | 0.00762 | -| value_loss | 0.000554 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19987 | -| time_elapsed | 108063 | -| total_timesteps | 2558336 | -| train/ | | -| approx_kl | 0.022264443 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.444 | -| learning_rate | 0.0003 | -| loss | 0.0201 | -| n_updates | 199860 | -| policy_gradient_loss | 0.0832 | -| std | 0.00762 | -| value_loss | 4.37e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19988 | -| time_elapsed | 108067 | -| total_timesteps | 2558464 | -| train/ | | -| approx_kl | 0.15076901 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -4.96 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 199870 | -| policy_gradient_loss | 0.000719 | -| std | 0.00762 | -| value_loss | 3.77e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19989 | -| time_elapsed | 108071 | -| total_timesteps | 2558592 | -| train/ | | -| approx_kl | 0.020474643 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.931 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 199880 | -| policy_gradient_loss | 0.00139 | -| std | 0.00762 | -| value_loss | 1.99e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19990 | -| time_elapsed | 108076 | -| total_timesteps | 2558720 | -| train/ | | -| approx_kl | 0.115137175 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.0846 | -| n_updates | 199890 | -| policy_gradient_loss | 0.0611 | -| std | 0.00762 | -| value_loss | 6.89e-11 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19991 | -| time_elapsed | 108081 | -| total_timesteps | 2558848 | -| train/ | | -| approx_kl | 0.0302817 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.00525 | -| n_updates | 199900 | -| policy_gradient_loss | 0.0228 | -| std | 0.00762 | -| value_loss | 5.1e-11 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 19992 | -| time_elapsed | 108087 | -| total_timesteps | 2558976 | -| train/ | | -| approx_kl | 0.73245835 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | 0.224 | -| n_updates | 199910 | -| policy_gradient_loss | 0.159 | -| std | 0.00762 | -| value_loss | 3.98e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 19993 | -| time_elapsed | 108091 | -| total_timesteps | 2559104 | -| train/ | | -| approx_kl | 0.02269701 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.00461 | -| n_updates | 199920 | -| policy_gradient_loss | -0.000681 | -| std | 0.00762 | -| value_loss | 3.04e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 19994 | -| time_elapsed | 108102 | -| total_timesteps | 2559232 | -| train/ | | -| approx_kl | 0.15740453 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 199930 | -| policy_gradient_loss | -0.00497 | -| std | 0.00762 | -| value_loss | 0.00205 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 19995 | -| time_elapsed | 108106 | -| total_timesteps | 2559360 | -| train/ | | -| approx_kl | 0.036780678 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.00837 | -| n_updates | 199940 | -| policy_gradient_loss | 0.0436 | -| std | 0.00763 | -| value_loss | 2.84e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 19996 | -| time_elapsed | 108110 | -| total_timesteps | 2559488 | -| train/ | | -| approx_kl | 0.17776078 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00415 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 199950 | -| policy_gradient_loss | 0.0153 | -| std | 0.00763 | -| value_loss | 5.69e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 19997 | -| time_elapsed | 108115 | -| total_timesteps | 2559616 | -| train/ | | -| approx_kl | 0.0008585993 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 199960 | -| policy_gradient_loss | 0.0116 | -| std | 0.00763 | -| value_loss | 2.3e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 19998 | -| time_elapsed | 108120 | -| total_timesteps | 2559744 | -| train/ | | -| approx_kl | 1.4522579e-05 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | -0.000209 | -| n_updates | 199970 | -| policy_gradient_loss | 0.0093 | -| std | 0.00763 | -| value_loss | 1.47e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 19999 | -| time_elapsed | 108125 | -| total_timesteps | 2559872 | -| train/ | | -| approx_kl | 0.05456887 | -| clip_fraction | 0.551 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.00374 | -| n_updates | 199980 | -| policy_gradient_loss | 0.0481 | -| std | 0.00763 | -| value_loss | 1.24e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20000 | -| time_elapsed | 108130 | -| total_timesteps | 2560000 | -| train/ | | -| approx_kl | 0.01592654 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 199990 | -| policy_gradient_loss | 0.00975 | -| std | 0.00763 | -| value_loss | 9.38e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20001 | -| time_elapsed | 108135 | -| total_timesteps | 2560128 | -| train/ | | -| approx_kl | 0.01910226 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.0038 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 200000 | -| policy_gradient_loss | 0.042 | -| std | 0.00762 | -| value_loss | 1.7e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20002 | -| time_elapsed | 108144 | -| total_timesteps | 2560256 | -| train/ | | -| approx_kl | 0.036512993 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 200010 | -| policy_gradient_loss | -0.00505 | -| std | 0.00761 | -| value_loss | 0.000112 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20003 | -| time_elapsed | 108148 | -| total_timesteps | 2560384 | -| train/ | | -| approx_kl | 0.026843656 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00932 | -| learning_rate | 0.0003 | -| loss | 0.0257 | -| n_updates | 200020 | -| policy_gradient_loss | 0.0806 | -| std | 0.00761 | -| value_loss | 1.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20004 | -| time_elapsed | 108154 | -| total_timesteps | 2560512 | -| train/ | | -| approx_kl | 0.09888287 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0884 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 200030 | -| policy_gradient_loss | 0.123 | -| std | 0.00761 | -| value_loss | 9.44e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20005 | -| time_elapsed | 108158 | -| total_timesteps | 2560640 | -| train/ | | -| approx_kl | 0.017768903 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | 0.00784 | -| n_updates | 200040 | -| policy_gradient_loss | 0.0188 | -| std | 0.00761 | -| value_loss | 9.59e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20006 | -| time_elapsed | 108162 | -| total_timesteps | 2560768 | -| train/ | | -| approx_kl | 0.3354156 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 200050 | -| policy_gradient_loss | 0.0326 | -| std | 0.00761 | -| value_loss | 2.91e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 20007 | -| time_elapsed | 108166 | -| total_timesteps | 2560896 | -| train/ | | -| approx_kl | 0.007244285 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0606 | -| learning_rate | 0.0003 | -| loss | -0.000683 | -| n_updates | 200060 | -| policy_gradient_loss | 0.00555 | -| std | 0.00761 | -| value_loss | 2e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20008 | -| time_elapsed | 108172 | -| total_timesteps | 2561024 | -| train/ | | -| approx_kl | 0.05280074 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.0335 | -| n_updates | 200070 | -| policy_gradient_loss | 0.0135 | -| std | 0.00761 | -| value_loss | 1.29e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20009 | -| time_elapsed | 108184 | -| total_timesteps | 2561152 | -| train/ | | -| approx_kl | 0.0002011694 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.801 | -| learning_rate | 0.0003 | -| loss | -0.00976 | -| n_updates | 200080 | -| policy_gradient_loss | -0.00513 | -| std | 0.00761 | -| value_loss | 0.00356 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20010 | -| time_elapsed | 108189 | -| total_timesteps | 2561280 | -| train/ | | -| approx_kl | 0.09030698 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.452 | -| learning_rate | 0.0003 | -| loss | 0.0609 | -| n_updates | 200090 | -| policy_gradient_loss | 0.0313 | -| std | 0.0076 | -| value_loss | 2.13e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20011 | -| time_elapsed | 108192 | -| total_timesteps | 2561408 | -| train/ | | -| approx_kl | 0.0044166436 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00644 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 200100 | -| policy_gradient_loss | 0.0134 | -| std | 0.0076 | -| value_loss | 3.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20012 | -| time_elapsed | 108197 | -| total_timesteps | 2561536 | -| train/ | | -| approx_kl | 0.033031434 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.000872 | -| n_updates | 200110 | -| policy_gradient_loss | 0.000431 | -| std | 0.00759 | -| value_loss | 3.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20013 | -| time_elapsed | 108200 | -| total_timesteps | 2561664 | -| train/ | | -| approx_kl | 0.013822192 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.343 | -| learning_rate | 0.0003 | -| loss | -0.000399 | -| n_updates | 200120 | -| policy_gradient_loss | 0.0521 | -| std | 0.00758 | -| value_loss | 3.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20014 | -| time_elapsed | 108203 | -| total_timesteps | 2561792 | -| train/ | | -| approx_kl | 0.010238041 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.999 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 200130 | -| policy_gradient_loss | 0.0173 | -| std | 0.00758 | -| value_loss | 1.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 20015 | -| time_elapsed | 108207 | -| total_timesteps | 2561920 | -| train/ | | -| approx_kl | 0.03455182 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 200140 | -| policy_gradient_loss | 0.0289 | -| std | 0.00758 | -| value_loss | 3.07e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20016 | -| time_elapsed | 108212 | -| total_timesteps | 2562048 | -| train/ | | -| approx_kl | 0.12113736 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0602 | -| n_updates | 200150 | -| policy_gradient_loss | 0.0338 | -| std | 0.00758 | -| value_loss | 2.31e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20017 | -| time_elapsed | 108222 | -| total_timesteps | 2562176 | -| train/ | | -| approx_kl | 0.00184213 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.915 | -| learning_rate | 0.0003 | -| loss | -0.00609 | -| n_updates | 200160 | -| policy_gradient_loss | -0.00497 | -| std | 0.00758 | -| value_loss | 0.000967 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20018 | -| time_elapsed | 108226 | -| total_timesteps | 2562304 | -| train/ | | -| approx_kl | 0.06182878 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | 0.0697 | -| n_updates | 200170 | -| policy_gradient_loss | 0.0212 | -| std | 0.00758 | -| value_loss | 3.88e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20019 | -| time_elapsed | 108231 | -| total_timesteps | 2562432 | -| train/ | | -| approx_kl | 0.0013586269 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00851 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 200180 | -| policy_gradient_loss | 0.0216 | -| std | 0.00758 | -| value_loss | 2.8e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20020 | -| time_elapsed | 108237 | -| total_timesteps | 2562560 | -| train/ | | -| approx_kl | 0.05282554 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0757 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 200190 | -| policy_gradient_loss | 0.017 | -| std | 0.00758 | -| value_loss | 2.94e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20021 | -| time_elapsed | 108242 | -| total_timesteps | 2562688 | -| train/ | | -| approx_kl | 0.26226288 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.228 | -| n_updates | 200200 | -| policy_gradient_loss | 0.135 | -| std | 0.00758 | -| value_loss | 2.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20022 | -| time_elapsed | 108247 | -| total_timesteps | 2562816 | -| train/ | | -| approx_kl | 0.039985724 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 200210 | -| policy_gradient_loss | 0.0198 | -| std | 0.00758 | -| value_loss | 1.42e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 20023 | -| time_elapsed | 108252 | -| total_timesteps | 2562944 | -| train/ | | -| approx_kl | 0.1198698 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 200220 | -| policy_gradient_loss | 0.0145 | -| std | 0.00758 | -| value_loss | 1.04e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20024 | -| time_elapsed | 108257 | -| total_timesteps | 2563072 | -| train/ | | -| approx_kl | 0.009283456 | -| clip_fraction | 0.0641 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 200230 | -| policy_gradient_loss | -0.00175 | -| std | 0.00758 | -| value_loss | 5.96e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20025 | -| time_elapsed | 108265 | -| total_timesteps | 2563200 | -| train/ | | -| approx_kl | 0.0683967 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.971 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 200240 | -| policy_gradient_loss | 0.00807 | -| std | 0.00758 | -| value_loss | 0.000238 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20026 | -| time_elapsed | 108269 | -| total_timesteps | 2563328 | -| train/ | | -| approx_kl | 0.56548333 | -| clip_fraction | 0.634 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0051 | -| learning_rate | 0.0003 | -| loss | 0.224 | -| n_updates | 200250 | -| policy_gradient_loss | 0.129 | -| std | 0.00759 | -| value_loss | 1.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20027 | -| time_elapsed | 108274 | -| total_timesteps | 2563456 | -| train/ | | -| approx_kl | 0.24705058 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | 0.205 | -| n_updates | 200260 | -| policy_gradient_loss | 0.111 | -| std | 0.0076 | -| value_loss | 6.83e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20028 | -| time_elapsed | 108278 | -| total_timesteps | 2563584 | -| train/ | | -| approx_kl | 0.18521744 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.0076 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 200270 | -| policy_gradient_loss | 0.132 | -| std | 0.00761 | -| value_loss | 2.23e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20029 | -| time_elapsed | 108282 | -| total_timesteps | 2563712 | -| train/ | | -| approx_kl | 0.027501848 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00177 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 200280 | -| policy_gradient_loss | 0.0209 | -| std | 0.00761 | -| value_loss | 1.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20030 | -| time_elapsed | 108287 | -| total_timesteps | 2563840 | -| train/ | | -| approx_kl | 0.11433329 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 200290 | -| policy_gradient_loss | 0.0123 | -| std | 0.00761 | -| value_loss | 7.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20031 | -| time_elapsed | 108290 | -| total_timesteps | 2563968 | -| train/ | | -| approx_kl | 0.014834231 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.0025 | -| n_updates | 200300 | -| policy_gradient_loss | 0.0163 | -| std | 0.00761 | -| value_loss | 8.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20032 | -| time_elapsed | 108295 | -| total_timesteps | 2564096 | -| train/ | | -| approx_kl | 0.09338859 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 200310 | -| policy_gradient_loss | 0.02 | -| std | 0.00761 | -| value_loss | 2.15e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20033 | -| time_elapsed | 108305 | -| total_timesteps | 2564224 | -| train/ | | -| approx_kl | 0.087489694 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | -0.00981 | -| n_updates | 200320 | -| policy_gradient_loss | -0.0103 | -| std | 0.00761 | -| value_loss | 0.0022 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20034 | -| time_elapsed | 108311 | -| total_timesteps | 2564352 | -| train/ | | -| approx_kl | 0.06457852 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -10.6 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 200330 | -| policy_gradient_loss | 0.0141 | -| std | 0.00763 | -| value_loss | 1.37e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20035 | -| time_elapsed | 108316 | -| total_timesteps | 2564480 | -| train/ | | -| approx_kl | 0.22906458 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | 0.0869 | -| n_updates | 200340 | -| policy_gradient_loss | 0.0334 | -| std | 0.00764 | -| value_loss | 1.61e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20036 | -| time_elapsed | 108320 | -| total_timesteps | 2564608 | -| train/ | | -| approx_kl | 0.0009553204 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 200350 | -| policy_gradient_loss | -0.00328 | -| std | 0.00765 | -| value_loss | 6.96e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20037 | -| time_elapsed | 108324 | -| total_timesteps | 2564736 | -| train/ | | -| approx_kl | 1.128763e-06 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 200360 | -| policy_gradient_loss | 0.000806 | -| std | 0.00765 | -| value_loss | 5.21e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20038 | -| time_elapsed | 108329 | -| total_timesteps | 2564864 | -| train/ | | -| approx_kl | 0.046454687 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 200370 | -| policy_gradient_loss | 0.0477 | -| std | 0.00765 | -| value_loss | 3.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20039 | -| time_elapsed | 108334 | -| total_timesteps | 2564992 | -| train/ | | -| approx_kl | 0.17678143 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.0746 | -| n_updates | 200380 | -| policy_gradient_loss | 0.0344 | -| std | 0.00765 | -| value_loss | 3.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20040 | -| time_elapsed | 108339 | -| total_timesteps | 2565120 | -| train/ | | -| approx_kl | 0.035717502 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 200390 | -| policy_gradient_loss | 0.034 | -| std | 0.00765 | -| value_loss | 1.93e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20041 | -| time_elapsed | 108351 | -| total_timesteps | 2565248 | -| train/ | | -| approx_kl | 0.19053723 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.479 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 200400 | -| policy_gradient_loss | 0.00273 | -| std | 0.00766 | -| value_loss | 0.000993 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20042 | -| time_elapsed | 108357 | -| total_timesteps | 2565376 | -| train/ | | -| approx_kl | 0.112061456 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00659 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 200410 | -| policy_gradient_loss | 0.0333 | -| std | 0.00766 | -| value_loss | 1.13e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20043 | -| time_elapsed | 108362 | -| total_timesteps | 2565504 | -| train/ | | -| approx_kl | 0.032369617 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | 0.00251 | -| n_updates | 200420 | -| policy_gradient_loss | 0.0807 | -| std | 0.00766 | -| value_loss | 4.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20044 | -| time_elapsed | 108368 | -| total_timesteps | 2565632 | -| train/ | | -| approx_kl | 0.015404096 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 200430 | -| policy_gradient_loss | -0.000149 | -| std | 0.00766 | -| value_loss | 3.78e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20045 | -| time_elapsed | 108373 | -| total_timesteps | 2565760 | -| train/ | | -| approx_kl | 0.13169861 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.0829 | -| n_updates | 200440 | -| policy_gradient_loss | 0.014 | -| std | 0.00766 | -| value_loss | 1.96e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20046 | -| time_elapsed | 108378 | -| total_timesteps | 2565888 | -| train/ | | -| approx_kl | 0.003216919 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.00531 | -| n_updates | 200450 | -| policy_gradient_loss | 0.0145 | -| std | 0.00766 | -| value_loss | 3.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20047 | -| time_elapsed | 108383 | -| total_timesteps | 2566016 | -| train/ | | -| approx_kl | 0.09558291 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 200460 | -| policy_gradient_loss | 0.0345 | -| std | 0.00766 | -| value_loss | 4.57e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20048 | -| time_elapsed | 108393 | -| total_timesteps | 2566144 | -| train/ | | -| approx_kl | 0.14611153 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | 0.00143 | -| n_updates | 200470 | -| policy_gradient_loss | -0.00214 | -| std | 0.00765 | -| value_loss | 0.000257 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20049 | -| time_elapsed | 108399 | -| total_timesteps | 2566272 | -| train/ | | -| approx_kl | 0.27399394 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0271 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 200480 | -| policy_gradient_loss | 0.0781 | -| std | 0.00765 | -| value_loss | 0.000189 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20050 | -| time_elapsed | 108404 | -| total_timesteps | 2566400 | -| train/ | | -| approx_kl | 0.050344747 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 200490 | -| policy_gradient_loss | 0.0197 | -| std | 0.00765 | -| value_loss | 1.16e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20051 | -| time_elapsed | 108408 | -| total_timesteps | 2566528 | -| train/ | | -| approx_kl | 0.41442016 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 200500 | -| policy_gradient_loss | 0.0409 | -| std | 0.00765 | -| value_loss | 2.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20052 | -| time_elapsed | 108413 | -| total_timesteps | 2566656 | -| train/ | | -| approx_kl | 0.026553802 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 200510 | -| policy_gradient_loss | 0.00241 | -| std | 0.00765 | -| value_loss | 1.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20053 | -| time_elapsed | 108418 | -| total_timesteps | 2566784 | -| train/ | | -| approx_kl | 0.04218248 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.00926 | -| n_updates | 200520 | -| policy_gradient_loss | 0.00392 | -| std | 0.00765 | -| value_loss | 1.02e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20054 | -| time_elapsed | 108422 | -| total_timesteps | 2566912 | -| train/ | | -| approx_kl | 0.007824719 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 200530 | -| policy_gradient_loss | 0.00513 | -| std | 0.00766 | -| value_loss | 7.68e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20055 | -| time_elapsed | 108427 | -| total_timesteps | 2567040 | -| train/ | | -| approx_kl | 0.04827345 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 200540 | -| policy_gradient_loss | 0.0255 | -| std | 0.00766 | -| value_loss | 5.43e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20056 | -| time_elapsed | 108437 | -| total_timesteps | 2567168 | -| train/ | | -| approx_kl | 0.03735192 | -| clip_fraction | 0.583 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -1.42 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 200550 | -| policy_gradient_loss | 0.0256 | -| std | 0.00766 | -| value_loss | 0.00266 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20057 | -| time_elapsed | 108441 | -| total_timesteps | 2567296 | -| train/ | | -| approx_kl | 0.034136303 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.308 | -| learning_rate | 0.0003 | -| loss | 0.0217 | -| n_updates | 200560 | -| policy_gradient_loss | 0.00821 | -| std | 0.00764 | -| value_loss | 2.41e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20058 | -| time_elapsed | 108445 | -| total_timesteps | 2567424 | -| train/ | | -| approx_kl | 4.2797066e-05 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.000832 | -| n_updates | 200570 | -| policy_gradient_loss | 0.0161 | -| std | 0.00763 | -| value_loss | 8.35e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20059 | -| time_elapsed | 108450 | -| total_timesteps | 2567552 | -| train/ | | -| approx_kl | 0.35432172 | -| clip_fraction | 0.679 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.203 | -| n_updates | 200580 | -| policy_gradient_loss | 0.135 | -| std | 0.00762 | -| value_loss | 2.23e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20060 | -| time_elapsed | 108455 | -| total_timesteps | 2567680 | -| train/ | | -| approx_kl | 0.14710285 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 200590 | -| policy_gradient_loss | 0.103 | -| std | 0.00762 | -| value_loss | 2.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20061 | -| time_elapsed | 108460 | -| total_timesteps | 2567808 | -| train/ | | -| approx_kl | 0.033882745 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.00945 | -| n_updates | 200600 | -| policy_gradient_loss | 0.0194 | -| std | 0.00763 | -| value_loss | 1.41e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20062 | -| time_elapsed | 108465 | -| total_timesteps | 2567936 | -| train/ | | -| approx_kl | 0.14861998 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0533 | -| n_updates | 200610 | -| policy_gradient_loss | 0.0161 | -| std | 0.00762 | -| value_loss | 1.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20063 | -| time_elapsed | 108469 | -| total_timesteps | 2568064 | -| train/ | | -| approx_kl | 0.016099809 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.00765 | -| n_updates | 200620 | -| policy_gradient_loss | 0.0223 | -| std | 0.00761 | -| value_loss | 1.23e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20064 | -| time_elapsed | 108478 | -| total_timesteps | 2568192 | -| train/ | | -| approx_kl | 0.0021455935 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.027 | -| n_updates | 200630 | -| policy_gradient_loss | -0.00847 | -| std | 0.00761 | -| value_loss | 0.000201 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20065 | -| time_elapsed | 108482 | -| total_timesteps | 2568320 | -| train/ | | -| approx_kl | 0.014264932 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 200640 | -| policy_gradient_loss | 0.0168 | -| std | 0.0076 | -| value_loss | 7.58e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20066 | -| time_elapsed | 108487 | -| total_timesteps | 2568448 | -| train/ | | -| approx_kl | 0.14849907 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.00983 | -| learning_rate | 0.0003 | -| loss | 0.0999 | -| n_updates | 200650 | -| policy_gradient_loss | 0.0171 | -| std | 0.0076 | -| value_loss | 5.93e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20067 | -| time_elapsed | 108492 | -| total_timesteps | 2568576 | -| train/ | | -| approx_kl | 0.03594349 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0732 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 200660 | -| policy_gradient_loss | 0.0191 | -| std | 0.0076 | -| value_loss | 1.99e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20068 | -| time_elapsed | 108497 | -| total_timesteps | 2568704 | -| train/ | | -| approx_kl | 0.11126875 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.0109 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 200670 | -| policy_gradient_loss | 0.0143 | -| std | 0.0076 | -| value_loss | 4.2e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20069 | -| time_elapsed | 108502 | -| total_timesteps | 2568832 | -| train/ | | -| approx_kl | 0.0068969335 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | 0.00849 | -| n_updates | 200680 | -| policy_gradient_loss | 0.00924 | -| std | 0.0076 | -| value_loss | 2.48e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.858 | -| time/ | | -| fps | 23 | -| iterations | 20070 | -| time_elapsed | 108506 | -| total_timesteps | 2568960 | -| train/ | | -| approx_kl | 0.15206134 | -| clip_fraction | 0.694 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.0957 | -| n_updates | 200690 | -| policy_gradient_loss | 0.0955 | -| std | 0.0076 | -| value_loss | 1.16e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20071 | -| time_elapsed | 108511 | -| total_timesteps | 2569088 | -| train/ | | -| approx_kl | 0.13773112 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 200700 | -| policy_gradient_loss | 0.12 | -| std | 0.0076 | -| value_loss | 9.98e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20072 | -| time_elapsed | 108520 | -| total_timesteps | 2569216 | -| train/ | | -| approx_kl | 0.2953629 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 200710 | -| policy_gradient_loss | 0.0621 | -| std | 0.0076 | -| value_loss | 0.00681 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20073 | -| time_elapsed | 108524 | -| total_timesteps | 2569344 | -| train/ | | -| approx_kl | 0.29470205 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 200720 | -| policy_gradient_loss | 0.148 | -| std | 0.0076 | -| value_loss | 5.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20074 | -| time_elapsed | 108529 | -| total_timesteps | 2569472 | -| train/ | | -| approx_kl | 0.118856445 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00971 | -| learning_rate | 0.0003 | -| loss | 0.0855 | -| n_updates | 200730 | -| policy_gradient_loss | 0.108 | -| std | 0.0076 | -| value_loss | 1.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20075 | -| time_elapsed | 108534 | -| total_timesteps | 2569600 | -| train/ | | -| approx_kl | 0.11109411 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0057 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 200740 | -| policy_gradient_loss | 0.0983 | -| std | 0.0076 | -| value_loss | 1.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20076 | -| time_elapsed | 108540 | -| total_timesteps | 2569728 | -| train/ | | -| approx_kl | 0.021133184 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.00735 | -| n_updates | 200750 | -| policy_gradient_loss | 0.0184 | -| std | 0.00761 | -| value_loss | 5.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20077 | -| time_elapsed | 108544 | -| total_timesteps | 2569856 | -| train/ | | -| approx_kl | 0.12872803 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0689 | -| n_updates | 200760 | -| policy_gradient_loss | 0.0189 | -| std | 0.00761 | -| value_loss | 3.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20078 | -| time_elapsed | 108549 | -| total_timesteps | 2569984 | -| train/ | | -| approx_kl | 0.011414776 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.000466 | -| n_updates | 200770 | -| policy_gradient_loss | -0.000617 | -| std | 0.00761 | -| value_loss | 2.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20079 | -| time_elapsed | 108554 | -| total_timesteps | 2570112 | -| train/ | | -| approx_kl | 0.008574389 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 200780 | -| policy_gradient_loss | -0.00378 | -| std | 0.00761 | -| value_loss | 1.49e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20080 | -| time_elapsed | 108564 | -| total_timesteps | 2570240 | -| train/ | | -| approx_kl | 0.12110388 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 200790 | -| policy_gradient_loss | 0.0231 | -| std | 0.00761 | -| value_loss | 0.0017 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20081 | -| time_elapsed | 108569 | -| total_timesteps | 2570368 | -| train/ | | -| approx_kl | 0.0642848 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0564 | -| learning_rate | 0.0003 | -| loss | 0.00281 | -| n_updates | 200800 | -| policy_gradient_loss | 0.0348 | -| std | 0.00761 | -| value_loss | 1.18e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20082 | -| time_elapsed | 108573 | -| total_timesteps | 2570496 | -| train/ | | -| approx_kl | 0.08966601 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 200810 | -| policy_gradient_loss | 0.0385 | -| std | 0.00761 | -| value_loss | 3.67e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20083 | -| time_elapsed | 108578 | -| total_timesteps | 2570624 | -| train/ | | -| approx_kl | 0.122611254 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.00628 | -| learning_rate | 0.0003 | -| loss | 0.0976 | -| n_updates | 200820 | -| policy_gradient_loss | 0.0236 | -| std | 0.00761 | -| value_loss | 1.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20084 | -| time_elapsed | 108583 | -| total_timesteps | 2570752 | -| train/ | | -| approx_kl | 0.47529775 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.0945 | -| n_updates | 200830 | -| policy_gradient_loss | 0.0402 | -| std | 0.00761 | -| value_loss | 1.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20085 | -| time_elapsed | 108588 | -| total_timesteps | 2570880 | -| train/ | | -| approx_kl | 0.042088035 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.00567 | -| n_updates | 200840 | -| policy_gradient_loss | 0.00431 | -| std | 0.00761 | -| value_loss | 1.05e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20086 | -| time_elapsed | 108592 | -| total_timesteps | 2571008 | -| train/ | | -| approx_kl | 0.03716123 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 200850 | -| policy_gradient_loss | 0.00921 | -| std | 0.00761 | -| value_loss | 6.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20087 | -| time_elapsed | 108605 | -| total_timesteps | 2571136 | -| train/ | | -| approx_kl | 0.015200317 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 200860 | -| policy_gradient_loss | -0.0118 | -| std | 0.00761 | -| value_loss | 7.68e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20088 | -| time_elapsed | 108609 | -| total_timesteps | 2571264 | -| train/ | | -| approx_kl | 0.47316667 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.483 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 200870 | -| policy_gradient_loss | 0.0526 | -| std | 0.00761 | -| value_loss | 4.39e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20089 | -| time_elapsed | 108614 | -| total_timesteps | 2571392 | -| train/ | | -| approx_kl | 0.0076951333 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | -0.00785 | -| n_updates | 200880 | -| policy_gradient_loss | 0.00308 | -| std | 0.0076 | -| value_loss | 1.96e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20090 | -| time_elapsed | 108618 | -| total_timesteps | 2571520 | -| train/ | | -| approx_kl | 0.024749193 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 200890 | -| policy_gradient_loss | 0.0761 | -| std | 0.0076 | -| value_loss | 6.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20091 | -| time_elapsed | 108621 | -| total_timesteps | 2571648 | -| train/ | | -| approx_kl | 0.008225321 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.00098 | -| n_updates | 200900 | -| policy_gradient_loss | 0.0181 | -| std | 0.00759 | -| value_loss | 4.34e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20092 | -| time_elapsed | 108625 | -| total_timesteps | 2571776 | -| train/ | | -| approx_kl | 3.6768615e-06 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | -0.000224 | -| n_updates | 200910 | -| policy_gradient_loss | 0.0256 | -| std | 0.00758 | -| value_loss | 6.29e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 20093 | -| time_elapsed | 108630 | -| total_timesteps | 2571904 | -| train/ | | -| approx_kl | 0.014581562 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 200920 | -| policy_gradient_loss | 0.00312 | -| std | 0.00757 | -| value_loss | 1.41e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20094 | -| time_elapsed | 108635 | -| total_timesteps | 2572032 | -| train/ | | -| approx_kl | 0.0709211 | -| clip_fraction | 0.603 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0683 | -| n_updates | 200930 | -| policy_gradient_loss | 0.171 | -| std | 0.00757 | -| value_loss | 3.59e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20095 | -| time_elapsed | 108643 | -| total_timesteps | 2572160 | -| train/ | | -| approx_kl | 0.13126372 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | 0.058 | -| n_updates | 200940 | -| policy_gradient_loss | 0.0546 | -| std | 0.00757 | -| value_loss | 5.1e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20096 | -| time_elapsed | 108647 | -| total_timesteps | 2572288 | -| train/ | | -| approx_kl | 0.10501937 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | 0.0679 | -| n_updates | 200950 | -| policy_gradient_loss | 0.119 | -| std | 0.00757 | -| value_loss | 2.56e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20097 | -| time_elapsed | 108652 | -| total_timesteps | 2572416 | -| train/ | | -| approx_kl | 0.10204988 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.00611 | -| learning_rate | 0.0003 | -| loss | 0.0818 | -| n_updates | 200960 | -| policy_gradient_loss | 0.104 | -| std | 0.00757 | -| value_loss | 1.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20098 | -| time_elapsed | 108656 | -| total_timesteps | 2572544 | -| train/ | | -| approx_kl | 0.020324517 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.009 | -| learning_rate | 0.0003 | -| loss | 0.00386 | -| n_updates | 200970 | -| policy_gradient_loss | 0.0191 | -| std | 0.00757 | -| value_loss | 6.74e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20099 | -| time_elapsed | 108659 | -| total_timesteps | 2572672 | -| train/ | | -| approx_kl | 0.13742265 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.0677 | -| n_updates | 200980 | -| policy_gradient_loss | 0.0157 | -| std | 0.00756 | -| value_loss | 4.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20100 | -| time_elapsed | 108663 | -| total_timesteps | 2572800 | -| train/ | | -| approx_kl | 0.013203685 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0533 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 200990 | -| policy_gradient_loss | -0.00163 | -| std | 0.00756 | -| value_loss | 2.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 20101 | -| time_elapsed | 108667 | -| total_timesteps | 2572928 | -| train/ | | -| approx_kl | 0.010200771 | -| clip_fraction | 0.0695 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | -0.00427 | -| n_updates | 201000 | -| policy_gradient_loss | -0.00228 | -| std | 0.00755 | -| value_loss | 1.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20102 | -| time_elapsed | 108671 | -| total_timesteps | 2573056 | -| train/ | | -| approx_kl | 0.024843378 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 201010 | -| policy_gradient_loss | 0.0335 | -| std | 0.00755 | -| value_loss | 1.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20103 | -| time_elapsed | 108679 | -| total_timesteps | 2573184 | -| train/ | | -| approx_kl | 0.006149377 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 201020 | -| policy_gradient_loss | -0.0109 | -| std | 0.00755 | -| value_loss | 0.000473 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20104 | -| time_elapsed | 108683 | -| total_timesteps | 2573312 | -| train/ | | -| approx_kl | 0.004018801 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.849 | -| learning_rate | 0.0003 | -| loss | -0.00541 | -| n_updates | 201030 | -| policy_gradient_loss | 0.000559 | -| std | 0.00756 | -| value_loss | 8.95e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20105 | -| time_elapsed | 108688 | -| total_timesteps | 2573440 | -| train/ | | -| approx_kl | 0.023356117 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.099 | -| learning_rate | 0.0003 | -| loss | -0.00779 | -| n_updates | 201040 | -| policy_gradient_loss | 0.0235 | -| std | 0.00756 | -| value_loss | 1.05e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20106 | -| time_elapsed | 108694 | -| total_timesteps | 2573568 | -| train/ | | -| approx_kl | 0.61344683 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 201050 | -| policy_gradient_loss | 0.163 | -| std | 0.00755 | -| value_loss | 1.84e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20107 | -| time_elapsed | 108700 | -| total_timesteps | 2573696 | -| train/ | | -| approx_kl | 0.10513325 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0846 | -| learning_rate | 0.0003 | -| loss | 0.0487 | -| n_updates | 201060 | -| policy_gradient_loss | 0.039 | -| std | 0.00758 | -| value_loss | 6.08e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20108 | -| time_elapsed | 108706 | -| total_timesteps | 2573824 | -| train/ | | -| approx_kl | 0.0044116164 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.01 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 201070 | -| policy_gradient_loss | -0.00197 | -| std | 0.00759 | -| value_loss | 7.83e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.861 | -| time/ | | -| fps | 23 | -| iterations | 20109 | -| time_elapsed | 108710 | -| total_timesteps | 2573952 | -| train/ | | -| approx_kl | 0.021399662 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00735 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 201080 | -| policy_gradient_loss | 0.0155 | -| std | 0.0076 | -| value_loss | 4.98e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20110 | -| time_elapsed | 108715 | -| total_timesteps | 2574080 | -| train/ | | -| approx_kl | 0.60282236 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0821 | -| learning_rate | 0.0003 | -| loss | 0.446 | -| n_updates | 201090 | -| policy_gradient_loss | 0.205 | -| std | 0.0076 | -| value_loss | 3.06e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20111 | -| time_elapsed | 108724 | -| total_timesteps | 2574208 | -| train/ | | -| approx_kl | 0.0141943 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -3.03 | -| learning_rate | 0.0003 | -| loss | -0.0263 | -| n_updates | 201100 | -| policy_gradient_loss | -0.00606 | -| std | 0.0076 | -| value_loss | 0.00247 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20112 | -| time_elapsed | 108728 | -| total_timesteps | 2574336 | -| train/ | | -| approx_kl | 0.008339912 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0933 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 201110 | -| policy_gradient_loss | 0.00699 | -| std | 0.00761 | -| value_loss | 6.01e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20113 | -| time_elapsed | 108732 | -| total_timesteps | 2574464 | -| train/ | | -| approx_kl | 0.0013750992 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00525 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 201120 | -| policy_gradient_loss | -0.0118 | -| std | 0.00761 | -| value_loss | 1.94e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20114 | -| time_elapsed | 108737 | -| total_timesteps | 2574592 | -| train/ | | -| approx_kl | 0.042114392 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 201130 | -| policy_gradient_loss | 0.00621 | -| std | 0.00763 | -| value_loss | 0.000235 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20115 | -| time_elapsed | 108742 | -| total_timesteps | 2574720 | -| train/ | | -| approx_kl | 0.10338469 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | 0.0324 | -| n_updates | 201140 | -| policy_gradient_loss | 0.0149 | -| std | 0.00763 | -| value_loss | 2.03e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20116 | -| time_elapsed | 108746 | -| total_timesteps | 2574848 | -| train/ | | -| approx_kl | 0.006390394 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 201150 | -| policy_gradient_loss | 0.00906 | -| std | 0.00764 | -| value_loss | 7.88e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.854 | -| time/ | | -| fps | 23 | -| iterations | 20117 | -| time_elapsed | 108751 | -| total_timesteps | 2574976 | -| train/ | | -| approx_kl | 0.17838094 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 201160 | -| policy_gradient_loss | 0.105 | -| std | 0.00764 | -| value_loss | 4.32e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 20118 | -| time_elapsed | 108756 | -| total_timesteps | 2575104 | -| train/ | | -| approx_kl | 0.031951513 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | -0.00718 | -| n_updates | 201170 | -| policy_gradient_loss | 0.0117 | -| std | 0.00764 | -| value_loss | 3.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 20119 | -| time_elapsed | 108768 | -| total_timesteps | 2575232 | -| train/ | | -| approx_kl | 0.009336609 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 201180 | -| policy_gradient_loss | 0.00221 | -| std | 0.00764 | -| value_loss | 0.000359 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 20120 | -| time_elapsed | 108774 | -| total_timesteps | 2575360 | -| train/ | | -| approx_kl | 0.0037870924 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 201190 | -| policy_gradient_loss | 0.00828 | -| std | 0.00764 | -| value_loss | 1.92e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 20121 | -| time_elapsed | 108778 | -| total_timesteps | 2575488 | -| train/ | | -| approx_kl | 0.0011652652 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.00489 | -| n_updates | 201200 | -| policy_gradient_loss | 0.00299 | -| std | 0.00765 | -| value_loss | 4.06e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 20122 | -| time_elapsed | 108784 | -| total_timesteps | 2575616 | -| train/ | | -| approx_kl | 0.039179478 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | 0.00995 | -| n_updates | 201210 | -| policy_gradient_loss | 0.00322 | -| std | 0.00765 | -| value_loss | 3.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 20123 | -| time_elapsed | 108787 | -| total_timesteps | 2575744 | -| train/ | | -| approx_kl | 0.006152761 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | -0.00575 | -| n_updates | 201220 | -| policy_gradient_loss | 0.00346 | -| std | 0.00765 | -| value_loss | 2.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 20124 | -| time_elapsed | 108792 | -| total_timesteps | 2575872 | -| train/ | | -| approx_kl | 0.05636686 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | 0.000325 | -| n_updates | 201230 | -| policy_gradient_loss | 0.0139 | -| std | 0.00765 | -| value_loss | 1.71e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20125 | -| time_elapsed | 108796 | -| total_timesteps | 2576000 | -| train/ | | -| approx_kl | 0.0768366 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 201240 | -| policy_gradient_loss | 0.0477 | -| std | 0.00765 | -| value_loss | 1.31e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20126 | -| time_elapsed | 108804 | -| total_timesteps | 2576128 | -| train/ | | -| approx_kl | 0.027843816 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00298 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 201250 | -| policy_gradient_loss | 0.0374 | -| std | 0.00765 | -| value_loss | 6.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20127 | -| time_elapsed | 108815 | -| total_timesteps | 2576256 | -| train/ | | -| approx_kl | 0.43203223 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.743 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 201260 | -| policy_gradient_loss | 0.0541 | -| std | 0.00765 | -| value_loss | 0.00569 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20128 | -| time_elapsed | 108819 | -| total_timesteps | 2576384 | -| train/ | | -| approx_kl | 0.02120525 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.317 | -| learning_rate | 0.0003 | -| loss | 0.00396 | -| n_updates | 201270 | -| policy_gradient_loss | 0.000121 | -| std | 0.00765 | -| value_loss | 7.78e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20129 | -| time_elapsed | 108824 | -| total_timesteps | 2576512 | -| train/ | | -| approx_kl | 0.01694266 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00773 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 201280 | -| policy_gradient_loss | 0.0257 | -| std | 0.00765 | -| value_loss | 4.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20130 | -| time_elapsed | 108828 | -| total_timesteps | 2576640 | -| train/ | | -| approx_kl | 0.090433426 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.0678 | -| n_updates | 201290 | -| policy_gradient_loss | 0.0333 | -| std | 0.00764 | -| value_loss | 4.02e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20131 | -| time_elapsed | 108832 | -| total_timesteps | 2576768 | -| train/ | | -| approx_kl | 0.4851044 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0902 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 201300 | -| policy_gradient_loss | 0.0341 | -| std | 0.00763 | -| value_loss | 2.37e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20132 | -| time_elapsed | 108837 | -| total_timesteps | 2576896 | -| train/ | | -| approx_kl | 0.029871482 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 201310 | -| policy_gradient_loss | 0.0102 | -| std | 0.00763 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20133 | -| time_elapsed | 108843 | -| total_timesteps | 2577024 | -| train/ | | -| approx_kl | 0.033548906 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0558 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 201320 | -| policy_gradient_loss | -0.00345 | -| std | 0.00763 | -| value_loss | 9.68e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20134 | -| time_elapsed | 108853 | -| total_timesteps | 2577152 | -| train/ | | -| approx_kl | 0.0027862992 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.738 | -| learning_rate | 0.0003 | -| loss | -0.0282 | -| n_updates | 201330 | -| policy_gradient_loss | -0.0174 | -| std | 0.00763 | -| value_loss | 0.00594 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20135 | -| time_elapsed | 108856 | -| total_timesteps | 2577280 | -| train/ | | -| approx_kl | 0.050062433 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | 0.0299 | -| n_updates | 201340 | -| policy_gradient_loss | 0.00763 | -| std | 0.00763 | -| value_loss | 7.53e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20136 | -| time_elapsed | 108860 | -| total_timesteps | 2577408 | -| train/ | | -| approx_kl | 0.034827545 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00879 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 201350 | -| policy_gradient_loss | 0.0292 | -| std | 0.00763 | -| value_loss | 4.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20137 | -| time_elapsed | 108865 | -| total_timesteps | 2577536 | -| train/ | | -| approx_kl | 0.096475646 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | 0.0707 | -| n_updates | 201360 | -| policy_gradient_loss | 0.0534 | -| std | 0.00763 | -| value_loss | 2.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20138 | -| time_elapsed | 108870 | -| total_timesteps | 2577664 | -| train/ | | -| approx_kl | 0.026127849 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 201370 | -| policy_gradient_loss | 0.0292 | -| std | 0.00762 | -| value_loss | 2.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20139 | -| time_elapsed | 108874 | -| total_timesteps | 2577792 | -| train/ | | -| approx_kl | 0.74827945 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.308 | -| n_updates | 201380 | -| policy_gradient_loss | 0.169 | -| std | 0.00763 | -| value_loss | 1.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20140 | -| time_elapsed | 108878 | -| total_timesteps | 2577920 | -| train/ | | -| approx_kl | 0.026737383 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 201390 | -| policy_gradient_loss | -0.00595 | -| std | 0.00763 | -| value_loss | 9.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20141 | -| time_elapsed | 108882 | -| total_timesteps | 2578048 | -| train/ | | -| approx_kl | 0.013600623 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 201400 | -| policy_gradient_loss | -0.00366 | -| std | 0.00763 | -| value_loss | 6.81e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20142 | -| time_elapsed | 108892 | -| total_timesteps | 2578176 | -| train/ | | -| approx_kl | 0.06871903 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 201410 | -| policy_gradient_loss | 0.00112 | -| std | 0.00763 | -| value_loss | 0.000185 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20143 | -| time_elapsed | 108897 | -| total_timesteps | 2578304 | -| train/ | | -| approx_kl | 0.016420929 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00795 | -| learning_rate | 0.0003 | -| loss | 0.00652 | -| n_updates | 201420 | -| policy_gradient_loss | 0.0218 | -| std | 0.00763 | -| value_loss | 1.32e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20144 | -| time_elapsed | 108902 | -| total_timesteps | 2578432 | -| train/ | | -| approx_kl | 0.004126853 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.00689 | -| learning_rate | 0.0003 | -| loss | -0.000135 | -| n_updates | 201430 | -| policy_gradient_loss | 0.0206 | -| std | 0.00761 | -| value_loss | 5.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20145 | -| time_elapsed | 108908 | -| total_timesteps | 2578560 | -| train/ | | -| approx_kl | 0.032009825 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.000123 | -| n_updates | 201440 | -| policy_gradient_loss | 0.0305 | -| std | 0.0076 | -| value_loss | 9.41e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20146 | -| time_elapsed | 108913 | -| total_timesteps | 2578688 | -| train/ | | -| approx_kl | 0.0030492898 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.00134 | -| learning_rate | 0.0003 | -| loss | -0.00424 | -| n_updates | 201450 | -| policy_gradient_loss | 0.0811 | -| std | 0.00759 | -| value_loss | 3.9e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20147 | -| time_elapsed | 108917 | -| total_timesteps | 2578816 | -| train/ | | -| approx_kl | 0.027355658 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.00852 | -| n_updates | 201460 | -| policy_gradient_loss | 0.0266 | -| std | 0.00759 | -| value_loss | 2.85e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20148 | -| time_elapsed | 108923 | -| total_timesteps | 2578944 | -| train/ | | -| approx_kl | 0.0005405876 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.00136 | -| n_updates | 201470 | -| policy_gradient_loss | 0.0248 | -| std | 0.00757 | -| value_loss | 4.75e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20149 | -| time_elapsed | 108927 | -| total_timesteps | 2579072 | -| train/ | | -| approx_kl | 0.44061276 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 201480 | -| policy_gradient_loss | 0.115 | -| std | 0.00756 | -| value_loss | 4.6e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20150 | -| time_elapsed | 108935 | -| total_timesteps | 2579200 | -| train/ | | -| approx_kl | 0.26405022 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.692 | -| learning_rate | 0.0003 | -| loss | 0.00234 | -| n_updates | 201490 | -| policy_gradient_loss | 0.0099 | -| std | 0.00756 | -| value_loss | 0.000742 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20151 | -| time_elapsed | 108940 | -| total_timesteps | 2579328 | -| train/ | | -| approx_kl | 0.18386196 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.65 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 201500 | -| policy_gradient_loss | 0.132 | -| std | 0.00756 | -| value_loss | 1.98e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20152 | -| time_elapsed | 108945 | -| total_timesteps | 2579456 | -| train/ | | -| approx_kl | 0.10994373 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.00167 | -| learning_rate | 0.0003 | -| loss | 0.0727 | -| n_updates | 201510 | -| policy_gradient_loss | 0.112 | -| std | 0.00756 | -| value_loss | 9.39e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20153 | -| time_elapsed | 108950 | -| total_timesteps | 2579584 | -| train/ | | -| approx_kl | 0.022369448 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -2.53 | -| learning_rate | 0.0003 | -| loss | 0.00364 | -| n_updates | 201520 | -| policy_gradient_loss | 0.0166 | -| std | 0.00755 | -| value_loss | 6.66e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20154 | -| time_elapsed | 108955 | -| total_timesteps | 2579712 | -| train/ | | -| approx_kl | 0.46216634 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.00758 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 201530 | -| policy_gradient_loss | 0.0395 | -| std | 0.00755 | -| value_loss | 1.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20155 | -| time_elapsed | 108960 | -| total_timesteps | 2579840 | -| train/ | | -| approx_kl | 0.008503068 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 201540 | -| policy_gradient_loss | 0.00358 | -| std | 0.00755 | -| value_loss | 5.43e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20156 | -| time_elapsed | 108967 | -| total_timesteps | 2579968 | -| train/ | | -| approx_kl | 0.0006147651 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.00283 | -| n_updates | 201550 | -| policy_gradient_loss | 0.00393 | -| std | 0.00755 | -| value_loss | 3.41e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20157 | -| time_elapsed | 108972 | -| total_timesteps | 2580096 | -| train/ | | -| approx_kl | 6.295275e-06 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.000217 | -| n_updates | 201560 | -| policy_gradient_loss | 0.00325 | -| std | 0.00755 | -| value_loss | 2.1e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20158 | -| time_elapsed | 108982 | -| total_timesteps | 2580224 | -| train/ | | -| approx_kl | 0.0014412883 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.863 | -| learning_rate | 0.0003 | -| loss | -0.00807 | -| n_updates | 201570 | -| policy_gradient_loss | -0.00836 | -| std | 0.00755 | -| value_loss | 0.00185 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20159 | -| time_elapsed | 108987 | -| total_timesteps | 2580352 | -| train/ | | -| approx_kl | 0.39178884 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 201580 | -| policy_gradient_loss | 0.0371 | -| std | 0.00755 | -| value_loss | 0.000308 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20160 | -| time_elapsed | 108992 | -| total_timesteps | 2580480 | -| train/ | | -| approx_kl | 0.034594897 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.00729 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 201590 | -| policy_gradient_loss | 0.012 | -| std | 0.00755 | -| value_loss | 2.42e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20161 | -| time_elapsed | 108996 | -| total_timesteps | 2580608 | -| train/ | | -| approx_kl | 7.909397e-05 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | -0.00179 | -| n_updates | 201600 | -| policy_gradient_loss | -0.00263 | -| std | 0.00755 | -| value_loss | 1.46e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20162 | -| time_elapsed | 109001 | -| total_timesteps | 2580736 | -| train/ | | -| approx_kl | 0.03187881 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 201610 | -| policy_gradient_loss | 0.00864 | -| std | 0.00755 | -| value_loss | 8.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20163 | -| time_elapsed | 109005 | -| total_timesteps | 2580864 | -| train/ | | -| approx_kl | 0.006122127 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | -0.00434 | -| n_updates | 201620 | -| policy_gradient_loss | 0.00262 | -| std | 0.00755 | -| value_loss | 5.75e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20164 | -| time_elapsed | 109012 | -| total_timesteps | 2580992 | -| train/ | | -| approx_kl | 0.051706128 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | 0.029 | -| n_updates | 201630 | -| policy_gradient_loss | 0.00675 | -| std | 0.00756 | -| value_loss | 9.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20165 | -| time_elapsed | 109018 | -| total_timesteps | 2581120 | -| train/ | | -| approx_kl | 0.038407166 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 201640 | -| policy_gradient_loss | 0.0357 | -| std | 0.00757 | -| value_loss | 2.68e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20166 | -| time_elapsed | 109027 | -| total_timesteps | 2581248 | -| train/ | | -| approx_kl | 0.84944046 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 201650 | -| policy_gradient_loss | 0.0374 | -| std | 0.00757 | -| value_loss | 0.0025 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20167 | -| time_elapsed | 109031 | -| total_timesteps | 2581376 | -| train/ | | -| approx_kl | 0.00089169294 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -1.13 | -| learning_rate | 0.0003 | -| loss | 0.000386 | -| n_updates | 201660 | -| policy_gradient_loss | 0.0114 | -| std | 0.00757 | -| value_loss | 1.89e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20168 | -| time_elapsed | 109036 | -| total_timesteps | 2581504 | -| train/ | | -| approx_kl | 0.017511236 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -5.19 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 201670 | -| policy_gradient_loss | -0.000784 | -| std | 0.00757 | -| value_loss | 7.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20169 | -| time_elapsed | 109039 | -| total_timesteps | 2581632 | -| train/ | | -| approx_kl | 0.075606965 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0638 | -| n_updates | 201680 | -| policy_gradient_loss | 0.11 | -| std | 0.00758 | -| value_loss | 1.26e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20170 | -| time_elapsed | 109045 | -| total_timesteps | 2581760 | -| train/ | | -| approx_kl | 0.06974015 | -| clip_fraction | 0.611 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.496 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 201690 | -| policy_gradient_loss | 0.0422 | -| std | 0.00758 | -| value_loss | 1.05e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20171 | -| time_elapsed | 109049 | -| total_timesteps | 2581888 | -| train/ | | -| approx_kl | 0.07568001 | -| clip_fraction | 0.606 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00909 | -| learning_rate | 0.0003 | -| loss | 0.0675 | -| n_updates | 201700 | -| policy_gradient_loss | 0.0651 | -| std | 0.00758 | -| value_loss | 2.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20172 | -| time_elapsed | 109053 | -| total_timesteps | 2582016 | -| train/ | | -| approx_kl | 0.022066748 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 201710 | -| policy_gradient_loss | 0.021 | -| std | 0.00758 | -| value_loss | 1.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20173 | -| time_elapsed | 109065 | -| total_timesteps | 2582144 | -| train/ | | -| approx_kl | 0.06518499 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 201720 | -| policy_gradient_loss | -0.0122 | -| std | 0.00759 | -| value_loss | 0.000382 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20174 | -| time_elapsed | 109069 | -| total_timesteps | 2582272 | -| train/ | | -| approx_kl | 0.060500827 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.0499 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 201730 | -| policy_gradient_loss | 0.0232 | -| std | 0.00759 | -| value_loss | 6.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20175 | -| time_elapsed | 109072 | -| total_timesteps | 2582400 | -| train/ | | -| approx_kl | 0.09802581 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.0628 | -| n_updates | 201740 | -| policy_gradient_loss | 0.0275 | -| std | 0.00758 | -| value_loss | 1.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20176 | -| time_elapsed | 109076 | -| total_timesteps | 2582528 | -| train/ | | -| approx_kl | 0.008522317 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.00743 | -| n_updates | 201750 | -| policy_gradient_loss | 0.00854 | -| std | 0.00759 | -| value_loss | 8.6e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20177 | -| time_elapsed | 109080 | -| total_timesteps | 2582656 | -| train/ | | -| approx_kl | 0.18418646 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0632 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 201760 | -| policy_gradient_loss | 0.0961 | -| std | 0.00759 | -| value_loss | 4.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20178 | -| time_elapsed | 109084 | -| total_timesteps | 2582784 | -| train/ | | -| approx_kl | 0.022775404 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.0094 | -| n_updates | 201770 | -| policy_gradient_loss | 0.0123 | -| std | 0.00759 | -| value_loss | 5.17e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20179 | -| time_elapsed | 109088 | -| total_timesteps | 2582912 | -| train/ | | -| approx_kl | 0.00056682667 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.000345 | -| n_updates | 201780 | -| policy_gradient_loss | 0.027 | -| std | 0.00758 | -| value_loss | 2.23e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20180 | -| time_elapsed | 109093 | -| total_timesteps | 2583040 | -| train/ | | -| approx_kl | 0.41086176 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 201790 | -| policy_gradient_loss | 0.0511 | -| std | 0.00758 | -| value_loss | 1.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20181 | -| time_elapsed | 109102 | -| total_timesteps | 2583168 | -| train/ | | -| approx_kl | 0.010304958 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 201800 | -| policy_gradient_loss | -0.00902 | -| std | 0.00757 | -| value_loss | 0.0026 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20182 | -| time_elapsed | 109105 | -| total_timesteps | 2583296 | -| train/ | | -| approx_kl | 0.0002929829 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | 0.000117 | -| n_updates | 201810 | -| policy_gradient_loss | 0.0198 | -| std | 0.00756 | -| value_loss | 4.42e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20183 | -| time_elapsed | 109109 | -| total_timesteps | 2583424 | -| train/ | | -| approx_kl | 0.060018063 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.31 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 201820 | -| policy_gradient_loss | 0.0166 | -| std | 0.00756 | -| value_loss | 3.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20184 | -| time_elapsed | 109113 | -| total_timesteps | 2583552 | -| train/ | | -| approx_kl | 0.025284545 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 201830 | -| policy_gradient_loss | 0.0219 | -| std | 0.00756 | -| value_loss | 1.74e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20185 | -| time_elapsed | 109117 | -| total_timesteps | 2583680 | -| train/ | | -| approx_kl | 0.002593283 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 201840 | -| policy_gradient_loss | 0.0234 | -| std | 0.00756 | -| value_loss | 8.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20186 | -| time_elapsed | 109122 | -| total_timesteps | 2583808 | -| train/ | | -| approx_kl | 0.053724468 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 201850 | -| policy_gradient_loss | 0.022 | -| std | 0.00756 | -| value_loss | 6.36e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20187 | -| time_elapsed | 109125 | -| total_timesteps | 2583936 | -| train/ | | -| approx_kl | 0.2827842 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 201860 | -| policy_gradient_loss | 0.124 | -| std | 0.00756 | -| value_loss | 5.22e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20188 | -| time_elapsed | 109129 | -| total_timesteps | 2584064 | -| train/ | | -| approx_kl | 0.041094575 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 201870 | -| policy_gradient_loss | 0.0173 | -| std | 0.00756 | -| value_loss | 3.31e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20189 | -| time_elapsed | 109137 | -| total_timesteps | 2584192 | -| train/ | | -| approx_kl | 0.4330905 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 201880 | -| policy_gradient_loss | 0.0479 | -| std | 0.00756 | -| value_loss | 9.81e-05 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20190 | -| time_elapsed | 109142 | -| total_timesteps | 2584320 | -| train/ | | -| approx_kl | 8.1479084e-05 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | 0.00068 | -| n_updates | 201890 | -| policy_gradient_loss | 0.00325 | -| std | 0.00756 | -| value_loss | 9.23e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20191 | -| time_elapsed | 109147 | -| total_timesteps | 2584448 | -| train/ | | -| approx_kl | 0.057122447 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.0453 | -| n_updates | 201900 | -| policy_gradient_loss | 0.0444 | -| std | 0.00758 | -| value_loss | 2.18e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20192 | -| time_elapsed | 109152 | -| total_timesteps | 2584576 | -| train/ | | -| approx_kl | 0.0003014831 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | -0.000285 | -| n_updates | 201910 | -| policy_gradient_loss | 0.0116 | -| std | 0.00759 | -| value_loss | 1.11e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20193 | -| time_elapsed | 109158 | -| total_timesteps | 2584704 | -| train/ | | -| approx_kl | 0.009651129 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.00551 | -| n_updates | 201920 | -| policy_gradient_loss | 0.00792 | -| std | 0.00759 | -| value_loss | 2.81e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20194 | -| time_elapsed | 109162 | -| total_timesteps | 2584832 | -| train/ | | -| approx_kl | 0.0016308292 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 201930 | -| policy_gradient_loss | 0.0053 | -| std | 0.00759 | -| value_loss | 9.23e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20195 | -| time_elapsed | 109167 | -| total_timesteps | 2584960 | -| train/ | | -| approx_kl | 0.031043714 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0373 | -| n_updates | 201940 | -| policy_gradient_loss | 0.0815 | -| std | 0.00759 | -| value_loss | 6.25e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20196 | -| time_elapsed | 109172 | -| total_timesteps | 2585088 | -| train/ | | -| approx_kl | 0.007862145 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 201950 | -| policy_gradient_loss | 0.0179 | -| std | 0.00759 | -| value_loss | 4.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20197 | -| time_elapsed | 109182 | -| total_timesteps | 2585216 | -| train/ | | -| approx_kl | 0.023114406 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -4.91 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 201960 | -| policy_gradient_loss | -0.00989 | -| std | 0.00759 | -| value_loss | 0.00313 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20198 | -| time_elapsed | 109186 | -| total_timesteps | 2585344 | -| train/ | | -| approx_kl | 0.0002753595 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.343 | -| learning_rate | 0.0003 | -| loss | -0.000244 | -| n_updates | 201970 | -| policy_gradient_loss | 0.00964 | -| std | 0.00759 | -| value_loss | 1.36e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20199 | -| time_elapsed | 109190 | -| total_timesteps | 2585472 | -| train/ | | -| approx_kl | 0.060300693 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.152 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 201980 | -| policy_gradient_loss | 0.0876 | -| std | 0.00759 | -| value_loss | 4.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20200 | -| time_elapsed | 109194 | -| total_timesteps | 2585600 | -| train/ | | -| approx_kl | 0.016425602 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.402 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 201990 | -| policy_gradient_loss | 0.00966 | -| std | 0.00759 | -| value_loss | 3.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20201 | -| time_elapsed | 109198 | -| total_timesteps | 2585728 | -| train/ | | -| approx_kl | 0.006986422 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 202000 | -| policy_gradient_loss | -0.00457 | -| std | 0.00761 | -| value_loss | 7.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20202 | -| time_elapsed | 109204 | -| total_timesteps | 2585856 | -| train/ | | -| approx_kl | 0.028712947 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.679 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 202010 | -| policy_gradient_loss | 0.0244 | -| std | 0.00762 | -| value_loss | 1.39e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20203 | -| time_elapsed | 109210 | -| total_timesteps | 2585984 | -| train/ | | -| approx_kl | 0.0007629045 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -2.64 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 202020 | -| policy_gradient_loss | 0.0451 | -| std | 0.00762 | -| value_loss | 9.51e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20204 | -| time_elapsed | 109215 | -| total_timesteps | 2586112 | -| train/ | | -| approx_kl | 0.022289524 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00911 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 202030 | -| policy_gradient_loss | 0.0205 | -| std | 0.00762 | -| value_loss | 6.75e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20205 | -| time_elapsed | 109227 | -| total_timesteps | 2586240 | -| train/ | | -| approx_kl | 0.045077153 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 202040 | -| policy_gradient_loss | 0.00755 | -| std | 0.00762 | -| value_loss | 0.00568 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20206 | -| time_elapsed | 109232 | -| total_timesteps | 2586368 | -| train/ | | -| approx_kl | 0.028432155 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 202050 | -| policy_gradient_loss | 0.0178 | -| std | 0.00762 | -| value_loss | 9.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20207 | -| time_elapsed | 109236 | -| total_timesteps | 2586496 | -| train/ | | -| approx_kl | 0.070852235 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 202060 | -| policy_gradient_loss | 0.0408 | -| std | 0.00762 | -| value_loss | 2.22e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20208 | -| time_elapsed | 109241 | -| total_timesteps | 2586624 | -| train/ | | -| approx_kl | 0.00065146666 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 202070 | -| policy_gradient_loss | 0.0887 | -| std | 0.00762 | -| value_loss | 1.91e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20209 | -| time_elapsed | 109247 | -| total_timesteps | 2586752 | -| train/ | | -| approx_kl | 0.10175798 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0918 | -| n_updates | 202080 | -| policy_gradient_loss | 0.168 | -| std | 0.00762 | -| value_loss | 1.41e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 20210 | -| time_elapsed | 109251 | -| total_timesteps | 2586880 | -| train/ | | -| approx_kl | 0.0077871876 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.0025 | -| n_updates | 202090 | -| policy_gradient_loss | 0.0149 | -| std | 0.00762 | -| value_loss | 2.54e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20211 | -| time_elapsed | 109257 | -| total_timesteps | 2587008 | -| train/ | | -| approx_kl | 0.0023089428 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | -0.0098 | -| n_updates | 202100 | -| policy_gradient_loss | 0.0107 | -| std | 0.00762 | -| value_loss | 2.97e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20212 | -| time_elapsed | 109267 | -| total_timesteps | 2587136 | -| train/ | | -| approx_kl | 0.04950585 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.00137 | -| n_updates | 202110 | -| policy_gradient_loss | 0.00564 | -| std | 0.00762 | -| value_loss | 6.93e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20213 | -| time_elapsed | 109271 | -| total_timesteps | 2587264 | -| train/ | | -| approx_kl | 0.19806914 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.649 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 202120 | -| policy_gradient_loss | 0.0642 | -| std | 0.00762 | -| value_loss | 2.74e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20214 | -| time_elapsed | 109277 | -| total_timesteps | 2587392 | -| train/ | | -| approx_kl | 0.1427559 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0944 | -| n_updates | 202130 | -| policy_gradient_loss | 0.107 | -| std | 0.00762 | -| value_loss | 2.24e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20215 | -| time_elapsed | 109280 | -| total_timesteps | 2587520 | -| train/ | | -| approx_kl | 0.025380664 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 202140 | -| policy_gradient_loss | 0.0185 | -| std | 0.00763 | -| value_loss | 1.77e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20216 | -| time_elapsed | 109284 | -| total_timesteps | 2587648 | -| train/ | | -| approx_kl | 0.5371774 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.241 | -| n_updates | 202150 | -| policy_gradient_loss | 0.0603 | -| std | 0.00762 | -| value_loss | 9.85e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20217 | -| time_elapsed | 109289 | -| total_timesteps | 2587776 | -| train/ | | -| approx_kl | 0.008073422 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 202160 | -| policy_gradient_loss | 0.00504 | -| std | 0.00762 | -| value_loss | 6.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 20218 | -| time_elapsed | 109294 | -| total_timesteps | 2587904 | -| train/ | | -| approx_kl | 0.049502477 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 202170 | -| policy_gradient_loss | 0.0233 | -| std | 0.00764 | -| value_loss | 3.5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20219 | -| time_elapsed | 109299 | -| total_timesteps | 2588032 | -| train/ | | -| approx_kl | 0.61545205 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -4.12 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 202180 | -| policy_gradient_loss | 0.112 | -| std | 0.00765 | -| value_loss | 5.31e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20220 | -| time_elapsed | 109308 | -| total_timesteps | 2588160 | -| train/ | | -| approx_kl | 0.18233931 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.823 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 202190 | -| policy_gradient_loss | 0.000537 | -| std | 0.00766 | -| value_loss | 0.00336 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20221 | -| time_elapsed | 109313 | -| total_timesteps | 2588288 | -| train/ | | -| approx_kl | 0.050642103 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | 0.0051 | -| n_updates | 202200 | -| policy_gradient_loss | 0.0137 | -| std | 0.00766 | -| value_loss | 1.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20222 | -| time_elapsed | 109318 | -| total_timesteps | 2588416 | -| train/ | | -| approx_kl | 0.24087541 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00808 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 202210 | -| policy_gradient_loss | 0.12 | -| std | 0.00766 | -| value_loss | 2.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20223 | -| time_elapsed | 109324 | -| total_timesteps | 2588544 | -| train/ | | -| approx_kl | 0.13868831 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | 0.0879 | -| n_updates | 202220 | -| policy_gradient_loss | 0.126 | -| std | 0.00766 | -| value_loss | 9.93e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20224 | -| time_elapsed | 109329 | -| total_timesteps | 2588672 | -| train/ | | -| approx_kl | 0.10993348 | -| clip_fraction | 0.661 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 202230 | -| policy_gradient_loss | 0.0842 | -| std | 0.00766 | -| value_loss | 8.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20225 | -| time_elapsed | 109333 | -| total_timesteps | 2588800 | -| train/ | | -| approx_kl | 0.089867845 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0903 | -| n_updates | 202240 | -| policy_gradient_loss | 0.0795 | -| std | 0.00766 | -| value_loss | 6.42e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20226 | -| time_elapsed | 109337 | -| total_timesteps | 2588928 | -| train/ | | -| approx_kl | 0.1034299 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0777 | -| n_updates | 202250 | -| policy_gradient_loss | 0.126 | -| std | 0.00766 | -| value_loss | 2.19e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20227 | -| time_elapsed | 109342 | -| total_timesteps | 2589056 | -| train/ | | -| approx_kl | 0.091511145 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.484 | -| learning_rate | 0.0003 | -| loss | 0.0593 | -| n_updates | 202260 | -| policy_gradient_loss | 0.0917 | -| std | 0.00765 | -| value_loss | 2.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20228 | -| time_elapsed | 109350 | -| total_timesteps | 2589184 | -| train/ | | -| approx_kl | 0.020592516 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 202270 | -| policy_gradient_loss | -0.00926 | -| std | 0.00765 | -| value_loss | 0.0039 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20229 | -| time_elapsed | 109355 | -| total_timesteps | 2589312 | -| train/ | | -| approx_kl | 0.008415951 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 202280 | -| policy_gradient_loss | 0.0263 | -| std | 0.00765 | -| value_loss | 5.73e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20230 | -| time_elapsed | 109359 | -| total_timesteps | 2589440 | -| train/ | | -| approx_kl | 0.13200268 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00975 | -| learning_rate | 0.0003 | -| loss | 0.0863 | -| n_updates | 202290 | -| policy_gradient_loss | 0.0392 | -| std | 0.00765 | -| value_loss | 5.47e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20231 | -| time_elapsed | 109364 | -| total_timesteps | 2589568 | -| train/ | | -| approx_kl | 0.03466201 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 202300 | -| policy_gradient_loss | 0.0359 | -| std | 0.00765 | -| value_loss | 7.15e-06 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20232 | -| time_elapsed | 109369 | -| total_timesteps | 2589696 | -| train/ | | -| approx_kl | 0.089543 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.0799 | -| n_updates | 202310 | -| policy_gradient_loss | 0.0436 | -| std | 0.00766 | -| value_loss | 1.74e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20233 | -| time_elapsed | 109375 | -| total_timesteps | 2589824 | -| train/ | | -| approx_kl | 0.022870516 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.00747 | -| n_updates | 202320 | -| policy_gradient_loss | 0.0252 | -| std | 0.00766 | -| value_loss | 1.04e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 20234 | -| time_elapsed | 109380 | -| total_timesteps | 2589952 | -| train/ | | -| approx_kl | 0.657347 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.247 | -| n_updates | 202330 | -| policy_gradient_loss | 0.134 | -| std | 0.00766 | -| value_loss | 7.44e-07 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20235 | -| time_elapsed | 109385 | -| total_timesteps | 2590080 | -| train/ | | -| approx_kl | 0.0055402745 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 202340 | -| policy_gradient_loss | 0.019 | -| std | 0.00766 | -| value_loss | 5.77e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20236 | -| time_elapsed | 109393 | -| total_timesteps | 2590208 | -| train/ | | -| approx_kl | 0.21139659 | -| clip_fraction | 0.66 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.948 | -| learning_rate | 0.0003 | -| loss | 0.0818 | -| n_updates | 202350 | -| policy_gradient_loss | 0.0644 | -| std | 0.00765 | -| value_loss | 0.000576 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20237 | -| time_elapsed | 109397 | -| total_timesteps | 2590336 | -| train/ | | -| approx_kl | 0.16396871 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.000704 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 202360 | -| policy_gradient_loss | 0.114 | -| std | 0.00765 | -| value_loss | 4.43e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20238 | -| time_elapsed | 109403 | -| total_timesteps | 2590464 | -| train/ | | -| approx_kl | 0.027009428 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.00363 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 202370 | -| policy_gradient_loss | 0.0123 | -| std | 0.00765 | -| value_loss | 1.68e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20239 | -| time_elapsed | 109409 | -| total_timesteps | 2590592 | -| train/ | | -| approx_kl | 0.0010508699 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | -0.000485 | -| n_updates | 202380 | -| policy_gradient_loss | 0.0245 | -| std | 0.00768 | -| value_loss | 6.5e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20240 | -| time_elapsed | 109414 | -| total_timesteps | 2590720 | -| train/ | | -| approx_kl | 0.45060802 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -42.3 | -| learning_rate | 0.0003 | -| loss | 0.265 | -| n_updates | 202390 | -| policy_gradient_loss | 0.0743 | -| std | 0.00769 | -| value_loss | 0.000113 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20241 | -| time_elapsed | 109420 | -| total_timesteps | 2590848 | -| train/ | | -| approx_kl | 0.013426825 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | 0.00483 | -| n_updates | 202400 | -| policy_gradient_loss | 0.00156 | -| std | 0.00773 | -| value_loss | 7.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20242 | -| time_elapsed | 109424 | -| total_timesteps | 2590976 | -| train/ | | -| approx_kl | 0.011076331 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | -0.00202 | -| n_updates | 202410 | -| policy_gradient_loss | -0.00161 | -| std | 0.00775 | -| value_loss | 1.77e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20243 | -| time_elapsed | 109429 | -| total_timesteps | 2591104 | -| train/ | | -| approx_kl | 0.009174363 | -| clip_fraction | 0.0617 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00205 | -| n_updates | 202420 | -| policy_gradient_loss | -0.0011 | -| std | 0.00776 | -| value_loss | 1.82e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20244 | -| time_elapsed | 109442 | -| total_timesteps | 2591232 | -| train/ | | -| approx_kl | 0.08506404 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.601 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 202430 | -| policy_gradient_loss | -0.0136 | -| std | 0.00777 | -| value_loss | 0.00102 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20245 | -| time_elapsed | 109447 | -| total_timesteps | 2591360 | -| train/ | | -| approx_kl | 0.10032076 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.776 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 202440 | -| policy_gradient_loss | 0.0371 | -| std | 0.00776 | -| value_loss | 4.73e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20246 | -| time_elapsed | 109451 | -| total_timesteps | 2591488 | -| train/ | | -| approx_kl | 0.00016255071 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.000104 | -| n_updates | 202450 | -| policy_gradient_loss | 0.0174 | -| std | 0.00775 | -| value_loss | 2.76e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20247 | -| time_elapsed | 109457 | -| total_timesteps | 2591616 | -| train/ | | -| approx_kl | 0.00791227 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.00343 | -| n_updates | 202460 | -| policy_gradient_loss | 0.0132 | -| std | 0.00775 | -| value_loss | 2.13e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20248 | -| time_elapsed | 109462 | -| total_timesteps | 2591744 | -| train/ | | -| approx_kl | 0.012295729 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.00349 | -| n_updates | 202470 | -| policy_gradient_loss | 0.023 | -| std | 0.00774 | -| value_loss | 1.44e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20249 | -| time_elapsed | 109468 | -| total_timesteps | 2591872 | -| train/ | | -| approx_kl | 0.07047824 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.459 | -| learning_rate | 0.0003 | -| loss | 0.0217 | -| n_updates | 202480 | -| policy_gradient_loss | 0.0127 | -| std | 0.00774 | -| value_loss | 6.21e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20250 | -| time_elapsed | 109473 | -| total_timesteps | 2592000 | -| train/ | | -| approx_kl | 0.11364047 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0772 | -| learning_rate | 0.0003 | -| loss | 0.0487 | -| n_updates | 202490 | -| policy_gradient_loss | 0.014 | -| std | 0.00776 | -| value_loss | 3.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20251 | -| time_elapsed | 109476 | -| total_timesteps | 2592128 | -| train/ | | -| approx_kl | 0.018613609 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 202500 | -| policy_gradient_loss | 0.0159 | -| std | 0.00777 | -| value_loss | 1.82e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20252 | -| time_elapsed | 109487 | -| total_timesteps | 2592256 | -| train/ | | -| approx_kl | 0.00035727723 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.836 | -| learning_rate | 0.0003 | -| loss | -0.00529 | -| n_updates | 202510 | -| policy_gradient_loss | 0.0045 | -| std | 0.00777 | -| value_loss | 0.00312 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20253 | -| time_elapsed | 109493 | -| total_timesteps | 2592384 | -| train/ | | -| approx_kl | 0.0006825919 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.00666 | -| n_updates | 202520 | -| policy_gradient_loss | 0.0148 | -| std | 0.00777 | -| value_loss | 1.07e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20254 | -| time_elapsed | 109497 | -| total_timesteps | 2592512 | -| train/ | | -| approx_kl | 0.00071644457 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 202530 | -| policy_gradient_loss | 0.022 | -| std | 0.00777 | -| value_loss | 2.48e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20255 | -| time_elapsed | 109502 | -| total_timesteps | 2592640 | -| train/ | | -| approx_kl | 0.15601401 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0717 | -| learning_rate | 0.0003 | -| loss | 0.078 | -| n_updates | 202540 | -| policy_gradient_loss | 0.0173 | -| std | 0.00777 | -| value_loss | 2.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20256 | -| time_elapsed | 109507 | -| total_timesteps | 2592768 | -| train/ | | -| approx_kl | 0.018460784 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 202550 | -| policy_gradient_loss | -0.00549 | -| std | 0.00777 | -| value_loss | 9.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20257 | -| time_elapsed | 109513 | -| total_timesteps | 2592896 | -| train/ | | -| approx_kl | 0.014530576 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.00426 | -| n_updates | 202560 | -| policy_gradient_loss | 0.0187 | -| std | 0.00777 | -| value_loss | 5.74e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20258 | -| time_elapsed | 109516 | -| total_timesteps | 2593024 | -| train/ | | -| approx_kl | 0.07372062 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.082 | -| learning_rate | 0.0003 | -| loss | 0.0296 | -| n_updates | 202570 | -| policy_gradient_loss | 0.0166 | -| std | 0.00777 | -| value_loss | 3.55e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20259 | -| time_elapsed | 109529 | -| total_timesteps | 2593152 | -| train/ | | -| approx_kl | 0.0044396673 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.117 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 202580 | -| policy_gradient_loss | -0.0118 | -| std | 0.00777 | -| value_loss | 0.00163 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20260 | -| time_elapsed | 109534 | -| total_timesteps | 2593280 | -| train/ | | -| approx_kl | 0.044510074 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 202590 | -| policy_gradient_loss | 0.0362 | -| std | 0.00777 | -| value_loss | 0.000322 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20261 | -| time_elapsed | 109539 | -| total_timesteps | 2593408 | -| train/ | | -| approx_kl | 0.17991787 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 0.0834 | -| n_updates | 202600 | -| policy_gradient_loss | 0.0388 | -| std | 0.00777 | -| value_loss | 1.25e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20262 | -| time_elapsed | 109543 | -| total_timesteps | 2593536 | -| train/ | | -| approx_kl | 0.03794002 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 202610 | -| policy_gradient_loss | 0.0704 | -| std | 0.00777 | -| value_loss | 4.13e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20263 | -| time_elapsed | 109547 | -| total_timesteps | 2593664 | -| train/ | | -| approx_kl | 0.20258008 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 202620 | -| policy_gradient_loss | 0.0282 | -| std | 0.00777 | -| value_loss | 3.92e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20264 | -| time_elapsed | 109552 | -| total_timesteps | 2593792 | -| train/ | | -| approx_kl | 0.00062739523 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | -0.004 | -| n_updates | 202630 | -| policy_gradient_loss | 0.00131 | -| std | 0.00777 | -| value_loss | 2.67e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20265 | -| time_elapsed | 109557 | -| total_timesteps | 2593920 | -| train/ | | -| approx_kl | 0.062158734 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 202640 | -| policy_gradient_loss | 0.0542 | -| std | 0.00777 | -| value_loss | 2.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20266 | -| time_elapsed | 109563 | -| total_timesteps | 2594048 | -| train/ | | -| approx_kl | 0.17420565 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.0598 | -| n_updates | 202650 | -| policy_gradient_loss | 0.0271 | -| std | 0.00777 | -| value_loss | 1.59e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20267 | -| time_elapsed | 109573 | -| total_timesteps | 2594176 | -| train/ | | -| approx_kl | 0.04928583 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 202660 | -| policy_gradient_loss | -0.00564 | -| std | 0.00776 | -| value_loss | 0.000101 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20268 | -| time_elapsed | 109578 | -| total_timesteps | 2594304 | -| train/ | | -| approx_kl | 0.1729994 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00895 | -| learning_rate | 0.0003 | -| loss | 0.0962 | -| n_updates | 202670 | -| policy_gradient_loss | 0.0353 | -| std | 0.00776 | -| value_loss | 6.69e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20269 | -| time_elapsed | 109583 | -| total_timesteps | 2594432 | -| train/ | | -| approx_kl | 0.03801069 | -| clip_fraction | 0.597 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 202680 | -| policy_gradient_loss | 0.0522 | -| std | 0.00776 | -| value_loss | 5.33e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20270 | -| time_elapsed | 109587 | -| total_timesteps | 2594560 | -| train/ | | -| approx_kl | 0.15849128 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | 0.0669 | -| n_updates | 202690 | -| policy_gradient_loss | 0.0263 | -| std | 0.00776 | -| value_loss | 4.3e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20271 | -| time_elapsed | 109593 | -| total_timesteps | 2594688 | -| train/ | | -| approx_kl | 0.048782382 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 202700 | -| policy_gradient_loss | 0.0602 | -| std | 0.00776 | -| value_loss | 2.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20272 | -| time_elapsed | 109597 | -| total_timesteps | 2594816 | -| train/ | | -| approx_kl | 0.030732311 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 202710 | -| policy_gradient_loss | 0.0206 | -| std | 0.00776 | -| value_loss | 2.67e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20273 | -| time_elapsed | 109602 | -| total_timesteps | 2594944 | -| train/ | | -| approx_kl | 0.13783771 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0821 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 202720 | -| policy_gradient_loss | 0.0275 | -| std | 0.00775 | -| value_loss | 8.39e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20274 | -| time_elapsed | 109606 | -| total_timesteps | 2595072 | -| train/ | | -| approx_kl | 0.03820867 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -3.07 | -| learning_rate | 0.0003 | -| loss | -0.0248 | -| n_updates | 202730 | -| policy_gradient_loss | 0.0434 | -| std | 0.00774 | -| value_loss | 6.54e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20275 | -| time_elapsed | 109615 | -| total_timesteps | 2595200 | -| train/ | | -| approx_kl | 0.092230186 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.818 | -| learning_rate | 0.0003 | -| loss | 0.00711 | -| n_updates | 202740 | -| policy_gradient_loss | 0.00695 | -| std | 0.00774 | -| value_loss | 0.00325 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20276 | -| time_elapsed | 109619 | -| total_timesteps | 2595328 | -| train/ | | -| approx_kl | 0.009256009 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | -0.00787 | -| n_updates | 202750 | -| policy_gradient_loss | 0.00752 | -| std | 0.00774 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20277 | -| time_elapsed | 109624 | -| total_timesteps | 2595456 | -| train/ | | -| approx_kl | 0.011417802 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00953 | -| learning_rate | 0.0003 | -| loss | -0.00693 | -| n_updates | 202760 | -| policy_gradient_loss | 0.0703 | -| std | 0.00774 | -| value_loss | 1.21e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20278 | -| time_elapsed | 109629 | -| total_timesteps | 2595584 | -| train/ | | -| approx_kl | 0.00863602 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 202770 | -| policy_gradient_loss | 0.00259 | -| std | 0.00774 | -| value_loss | 2.6e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20279 | -| time_elapsed | 109633 | -| total_timesteps | 2595712 | -| train/ | | -| approx_kl | 0.053479515 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.00456 | -| n_updates | 202780 | -| policy_gradient_loss | 0.0128 | -| std | 0.00774 | -| value_loss | 2.13e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20280 | -| time_elapsed | 109637 | -| total_timesteps | 2595840 | -| train/ | | -| approx_kl | 0.0010615601 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 202790 | -| policy_gradient_loss | 0.0195 | -| std | 0.00774 | -| value_loss | 1.25e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20281 | -| time_elapsed | 109641 | -| total_timesteps | 2595968 | -| train/ | | -| approx_kl | 0.06170257 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 202800 | -| policy_gradient_loss | 0.0327 | -| std | 0.00775 | -| value_loss | 8.52e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20282 | -| time_elapsed | 109647 | -| total_timesteps | 2596096 | -| train/ | | -| approx_kl | 0.08676839 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.0673 | -| n_updates | 202810 | -| policy_gradient_loss | 0.0286 | -| std | 0.00775 | -| value_loss | 5.55e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20283 | -| time_elapsed | 109660 | -| total_timesteps | 2596224 | -| train/ | | -| approx_kl | 0.40414062 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.67 | -| learning_rate | 0.0003 | -| loss | 0.0584 | -| n_updates | 202820 | -| policy_gradient_loss | 0.0184 | -| std | 0.00775 | -| value_loss | 0.00804 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20284 | -| time_elapsed | 109665 | -| total_timesteps | 2596352 | -| train/ | | -| approx_kl | 0.0064219604 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -4.27e-05 | -| n_updates | 202830 | -| policy_gradient_loss | 0.00217 | -| std | 0.00775 | -| value_loss | 3.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20285 | -| time_elapsed | 109669 | -| total_timesteps | 2596480 | -| train/ | | -| approx_kl | 0.056805376 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 202840 | -| policy_gradient_loss | 0.0305 | -| std | 0.00775 | -| value_loss | 8.05e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20286 | -| time_elapsed | 109674 | -| total_timesteps | 2596608 | -| train/ | | -| approx_kl | 0.07761742 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.0614 | -| n_updates | 202850 | -| policy_gradient_loss | 0.044 | -| std | 0.00775 | -| value_loss | 3.25e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20287 | -| time_elapsed | 109678 | -| total_timesteps | 2596736 | -| train/ | | -| approx_kl | 0.003197275 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0746 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 202860 | -| policy_gradient_loss | -0.00192 | -| std | 0.00775 | -| value_loss | 2.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20288 | -| time_elapsed | 109683 | -| total_timesteps | 2596864 | -| train/ | | -| approx_kl | 0.01870713 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.000394 | -| n_updates | 202870 | -| policy_gradient_loss | 0.0291 | -| std | 0.00775 | -| value_loss | 1.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20289 | -| time_elapsed | 109689 | -| total_timesteps | 2596992 | -| train/ | | -| approx_kl | 0.11399109 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0892 | -| n_updates | 202880 | -| policy_gradient_loss | 0.0545 | -| std | 0.00774 | -| value_loss | 7.67e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20290 | -| time_elapsed | 109693 | -| total_timesteps | 2597120 | -| train/ | | -| approx_kl | 0.13767341 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.0912 | -| n_updates | 202890 | -| policy_gradient_loss | 0.0247 | -| std | 0.00774 | -| value_loss | 4.85e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20291 | -| time_elapsed | 109706 | -| total_timesteps | 2597248 | -| train/ | | -| approx_kl | 0.4617172 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 202900 | -| policy_gradient_loss | 0.00676 | -| std | 0.00774 | -| value_loss | 0.00418 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20292 | -| time_elapsed | 109712 | -| total_timesteps | 2597376 | -| train/ | | -| approx_kl | 0.016533371 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00277 | -| n_updates | 202910 | -| policy_gradient_loss | 0.00423 | -| std | 0.00774 | -| value_loss | 1.18e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20293 | -| time_elapsed | 109717 | -| total_timesteps | 2597504 | -| train/ | | -| approx_kl | 0.045380928 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 202920 | -| policy_gradient_loss | -0.00698 | -| std | 0.00773 | -| value_loss | 1.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20294 | -| time_elapsed | 109722 | -| total_timesteps | 2597632 | -| train/ | | -| approx_kl | 0.007306891 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 202930 | -| policy_gradient_loss | 0.0042 | -| std | 0.00773 | -| value_loss | 1.21e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20295 | -| time_elapsed | 109725 | -| total_timesteps | 2597760 | -| train/ | | -| approx_kl | 0.00061471574 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.092 | -| learning_rate | 0.0003 | -| loss | 0.00714 | -| n_updates | 202940 | -| policy_gradient_loss | -0.0036 | -| std | 0.00773 | -| value_loss | 6.85e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 20296 | -| time_elapsed | 109728 | -| total_timesteps | 2597888 | -| train/ | | -| approx_kl | 0.005020233 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | -0.00147 | -| n_updates | 202950 | -| policy_gradient_loss | 0.00462 | -| std | 0.00774 | -| value_loss | 3.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20297 | -| time_elapsed | 109733 | -| total_timesteps | 2598016 | -| train/ | | -| approx_kl | 0.05931288 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 202960 | -| policy_gradient_loss | 0.00498 | -| std | 0.00774 | -| value_loss | 2.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20298 | -| time_elapsed | 109746 | -| total_timesteps | 2598144 | -| train/ | | -| approx_kl | 0.032534294 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.793 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 202970 | -| policy_gradient_loss | -0.00479 | -| std | 0.00774 | -| value_loss | 0.0044 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20299 | -| time_elapsed | 109751 | -| total_timesteps | 2598272 | -| train/ | | -| approx_kl | 0.69728416 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.321 | -| learning_rate | 0.0003 | -| loss | 0.349 | -| n_updates | 202980 | -| policy_gradient_loss | 0.151 | -| std | 0.00774 | -| value_loss | 1.92e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20300 | -| time_elapsed | 109755 | -| total_timesteps | 2598400 | -| train/ | | -| approx_kl | 0.0059191748 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.00931 | -| learning_rate | 0.0003 | -| loss | -0.00391 | -| n_updates | 202990 | -| policy_gradient_loss | 0.0189 | -| std | 0.00774 | -| value_loss | 4.92e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20301 | -| time_elapsed | 109759 | -| total_timesteps | 2598528 | -| train/ | | -| approx_kl | 0.19727403 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 203000 | -| policy_gradient_loss | 0.12 | -| std | 0.00774 | -| value_loss | 2.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20302 | -| time_elapsed | 109765 | -| total_timesteps | 2598656 | -| train/ | | -| approx_kl | 0.03966099 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 203010 | -| policy_gradient_loss | 0.023 | -| std | 0.00773 | -| value_loss | 2.08e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20303 | -| time_elapsed | 109769 | -| total_timesteps | 2598784 | -| train/ | | -| approx_kl | 0.12855875 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00473 | -| learning_rate | 0.0003 | -| loss | 0.0574 | -| n_updates | 203020 | -| policy_gradient_loss | 0.0158 | -| std | 0.00773 | -| value_loss | 4.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20304 | -| time_elapsed | 109773 | -| total_timesteps | 2598912 | -| train/ | | -| approx_kl | 0.012051113 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00811 | -| learning_rate | 0.0003 | -| loss | 0.00213 | -| n_updates | 203030 | -| policy_gradient_loss | 0.000648 | -| std | 0.00773 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20305 | -| time_elapsed | 109778 | -| total_timesteps | 2599040 | -| train/ | | -| approx_kl | 0.017352762 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 203040 | -| policy_gradient_loss | 0.0251 | -| std | 0.00772 | -| value_loss | 7.27e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20306 | -| time_elapsed | 109789 | -| total_timesteps | 2599168 | -| train/ | | -| approx_kl | 0.22644302 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | 0.0863 | -| n_updates | 203050 | -| policy_gradient_loss | 0.0641 | -| std | 0.00772 | -| value_loss | 0.0014 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20307 | -| time_elapsed | 109794 | -| total_timesteps | 2599296 | -| train/ | | -| approx_kl | 0.15455435 | -| clip_fraction | 0.625 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 203060 | -| policy_gradient_loss | 0.117 | -| std | 0.00772 | -| value_loss | 3.91e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20308 | -| time_elapsed | 109800 | -| total_timesteps | 2599424 | -| train/ | | -| approx_kl | 0.10602844 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0038 | -| learning_rate | 0.0003 | -| loss | 0.0773 | -| n_updates | 203070 | -| policy_gradient_loss | 0.114 | -| std | 0.00772 | -| value_loss | 7.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20309 | -| time_elapsed | 109805 | -| total_timesteps | 2599552 | -| train/ | | -| approx_kl | 0.117348686 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | 0.0884 | -| n_updates | 203080 | -| policy_gradient_loss | 0.11 | -| std | 0.00772 | -| value_loss | 5.42e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20310 | -| time_elapsed | 109810 | -| total_timesteps | 2599680 | -| train/ | | -| approx_kl | 0.0718018 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.0787 | -| n_updates | 203090 | -| policy_gradient_loss | 0.0778 | -| std | 0.00772 | -| value_loss | 4.6e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20311 | -| time_elapsed | 109814 | -| total_timesteps | 2599808 | -| train/ | | -| approx_kl | 0.119047984 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | 0.0882 | -| n_updates | 203100 | -| policy_gradient_loss | 0.111 | -| std | 0.00772 | -| value_loss | 3.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20312 | -| time_elapsed | 109818 | -| total_timesteps | 2599936 | -| train/ | | -| approx_kl | 0.017073452 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.00182 | -| n_updates | 203110 | -| policy_gradient_loss | 0.0143 | -| std | 0.00772 | -| value_loss | 2.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20313 | -| time_elapsed | 109823 | -| total_timesteps | 2600064 | -| train/ | | -| approx_kl | 0.38479468 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 203120 | -| policy_gradient_loss | 0.0353 | -| std | 0.00772 | -| value_loss | 1.57e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20314 | -| time_elapsed | 109831 | -| total_timesteps | 2600192 | -| train/ | | -| approx_kl | 0.0077145775 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 203130 | -| policy_gradient_loss | 0.000114 | -| std | 0.00772 | -| value_loss | 0.00101 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20315 | -| time_elapsed | 109836 | -| total_timesteps | 2600320 | -| train/ | | -| approx_kl | 0.030868243 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.000943 | -| n_updates | 203140 | -| policy_gradient_loss | 0.0108 | -| std | 0.00772 | -| value_loss | 2.17e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20316 | -| time_elapsed | 109841 | -| total_timesteps | 2600448 | -| train/ | | -| approx_kl | 0.0056210146 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -3.72 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 203150 | -| policy_gradient_loss | 0.0159 | -| std | 0.00773 | -| value_loss | 0.000528 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20317 | -| time_elapsed | 109845 | -| total_timesteps | 2600576 | -| train/ | | -| approx_kl | 0.42593044 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.268 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 203160 | -| policy_gradient_loss | 0.0588 | -| std | 0.00774 | -| value_loss | 3.15e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20318 | -| time_elapsed | 109850 | -| total_timesteps | 2600704 | -| train/ | | -| approx_kl | 0.0062300987 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00554 | -| learning_rate | 0.0003 | -| loss | -0.00722 | -| n_updates | 203170 | -| policy_gradient_loss | 0.0026 | -| std | 0.00774 | -| value_loss | 1.17e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20319 | -| time_elapsed | 109855 | -| total_timesteps | 2600832 | -| train/ | | -| approx_kl | 0.0007109167 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 203180 | -| policy_gradient_loss | 0.00504 | -| std | 0.00774 | -| value_loss | 7.2e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20320 | -| time_elapsed | 109860 | -| total_timesteps | 2600960 | -| train/ | | -| approx_kl | 0.06090256 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | 0.00497 | -| n_updates | 203190 | -| policy_gradient_loss | 0.0196 | -| std | 0.00773 | -| value_loss | 4.89e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20321 | -| time_elapsed | 109865 | -| total_timesteps | 2601088 | -| train/ | | -| approx_kl | 0.60356176 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | 0.23 | -| n_updates | 203200 | -| policy_gradient_loss | 0.128 | -| std | 0.00773 | -| value_loss | 2.91e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20322 | -| time_elapsed | 109875 | -| total_timesteps | 2601216 | -| train/ | | -| approx_kl | 0.012514977 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | 0.00855 | -| n_updates | 203210 | -| policy_gradient_loss | -0.00914 | -| std | 0.00773 | -| value_loss | 0.000428 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20323 | -| time_elapsed | 109881 | -| total_timesteps | 2601344 | -| train/ | | -| approx_kl | 0.0005162 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.00315 | -| learning_rate | 0.0003 | -| loss | 0.000336 | -| n_updates | 203220 | -| policy_gradient_loss | 0.0087 | -| std | 0.00772 | -| value_loss | 3.53e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20324 | -| time_elapsed | 109886 | -| total_timesteps | 2601472 | -| train/ | | -| approx_kl | 0.03604183 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | 0.00248 | -| n_updates | 203230 | -| policy_gradient_loss | 3.12e-05 | -| std | 0.00772 | -| value_loss | 1.25e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20325 | -| time_elapsed | 109892 | -| total_timesteps | 2601600 | -| train/ | | -| approx_kl | 0.006983417 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0992 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 203240 | -| policy_gradient_loss | 0.00278 | -| std | 0.00771 | -| value_loss | 6.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20326 | -| time_elapsed | 109897 | -| total_timesteps | 2601728 | -| train/ | | -| approx_kl | 0.029995926 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 203250 | -| policy_gradient_loss | 0.126 | -| std | 0.00771 | -| value_loss | 4.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20327 | -| time_elapsed | 109902 | -| total_timesteps | 2601856 | -| train/ | | -| approx_kl | 0.07461034 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.0772 | -| n_updates | 203260 | -| policy_gradient_loss | 0.0943 | -| std | 0.00771 | -| value_loss | 3.42e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20328 | -| time_elapsed | 109906 | -| total_timesteps | 2601984 | -| train/ | | -| approx_kl | 0.075139455 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 203270 | -| policy_gradient_loss | 0.0914 | -| std | 0.00771 | -| value_loss | 1.97e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20329 | -| time_elapsed | 109911 | -| total_timesteps | 2602112 | -| train/ | | -| approx_kl | 0.10323505 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.0807 | -| n_updates | 203280 | -| policy_gradient_loss | 0.108 | -| std | 0.00772 | -| value_loss | 1.55e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20330 | -| time_elapsed | 109923 | -| total_timesteps | 2602240 | -| train/ | | -| approx_kl | 0.11549063 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | 0.0648 | -| n_updates | 203290 | -| policy_gradient_loss | 0.0636 | -| std | 0.00772 | -| value_loss | 8.71e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20331 | -| time_elapsed | 109927 | -| total_timesteps | 2602368 | -| train/ | | -| approx_kl | 0.03161414 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.00561 | -| n_updates | 203300 | -| policy_gradient_loss | 0.0165 | -| std | 0.00772 | -| value_loss | 5.33e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20332 | -| time_elapsed | 109932 | -| total_timesteps | 2602496 | -| train/ | | -| approx_kl | 0.0010270635 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.00128 | -| learning_rate | 0.0003 | -| loss | 0.00359 | -| n_updates | 203310 | -| policy_gradient_loss | 0.00472 | -| std | 0.00771 | -| value_loss | 1.64e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20333 | -| time_elapsed | 109936 | -| total_timesteps | 2602624 | -| train/ | | -| approx_kl | 0.10646173 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.0956 | -| n_updates | 203320 | -| policy_gradient_loss | 0.104 | -| std | 0.00771 | -| value_loss | 9.85e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20334 | -| time_elapsed | 109941 | -| total_timesteps | 2602752 | -| train/ | | -| approx_kl | 0.025487583 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 203330 | -| policy_gradient_loss | 0.0197 | -| std | 0.00771 | -| value_loss | 2.41e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.87 | -| time/ | | -| fps | 23 | -| iterations | 20335 | -| time_elapsed | 109945 | -| total_timesteps | 2602880 | -| train/ | | -| approx_kl | 0.11445488 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | 0.0692 | -| n_updates | 203340 | -| policy_gradient_loss | 0.0178 | -| std | 0.00771 | -| value_loss | 7.83e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20336 | -| time_elapsed | 109951 | -| total_timesteps | 2603008 | -| train/ | | -| approx_kl | 0.13812576 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | 0.0341 | -| n_updates | 203350 | -| policy_gradient_loss | 0.0149 | -| std | 0.00771 | -| value_loss | 6.85e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20337 | -| time_elapsed | 109962 | -| total_timesteps | 2603136 | -| train/ | | -| approx_kl | 0.07206033 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.954 | -| learning_rate | 0.0003 | -| loss | -0.00927 | -| n_updates | 203360 | -| policy_gradient_loss | 0.0101 | -| std | 0.00771 | -| value_loss | 0.00231 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20338 | -| time_elapsed | 109966 | -| total_timesteps | 2603264 | -| train/ | | -| approx_kl | 0.004353362 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.707 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 203370 | -| policy_gradient_loss | 0.00764 | -| std | 0.00771 | -| value_loss | 4.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20339 | -| time_elapsed | 109971 | -| total_timesteps | 2603392 | -| train/ | | -| approx_kl | 0.037424225 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0559 | -| learning_rate | 0.0003 | -| loss | 0.00724 | -| n_updates | 203380 | -| policy_gradient_loss | 0.00401 | -| std | 0.00771 | -| value_loss | 6.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20340 | -| time_elapsed | 109976 | -| total_timesteps | 2603520 | -| train/ | | -| approx_kl | 0.016425874 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.000604 | -| n_updates | 203390 | -| policy_gradient_loss | 0.0414 | -| std | 0.00772 | -| value_loss | 2.87e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20341 | -| time_elapsed | 109981 | -| total_timesteps | 2603648 | -| train/ | | -| approx_kl | 0.19228913 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | 0.082 | -| n_updates | 203400 | -| policy_gradient_loss | 0.0247 | -| std | 0.00772 | -| value_loss | 1.8e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20342 | -| time_elapsed | 109985 | -| total_timesteps | 2603776 | -| train/ | | -| approx_kl | 0.00045359833 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 203410 | -| policy_gradient_loss | 0.00499 | -| std | 0.00773 | -| value_loss | 1.32e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20343 | -| time_elapsed | 109990 | -| total_timesteps | 2603904 | -| train/ | | -| approx_kl | 3.3063814e-05 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | -3.16e-05 | -| n_updates | 203420 | -| policy_gradient_loss | 0.0109 | -| std | 0.00773 | -| value_loss | 1.14e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20344 | -| time_elapsed | 109994 | -| total_timesteps | 2604032 | -| train/ | | -| approx_kl | 0.053594563 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.312 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 203430 | -| policy_gradient_loss | 0.0684 | -| std | 0.00774 | -| value_loss | 4.14e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20345 | -| time_elapsed | 110006 | -| total_timesteps | 2604160 | -| train/ | | -| approx_kl | 0.0008249893 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 203440 | -| policy_gradient_loss | -0.00427 | -| std | 0.00774 | -| value_loss | 0.00269 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20346 | -| time_elapsed | 110011 | -| total_timesteps | 2604288 | -| train/ | | -| approx_kl | 0.14355792 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.0711 | -| n_updates | 203450 | -| policy_gradient_loss | 0.0157 | -| std | 0.00774 | -| value_loss | 4.04e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20347 | -| time_elapsed | 110016 | -| total_timesteps | 2604416 | -| train/ | | -| approx_kl | 0.0143760545 | -| clip_fraction | 0.0891 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 203460 | -| policy_gradient_loss | -0.00254 | -| std | 0.00774 | -| value_loss | 1.7e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20348 | -| time_elapsed | 110022 | -| total_timesteps | 2604544 | -| train/ | | -| approx_kl | 0.12933803 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 203470 | -| policy_gradient_loss | 0.00466 | -| std | 0.00774 | -| value_loss | 1.19e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20349 | -| time_elapsed | 110026 | -| total_timesteps | 2604672 | -| train/ | | -| approx_kl | 0.016673993 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 203480 | -| policy_gradient_loss | 0.0186 | -| std | 0.00773 | -| value_loss | 1.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20350 | -| time_elapsed | 110031 | -| total_timesteps | 2604800 | -| train/ | | -| approx_kl | 0.086011715 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 203490 | -| policy_gradient_loss | 0.0518 | -| std | 0.00773 | -| value_loss | 2.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.875 | -| time/ | | -| fps | 23 | -| iterations | 20351 | -| time_elapsed | 110035 | -| total_timesteps | 2604928 | -| train/ | | -| approx_kl | 0.16255257 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 203500 | -| policy_gradient_loss | 0.0258 | -| std | 0.00773 | -| value_loss | 2.06e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20352 | -| time_elapsed | 110040 | -| total_timesteps | 2605056 | -| train/ | | -| approx_kl | 0.0012512696 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 203510 | -| policy_gradient_loss | 0.00676 | -| std | 0.00773 | -| value_loss | 1.24e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20353 | -| time_elapsed | 110051 | -| total_timesteps | 2605184 | -| train/ | | -| approx_kl | 0.03114061 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.57 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 203520 | -| policy_gradient_loss | 0.0529 | -| std | 0.00773 | -| value_loss | 0.0145 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20354 | -| time_elapsed | 110057 | -| total_timesteps | 2605312 | -| train/ | | -| approx_kl | 0.15971068 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 203530 | -| policy_gradient_loss | 0.0254 | -| std | 0.00773 | -| value_loss | 0.000161 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20355 | -| time_elapsed | 110061 | -| total_timesteps | 2605440 | -| train/ | | -| approx_kl | 0.00057516154 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.44 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | -0.000288 | -| n_updates | 203540 | -| policy_gradient_loss | 0.00877 | -| std | 0.00772 | -| value_loss | 2.04e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20356 | -| time_elapsed | 110066 | -| total_timesteps | 2605568 | -| train/ | | -| approx_kl | 3.434159e-05 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | -0.000477 | -| n_updates | 203550 | -| policy_gradient_loss | 0.00705 | -| std | 0.00771 | -| value_loss | 2.25e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20357 | -| time_elapsed | 110071 | -| total_timesteps | 2605696 | -| train/ | | -| approx_kl | 0.00012933975 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | -0.000953 | -| n_updates | 203560 | -| policy_gradient_loss | 0.00398 | -| std | 0.0077 | -| value_loss | 8.52e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20358 | -| time_elapsed | 110075 | -| total_timesteps | 2605824 | -| train/ | | -| approx_kl | 0.043866623 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | 0.00063 | -| n_updates | 203570 | -| policy_gradient_loss | 0.0384 | -| std | 0.00769 | -| value_loss | 6.88e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 20359 | -| time_elapsed | 110079 | -| total_timesteps | 2605952 | -| train/ | | -| approx_kl | 0.028083976 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 203580 | -| policy_gradient_loss | 0.0216 | -| std | 0.00768 | -| value_loss | 2.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20360 | -| time_elapsed | 110083 | -| total_timesteps | 2606080 | -| train/ | | -| approx_kl | 0.022281598 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 203590 | -| policy_gradient_loss | 0.0208 | -| std | 0.00767 | -| value_loss | 6.62e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20361 | -| time_elapsed | 110091 | -| total_timesteps | 2606208 | -| train/ | | -| approx_kl | 0.03267229 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | 0.751 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 203600 | -| policy_gradient_loss | -0.0151 | -| std | 0.00766 | -| value_loss | 0.0065 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20362 | -| time_elapsed | 110096 | -| total_timesteps | 2606336 | -| train/ | | -| approx_kl | 0.23095208 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.45 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.079 | -| n_updates | 203610 | -| policy_gradient_loss | 0.0126 | -| std | 0.00764 | -| value_loss | 1.12e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20363 | -| time_elapsed | 110100 | -| total_timesteps | 2606464 | -| train/ | | -| approx_kl | 0.008689303 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | -0.00617 | -| n_updates | 203620 | -| policy_gradient_loss | 0.0201 | -| std | 0.00763 | -| value_loss | 7.91e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20364 | -| time_elapsed | 110104 | -| total_timesteps | 2606592 | -| train/ | | -| approx_kl | 0.4232422 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.0702 | -| n_updates | 203630 | -| policy_gradient_loss | 0.0281 | -| std | 0.00763 | -| value_loss | 4.25e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20365 | -| time_elapsed | 110109 | -| total_timesteps | 2606720 | -| train/ | | -| approx_kl | 0.010398861 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00305 | -| n_updates | 203640 | -| policy_gradient_loss | 0.00346 | -| std | 0.00763 | -| value_loss | 2.85e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20366 | -| time_elapsed | 110113 | -| total_timesteps | 2606848 | -| train/ | | -| approx_kl | 0.0464143 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0924 | -| learning_rate | 0.0003 | -| loss | 0.00654 | -| n_updates | 203650 | -| policy_gradient_loss | 0.000366 | -| std | 0.00763 | -| value_loss | 1.88e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20367 | -| time_elapsed | 110117 | -| total_timesteps | 2606976 | -| train/ | | -| approx_kl | 0.033202145 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 203660 | -| policy_gradient_loss | 0.00714 | -| std | 0.00764 | -| value_loss | 1.25e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20368 | -| time_elapsed | 110122 | -| total_timesteps | 2607104 | -| train/ | | -| approx_kl | 0.03863521 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0933 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 203670 | -| policy_gradient_loss | 0.00958 | -| std | 0.00764 | -| value_loss | 1.86e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20369 | -| time_elapsed | 110130 | -| total_timesteps | 2607232 | -| train/ | | -| approx_kl | 0.014316853 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -3.4 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 203680 | -| policy_gradient_loss | -0.0123 | -| std | 0.00763 | -| value_loss | 0.00455 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20370 | -| time_elapsed | 110134 | -| total_timesteps | 2607360 | -| train/ | | -| approx_kl | 0.012786048 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.563 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 203690 | -| policy_gradient_loss | 0.0161 | -| std | 0.00763 | -| value_loss | 7.59e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20371 | -| time_elapsed | 110139 | -| total_timesteps | 2607488 | -| train/ | | -| approx_kl | 0.06348981 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 203700 | -| policy_gradient_loss | 0.0136 | -| std | 0.00763 | -| value_loss | 1.42e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20372 | -| time_elapsed | 110144 | -| total_timesteps | 2607616 | -| train/ | | -| approx_kl | 6.626127e-05 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.492 | -| learning_rate | 0.0003 | -| loss | -0.000219 | -| n_updates | 203710 | -| policy_gradient_loss | 0.0126 | -| std | 0.00764 | -| value_loss | 1.08e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20373 | -| time_elapsed | 110148 | -| total_timesteps | 2607744 | -| train/ | | -| approx_kl | 0.11227166 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0614 | -| n_updates | 203720 | -| policy_gradient_loss | 0.0143 | -| std | 0.00764 | -| value_loss | 2.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20374 | -| time_elapsed | 110153 | -| total_timesteps | 2607872 | -| train/ | | -| approx_kl | 0.015319036 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | 0.0016 | -| n_updates | 203730 | -| policy_gradient_loss | 0.0177 | -| std | 0.00763 | -| value_loss | 5.74e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20375 | -| time_elapsed | 110159 | -| total_timesteps | 2608000 | -| train/ | | -| approx_kl | 0.20313162 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 203740 | -| policy_gradient_loss | 0.122 | -| std | 0.00763 | -| value_loss | 3.99e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20376 | -| time_elapsed | 110164 | -| total_timesteps | 2608128 | -| train/ | | -| approx_kl | 0.11289885 | -| clip_fraction | 0.632 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00472 | -| learning_rate | 0.0003 | -| loss | 0.083 | -| n_updates | 203750 | -| policy_gradient_loss | 0.0862 | -| std | 0.00763 | -| value_loss | 2.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20377 | -| time_elapsed | 110175 | -| total_timesteps | 2608256 | -| train/ | | -| approx_kl | 0.018934198 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 203760 | -| policy_gradient_loss | -0.0109 | -| std | 0.00764 | -| value_loss | 0.000159 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20378 | -| time_elapsed | 110180 | -| total_timesteps | 2608384 | -| train/ | | -| approx_kl | 0.067468844 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.675 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 203770 | -| policy_gradient_loss | 0.0249 | -| std | 0.00764 | -| value_loss | 4.43e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20379 | -| time_elapsed | 110184 | -| total_timesteps | 2608512 | -| train/ | | -| approx_kl | 0.09266393 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -101 | -| learning_rate | 0.0003 | -| loss | 0.00386 | -| n_updates | 203780 | -| policy_gradient_loss | 0.00258 | -| std | 0.00764 | -| value_loss | 1.19e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20380 | -| time_elapsed | 110189 | -| total_timesteps | 2608640 | -| train/ | | -| approx_kl | 0.4624428 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -80.8 | -| learning_rate | 0.0003 | -| loss | 0.0592 | -| n_updates | 203790 | -| policy_gradient_loss | 0.0166 | -| std | 0.00763 | -| value_loss | 8.68e-11 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20381 | -| time_elapsed | 110193 | -| total_timesteps | 2608768 | -| train/ | | -| approx_kl | 0.02754819 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -81.9 | -| learning_rate | 0.0003 | -| loss | -0.0055 | -| n_updates | 203800 | -| policy_gradient_loss | -0.00141 | -| std | 0.00763 | -| value_loss | 1.07e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 20382 | -| time_elapsed | 110197 | -| total_timesteps | 2608896 | -| train/ | | -| approx_kl | 0.005734984 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -53 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 203810 | -| policy_gradient_loss | 0.00385 | -| std | 0.00763 | -| value_loss | 1.22e-12 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20383 | -| time_elapsed | 110202 | -| total_timesteps | 2609024 | -| train/ | | -| approx_kl | 0.0015593814 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -27.9 | -| learning_rate | 0.0003 | -| loss | -0.000637 | -| n_updates | 203820 | -| policy_gradient_loss | 0.00219 | -| std | 0.00762 | -| value_loss | 1.53e-13 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20384 | -| time_elapsed | 110211 | -| total_timesteps | 2609152 | -| train/ | | -| approx_kl | 0.018224714 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 203830 | -| policy_gradient_loss | -0.008 | -| std | 0.00761 | -| value_loss | 0.00163 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20385 | -| time_elapsed | 110217 | -| total_timesteps | 2609280 | -| train/ | | -| approx_kl | 0.0217481 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.424 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 203840 | -| policy_gradient_loss | 0.0272 | -| std | 0.0076 | -| value_loss | 2.47e-05 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20386 | -| time_elapsed | 110221 | -| total_timesteps | 2609408 | -| train/ | | -| approx_kl | 0.1167915 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | 0.00424 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 203850 | -| policy_gradient_loss | 0.0339 | -| std | 0.0076 | -| value_loss | 1.68e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20387 | -| time_elapsed | 110226 | -| total_timesteps | 2609536 | -| train/ | | -| approx_kl | 0.0025059585 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 203860 | -| policy_gradient_loss | -0.00179 | -| std | 0.0076 | -| value_loss | 1.28e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20388 | -| time_elapsed | 110231 | -| total_timesteps | 2609664 | -| train/ | | -| approx_kl | 2.3080036e-05 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | 9.11e-05 | -| n_updates | 203870 | -| policy_gradient_loss | 0.00864 | -| std | 0.00759 | -| value_loss | 8.38e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20389 | -| time_elapsed | 110236 | -| total_timesteps | 2609792 | -| train/ | | -| approx_kl | 0.019666504 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.46 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 203880 | -| policy_gradient_loss | 0.0115 | -| std | 0.00755 | -| value_loss | 0.000401 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 20390 | -| time_elapsed | 110239 | -| total_timesteps | 2609920 | -| train/ | | -| approx_kl | 0.15418334 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.845 | -| learning_rate | 0.0003 | -| loss | 0.083 | -| n_updates | 203890 | -| policy_gradient_loss | 0.111 | -| std | 0.00753 | -| value_loss | 5.18e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20391 | -| time_elapsed | 110244 | -| total_timesteps | 2610048 | -| train/ | | -| approx_kl | 0.110971674 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -9.51 | -| learning_rate | 0.0003 | -| loss | 0.038 | -| n_updates | 203900 | -| policy_gradient_loss | 0.0504 | -| std | 0.00752 | -| value_loss | 3.07e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20392 | -| time_elapsed | 110252 | -| total_timesteps | 2610176 | -| train/ | | -| approx_kl | 0.0042573586 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 203910 | -| policy_gradient_loss | 0.00642 | -| std | 0.00752 | -| value_loss | 0.0024 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20393 | -| time_elapsed | 110257 | -| total_timesteps | 2610304 | -| train/ | | -| approx_kl | 0.048608765 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | 0.0934 | -| n_updates | 203920 | -| policy_gradient_loss | 0.122 | -| std | 0.00752 | -| value_loss | 4.23e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20394 | -| time_elapsed | 110262 | -| total_timesteps | 2610432 | -| train/ | | -| approx_kl | 0.011690318 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.00715 | -| learning_rate | 0.0003 | -| loss | -0.000754 | -| n_updates | 203930 | -| policy_gradient_loss | 0.0152 | -| std | 0.00752 | -| value_loss | 1.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20395 | -| time_elapsed | 110267 | -| total_timesteps | 2610560 | -| train/ | | -| approx_kl | 2.56747e-05 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -2.98e-05 | -| n_updates | 203940 | -| policy_gradient_loss | 0.0305 | -| std | 0.00752 | -| value_loss | 3.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20396 | -| time_elapsed | 110272 | -| total_timesteps | 2610688 | -| train/ | | -| approx_kl | 0.14895885 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.317 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 203950 | -| policy_gradient_loss | 0.0106 | -| std | 0.00751 | -| value_loss | 1.69e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20397 | -| time_elapsed | 110276 | -| total_timesteps | 2610816 | -| train/ | | -| approx_kl | 0.10839466 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 203960 | -| policy_gradient_loss | 0.0132 | -| std | 0.00751 | -| value_loss | 6.57e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 20398 | -| time_elapsed | 110280 | -| total_timesteps | 2610944 | -| train/ | | -| approx_kl | 0.068519056 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 203970 | -| policy_gradient_loss | 0.0342 | -| std | 0.00751 | -| value_loss | 5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20399 | -| time_elapsed | 110285 | -| total_timesteps | 2611072 | -| train/ | | -| approx_kl | 0.28431594 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 203980 | -| policy_gradient_loss | 0.115 | -| std | 0.00751 | -| value_loss | 2.92e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20400 | -| time_elapsed | 110295 | -| total_timesteps | 2611200 | -| train/ | | -| approx_kl | 0.005011696 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.00925 | -| n_updates | 203990 | -| policy_gradient_loss | 0.00427 | -| std | 0.00751 | -| value_loss | 5.52e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20401 | -| time_elapsed | 110300 | -| total_timesteps | 2611328 | -| train/ | | -| approx_kl | 0.0028784126 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.595 | -| learning_rate | 0.0003 | -| loss | -0.000726 | -| n_updates | 204000 | -| policy_gradient_loss | 0.0247 | -| std | 0.00751 | -| value_loss | 4.85e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20402 | -| time_elapsed | 110305 | -| total_timesteps | 2611456 | -| train/ | | -| approx_kl | 0.009731192 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.586 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 204010 | -| policy_gradient_loss | -0.00543 | -| std | 0.00751 | -| value_loss | 4.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20403 | -| time_elapsed | 110310 | -| total_timesteps | 2611584 | -| train/ | | -| approx_kl | 0.02586394 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -4.78 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 204020 | -| policy_gradient_loss | 0.00593 | -| std | 0.0075 | -| value_loss | 4.33e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20404 | -| time_elapsed | 110315 | -| total_timesteps | 2611712 | -| train/ | | -| approx_kl | 0.12555124 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.307 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 204030 | -| policy_gradient_loss | 0.0636 | -| std | 0.0075 | -| value_loss | 9.93e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20405 | -| time_elapsed | 110320 | -| total_timesteps | 2611840 | -| train/ | | -| approx_kl | 0.07888174 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 204040 | -| policy_gradient_loss | 0.00345 | -| std | 0.0075 | -| value_loss | 8.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.868 | -| time/ | | -| fps | 23 | -| iterations | 20406 | -| time_elapsed | 110325 | -| total_timesteps | 2611968 | -| train/ | | -| approx_kl | 0.012571724 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 204050 | -| policy_gradient_loss | 0.00117 | -| std | 0.0075 | -| value_loss | 4.63e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20407 | -| time_elapsed | 110332 | -| total_timesteps | 2612096 | -| train/ | | -| approx_kl | 0.0032379688 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 204060 | -| policy_gradient_loss | 0.00501 | -| std | 0.0075 | -| value_loss | 2.92e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20408 | -| time_elapsed | 110342 | -| total_timesteps | 2612224 | -| train/ | | -| approx_kl | 0.0676284 | -| clip_fraction | 0.558 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -7.91 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 204070 | -| policy_gradient_loss | 0.0059 | -| std | 0.0075 | -| value_loss | 0.0049 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20409 | -| time_elapsed | 110347 | -| total_timesteps | 2612352 | -| train/ | | -| approx_kl | 0.23010896 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.554 | -| learning_rate | 0.0003 | -| loss | 0.0544 | -| n_updates | 204080 | -| policy_gradient_loss | 0.0232 | -| std | 0.0075 | -| value_loss | 6.74e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20410 | -| time_elapsed | 110352 | -| total_timesteps | 2612480 | -| train/ | | -| approx_kl | 0.00033163093 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.000129 | -| n_updates | 204090 | -| policy_gradient_loss | 0.00708 | -| std | 0.00751 | -| value_loss | 1.78e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20411 | -| time_elapsed | 110356 | -| total_timesteps | 2612608 | -| train/ | | -| approx_kl | 3.8458966e-05 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | -0.000534 | -| n_updates | 204100 | -| policy_gradient_loss | 0.00363 | -| std | 0.00751 | -| value_loss | 4.45e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20412 | -| time_elapsed | 110362 | -| total_timesteps | 2612736 | -| train/ | | -| approx_kl | 0.0470952 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.000197 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 204110 | -| policy_gradient_loss | 0.0681 | -| std | 0.0075 | -| value_loss | 6.17e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20413 | -| time_elapsed | 110367 | -| total_timesteps | 2612864 | -| train/ | | -| approx_kl | 0.016811578 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -9.59 | -| learning_rate | 0.0003 | -| loss | -0.00226 | -| n_updates | 204120 | -| policy_gradient_loss | 0.00874 | -| std | 0.0075 | -| value_loss | 3.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 20414 | -| time_elapsed | 110373 | -| total_timesteps | 2612992 | -| train/ | | -| approx_kl | 0.16064736 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.0734 | -| n_updates | 204130 | -| policy_gradient_loss | 0.0124 | -| std | 0.00749 | -| value_loss | 7.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 20415 | -| time_elapsed | 110378 | -| total_timesteps | 2613120 | -| train/ | | -| approx_kl | 0.086815745 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.47 | -| explained_variance | -0.707 | -| learning_rate | 0.0003 | -| loss | 0.00499 | -| n_updates | 204140 | -| policy_gradient_loss | 0.00836 | -| std | 0.00749 | -| value_loss | 4.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 20416 | -| time_elapsed | 110390 | -| total_timesteps | 2613248 | -| train/ | | -| approx_kl | 0.04278199 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -4.58 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 204150 | -| policy_gradient_loss | -0.0205 | -| std | 0.00749 | -| value_loss | 0.00412 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 20417 | -| time_elapsed | 110395 | -| total_timesteps | 2613376 | -| train/ | | -| approx_kl | 0.080851965 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | 0.0551 | -| n_updates | 204160 | -| policy_gradient_loss | 0.0396 | -| std | 0.00749 | -| value_loss | 1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 20418 | -| time_elapsed | 110399 | -| total_timesteps | 2613504 | -| train/ | | -| approx_kl | 0.02296703 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.336 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 204170 | -| policy_gradient_loss | 0.0124 | -| std | 0.00749 | -| value_loss | 3.53e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 20419 | -| time_elapsed | 110404 | -| total_timesteps | 2613632 | -| train/ | | -| approx_kl | 0.016760759 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 204180 | -| policy_gradient_loss | 0.0323 | -| std | 0.00749 | -| value_loss | 1.68e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 20420 | -| time_elapsed | 110409 | -| total_timesteps | 2613760 | -| train/ | | -| approx_kl | 0.00841102 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0838 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 204190 | -| policy_gradient_loss | 0.0238 | -| std | 0.00748 | -| value_loss | 9.19e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 20421 | -| time_elapsed | 110413 | -| total_timesteps | 2613888 | -| train/ | | -| approx_kl | 0.17610303 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0611 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 204200 | -| policy_gradient_loss | 0.0461 | -| std | 0.00747 | -| value_loss | 2.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20422 | -| time_elapsed | 110419 | -| total_timesteps | 2614016 | -| train/ | | -| approx_kl | 0.042585522 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.00265 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 204210 | -| policy_gradient_loss | 0.0619 | -| std | 0.00747 | -| value_loss | 1.05e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20423 | -| time_elapsed | 110431 | -| total_timesteps | 2614144 | -| train/ | | -| approx_kl | 0.139207 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.00966 | -| n_updates | 204220 | -| policy_gradient_loss | 0.00539 | -| std | 0.00746 | -| value_loss | 0.000312 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20424 | -| time_elapsed | 110435 | -| total_timesteps | 2614272 | -| train/ | | -| approx_kl | 0.07981776 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0088 | -| n_updates | 204230 | -| policy_gradient_loss | 0.00626 | -| std | 0.00746 | -| value_loss | 9.93e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20425 | -| time_elapsed | 110440 | -| total_timesteps | 2614400 | -| train/ | | -| approx_kl | 0.006810822 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | 0.0159 | -| n_updates | 204240 | -| policy_gradient_loss | 0.00761 | -| std | 0.00747 | -| value_loss | 5.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20426 | -| time_elapsed | 110444 | -| total_timesteps | 2614528 | -| train/ | | -| approx_kl | 0.052918896 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.00519 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 204250 | -| policy_gradient_loss | 0.0182 | -| std | 0.00747 | -| value_loss | 2.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20427 | -| time_elapsed | 110449 | -| total_timesteps | 2614656 | -| train/ | | -| approx_kl | 0.12864558 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | 0.0555 | -| n_updates | 204260 | -| policy_gradient_loss | 0.0164 | -| std | 0.00746 | -| value_loss | 1.45e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20428 | -| time_elapsed | 110454 | -| total_timesteps | 2614784 | -| train/ | | -| approx_kl | 0.014456731 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0032 | -| n_updates | 204270 | -| policy_gradient_loss | 0.0188 | -| std | 0.00746 | -| value_loss | 9.16e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 20429 | -| time_elapsed | 110459 | -| total_timesteps | 2614912 | -| train/ | | -| approx_kl | 0.19242276 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 204280 | -| policy_gradient_loss | 0.102 | -| std | 0.00746 | -| value_loss | 7.12e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20430 | -| time_elapsed | 110465 | -| total_timesteps | 2615040 | -| train/ | | -| approx_kl | 0.036383063 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 204290 | -| policy_gradient_loss | 0.0195 | -| std | 0.00746 | -| value_loss | 5.02e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20431 | -| time_elapsed | 110474 | -| total_timesteps | 2615168 | -| train/ | | -| approx_kl | 0.36416435 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | 0.075 | -| n_updates | 204300 | -| policy_gradient_loss | 0.0223 | -| std | 0.00746 | -| value_loss | 0.000722 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20432 | -| time_elapsed | 110479 | -| total_timesteps | 2615296 | -| train/ | | -| approx_kl | 0.005135252 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.469 | -| learning_rate | 0.0003 | -| loss | 0.00107 | -| n_updates | 204310 | -| policy_gradient_loss | 0.00464 | -| std | 0.00746 | -| value_loss | 6.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20433 | -| time_elapsed | 110484 | -| total_timesteps | 2615424 | -| train/ | | -| approx_kl | 0.054829024 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.342 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 204320 | -| policy_gradient_loss | 0.00263 | -| std | 0.00746 | -| value_loss | 1.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20434 | -| time_elapsed | 110488 | -| total_timesteps | 2615552 | -| train/ | | -| approx_kl | 0.029873688 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 204330 | -| policy_gradient_loss | 0.000372 | -| std | 0.00746 | -| value_loss | 9.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20435 | -| time_elapsed | 110493 | -| total_timesteps | 2615680 | -| train/ | | -| approx_kl | 0.040232465 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.0134 | -| n_updates | 204340 | -| policy_gradient_loss | 0.00598 | -| std | 0.00746 | -| value_loss | 5.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20436 | -| time_elapsed | 110497 | -| total_timesteps | 2615808 | -| train/ | | -| approx_kl | 0.006506548 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | -0.000398 | -| n_updates | 204350 | -| policy_gradient_loss | 0.00524 | -| std | 0.00746 | -| value_loss | 3.21e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.847 | -| time/ | | -| fps | 23 | -| iterations | 20437 | -| time_elapsed | 110502 | -| total_timesteps | 2615936 | -| train/ | | -| approx_kl | 0.0006096731 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0745 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 204360 | -| policy_gradient_loss | 0.00477 | -| std | 0.00746 | -| value_loss | 2.53e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20438 | -| time_elapsed | 110507 | -| total_timesteps | 2616064 | -| train/ | | -| approx_kl | 0.0055952044 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.000642 | -| n_updates | 204370 | -| policy_gradient_loss | 0.0079 | -| std | 0.00745 | -| value_loss | 1.54e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20439 | -| time_elapsed | 110514 | -| total_timesteps | 2616192 | -| train/ | | -| approx_kl | 0.01606843 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.00022 | -| n_updates | 204380 | -| policy_gradient_loss | 0.011 | -| std | 0.00744 | -| value_loss | 4.54e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20440 | -| time_elapsed | 110519 | -| total_timesteps | 2616320 | -| train/ | | -| approx_kl | 0.0023731305 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 204390 | -| policy_gradient_loss | 0.00983 | -| std | 0.00744 | -| value_loss | 1.86e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20441 | -| time_elapsed | 110524 | -| total_timesteps | 2616448 | -| train/ | | -| approx_kl | 0.0015879464 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 204400 | -| policy_gradient_loss | 0.00523 | -| std | 0.00744 | -| value_loss | 7.32e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20442 | -| time_elapsed | 110529 | -| total_timesteps | 2616576 | -| train/ | | -| approx_kl | 0.004541211 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | -0.0058 | -| n_updates | 204410 | -| policy_gradient_loss | 0.0057 | -| std | 0.00744 | -| value_loss | 6.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20443 | -| time_elapsed | 110533 | -| total_timesteps | 2616704 | -| train/ | | -| approx_kl | 0.072749175 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 204420 | -| policy_gradient_loss | 0.00847 | -| std | 0.00743 | -| value_loss | 3.79e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20444 | -| time_elapsed | 110537 | -| total_timesteps | 2616832 | -| train/ | | -| approx_kl | 0.00056770863 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.000102 | -| n_updates | 204430 | -| policy_gradient_loss | 0.00788 | -| std | 0.00742 | -| value_loss | 3.21e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 20445 | -| time_elapsed | 110543 | -| total_timesteps | 2616960 | -| train/ | | -| approx_kl | 0.036593795 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 204440 | -| policy_gradient_loss | 0.0348 | -| std | 0.00741 | -| value_loss | 5.74e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20446 | -| time_elapsed | 110548 | -| total_timesteps | 2617088 | -| train/ | | -| approx_kl | 0.0908112 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.004 | -| learning_rate | 0.0003 | -| loss | 0.0719 | -| n_updates | 204450 | -| policy_gradient_loss | 0.0466 | -| std | 0.00741 | -| value_loss | 1.79e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20447 | -| time_elapsed | 110559 | -| total_timesteps | 2617216 | -| train/ | | -| approx_kl | 0.053970907 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 204460 | -| policy_gradient_loss | 0.00937 | -| std | 0.00741 | -| value_loss | 0.000457 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20448 | -| time_elapsed | 110564 | -| total_timesteps | 2617344 | -| train/ | | -| approx_kl | 0.027151525 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 204470 | -| policy_gradient_loss | 0.0272 | -| std | 0.0074 | -| value_loss | 0.000205 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20449 | -| time_elapsed | 110568 | -| total_timesteps | 2617472 | -| train/ | | -| approx_kl | 0.6489657 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00634 | -| learning_rate | 0.0003 | -| loss | 0.317 | -| n_updates | 204480 | -| policy_gradient_loss | 0.144 | -| std | 0.0074 | -| value_loss | 1.04e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20450 | -| time_elapsed | 110574 | -| total_timesteps | 2617600 | -| train/ | | -| approx_kl | 0.14818017 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 204490 | -| policy_gradient_loss | 0.00226 | -| std | 0.0074 | -| value_loss | 9.06e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20451 | -| time_elapsed | 110578 | -| total_timesteps | 2617728 | -| train/ | | -| approx_kl | 0.0098449215 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.00532 | -| n_updates | 204500 | -| policy_gradient_loss | 0.0135 | -| std | 0.0074 | -| value_loss | 7.86e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20452 | -| time_elapsed | 110582 | -| total_timesteps | 2617856 | -| train/ | | -| approx_kl | 0.036735974 | -| clip_fraction | 0.147 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 204510 | -| policy_gradient_loss | 0.00473 | -| std | 0.0074 | -| value_loss | 5.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20453 | -| time_elapsed | 110585 | -| total_timesteps | 2617984 | -| train/ | | -| approx_kl | 0.061394773 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 204520 | -| policy_gradient_loss | 0.021 | -| std | 0.0074 | -| value_loss | 1.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20454 | -| time_elapsed | 110590 | -| total_timesteps | 2618112 | -| train/ | | -| approx_kl | 0.06659073 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 204530 | -| policy_gradient_loss | 0.0515 | -| std | 0.0074 | -| value_loss | 8.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20455 | -| time_elapsed | 110602 | -| total_timesteps | 2618240 | -| train/ | | -| approx_kl | 0.03813965 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.819 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 204540 | -| policy_gradient_loss | 0.000823 | -| std | 0.0074 | -| value_loss | 0.000725 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20456 | -| time_elapsed | 110606 | -| total_timesteps | 2618368 | -| train/ | | -| approx_kl | 0.011522201 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | 0.00495 | -| n_updates | 204550 | -| policy_gradient_loss | 0.056 | -| std | 0.0074 | -| value_loss | 4.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20457 | -| time_elapsed | 110611 | -| total_timesteps | 2618496 | -| train/ | | -| approx_kl | 0.20079795 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 204560 | -| policy_gradient_loss | 0.0339 | -| std | 0.0074 | -| value_loss | 1.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20458 | -| time_elapsed | 110618 | -| total_timesteps | 2618624 | -| train/ | | -| approx_kl | 0.04685421 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | 0.00492 | -| n_updates | 204570 | -| policy_gradient_loss | 0.0491 | -| std | 0.0074 | -| value_loss | 1.34e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20459 | -| time_elapsed | 110622 | -| total_timesteps | 2618752 | -| train/ | | -| approx_kl | 0.22255005 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0878 | -| n_updates | 204580 | -| policy_gradient_loss | 0.0338 | -| std | 0.0074 | -| value_loss | 7.89e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 20460 | -| time_elapsed | 110627 | -| total_timesteps | 2618880 | -| train/ | | -| approx_kl | 0.0013941661 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -0.0028 | -| n_updates | 204590 | -| policy_gradient_loss | 0.00703 | -| std | 0.0074 | -| value_loss | 5.71e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20461 | -| time_elapsed | 110634 | -| total_timesteps | 2619008 | -| train/ | | -| approx_kl | 5.398877e-06 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | -0.000486 | -| n_updates | 204600 | -| policy_gradient_loss | -0.000591 | -| std | 0.0074 | -| value_loss | 4.62e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20462 | -| time_elapsed | 110648 | -| total_timesteps | 2619136 | -| train/ | | -| approx_kl | 0.005453793 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.518 | -| learning_rate | 0.0003 | -| loss | -0.0253 | -| n_updates | 204610 | -| policy_gradient_loss | -0.0154 | -| std | 0.0074 | -| value_loss | 0.00243 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20463 | -| time_elapsed | 110652 | -| total_timesteps | 2619264 | -| train/ | | -| approx_kl | 0.051781952 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.746 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 204620 | -| policy_gradient_loss | 0.0477 | -| std | 0.00739 | -| value_loss | 5.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20464 | -| time_elapsed | 110656 | -| total_timesteps | 2619392 | -| train/ | | -| approx_kl | 0.19549872 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0817 | -| n_updates | 204630 | -| policy_gradient_loss | 0.0354 | -| std | 0.00739 | -| value_loss | 3.98e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20465 | -| time_elapsed | 110661 | -| total_timesteps | 2619520 | -| train/ | | -| approx_kl | 0.0012738123 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | -0.00761 | -| n_updates | 204640 | -| policy_gradient_loss | -0.00896 | -| std | 0.0074 | -| value_loss | 2.71e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20466 | -| time_elapsed | 110665 | -| total_timesteps | 2619648 | -| train/ | | -| approx_kl | 0.05347451 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.00857 | -| n_updates | 204650 | -| policy_gradient_loss | 0.0475 | -| std | 0.0074 | -| value_loss | 1.97e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20467 | -| time_elapsed | 110670 | -| total_timesteps | 2619776 | -| train/ | | -| approx_kl | 0.17011833 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.0396 | -| n_updates | 204660 | -| policy_gradient_loss | 0.0191 | -| std | 0.0074 | -| value_loss | 1.22e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 20468 | -| time_elapsed | 110675 | -| total_timesteps | 2619904 | -| train/ | | -| approx_kl | 0.0012253169 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 204670 | -| policy_gradient_loss | -0.00185 | -| std | 0.0074 | -| value_loss | 9.96e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20469 | -| time_elapsed | 110680 | -| total_timesteps | 2620032 | -| train/ | | -| approx_kl | 0.053624265 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 204680 | -| policy_gradient_loss | 0.0468 | -| std | 0.0074 | -| value_loss | 8.07e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20470 | -| time_elapsed | 110689 | -| total_timesteps | 2620160 | -| train/ | | -| approx_kl | 0.12970942 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 204690 | -| policy_gradient_loss | 0.0171 | -| std | 0.0074 | -| value_loss | 0.00959 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20471 | -| time_elapsed | 110694 | -| total_timesteps | 2620288 | -| train/ | | -| approx_kl | 0.0060091894 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.974 | -| learning_rate | 0.0003 | -| loss | -0.000948 | -| n_updates | 204700 | -| policy_gradient_loss | 0.0112 | -| std | 0.00741 | -| value_loss | 1.79e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20472 | -| time_elapsed | 110700 | -| total_timesteps | 2620416 | -| train/ | | -| approx_kl | 0.1130268 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0735 | -| n_updates | 204710 | -| policy_gradient_loss | 0.0436 | -| std | 0.00741 | -| value_loss | 8.2e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20473 | -| time_elapsed | 110705 | -| total_timesteps | 2620544 | -| train/ | | -| approx_kl | 0.00620453 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.654 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 204720 | -| policy_gradient_loss | 0.00189 | -| std | 0.00741 | -| value_loss | 3.69e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20474 | -| time_elapsed | 110710 | -| total_timesteps | 2620672 | -| train/ | | -| approx_kl | 0.00012931274 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0801 | -| learning_rate | 0.0003 | -| loss | 0.000177 | -| n_updates | 204730 | -| policy_gradient_loss | 0.0091 | -| std | 0.00741 | -| value_loss | 2.33e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20475 | -| time_elapsed | 110714 | -| total_timesteps | 2620800 | -| train/ | | -| approx_kl | 0.0003720494 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 204740 | -| policy_gradient_loss | 0.00984 | -| std | 0.0074 | -| value_loss | 1.83e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20476 | -| time_elapsed | 110719 | -| total_timesteps | 2620928 | -| train/ | | -| approx_kl | 0.054803155 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 204750 | -| policy_gradient_loss | 0.0615 | -| std | 0.00739 | -| value_loss | 9.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20477 | -| time_elapsed | 110724 | -| total_timesteps | 2621056 | -| train/ | | -| approx_kl | 0.019537337 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 204760 | -| policy_gradient_loss | 0.0022 | -| std | 0.00739 | -| value_loss | 8.99e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20478 | -| time_elapsed | 110734 | -| total_timesteps | 2621184 | -| train/ | | -| approx_kl | 0.018129282 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.788 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 204770 | -| policy_gradient_loss | -0.00177 | -| std | 0.00739 | -| value_loss | 0.00575 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20479 | -| time_elapsed | 110739 | -| total_timesteps | 2621312 | -| train/ | | -| approx_kl | 0.32385948 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 204780 | -| policy_gradient_loss | 0.106 | -| std | 0.00738 | -| value_loss | 0.000136 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20480 | -| time_elapsed | 110744 | -| total_timesteps | 2621440 | -| train/ | | -| approx_kl | 0.062456917 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -1.64 | -| learning_rate | 0.0003 | -| loss | 0.0339 | -| n_updates | 204790 | -| policy_gradient_loss | 0.0244 | -| std | 0.00737 | -| value_loss | 0.000415 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20481 | -| time_elapsed | 110747 | -| total_timesteps | 2621568 | -| train/ | | -| approx_kl | 0.0026775436 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0795 | -| learning_rate | 0.0003 | -| loss | 0.00763 | -| n_updates | 204800 | -| policy_gradient_loss | 0.00349 | -| std | 0.00736 | -| value_loss | 2.66e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20482 | -| time_elapsed | 110753 | -| total_timesteps | 2621696 | -| train/ | | -| approx_kl | 0.15157318 | -| clip_fraction | 0.683 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 204810 | -| policy_gradient_loss | 0.154 | -| std | 0.00736 | -| value_loss | 1.19e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20483 | -| time_elapsed | 110758 | -| total_timesteps | 2621824 | -| train/ | | -| approx_kl | 0.109699465 | -| clip_fraction | 0.649 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 204820 | -| policy_gradient_loss | 0.121 | -| std | 0.00736 | -| value_loss | 1.12e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20484 | -| time_elapsed | 110762 | -| total_timesteps | 2621952 | -| train/ | | -| approx_kl | 0.13191047 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 204830 | -| policy_gradient_loss | 0.122 | -| std | 0.00736 | -| value_loss | 5.83e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20485 | -| time_elapsed | 110766 | -| total_timesteps | 2622080 | -| train/ | | -| approx_kl | 0.13957886 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | 0.0669 | -| n_updates | 204840 | -| policy_gradient_loss | 0.00876 | -| std | 0.0074 | -| value_loss | 2.06e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20486 | -| time_elapsed | 110775 | -| total_timesteps | 2622208 | -| train/ | | -| approx_kl | 0.00054304395 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.847 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 204850 | -| policy_gradient_loss | 0.00606 | -| std | 0.00742 | -| value_loss | 0.00352 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20487 | -| time_elapsed | 110781 | -| total_timesteps | 2622336 | -| train/ | | -| approx_kl | 0.0208474 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -97.7 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 204860 | -| policy_gradient_loss | 0.00287 | -| std | 0.00743 | -| value_loss | 1.14e-05 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20488 | -| time_elapsed | 110785 | -| total_timesteps | 2622464 | -| train/ | | -| approx_kl | 0.157157 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.0603 | -| n_updates | 204870 | -| policy_gradient_loss | 0.033 | -| std | 0.00743 | -| value_loss | 1.53e-05 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20489 | -| time_elapsed | 110789 | -| total_timesteps | 2622592 | -| train/ | | -| approx_kl | 0.0023468565 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.646 | -| learning_rate | 0.0003 | -| loss | -0.000533 | -| n_updates | 204880 | -| policy_gradient_loss | 0.0129 | -| std | 0.00743 | -| value_loss | 2.01e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20490 | -| time_elapsed | 110794 | -| total_timesteps | 2622720 | -| train/ | | -| approx_kl | 7.0463866e-06 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | -9.68e-05 | -| n_updates | 204890 | -| policy_gradient_loss | 0.00485 | -| std | 0.00744 | -| value_loss | 2.26e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20491 | -| time_elapsed | 110798 | -| total_timesteps | 2622848 | -| train/ | | -| approx_kl | 0.03630042 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 204900 | -| policy_gradient_loss | 0.0527 | -| std | 0.00744 | -| value_loss | 6.84e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 20492 | -| time_elapsed | 110802 | -| total_timesteps | 2622976 | -| train/ | | -| approx_kl | 1.8817838e-05 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0999 | -| learning_rate | 0.0003 | -| loss | 0.00042 | -| n_updates | 204910 | -| policy_gradient_loss | 0.104 | -| std | 0.00744 | -| value_loss | 4.41e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20493 | -| time_elapsed | 110806 | -| total_timesteps | 2623104 | -| train/ | | -| approx_kl | 0.016378405 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.00885 | -| n_updates | 204920 | -| policy_gradient_loss | 0.0236 | -| std | 0.00744 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20494 | -| time_elapsed | 110818 | -| total_timesteps | 2623232 | -| train/ | | -| approx_kl | 0.014354356 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -4.87 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 204930 | -| policy_gradient_loss | 0.00624 | -| std | 0.00744 | -| value_loss | 0.00427 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20495 | -| time_elapsed | 110824 | -| total_timesteps | 2623360 | -| train/ | | -| approx_kl | 0.000103727914 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | -0.000197 | -| n_updates | 204940 | -| policy_gradient_loss | 0.00479 | -| std | 0.00745 | -| value_loss | 5.58e-07 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20496 | -| time_elapsed | 110829 | -| total_timesteps | 2623488 | -| train/ | | -| approx_kl | 0.050051555 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | 0.00774 | -| n_updates | 204950 | -| policy_gradient_loss | 0.0252 | -| std | 0.00745 | -| value_loss | 2.47e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20497 | -| time_elapsed | 110833 | -| total_timesteps | 2623616 | -| train/ | | -| approx_kl | 0.67259717 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.518 | -| learning_rate | 0.0003 | -| loss | 0.197 | -| n_updates | 204960 | -| policy_gradient_loss | 0.11 | -| std | 0.00745 | -| value_loss | 2.4e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20498 | -| time_elapsed | 110838 | -| total_timesteps | 2623744 | -| train/ | | -| approx_kl | 0.0060486393 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 204970 | -| policy_gradient_loss | 0.0161 | -| std | 0.00745 | -| value_loss | 1.7e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20499 | -| time_elapsed | 110843 | -| total_timesteps | 2623872 | -| train/ | | -| approx_kl | 0.48679638 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.0937 | -| n_updates | 204980 | -| policy_gradient_loss | 0.0321 | -| std | 0.00745 | -| value_loss | 1.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20500 | -| time_elapsed | 110847 | -| total_timesteps | 2624000 | -| train/ | | -| approx_kl | 0.033713266 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.00571 | -| n_updates | 204990 | -| policy_gradient_loss | 0.00361 | -| std | 0.00745 | -| value_loss | 7.98e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20501 | -| time_elapsed | 110853 | -| total_timesteps | 2624128 | -| train/ | | -| approx_kl | 0.00525014 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.00568 | -| learning_rate | 0.0003 | -| loss | -0.00927 | -| n_updates | 205000 | -| policy_gradient_loss | 0.00178 | -| std | 0.00745 | -| value_loss | 4.44e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20502 | -| time_elapsed | 110865 | -| total_timesteps | 2624256 | -| train/ | | -| approx_kl | 0.3499024 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | 0.00422 | -| n_updates | 205010 | -| policy_gradient_loss | 0.0222 | -| std | 0.00745 | -| value_loss | 0.000414 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20503 | -| time_elapsed | 110869 | -| total_timesteps | 2624384 | -| train/ | | -| approx_kl | 0.5782913 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -6.28 | -| learning_rate | 0.0003 | -| loss | 0.0562 | -| n_updates | 205020 | -| policy_gradient_loss | 0.0242 | -| std | 0.00746 | -| value_loss | 4.94e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20504 | -| time_elapsed | 110874 | -| total_timesteps | 2624512 | -| train/ | | -| approx_kl | 0.013287237 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -6.62 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 205030 | -| policy_gradient_loss | 0.0272 | -| std | 0.00746 | -| value_loss | 2e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20505 | -| time_elapsed | 110878 | -| total_timesteps | 2624640 | -| train/ | | -| approx_kl | 0.010055007 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | -0.00452 | -| n_updates | 205040 | -| policy_gradient_loss | 0.0202 | -| std | 0.00746 | -| value_loss | 6.96e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20506 | -| time_elapsed | 110883 | -| total_timesteps | 2624768 | -| train/ | | -| approx_kl | 0.03381349 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.271 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 205050 | -| policy_gradient_loss | 0.026 | -| std | 0.00746 | -| value_loss | 4.11e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.829 | -| time/ | | -| fps | 23 | -| iterations | 20507 | -| time_elapsed | 110888 | -| total_timesteps | 2624896 | -| train/ | | -| approx_kl | 0.01409043 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 205060 | -| policy_gradient_loss | 0.008 | -| std | 0.00746 | -| value_loss | 2.9e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20508 | -| time_elapsed | 110892 | -| total_timesteps | 2625024 | -| train/ | | -| approx_kl | 0.0017678314 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0804 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 205070 | -| policy_gradient_loss | 0.0721 | -| std | 0.00746 | -| value_loss | 1.47e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20509 | -| time_elapsed | 110903 | -| total_timesteps | 2625152 | -| train/ | | -| approx_kl | 0.01969752 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 205080 | -| policy_gradient_loss | 0.0189 | -| std | 0.00746 | -| value_loss | 0.00282 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20510 | -| time_elapsed | 110907 | -| total_timesteps | 2625280 | -| train/ | | -| approx_kl | 0.0020548091 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.00542 | -| n_updates | 205090 | -| policy_gradient_loss | 0.00552 | -| std | 0.00746 | -| value_loss | 0.000115 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20511 | -| time_elapsed | 110913 | -| total_timesteps | 2625408 | -| train/ | | -| approx_kl | 0.013368843 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.00595 | -| learning_rate | 0.0003 | -| loss | 0.000392 | -| n_updates | 205100 | -| policy_gradient_loss | -0.00152 | -| std | 0.00746 | -| value_loss | 3.87e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20512 | -| time_elapsed | 110918 | -| total_timesteps | 2625536 | -| train/ | | -| approx_kl | 0.016842406 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.00224 | -| n_updates | 205110 | -| policy_gradient_loss | 0.0185 | -| std | 0.00746 | -| value_loss | 3.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20513 | -| time_elapsed | 110923 | -| total_timesteps | 2625664 | -| train/ | | -| approx_kl | 0.09590511 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0452 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 205120 | -| policy_gradient_loss | 0.0268 | -| std | 0.00746 | -| value_loss | 1.85e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20514 | -| time_elapsed | 110926 | -| total_timesteps | 2625792 | -| train/ | | -| approx_kl | 0.00016173813 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0936 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 205130 | -| policy_gradient_loss | 0.0205 | -| std | 0.00746 | -| value_loss | 1.81e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.828 | -| time/ | | -| fps | 23 | -| iterations | 20515 | -| time_elapsed | 110931 | -| total_timesteps | 2625920 | -| train/ | | -| approx_kl | 0.0007208213 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.0028 | -| n_updates | 205140 | -| policy_gradient_loss | 0.00285 | -| std | 0.00744 | -| value_loss | 4.96e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20516 | -| time_elapsed | 110936 | -| total_timesteps | 2626048 | -| train/ | | -| approx_kl | 0.03679772 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.00436 | -| n_updates | 205150 | -| policy_gradient_loss | 0.00776 | -| std | 0.00744 | -| value_loss | 9.43e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20517 | -| time_elapsed | 110946 | -| total_timesteps | 2626176 | -| train/ | | -| approx_kl | 0.029029671 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.917 | -| learning_rate | 0.0003 | -| loss | -0.0246 | -| n_updates | 205160 | -| policy_gradient_loss | -0.0191 | -| std | 0.00744 | -| value_loss | 0.000413 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20518 | -| time_elapsed | 110951 | -| total_timesteps | 2626304 | -| train/ | | -| approx_kl | 0.012703119 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | 0.00457 | -| n_updates | 205170 | -| policy_gradient_loss | 0.0209 | -| std | 0.00744 | -| value_loss | 8.2e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20519 | -| time_elapsed | 110956 | -| total_timesteps | 2626432 | -| train/ | | -| approx_kl | 7.425435e-06 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.262 | -| learning_rate | 0.0003 | -| loss | 0.000161 | -| n_updates | 205180 | -| policy_gradient_loss | 0.0193 | -| std | 0.00744 | -| value_loss | 2.71e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20520 | -| time_elapsed | 110961 | -| total_timesteps | 2626560 | -| train/ | | -| approx_kl | 0.4183402 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 205190 | -| policy_gradient_loss | 0.044 | -| std | 0.00744 | -| value_loss | 9.49e-10 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20521 | -| time_elapsed | 110967 | -| total_timesteps | 2626688 | -| train/ | | -| approx_kl | 0.005325581 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.00182 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 205200 | -| policy_gradient_loss | 0.00292 | -| std | 0.00744 | -| value_loss | 6.49e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20522 | -| time_elapsed | 110972 | -| total_timesteps | 2626816 | -| train/ | | -| approx_kl | 0.050049834 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 205210 | -| policy_gradient_loss | 0.00436 | -| std | 0.00745 | -| value_loss | 4.19e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.825 | -| time/ | | -| fps | 23 | -| iterations | 20523 | -| time_elapsed | 110977 | -| total_timesteps | 2626944 | -| train/ | | -| approx_kl | 0.0005303873 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.0143 | -| learning_rate | 0.0003 | -| loss | -0.00538 | -| n_updates | 205220 | -| policy_gradient_loss | -0.00372 | -| std | 0.00746 | -| value_loss | 7.03e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20524 | -| time_elapsed | 110983 | -| total_timesteps | 2627072 | -| train/ | | -| approx_kl | 0.0062809377 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 205230 | -| policy_gradient_loss | 0.00249 | -| std | 0.00746 | -| value_loss | 3.91e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20525 | -| time_elapsed | 110992 | -| total_timesteps | 2627200 | -| train/ | | -| approx_kl | 0.059944764 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.796 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 205240 | -| policy_gradient_loss | -0.000101 | -| std | 0.00746 | -| value_loss | 0.00567 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20526 | -| time_elapsed | 110997 | -| total_timesteps | 2627328 | -| train/ | | -| approx_kl | 0.032659084 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 205250 | -| policy_gradient_loss | 0.0116 | -| std | 0.00746 | -| value_loss | 1.89e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20527 | -| time_elapsed | 111002 | -| total_timesteps | 2627456 | -| train/ | | -| approx_kl | 3.2684766e-05 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.0084 | -| learning_rate | 0.0003 | -| loss | -0.00086 | -| n_updates | 205260 | -| policy_gradient_loss | 0.00115 | -| std | 0.00746 | -| value_loss | 1.25e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20528 | -| time_elapsed | 111007 | -| total_timesteps | 2627584 | -| train/ | | -| approx_kl | 0.04259464 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | 0.0192 | -| n_updates | 205270 | -| policy_gradient_loss | 0.00898 | -| std | 0.00746 | -| value_loss | 9.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20529 | -| time_elapsed | 111012 | -| total_timesteps | 2627712 | -| train/ | | -| approx_kl | 0.005815498 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | -0.00015 | -| n_updates | 205280 | -| policy_gradient_loss | 0.00376 | -| std | 0.00746 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20530 | -| time_elapsed | 111018 | -| total_timesteps | 2627840 | -| train/ | | -| approx_kl | 0.0007443945 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.00365 | -| n_updates | 205290 | -| policy_gradient_loss | 0.00134 | -| std | 0.00746 | -| value_loss | 5.01e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.815 | -| time/ | | -| fps | 23 | -| iterations | 20531 | -| time_elapsed | 111023 | -| total_timesteps | 2627968 | -| train/ | | -| approx_kl | 0.0491632 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 205300 | -| policy_gradient_loss | 0.0119 | -| std | 0.00746 | -| value_loss | 2.09e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20532 | -| time_elapsed | 111027 | -| total_timesteps | 2628096 | -| train/ | | -| approx_kl | 0.037796862 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 205310 | -| policy_gradient_loss | 0.0075 | -| std | 0.00745 | -| value_loss | 1.54e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20533 | -| time_elapsed | 111040 | -| total_timesteps | 2628224 | -| train/ | | -| approx_kl | 0.0449734 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 205320 | -| policy_gradient_loss | -0.0172 | -| std | 0.00745 | -| value_loss | 0.0023 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20534 | -| time_elapsed | 111045 | -| total_timesteps | 2628352 | -| train/ | | -| approx_kl | 0.02666287 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.779 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 205330 | -| policy_gradient_loss | 0.00549 | -| std | 0.00745 | -| value_loss | 6.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20535 | -| time_elapsed | 111049 | -| total_timesteps | 2628480 | -| train/ | | -| approx_kl | 0.032466874 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.0027 | -| n_updates | 205340 | -| policy_gradient_loss | 0.00107 | -| std | 0.00745 | -| value_loss | 6.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20536 | -| time_elapsed | 111053 | -| total_timesteps | 2628608 | -| train/ | | -| approx_kl | 0.006410316 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0005 | -| learning_rate | 0.0003 | -| loss | 0.000197 | -| n_updates | 205350 | -| policy_gradient_loss | 0.00747 | -| std | 0.00744 | -| value_loss | 3.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20537 | -| time_elapsed | 111058 | -| total_timesteps | 2628736 | -| train/ | | -| approx_kl | 0.06143525 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0603 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 205360 | -| policy_gradient_loss | 0.0314 | -| std | 0.00744 | -| value_loss | 2.94e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20538 | -| time_elapsed | 111064 | -| total_timesteps | 2628864 | -| train/ | | -| approx_kl | 0.7417774 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0931 | -| learning_rate | 0.0003 | -| loss | 0.329 | -| n_updates | 205370 | -| policy_gradient_loss | 0.247 | -| std | 0.00744 | -| value_loss | 1.28e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 20539 | -| time_elapsed | 111069 | -| total_timesteps | 2628992 | -| train/ | | -| approx_kl | 0.0052169156 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0893 | -| learning_rate | 0.0003 | -| loss | 0.000289 | -| n_updates | 205380 | -| policy_gradient_loss | 0.0235 | -| std | 0.00744 | -| value_loss | 2.2e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 23 | -| iterations | 20540 | -| time_elapsed | 111074 | -| total_timesteps | 2629120 | -| train/ | | -| approx_kl | 0.14042217 | -| clip_fraction | 0.614 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 205390 | -| policy_gradient_loss | 0.0935 | -| std | 0.00744 | -| value_loss | 2.94e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 23 | -| iterations | 20541 | -| time_elapsed | 111086 | -| total_timesteps | 2629248 | -| train/ | | -| approx_kl | 0.14413247 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.689 | -| learning_rate | 0.0003 | -| loss | 0.0727 | -| n_updates | 205400 | -| policy_gradient_loss | 0.1 | -| std | 0.00744 | -| value_loss | 0.00797 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 23 | -| iterations | 20542 | -| time_elapsed | 111091 | -| total_timesteps | 2629376 | -| train/ | | -| approx_kl | 0.030466285 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.282 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 205410 | -| policy_gradient_loss | 0.02 | -| std | 0.00743 | -| value_loss | 1.46e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 23 | -| iterations | 20543 | -| time_elapsed | 111096 | -| total_timesteps | 2629504 | -| train/ | | -| approx_kl | 0.35041597 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | 0.0883 | -| n_updates | 205420 | -| policy_gradient_loss | 0.0286 | -| std | 0.00743 | -| value_loss | 6.33e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 23 | -| iterations | 20544 | -| time_elapsed | 111100 | -| total_timesteps | 2629632 | -| train/ | | -| approx_kl | 0.070570886 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.093 | -| learning_rate | 0.0003 | -| loss | 0.0453 | -| n_updates | 205430 | -| policy_gradient_loss | 0.0634 | -| std | 0.00743 | -| value_loss | 6.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 23 | -| iterations | 20545 | -| time_elapsed | 111103 | -| total_timesteps | 2629760 | -| train/ | | -| approx_kl | 0.027485663 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | 0.000113 | -| n_updates | 205440 | -| policy_gradient_loss | 0.0253 | -| std | 0.00744 | -| value_loss | 1.53e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.822 | -| time/ | | -| fps | 23 | -| iterations | 20546 | -| time_elapsed | 111107 | -| total_timesteps | 2629888 | -| train/ | | -| approx_kl | 0.6234759 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | 0.303 | -| n_updates | 205450 | -| policy_gradient_loss | 0.13 | -| std | 0.00744 | -| value_loss | 1.21e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20547 | -| time_elapsed | 111112 | -| total_timesteps | 2630016 | -| train/ | | -| approx_kl | 0.0056530195 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 205460 | -| policy_gradient_loss | 0.0167 | -| std | 0.00744 | -| value_loss | 8.27e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20548 | -| time_elapsed | 111124 | -| total_timesteps | 2630144 | -| train/ | | -| approx_kl | 0.5015613 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 205470 | -| policy_gradient_loss | 0.0473 | -| std | 0.00744 | -| value_loss | 0.00215 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20549 | -| time_elapsed | 111129 | -| total_timesteps | 2630272 | -| train/ | | -| approx_kl | 0.21881062 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0629 | -| learning_rate | 0.0003 | -| loss | 0.184 | -| n_updates | 205480 | -| policy_gradient_loss | 0.109 | -| std | 0.00744 | -| value_loss | 8.98e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20550 | -| time_elapsed | 111136 | -| total_timesteps | 2630400 | -| train/ | | -| approx_kl | 0.11932889 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.00723 | -| learning_rate | 0.0003 | -| loss | 0.0807 | -| n_updates | 205490 | -| policy_gradient_loss | 0.0963 | -| std | 0.00744 | -| value_loss | 3.54e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20551 | -| time_elapsed | 111141 | -| total_timesteps | 2630528 | -| train/ | | -| approx_kl | 0.03155646 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 205500 | -| policy_gradient_loss | 0.0224 | -| std | 0.00744 | -| value_loss | 1.51e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20552 | -| time_elapsed | 111146 | -| total_timesteps | 2630656 | -| train/ | | -| approx_kl | 0.38133132 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0619 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 205510 | -| policy_gradient_loss | 0.0437 | -| std | 0.00744 | -| value_loss | 8.62e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20553 | -| time_elapsed | 111151 | -| total_timesteps | 2630784 | -| train/ | | -| approx_kl | 0.04101669 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0714 | -| learning_rate | 0.0003 | -| loss | 0.0242 | -| n_updates | 205520 | -| policy_gradient_loss | 0.0125 | -| std | 0.00743 | -| value_loss | 6.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.833 | -| time/ | | -| fps | 23 | -| iterations | 20554 | -| time_elapsed | 111156 | -| total_timesteps | 2630912 | -| train/ | | -| approx_kl | 0.040585674 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0629 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 205530 | -| policy_gradient_loss | 0.0049 | -| std | 0.00743 | -| value_loss | 4.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20555 | -| time_elapsed | 111161 | -| total_timesteps | 2631040 | -| train/ | | -| approx_kl | 0.005600324 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 205540 | -| policy_gradient_loss | 0.00261 | -| std | 0.00743 | -| value_loss | 2.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20556 | -| time_elapsed | 111171 | -| total_timesteps | 2631168 | -| train/ | | -| approx_kl | 0.028138597 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | 0.796 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 205550 | -| policy_gradient_loss | -0.00547 | -| std | 0.00743 | -| value_loss | 0.000795 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20557 | -| time_elapsed | 111176 | -| total_timesteps | 2631296 | -| train/ | | -| approx_kl | 0.07276691 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -2.89 | -| learning_rate | 0.0003 | -| loss | 0.0647 | -| n_updates | 205560 | -| policy_gradient_loss | 0.0318 | -| std | 0.00743 | -| value_loss | 1.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20558 | -| time_elapsed | 111181 | -| total_timesteps | 2631424 | -| train/ | | -| approx_kl | 0.14841786 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -2.23 | -| learning_rate | 0.0003 | -| loss | 0.0987 | -| n_updates | 205570 | -| policy_gradient_loss | 0.0225 | -| std | 0.00743 | -| value_loss | 2.24e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20559 | -| time_elapsed | 111185 | -| total_timesteps | 2631552 | -| train/ | | -| approx_kl | 0.5355686 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.656 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 205580 | -| policy_gradient_loss | 0.0589 | -| std | 0.00743 | -| value_loss | 1.08e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20560 | -| time_elapsed | 111189 | -| total_timesteps | 2631680 | -| train/ | | -| approx_kl | 0.009194424 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.000558 | -| n_updates | 205590 | -| policy_gradient_loss | 0.00689 | -| std | 0.00743 | -| value_loss | 6.52e-10 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20561 | -| time_elapsed | 111194 | -| total_timesteps | 2631808 | -| train/ | | -| approx_kl | 0.00045303395 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.00383 | -| n_updates | 205600 | -| policy_gradient_loss | 0.00144 | -| std | 0.00743 | -| value_loss | 4.79e-10 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 20562 | -| time_elapsed | 111198 | -| total_timesteps | 2631936 | -| train/ | | -| approx_kl | 0.0046143252 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 205610 | -| policy_gradient_loss | 0.00532 | -| std | 0.00742 | -| value_loss | 2.15e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20563 | -| time_elapsed | 111203 | -| total_timesteps | 2632064 | -| train/ | | -| approx_kl | 0.078097634 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.48 | -| explained_variance | -0.0922 | -| learning_rate | 0.0003 | -| loss | 0.0494 | -| n_updates | 205620 | -| policy_gradient_loss | 0.0123 | -| std | 0.00741 | -| value_loss | 2.47e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20564 | -| time_elapsed | 111210 | -| total_timesteps | 2632192 | -| train/ | | -| approx_kl | 0.048337247 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.691 | -| learning_rate | 0.0003 | -| loss | -0.00858 | -| n_updates | 205630 | -| policy_gradient_loss | 0.00393 | -| std | 0.0074 | -| value_loss | 0.00826 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20565 | -| time_elapsed | 111214 | -| total_timesteps | 2632320 | -| train/ | | -| approx_kl | 0.32280016 | -| clip_fraction | 0.683 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.573 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 205640 | -| policy_gradient_loss | 0.161 | -| std | 0.00739 | -| value_loss | 0.000115 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20566 | -| time_elapsed | 111219 | -| total_timesteps | 2632448 | -| train/ | | -| approx_kl | 0.031318795 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00778 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 205650 | -| policy_gradient_loss | 0.0096 | -| std | 0.00739 | -| value_loss | 2.46e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20567 | -| time_elapsed | 111223 | -| total_timesteps | 2632576 | -| train/ | | -| approx_kl | 0.40683436 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00529 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 205660 | -| policy_gradient_loss | 0.0467 | -| std | 0.00739 | -| value_loss | 7.69e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20568 | -| time_elapsed | 111226 | -| total_timesteps | 2632704 | -| train/ | | -| approx_kl | 0.028017368 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | -0.00619 | -| n_updates | 205670 | -| policy_gradient_loss | -0.00153 | -| std | 0.00739 | -| value_loss | 5.78e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20569 | -| time_elapsed | 111230 | -| total_timesteps | 2632832 | -| train/ | | -| approx_kl | 0.034349166 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.00984 | -| n_updates | 205680 | -| policy_gradient_loss | 0.00414 | -| std | 0.0074 | -| value_loss | 4.04e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 20570 | -| time_elapsed | 111235 | -| total_timesteps | 2632960 | -| train/ | | -| approx_kl | 0.0072701764 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 205690 | -| policy_gradient_loss | 0.00458 | -| std | 0.0074 | -| value_loss | 2.8e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20571 | -| time_elapsed | 111241 | -| total_timesteps | 2633088 | -| train/ | | -| approx_kl | 0.054041266 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 205700 | -| policy_gradient_loss | 0.00628 | -| std | 0.0074 | -| value_loss | 2.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20572 | -| time_elapsed | 111250 | -| total_timesteps | 2633216 | -| train/ | | -| approx_kl | 0.03648005 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.687 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 205710 | -| policy_gradient_loss | -0.0173 | -| std | 0.00739 | -| value_loss | 0.00255 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20573 | -| time_elapsed | 111254 | -| total_timesteps | 2633344 | -| train/ | | -| approx_kl | 0.010046092 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.295 | -| learning_rate | 0.0003 | -| loss | 0.00165 | -| n_updates | 205720 | -| policy_gradient_loss | 0.0161 | -| std | 0.00739 | -| value_loss | 2.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20574 | -| time_elapsed | 111258 | -| total_timesteps | 2633472 | -| train/ | | -| approx_kl | 0.028966421 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 205730 | -| policy_gradient_loss | 0.0441 | -| std | 0.00739 | -| value_loss | 5.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20575 | -| time_elapsed | 111261 | -| total_timesteps | 2633600 | -| train/ | | -| approx_kl | 0.13196887 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.0104 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 205740 | -| policy_gradient_loss | 0.0372 | -| std | 0.00738 | -| value_loss | 6.83e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20576 | -| time_elapsed | 111266 | -| total_timesteps | 2633728 | -| train/ | | -| approx_kl | 0.0023143026 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.0156 | -| learning_rate | 0.0003 | -| loss | -0.0046 | -| n_updates | 205750 | -| policy_gradient_loss | 0.0042 | -| std | 0.00739 | -| value_loss | 1.51e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20577 | -| time_elapsed | 111271 | -| total_timesteps | 2633856 | -| train/ | | -| approx_kl | 1.9743573e-05 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 1.63e-06 | -| n_updates | 205760 | -| policy_gradient_loss | 0.00966 | -| std | 0.00738 | -| value_loss | 1.49e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 20578 | -| time_elapsed | 111276 | -| total_timesteps | 2633984 | -| train/ | | -| approx_kl | 0.05675978 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 205770 | -| policy_gradient_loss | 0.0533 | -| std | 0.00738 | -| value_loss | 5.74e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20579 | -| time_elapsed | 111280 | -| total_timesteps | 2634112 | -| train/ | | -| approx_kl | 2.993038e-05 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | -6.26e-05 | -| n_updates | 205780 | -| policy_gradient_loss | 0.0714 | -| std | 0.00737 | -| value_loss | 4.78e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20580 | -| time_elapsed | 111292 | -| total_timesteps | 2634240 | -| train/ | | -| approx_kl | 0.08455567 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | 0.00558 | -| n_updates | 205790 | -| policy_gradient_loss | 0.0491 | -| std | 0.00737 | -| value_loss | 0.000775 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20581 | -| time_elapsed | 111297 | -| total_timesteps | 2634368 | -| train/ | | -| approx_kl | 0.012395583 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0508 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 205800 | -| policy_gradient_loss | 0.0159 | -| std | 0.00737 | -| value_loss | 3.55e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20582 | -| time_elapsed | 111302 | -| total_timesteps | 2634496 | -| train/ | | -| approx_kl | 0.11290465 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.694 | -| learning_rate | 0.0003 | -| loss | 0.0518 | -| n_updates | 205810 | -| policy_gradient_loss | 0.0198 | -| std | 0.00736 | -| value_loss | 2.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20583 | -| time_elapsed | 111306 | -| total_timesteps | 2634624 | -| train/ | | -| approx_kl | 0.102622256 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | 0.0452 | -| n_updates | 205820 | -| policy_gradient_loss | 0.00998 | -| std | 0.00736 | -| value_loss | 1.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20584 | -| time_elapsed | 111310 | -| total_timesteps | 2634752 | -| train/ | | -| approx_kl | 0.10550466 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.00978 | -| n_updates | 205830 | -| policy_gradient_loss | 0.00868 | -| std | 0.00736 | -| value_loss | 6.18e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.836 | -| time/ | | -| fps | 23 | -| iterations | 20585 | -| time_elapsed | 111314 | -| total_timesteps | 2634880 | -| train/ | | -| approx_kl | 0.10970391 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.0576 | -| n_updates | 205840 | -| policy_gradient_loss | 0.0433 | -| std | 0.00736 | -| value_loss | 4.7e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20586 | -| time_elapsed | 111319 | -| total_timesteps | 2635008 | -| train/ | | -| approx_kl | 0.3587157 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.227 | -| n_updates | 205850 | -| policy_gradient_loss | 0.138 | -| std | 0.00736 | -| value_loss | 3.55e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20587 | -| time_elapsed | 111330 | -| total_timesteps | 2635136 | -| train/ | | -| approx_kl | 0.048286095 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 205860 | -| policy_gradient_loss | 0.00547 | -| std | 0.00736 | -| value_loss | 0.00516 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20588 | -| time_elapsed | 111335 | -| total_timesteps | 2635264 | -| train/ | | -| approx_kl | 1.9049272e-05 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.0702 | -| learning_rate | 0.0003 | -| loss | 5.36e-06 | -| n_updates | 205870 | -| policy_gradient_loss | -0.00205 | -| std | 0.00735 | -| value_loss | 0.00132 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20589 | -| time_elapsed | 111339 | -| total_timesteps | 2635392 | -| train/ | | -| approx_kl | 0.03982987 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.00896 | -| n_updates | 205880 | -| policy_gradient_loss | 0.0212 | -| std | 0.00735 | -| value_loss | 3.03e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20590 | -| time_elapsed | 111344 | -| total_timesteps | 2635520 | -| train/ | | -| approx_kl | 0.0012497744 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00181 | -| learning_rate | 0.0003 | -| loss | 0.00127 | -| n_updates | 205890 | -| policy_gradient_loss | 0.031 | -| std | 0.00735 | -| value_loss | 2.33e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20591 | -| time_elapsed | 111350 | -| total_timesteps | 2635648 | -| train/ | | -| approx_kl | 0.4639743 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.496 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 205900 | -| policy_gradient_loss | 0.0523 | -| std | 0.00734 | -| value_loss | 1.61e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20592 | -| time_elapsed | 111354 | -| total_timesteps | 2635776 | -| train/ | | -| approx_kl | 0.005600395 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 205910 | -| policy_gradient_loss | 0.00407 | -| std | 0.00734 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 20593 | -| time_elapsed | 111359 | -| total_timesteps | 2635904 | -| train/ | | -| approx_kl | 0.001858823 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0477 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 205920 | -| policy_gradient_loss | 0.00655 | -| std | 0.00734 | -| value_loss | 5.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20594 | -| time_elapsed | 111363 | -| total_timesteps | 2636032 | -| train/ | | -| approx_kl | 0.038706165 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 205930 | -| policy_gradient_loss | 0.113 | -| std | 0.00734 | -| value_loss | 4.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20595 | -| time_elapsed | 111374 | -| total_timesteps | 2636160 | -| train/ | | -| approx_kl | 0.023632586 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.76 | -| learning_rate | 0.0003 | -| loss | -0.0243 | -| n_updates | 205940 | -| policy_gradient_loss | -0.0172 | -| std | 0.00734 | -| value_loss | 0.00679 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20596 | -| time_elapsed | 111379 | -| total_timesteps | 2636288 | -| train/ | | -| approx_kl | 0.03447379 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 205950 | -| policy_gradient_loss | 0.0247 | -| std | 0.00734 | -| value_loss | 6.87e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20597 | -| time_elapsed | 111384 | -| total_timesteps | 2636416 | -| train/ | | -| approx_kl | 0.69938606 | -| clip_fraction | 0.722 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.000142 | -| learning_rate | 0.0003 | -| loss | 0.307 | -| n_updates | 205960 | -| policy_gradient_loss | 0.124 | -| std | 0.00734 | -| value_loss | 1.22e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20598 | -| time_elapsed | 111389 | -| total_timesteps | 2636544 | -| train/ | | -| approx_kl | 0.16842146 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.0559 | -| n_updates | 205970 | -| policy_gradient_loss | 0.0208 | -| std | 0.00734 | -| value_loss | 6.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20599 | -| time_elapsed | 111394 | -| total_timesteps | 2636672 | -| train/ | | -| approx_kl | 0.014800577 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 205980 | -| policy_gradient_loss | 0.0201 | -| std | 0.00734 | -| value_loss | 3.78e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20600 | -| time_elapsed | 111399 | -| total_timesteps | 2636800 | -| train/ | | -| approx_kl | 0.37275025 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 205990 | -| policy_gradient_loss | 0.127 | -| std | 0.00734 | -| value_loss | 2.13e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 20601 | -| time_elapsed | 111404 | -| total_timesteps | 2636928 | -| train/ | | -| approx_kl | 0.19193462 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0938 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 206000 | -| policy_gradient_loss | 0.102 | -| std | 0.00734 | -| value_loss | 1.45e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20602 | -| time_elapsed | 111409 | -| total_timesteps | 2637056 | -| train/ | | -| approx_kl | 0.14507799 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 206010 | -| policy_gradient_loss | 0.122 | -| std | 0.00734 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20603 | -| time_elapsed | 111417 | -| total_timesteps | 2637184 | -| train/ | | -| approx_kl | 0.10880788 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.246 | -| learning_rate | 0.0003 | -| loss | 0.0484 | -| n_updates | 206020 | -| policy_gradient_loss | 0.0133 | -| std | 0.00734 | -| value_loss | 0.00328 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20604 | -| time_elapsed | 111421 | -| total_timesteps | 2637312 | -| train/ | | -| approx_kl | 0.025277643 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.617 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 206030 | -| policy_gradient_loss | 0.0139 | -| std | 0.00734 | -| value_loss | 0.000142 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20605 | -| time_elapsed | 111427 | -| total_timesteps | 2637440 | -| train/ | | -| approx_kl | 0.0647682 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 206040 | -| policy_gradient_loss | 0.0201 | -| std | 0.00734 | -| value_loss | 1.6e-05 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20606 | -| time_elapsed | 111431 | -| total_timesteps | 2637568 | -| train/ | | -| approx_kl | 0.00018626126 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0777 | -| learning_rate | 0.0003 | -| loss | -0.00125 | -| n_updates | 206050 | -| policy_gradient_loss | 0.0218 | -| std | 0.00734 | -| value_loss | 1.31e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20607 | -| time_elapsed | 111436 | -| total_timesteps | 2637696 | -| train/ | | -| approx_kl | 0.00060395617 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.00647 | -| n_updates | 206060 | -| policy_gradient_loss | -0.00157 | -| std | 0.00734 | -| value_loss | 9.01e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20608 | -| time_elapsed | 111439 | -| total_timesteps | 2637824 | -| train/ | | -| approx_kl | 0.032513283 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | -0.00673 | -| n_updates | 206070 | -| policy_gradient_loss | 0.0101 | -| std | 0.00734 | -| value_loss | 6.29e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.859 | -| time/ | | -| fps | 23 | -| iterations | 20609 | -| time_elapsed | 111444 | -| total_timesteps | 2637952 | -| train/ | | -| approx_kl | 0.41264665 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 206080 | -| policy_gradient_loss | 0.0457 | -| std | 0.00734 | -| value_loss | 4.71e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20610 | -| time_elapsed | 111449 | -| total_timesteps | 2638080 | -| train/ | | -| approx_kl | 0.01066627 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.000656 | -| n_updates | 206090 | -| policy_gradient_loss | 0.00557 | -| std | 0.00734 | -| value_loss | 3.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20611 | -| time_elapsed | 111460 | -| total_timesteps | 2638208 | -| train/ | | -| approx_kl | 0.05292622 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 206100 | -| policy_gradient_loss | 0.00348 | -| std | 0.00734 | -| value_loss | 0.000102 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20612 | -| time_elapsed | 111465 | -| total_timesteps | 2638336 | -| train/ | | -| approx_kl | 0.042150732 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 206110 | -| policy_gradient_loss | 0.000154 | -| std | 0.00734 | -| value_loss | 2.8e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20613 | -| time_elapsed | 111468 | -| total_timesteps | 2638464 | -| train/ | | -| approx_kl | 0.0061238604 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.000459 | -| n_updates | 206120 | -| policy_gradient_loss | 0.00531 | -| std | 0.00734 | -| value_loss | 1.46e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20614 | -| time_elapsed | 111474 | -| total_timesteps | 2638592 | -| train/ | | -| approx_kl | 0.06086072 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00887 | -| n_updates | 206130 | -| policy_gradient_loss | 0.0126 | -| std | 0.00734 | -| value_loss | 8.17e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20615 | -| time_elapsed | 111479 | -| total_timesteps | 2638720 | -| train/ | | -| approx_kl | 0.09356629 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 206140 | -| policy_gradient_loss | 0.0508 | -| std | 0.00734 | -| value_loss | 5.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20616 | -| time_elapsed | 111484 | -| total_timesteps | 2638848 | -| train/ | | -| approx_kl | 0.030040849 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.00578 | -| n_updates | 206150 | -| policy_gradient_loss | 0.0298 | -| std | 0.00734 | -| value_loss | 4.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 20617 | -| time_elapsed | 111489 | -| total_timesteps | 2638976 | -| train/ | | -| approx_kl | 0.10087219 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | 0.0918 | -| n_updates | 206160 | -| policy_gradient_loss | 0.0395 | -| std | 0.00734 | -| value_loss | 3.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 20618 | -| time_elapsed | 111494 | -| total_timesteps | 2639104 | -| train/ | | -| approx_kl | 0.032420225 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 206170 | -| policy_gradient_loss | 0.0394 | -| std | 0.00734 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 20619 | -| time_elapsed | 111504 | -| total_timesteps | 2639232 | -| train/ | | -| approx_kl | 0.14261472 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 206180 | -| policy_gradient_loss | 0.00265 | -| std | 0.00734 | -| value_loss | 0.00042 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 20620 | -| time_elapsed | 111509 | -| total_timesteps | 2639360 | -| train/ | | -| approx_kl | 0.038132977 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.00796 | -| n_updates | 206190 | -| policy_gradient_loss | 0.03 | -| std | 0.00734 | -| value_loss | 9.52e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 20621 | -| time_elapsed | 111513 | -| total_timesteps | 2639488 | -| train/ | | -| approx_kl | 0.6436906 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.0139 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 206200 | -| policy_gradient_loss | 0.125 | -| std | 0.00734 | -| value_loss | 2.21e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 20622 | -| time_elapsed | 111518 | -| total_timesteps | 2639616 | -| train/ | | -| approx_kl | 0.006594157 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 206210 | -| policy_gradient_loss | 0.0279 | -| std | 0.00734 | -| value_loss | 1.28e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 20623 | -| time_elapsed | 111522 | -| total_timesteps | 2639744 | -| train/ | | -| approx_kl | 0.17588024 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.153 | -| n_updates | 206220 | -| policy_gradient_loss | 0.0991 | -| std | 0.00734 | -| value_loss | 1.13e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 20624 | -| time_elapsed | 111526 | -| total_timesteps | 2639872 | -| train/ | | -| approx_kl | 0.037229106 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 206230 | -| policy_gradient_loss | 0.0186 | -| std | 0.00735 | -| value_loss | 8.87e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20625 | -| time_elapsed | 111530 | -| total_timesteps | 2640000 | -| train/ | | -| approx_kl | 0.12939003 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.0603 | -| n_updates | 206240 | -| policy_gradient_loss | 0.0172 | -| std | 0.00735 | -| value_loss | 5.57e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20626 | -| time_elapsed | 111535 | -| total_timesteps | 2640128 | -| train/ | | -| approx_kl | 0.012954781 | -| clip_fraction | 0.0906 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.00512 | -| learning_rate | 0.0003 | -| loss | -0.00407 | -| n_updates | 206250 | -| policy_gradient_loss | -0.00229 | -| std | 0.00735 | -| value_loss | 2.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20627 | -| time_elapsed | 111546 | -| total_timesteps | 2640256 | -| train/ | | -| approx_kl | 0.023003545 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.845 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 206260 | -| policy_gradient_loss | 0.00623 | -| std | 0.00735 | -| value_loss | 0.00338 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20628 | -| time_elapsed | 111551 | -| total_timesteps | 2640384 | -| train/ | | -| approx_kl | 0.2550337 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 206270 | -| policy_gradient_loss | 0.133 | -| std | 0.00735 | -| value_loss | 2.62e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20629 | -| time_elapsed | 111555 | -| total_timesteps | 2640512 | -| train/ | | -| approx_kl | 0.16852522 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00602 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 206280 | -| policy_gradient_loss | 0.0928 | -| std | 0.00736 | -| value_loss | 5.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20630 | -| time_elapsed | 111560 | -| total_timesteps | 2640640 | -| train/ | | -| approx_kl | 0.024927873 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00637 | -| learning_rate | 0.0003 | -| loss | 0.00841 | -| n_updates | 206290 | -| policy_gradient_loss | 0.0191 | -| std | 0.00735 | -| value_loss | 1.9e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20631 | -| time_elapsed | 111565 | -| total_timesteps | 2640768 | -| train/ | | -| approx_kl | 0.09752793 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0409 | -| learning_rate | 0.0003 | -| loss | 0.0532 | -| n_updates | 206300 | -| policy_gradient_loss | 0.0126 | -| std | 0.00735 | -| value_loss | 1.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 20632 | -| time_elapsed | 111570 | -| total_timesteps | 2640896 | -| train/ | | -| approx_kl | 0.011659451 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 206310 | -| policy_gradient_loss | -0.00178 | -| std | 0.00735 | -| value_loss | 7.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20633 | -| time_elapsed | 111574 | -| total_timesteps | 2641024 | -| train/ | | -| approx_kl | 0.018372204 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 206320 | -| policy_gradient_loss | 0.0135 | -| std | 0.00735 | -| value_loss | 4.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20634 | -| time_elapsed | 111586 | -| total_timesteps | 2641152 | -| train/ | | -| approx_kl | 0.07943806 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.679 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 206330 | -| policy_gradient_loss | 0.00994 | -| std | 0.00735 | -| value_loss | 0.00179 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20635 | -| time_elapsed | 111591 | -| total_timesteps | 2641280 | -| train/ | | -| approx_kl | 0.1193002 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00888 | -| learning_rate | 0.0003 | -| loss | 0.0453 | -| n_updates | 206340 | -| policy_gradient_loss | 0.0153 | -| std | 0.00735 | -| value_loss | 0.000153 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20636 | -| time_elapsed | 111595 | -| total_timesteps | 2641408 | -| train/ | | -| approx_kl | 0.00982306 | -| clip_fraction | 0.0789 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | 0.00201 | -| n_updates | 206350 | -| policy_gradient_loss | 0.0011 | -| std | 0.00737 | -| value_loss | 2.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20637 | -| time_elapsed | 111600 | -| total_timesteps | 2641536 | -| train/ | | -| approx_kl | 0.010684829 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.000379 | -| n_updates | 206360 | -| policy_gradient_loss | -5.99e-05 | -| std | 0.00738 | -| value_loss | 4.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20638 | -| time_elapsed | 111604 | -| total_timesteps | 2641664 | -| train/ | | -| approx_kl | 0.007956172 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 206370 | -| policy_gradient_loss | -0.0035 | -| std | 0.00738 | -| value_loss | 1.84e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20639 | -| time_elapsed | 111609 | -| total_timesteps | 2641792 | -| train/ | | -| approx_kl | 0.0094627645 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0879 | -| learning_rate | 0.0003 | -| loss | 0.00408 | -| n_updates | 206380 | -| policy_gradient_loss | 0.00208 | -| std | 0.00738 | -| value_loss | 1.14e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.873 | -| time/ | | -| fps | 23 | -| iterations | 20640 | -| time_elapsed | 111614 | -| total_timesteps | 2641920 | -| train/ | | -| approx_kl | 0.008380972 | -| clip_fraction | 0.0437 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | 0.00263 | -| n_updates | 206390 | -| policy_gradient_loss | 0.00138 | -| std | 0.00737 | -| value_loss | 8.03e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20641 | -| time_elapsed | 111620 | -| total_timesteps | 2642048 | -| train/ | | -| approx_kl | 0.008923 | -| clip_fraction | 0.0648 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | -0.00524 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 206400 | -| policy_gradient_loss | -0.00145 | -| std | 0.00735 | -| value_loss | 2.05e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20642 | -| time_elapsed | 111628 | -| total_timesteps | 2642176 | -| train/ | | -| approx_kl | 0.018575998 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.49 | -| explained_variance | 0.619 | -| learning_rate | 0.0003 | -| loss | 0.00363 | -| n_updates | 206410 | -| policy_gradient_loss | 0.018 | -| std | 0.00734 | -| value_loss | 0.0155 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20643 | -| time_elapsed | 111634 | -| total_timesteps | 2642304 | -| train/ | | -| approx_kl | 0.21374771 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 206420 | -| policy_gradient_loss | 0.122 | -| std | 0.00734 | -| value_loss | 0.000145 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20644 | -| time_elapsed | 111639 | -| total_timesteps | 2642432 | -| train/ | | -| approx_kl | 0.028175937 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.00627 | -| learning_rate | 0.0003 | -| loss | 0.00669 | -| n_updates | 206430 | -| policy_gradient_loss | 0.013 | -| std | 0.00734 | -| value_loss | 2.41e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20645 | -| time_elapsed | 111643 | -| total_timesteps | 2642560 | -| train/ | | -| approx_kl | 0.5269326 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 206440 | -| policy_gradient_loss | 0.0488 | -| std | 0.00734 | -| value_loss | 1.16e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20646 | -| time_elapsed | 111646 | -| total_timesteps | 2642688 | -| train/ | | -| approx_kl | 0.031045731 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | 5.98e-05 | -| n_updates | 206450 | -| policy_gradient_loss | 0.00116 | -| std | 0.00734 | -| value_loss | 7.5e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20647 | -| time_elapsed | 111650 | -| total_timesteps | 2642816 | -| train/ | | -| approx_kl | 0.0052158833 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | -0.000393 | -| n_updates | 206460 | -| policy_gradient_loss | 0.00443 | -| std | 0.00733 | -| value_loss | 1.09e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 20648 | -| time_elapsed | 111654 | -| total_timesteps | 2642944 | -| train/ | | -| approx_kl | 0.07183337 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 206470 | -| policy_gradient_loss | 0.00363 | -| std | 0.00733 | -| value_loss | 5.24e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20649 | -| time_elapsed | 111657 | -| total_timesteps | 2643072 | -| train/ | | -| approx_kl | 0.009214312 | -| clip_fraction | 0.161 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.00966 | -| learning_rate | 0.0003 | -| loss | 0.00164 | -| n_updates | 206480 | -| policy_gradient_loss | 0.00475 | -| std | 0.00733 | -| value_loss | 4.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20650 | -| time_elapsed | 111665 | -| total_timesteps | 2643200 | -| train/ | | -| approx_kl | 0.042116247 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.772 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 206490 | -| policy_gradient_loss | -0.00978 | -| std | 0.00732 | -| value_loss | 0.00659 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20651 | -| time_elapsed | 111669 | -| total_timesteps | 2643328 | -| train/ | | -| approx_kl | 0.03686681 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.0034 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 206500 | -| policy_gradient_loss | 0.00737 | -| std | 0.00732 | -| value_loss | 2.92e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20652 | -| time_elapsed | 111675 | -| total_timesteps | 2643456 | -| train/ | | -| approx_kl | 0.0069393907 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.00831 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 206510 | -| policy_gradient_loss | 0.00329 | -| std | 0.00732 | -| value_loss | 5.09e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20653 | -| time_elapsed | 111680 | -| total_timesteps | 2643584 | -| train/ | | -| approx_kl | 0.029534379 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | 0.0362 | -| n_updates | 206520 | -| policy_gradient_loss | 0.115 | -| std | 0.00731 | -| value_loss | 5.25e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20654 | -| time_elapsed | 111684 | -| total_timesteps | 2643712 | -| train/ | | -| approx_kl | 0.08917356 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | 0.0781 | -| n_updates | 206530 | -| policy_gradient_loss | 0.105 | -| std | 0.00731 | -| value_loss | 1.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20655 | -| time_elapsed | 111688 | -| total_timesteps | 2643840 | -| train/ | | -| approx_kl | 0.014896695 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0633 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 206540 | -| policy_gradient_loss | 0.021 | -| std | 0.00731 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 20656 | -| time_elapsed | 111692 | -| total_timesteps | 2643968 | -| train/ | | -| approx_kl | 0.0020898622 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.000469 | -| n_updates | 206550 | -| policy_gradient_loss | 0.025 | -| std | 0.0073 | -| value_loss | 3.48e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20657 | -| time_elapsed | 111695 | -| total_timesteps | 2644096 | -| train/ | | -| approx_kl | 0.102649644 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0928 | -| learning_rate | 0.0003 | -| loss | 0.0655 | -| n_updates | 206560 | -| policy_gradient_loss | 0.0146 | -| std | 0.00728 | -| value_loss | 0.000239 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20658 | -| time_elapsed | 111706 | -| total_timesteps | 2644224 | -| train/ | | -| approx_kl | 0.09606665 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.778 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 206570 | -| policy_gradient_loss | 0.00609 | -| std | 0.00728 | -| value_loss | 0.00574 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20659 | -| time_elapsed | 111711 | -| total_timesteps | 2644352 | -| train/ | | -| approx_kl | 0.018403355 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.00486 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 206580 | -| policy_gradient_loss | 0.0188 | -| std | 0.00728 | -| value_loss | 5.72e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20660 | -| time_elapsed | 111716 | -| total_timesteps | 2644480 | -| train/ | | -| approx_kl | 0.3345196 | -| clip_fraction | 0.646 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 206590 | -| policy_gradient_loss | 0.105 | -| std | 0.00728 | -| value_loss | 8.58e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20661 | -| time_elapsed | 111719 | -| total_timesteps | 2644608 | -| train/ | | -| approx_kl | 0.23930329 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 206600 | -| policy_gradient_loss | 0.132 | -| std | 0.00728 | -| value_loss | 4.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20662 | -| time_elapsed | 111723 | -| total_timesteps | 2644736 | -| train/ | | -| approx_kl | 0.116081476 | -| clip_fraction | 0.633 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 206610 | -| policy_gradient_loss | 0.121 | -| std | 0.00728 | -| value_loss | 3.94e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20663 | -| time_elapsed | 111729 | -| total_timesteps | 2644864 | -| train/ | | -| approx_kl | 0.095990285 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0787 | -| n_updates | 206620 | -| policy_gradient_loss | 0.0874 | -| std | 0.00728 | -| value_loss | 2.94e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 20664 | -| time_elapsed | 111733 | -| total_timesteps | 2644992 | -| train/ | | -| approx_kl | 0.10666618 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 206630 | -| policy_gradient_loss | 0.0922 | -| std | 0.00728 | -| value_loss | 2.22e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 20665 | -| time_elapsed | 111738 | -| total_timesteps | 2645120 | -| train/ | | -| approx_kl | 0.019101117 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0051 | -| n_updates | 206640 | -| policy_gradient_loss | 0.0148 | -| std | 0.00728 | -| value_loss | 1.3e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 20666 | -| time_elapsed | 111749 | -| total_timesteps | 2645248 | -| train/ | | -| approx_kl | 0.43379354 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.953 | -| learning_rate | 0.0003 | -| loss | 0.226 | -| n_updates | 206650 | -| policy_gradient_loss | 0.0619 | -| std | 0.00728 | -| value_loss | 0.000514 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 20667 | -| time_elapsed | 111754 | -| total_timesteps | 2645376 | -| train/ | | -| approx_kl | 0.0049824296 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 206660 | -| policy_gradient_loss | 0.0021 | -| std | 0.00728 | -| value_loss | 2.26e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 20668 | -| time_elapsed | 111758 | -| total_timesteps | 2645504 | -| train/ | | -| approx_kl | 0.026707415 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.00317 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 206670 | -| policy_gradient_loss | 0.00251 | -| std | 0.00728 | -| value_loss | 3.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 20669 | -| time_elapsed | 111764 | -| total_timesteps | 2645632 | -| train/ | | -| approx_kl | 0.065156445 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0934 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 206680 | -| policy_gradient_loss | 0.128 | -| std | 0.00727 | -| value_loss | 1.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 20670 | -| time_elapsed | 111768 | -| total_timesteps | 2645760 | -| train/ | | -| approx_kl | 0.015957456 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0643 | -| learning_rate | 0.0003 | -| loss | -0.000393 | -| n_updates | 206690 | -| policy_gradient_loss | 0.0207 | -| std | 0.00727 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 20671 | -| time_elapsed | 111773 | -| total_timesteps | 2645888 | -| train/ | | -| approx_kl | 8.798065e-05 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.000243 | -| n_updates | 206700 | -| policy_gradient_loss | 0.0281 | -| std | 0.00728 | -| value_loss | 1e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20672 | -| time_elapsed | 111776 | -| total_timesteps | 2646016 | -| train/ | | -| approx_kl | 0.0010273764 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 206710 | -| policy_gradient_loss | 0.0247 | -| std | 0.00728 | -| value_loss | 5.53e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20673 | -| time_elapsed | 111788 | -| total_timesteps | 2646144 | -| train/ | | -| approx_kl | 0.15721822 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.921 | -| learning_rate | 0.0003 | -| loss | 0.00245 | -| n_updates | 206720 | -| policy_gradient_loss | -0.00953 | -| std | 0.00728 | -| value_loss | 0.00131 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20674 | -| time_elapsed | 111792 | -| total_timesteps | 2646272 | -| train/ | | -| approx_kl | 0.020345181 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 206730 | -| policy_gradient_loss | 0.0205 | -| std | 0.00728 | -| value_loss | 8.59e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20675 | -| time_elapsed | 111797 | -| total_timesteps | 2646400 | -| train/ | | -| approx_kl | 0.2345157 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.00778 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 206740 | -| policy_gradient_loss | 0.121 | -| std | 0.00728 | -| value_loss | 1.56e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20676 | -| time_elapsed | 111803 | -| total_timesteps | 2646528 | -| train/ | | -| approx_kl | 0.17201754 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 206750 | -| policy_gradient_loss | 0.11 | -| std | 0.00728 | -| value_loss | 1.25e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20677 | -| time_elapsed | 111808 | -| total_timesteps | 2646656 | -| train/ | | -| approx_kl | 0.026463607 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 206760 | -| policy_gradient_loss | 0.0235 | -| std | 0.00728 | -| value_loss | 7.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20678 | -| time_elapsed | 111812 | -| total_timesteps | 2646784 | -| train/ | | -| approx_kl | 0.13745734 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 206770 | -| policy_gradient_loss | 0.0155 | -| std | 0.00728 | -| value_loss | 4.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 20679 | -| time_elapsed | 111817 | -| total_timesteps | 2646912 | -| train/ | | -| approx_kl | 0.012372242 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0689 | -| learning_rate | 0.0003 | -| loss | 0.00293 | -| n_updates | 206780 | -| policy_gradient_loss | 0.00103 | -| std | 0.00729 | -| value_loss | 3.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20680 | -| time_elapsed | 111822 | -| total_timesteps | 2647040 | -| train/ | | -| approx_kl | 0.020143388 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0946 | -| learning_rate | 0.0003 | -| loss | 0.00311 | -| n_updates | 206790 | -| policy_gradient_loss | 0.0223 | -| std | 0.00729 | -| value_loss | 3.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20681 | -| time_elapsed | 111831 | -| total_timesteps | 2647168 | -| train/ | | -| approx_kl | 0.10954503 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.798 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 206800 | -| policy_gradient_loss | 0.0149 | -| std | 0.00728 | -| value_loss | 0.00596 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20682 | -| time_elapsed | 111836 | -| total_timesteps | 2647296 | -| train/ | | -| approx_kl | 0.11965724 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0616 | -| n_updates | 206810 | -| policy_gradient_loss | 0.0196 | -| std | 0.00729 | -| value_loss | 8.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20683 | -| time_elapsed | 111841 | -| total_timesteps | 2647424 | -| train/ | | -| approx_kl | 0.01727767 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.00872 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 206820 | -| policy_gradient_loss | 0.0102 | -| std | 0.00729 | -| value_loss | 1.7e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20684 | -| time_elapsed | 111845 | -| total_timesteps | 2647552 | -| train/ | | -| approx_kl | 0.22048914 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 206830 | -| policy_gradient_loss | 0.113 | -| std | 0.0073 | -| value_loss | 9.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20685 | -| time_elapsed | 111850 | -| total_timesteps | 2647680 | -| train/ | | -| approx_kl | 0.045699567 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0699 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 206840 | -| policy_gradient_loss | 0.0254 | -| std | 0.00729 | -| value_loss | 2.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20686 | -| time_elapsed | 111855 | -| total_timesteps | 2647808 | -| train/ | | -| approx_kl | 0.13522041 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.373 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 206850 | -| policy_gradient_loss | 0.0169 | -| std | 0.00728 | -| value_loss | 3.58e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20687 | -| time_elapsed | 111861 | -| total_timesteps | 2647936 | -| train/ | | -| approx_kl | 0.013127422 | -| clip_fraction | 0.0945 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | 0.00687 | -| learning_rate | 0.0003 | -| loss | -0.00122 | -| n_updates | 206860 | -| policy_gradient_loss | -0.000819 | -| std | 0.00728 | -| value_loss | 4.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20688 | -| time_elapsed | 111866 | -| total_timesteps | 2648064 | -| train/ | | -| approx_kl | 0.012834325 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.5 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 206870 | -| policy_gradient_loss | -0.00721 | -| std | 0.00727 | -| value_loss | 1.44e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20689 | -| time_elapsed | 111877 | -| total_timesteps | 2648192 | -| train/ | | -| approx_kl | 0.09881989 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 206880 | -| policy_gradient_loss | 0.00805 | -| std | 0.00727 | -| value_loss | 0.000197 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20690 | -| time_elapsed | 111883 | -| total_timesteps | 2648320 | -| train/ | | -| approx_kl | 0.03949327 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0929 | -| learning_rate | 0.0003 | -| loss | 0.00985 | -| n_updates | 206890 | -| policy_gradient_loss | 0.0195 | -| std | 0.00727 | -| value_loss | 4.1e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20691 | -| time_elapsed | 111887 | -| total_timesteps | 2648448 | -| train/ | | -| approx_kl | 0.021690974 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.009 | -| learning_rate | 0.0003 | -| loss | 0.00323 | -| n_updates | 206900 | -| policy_gradient_loss | 0.0187 | -| std | 0.00726 | -| value_loss | 6.97e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20692 | -| time_elapsed | 111892 | -| total_timesteps | 2648576 | -| train/ | | -| approx_kl | 0.3275364 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.054 | -| n_updates | 206910 | -| policy_gradient_loss | 0.0227 | -| std | 0.00726 | -| value_loss | 5.52e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20693 | -| time_elapsed | 111896 | -| total_timesteps | 2648704 | -| train/ | | -| approx_kl | 0.05349958 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 206920 | -| policy_gradient_loss | 0.0533 | -| std | 0.00726 | -| value_loss | 5.02e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20694 | -| time_elapsed | 111899 | -| total_timesteps | 2648832 | -| train/ | | -| approx_kl | 0.1897928 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.0667 | -| n_updates | 206930 | -| policy_gradient_loss | 0.0343 | -| std | 0.00727 | -| value_loss | 1.62e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 20695 | -| time_elapsed | 111904 | -| total_timesteps | 2648960 | -| train/ | | -| approx_kl | 0.0010725814 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 206940 | -| policy_gradient_loss | 0.00763 | -| std | 0.00727 | -| value_loss | 1.12e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20696 | -| time_elapsed | 111909 | -| total_timesteps | 2649088 | -| train/ | | -| approx_kl | 2.6961789e-06 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0909 | -| learning_rate | 0.0003 | -| loss | -0.000246 | -| n_updates | 206950 | -| policy_gradient_loss | 0.0088 | -| std | 0.00725 | -| value_loss | 8.87e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20697 | -| time_elapsed | 111919 | -| total_timesteps | 2649216 | -| train/ | | -| approx_kl | 0.00022994727 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.00219 | -| n_updates | 206960 | -| policy_gradient_loss | -0.00263 | -| std | 0.00724 | -| value_loss | 0.000316 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20698 | -| time_elapsed | 111924 | -| total_timesteps | 2649344 | -| train/ | | -| approx_kl | 0.05106979 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 206970 | -| policy_gradient_loss | 0.0561 | -| std | 0.00724 | -| value_loss | 5.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20699 | -| time_elapsed | 111929 | -| total_timesteps | 2649472 | -| train/ | | -| approx_kl | 0.06682751 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.0115 | -| learning_rate | 0.0003 | -| loss | 0.0516 | -| n_updates | 206980 | -| policy_gradient_loss | 0.0227 | -| std | 0.00724 | -| value_loss | 8.54e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20700 | -| time_elapsed | 111935 | -| total_timesteps | 2649600 | -| train/ | | -| approx_kl | 0.049278583 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 206990 | -| policy_gradient_loss | 0.0428 | -| std | 0.00724 | -| value_loss | 2.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20701 | -| time_elapsed | 111940 | -| total_timesteps | 2649728 | -| train/ | | -| approx_kl | 0.064064845 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0709 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 207000 | -| policy_gradient_loss | 0.00722 | -| std | 0.00723 | -| value_loss | 5.8e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20702 | -| time_elapsed | 111944 | -| total_timesteps | 2649856 | -| train/ | | -| approx_kl | 0.0115814945 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -2.68 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 207010 | -| policy_gradient_loss | -0.00261 | -| std | 0.00722 | -| value_loss | 9.65e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 20703 | -| time_elapsed | 111949 | -| total_timesteps | 2649984 | -| train/ | | -| approx_kl | 0.022421677 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.00494 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 207020 | -| policy_gradient_loss | 0.12 | -| std | 0.00722 | -| value_loss | 2.85e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 20704 | -| time_elapsed | 111954 | -| total_timesteps | 2650112 | -| train/ | | -| approx_kl | 0.077368945 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0883 | -| n_updates | 207030 | -| policy_gradient_loss | 0.0868 | -| std | 0.00721 | -| value_loss | 1.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 20705 | -| time_elapsed | 111965 | -| total_timesteps | 2650240 | -| train/ | | -| approx_kl | 0.12015397 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 207040 | -| policy_gradient_loss | 0.0948 | -| std | 0.00721 | -| value_loss | 0.00424 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 20706 | -| time_elapsed | 111971 | -| total_timesteps | 2650368 | -| train/ | | -| approx_kl | 0.023227796 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -6.42 | -| learning_rate | 0.0003 | -| loss | -0.00377 | -| n_updates | 207050 | -| policy_gradient_loss | 0.0113 | -| std | 0.00722 | -| value_loss | 1.86e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 20707 | -| time_elapsed | 111977 | -| total_timesteps | 2650496 | -| train/ | | -| approx_kl | 0.053399984 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | -0.0323 | -| n_updates | 207060 | -| policy_gradient_loss | -0.0164 | -| std | 0.00722 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 20708 | -| time_elapsed | 111981 | -| total_timesteps | 2650624 | -| train/ | | -| approx_kl | 0.0022909162 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | -0.00341 | -| n_updates | 207070 | -| policy_gradient_loss | 0.0174 | -| std | 0.00722 | -| value_loss | 2.21e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 20709 | -| time_elapsed | 111986 | -| total_timesteps | 2650752 | -| train/ | | -| approx_kl | 0.14055806 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | 0.0696 | -| n_updates | 207080 | -| policy_gradient_loss | 0.018 | -| std | 0.00722 | -| value_loss | 1.45e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 20710 | -| time_elapsed | 111991 | -| total_timesteps | 2650880 | -| train/ | | -| approx_kl | 0.014136497 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | 0.000358 | -| n_updates | 207090 | -| policy_gradient_loss | -0.000235 | -| std | 0.00721 | -| value_loss | 8.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20711 | -| time_elapsed | 111996 | -| total_timesteps | 2651008 | -| train/ | | -| approx_kl | 0.019622112 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0829 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 207100 | -| policy_gradient_loss | 0.0136 | -| std | 0.00721 | -| value_loss | 6.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20712 | -| time_elapsed | 112007 | -| total_timesteps | 2651136 | -| train/ | | -| approx_kl | 0.03677278 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.000622 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 207110 | -| policy_gradient_loss | 0.0235 | -| std | 0.00721 | -| value_loss | 0.00228 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20713 | -| time_elapsed | 112012 | -| total_timesteps | 2651264 | -| train/ | | -| approx_kl | 0.0038677705 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.467 | -| learning_rate | 0.0003 | -| loss | 0.00881 | -| n_updates | 207120 | -| policy_gradient_loss | 0.0206 | -| std | 0.0072 | -| value_loss | 1.72e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20714 | -| time_elapsed | 112016 | -| total_timesteps | 2651392 | -| train/ | | -| approx_kl | 0.07251613 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -4.15 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 207130 | -| policy_gradient_loss | 0.0144 | -| std | 0.0072 | -| value_loss | 3.45e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20715 | -| time_elapsed | 112021 | -| total_timesteps | 2651520 | -| train/ | | -| approx_kl | 0.0036457404 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -4.01 | -| learning_rate | 0.0003 | -| loss | 0.00297 | -| n_updates | 207140 | -| policy_gradient_loss | 0.00368 | -| std | 0.0072 | -| value_loss | 2.08e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20716 | -| time_elapsed | 112026 | -| total_timesteps | 2651648 | -| train/ | | -| approx_kl | 0.14162311 | -| clip_fraction | 0.692 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | 0.0803 | -| n_updates | 207150 | -| policy_gradient_loss | 0.108 | -| std | 0.0072 | -| value_loss | 2.07e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20717 | -| time_elapsed | 112029 | -| total_timesteps | 2651776 | -| train/ | | -| approx_kl | 0.0258506 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.00817 | -| n_updates | 207160 | -| policy_gradient_loss | 0.0163 | -| std | 0.0072 | -| value_loss | 9.59e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 20718 | -| time_elapsed | 112033 | -| total_timesteps | 2651904 | -| train/ | | -| approx_kl | 0.5169009 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 207170 | -| policy_gradient_loss | 0.0415 | -| std | 0.0072 | -| value_loss | 6.14e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20719 | -| time_elapsed | 112038 | -| total_timesteps | 2652032 | -| train/ | | -| approx_kl | 0.031121664 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 207180 | -| policy_gradient_loss | -0.00903 | -| std | 0.0072 | -| value_loss | 4.14e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20720 | -| time_elapsed | 112046 | -| total_timesteps | 2652160 | -| train/ | | -| approx_kl | 0.0041144593 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.831 | -| learning_rate | 0.0003 | -| loss | -0.00158 | -| n_updates | 207190 | -| policy_gradient_loss | 0.00127 | -| std | 0.0072 | -| value_loss | 0.00423 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20721 | -| time_elapsed | 112051 | -| total_timesteps | 2652288 | -| train/ | | -| approx_kl | 0.010652423 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.387 | -| learning_rate | 0.0003 | -| loss | -0.00515 | -| n_updates | 207200 | -| policy_gradient_loss | 0.00231 | -| std | 0.0072 | -| value_loss | 1.01e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20722 | -| time_elapsed | 112057 | -| total_timesteps | 2652416 | -| train/ | | -| approx_kl | 0.062779985 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 207210 | -| policy_gradient_loss | 0.00943 | -| std | 0.0072 | -| value_loss | 3.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20723 | -| time_elapsed | 112062 | -| total_timesteps | 2652544 | -| train/ | | -| approx_kl | 0.036429502 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | 0.00019 | -| n_updates | 207220 | -| policy_gradient_loss | 0.00121 | -| std | 0.0072 | -| value_loss | 2.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20724 | -| time_elapsed | 112067 | -| total_timesteps | 2652672 | -| train/ | | -| approx_kl | 0.006213833 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 207230 | -| policy_gradient_loss | 0.0042 | -| std | 0.0072 | -| value_loss | 1.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20725 | -| time_elapsed | 112072 | -| total_timesteps | 2652800 | -| train/ | | -| approx_kl | 0.031357132 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 207240 | -| policy_gradient_loss | 0.0863 | -| std | 0.0072 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 20726 | -| time_elapsed | 112076 | -| total_timesteps | 2652928 | -| train/ | | -| approx_kl | 0.010218654 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.0049 | -| n_updates | 207250 | -| policy_gradient_loss | 0.0287 | -| std | 0.0072 | -| value_loss | 8.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20727 | -| time_elapsed | 112082 | -| total_timesteps | 2653056 | -| train/ | | -| approx_kl | 0.122770295 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 207260 | -| policy_gradient_loss | 0.0106 | -| std | 0.0072 | -| value_loss | 5.78e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20728 | -| time_elapsed | 112090 | -| total_timesteps | 2653184 | -| train/ | | -| approx_kl | 0.007001526 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 207270 | -| policy_gradient_loss | 0.00741 | -| std | 0.0072 | -| value_loss | 0.00189 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20729 | -| time_elapsed | 112095 | -| total_timesteps | 2653312 | -| train/ | | -| approx_kl | 0.19725528 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.00361 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 207280 | -| policy_gradient_loss | 0.11 | -| std | 0.0072 | -| value_loss | 5.59e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20730 | -| time_elapsed | 112099 | -| total_timesteps | 2653440 | -| train/ | | -| approx_kl | 0.0469771 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.00279 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 207290 | -| policy_gradient_loss | 0.0273 | -| std | 0.0072 | -| value_loss | 1.15e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20731 | -| time_elapsed | 112103 | -| total_timesteps | 2653568 | -| train/ | | -| approx_kl | 0.4004275 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 207300 | -| policy_gradient_loss | 0.0373 | -| std | 0.0072 | -| value_loss | 8.22e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20732 | -| time_elapsed | 112108 | -| total_timesteps | 2653696 | -| train/ | | -| approx_kl | 0.03307287 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 207310 | -| policy_gradient_loss | 0.00791 | -| std | 0.0072 | -| value_loss | 5.15e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20733 | -| time_elapsed | 112113 | -| total_timesteps | 2653824 | -| train/ | | -| approx_kl | 0.051712494 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 207320 | -| policy_gradient_loss | 0.0171 | -| std | 0.0072 | -| value_loss | 3.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 20734 | -| time_elapsed | 112118 | -| total_timesteps | 2653952 | -| train/ | | -| approx_kl | 0.00712193 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.084 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 207330 | -| policy_gradient_loss | 0.000917 | -| std | 0.0072 | -| value_loss | 2.35e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20735 | -| time_elapsed | 112123 | -| total_timesteps | 2654080 | -| train/ | | -| approx_kl | 0.028084466 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 207340 | -| policy_gradient_loss | 0.0945 | -| std | 0.0072 | -| value_loss | 1.43e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20736 | -| time_elapsed | 112133 | -| total_timesteps | 2654208 | -| train/ | | -| approx_kl | 0.09064084 | -| clip_fraction | 0.671 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 207350 | -| policy_gradient_loss | 0.076 | -| std | 0.0072 | -| value_loss | 0.00297 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20737 | -| time_elapsed | 112136 | -| total_timesteps | 2654336 | -| train/ | | -| approx_kl | 0.09071844 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.51 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.0795 | -| n_updates | 207360 | -| policy_gradient_loss | 0.0997 | -| std | 0.0072 | -| value_loss | 8.75e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20738 | -| time_elapsed | 112140 | -| total_timesteps | 2654464 | -| train/ | | -| approx_kl | 0.022026144 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.0109 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 207370 | -| policy_gradient_loss | 0.0204 | -| std | 0.00719 | -| value_loss | 3.6e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20739 | -| time_elapsed | 112143 | -| total_timesteps | 2654592 | -| train/ | | -| approx_kl | 0.49445096 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.372 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 207380 | -| policy_gradient_loss | 0.0405 | -| std | 0.00719 | -| value_loss | 4.55e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20740 | -| time_elapsed | 112148 | -| total_timesteps | 2654720 | -| train/ | | -| approx_kl | 0.04293272 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.00876 | -| n_updates | 207390 | -| policy_gradient_loss | 0.00516 | -| std | 0.00719 | -| value_loss | 3.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20741 | -| time_elapsed | 112152 | -| total_timesteps | 2654848 | -| train/ | | -| approx_kl | 0.047075786 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 207400 | -| policy_gradient_loss | 0.0164 | -| std | 0.00719 | -| value_loss | 1.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20742 | -| time_elapsed | 112156 | -| total_timesteps | 2654976 | -| train/ | | -| approx_kl | 0.043729346 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | 0.0253 | -| n_updates | 207410 | -| policy_gradient_loss | 0.0121 | -| std | 0.00718 | -| value_loss | 9.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20743 | -| time_elapsed | 112161 | -| total_timesteps | 2655104 | -| train/ | | -| approx_kl | 0.038109556 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0813 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 207420 | -| policy_gradient_loss | 0.00557 | -| std | 0.00718 | -| value_loss | 6.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20744 | -| time_elapsed | 112173 | -| total_timesteps | 2655232 | -| train/ | | -| approx_kl | 0.008920211 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -2.57 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 207430 | -| policy_gradient_loss | -0.0117 | -| std | 0.00718 | -| value_loss | 0.00427 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20745 | -| time_elapsed | 112178 | -| total_timesteps | 2655360 | -| train/ | | -| approx_kl | 0.00969369 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.588 | -| learning_rate | 0.0003 | -| loss | 0.00805 | -| n_updates | 207440 | -| policy_gradient_loss | 0.0121 | -| std | 0.00717 | -| value_loss | 7.31e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20746 | -| time_elapsed | 112183 | -| total_timesteps | 2655488 | -| train/ | | -| approx_kl | 0.06745993 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -2.44 | -| learning_rate | 0.0003 | -| loss | 0.00967 | -| n_updates | 207450 | -| policy_gradient_loss | 0.0181 | -| std | 0.00716 | -| value_loss | 6.59e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20747 | -| time_elapsed | 112188 | -| total_timesteps | 2655616 | -| train/ | | -| approx_kl | 0.10951142 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -129 | -| learning_rate | 0.0003 | -| loss | 0.0643 | -| n_updates | 207460 | -| policy_gradient_loss | 0.0234 | -| std | 0.00715 | -| value_loss | 3.89e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20748 | -| time_elapsed | 112193 | -| total_timesteps | 2655744 | -| train/ | | -| approx_kl | 0.0033090957 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.00539 | -| n_updates | 207470 | -| policy_gradient_loss | 0.00705 | -| std | 0.00715 | -| value_loss | 4.64e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20749 | -| time_elapsed | 112198 | -| total_timesteps | 2655872 | -| train/ | | -| approx_kl | 0.20101207 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 207480 | -| policy_gradient_loss | 0.0311 | -| std | 0.00715 | -| value_loss | 4.37e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20750 | -| time_elapsed | 112204 | -| total_timesteps | 2656000 | -| train/ | | -| approx_kl | 0.0022101905 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.00793 | -| n_updates | 207490 | -| policy_gradient_loss | 0.00259 | -| std | 0.00715 | -| value_loss | 5.33e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20751 | -| time_elapsed | 112208 | -| total_timesteps | 2656128 | -| train/ | | -| approx_kl | 0.04358718 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.0086 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 207500 | -| policy_gradient_loss | 0.0192 | -| std | 0.00715 | -| value_loss | 2.41e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20752 | -| time_elapsed | 112219 | -| total_timesteps | 2656256 | -| train/ | | -| approx_kl | 0.03371045 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.0631 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 207510 | -| policy_gradient_loss | 0.0238 | -| std | 0.00715 | -| value_loss | 0.0024 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20753 | -| time_elapsed | 112224 | -| total_timesteps | 2656384 | -| train/ | | -| approx_kl | 0.50934625 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -2.65 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 207520 | -| policy_gradient_loss | 0.0492 | -| std | 0.00715 | -| value_loss | 2.43e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20754 | -| time_elapsed | 112228 | -| total_timesteps | 2656512 | -| train/ | | -| approx_kl | 0.031619515 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.539 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 207530 | -| policy_gradient_loss | -0.000241 | -| std | 0.00715 | -| value_loss | 9e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20755 | -| time_elapsed | 112234 | -| total_timesteps | 2656640 | -| train/ | | -| approx_kl | 0.044051442 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 207540 | -| policy_gradient_loss | -0.003 | -| std | 0.00715 | -| value_loss | 1.64e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20756 | -| time_elapsed | 112239 | -| total_timesteps | 2656768 | -| train/ | | -| approx_kl | 0.009587809 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | -0.00874 | -| n_updates | 207550 | -| policy_gradient_loss | 0.00552 | -| std | 0.00715 | -| value_loss | 1.08e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 20757 | -| time_elapsed | 112244 | -| total_timesteps | 2656896 | -| train/ | | -| approx_kl | 0.094055295 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.00821 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 207560 | -| policy_gradient_loss | 0.00805 | -| std | 0.00715 | -| value_loss | 9.05e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20758 | -| time_elapsed | 112249 | -| total_timesteps | 2657024 | -| train/ | | -| approx_kl | 0.0068938863 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 207570 | -| policy_gradient_loss | 0.00734 | -| std | 0.00715 | -| value_loss | 5.39e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20759 | -| time_elapsed | 112258 | -| total_timesteps | 2657152 | -| train/ | | -| approx_kl | 0.17497738 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | 0.0351 | -| n_updates | 207580 | -| policy_gradient_loss | -0.00369 | -| std | 0.00714 | -| value_loss | 5.99e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20760 | -| time_elapsed | 112263 | -| total_timesteps | 2657280 | -| train/ | | -| approx_kl | 0.1663972 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | 0.0702 | -| n_updates | 207590 | -| policy_gradient_loss | 0.0164 | -| std | 0.00714 | -| value_loss | 7.44e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20761 | -| time_elapsed | 112267 | -| total_timesteps | 2657408 | -| train/ | | -| approx_kl | 0.017578356 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 207600 | -| policy_gradient_loss | 0.0293 | -| std | 0.00713 | -| value_loss | 6.3e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20762 | -| time_elapsed | 112271 | -| total_timesteps | 2657536 | -| train/ | | -| approx_kl | 0.31544492 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.00192 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 207610 | -| policy_gradient_loss | 0.164 | -| std | 0.00713 | -| value_loss | 1.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20763 | -| time_elapsed | 112276 | -| total_timesteps | 2657664 | -| train/ | | -| approx_kl | 0.038736045 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0792 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 207620 | -| policy_gradient_loss | 0.0147 | -| std | 0.00713 | -| value_loss | 1.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20764 | -| time_elapsed | 112280 | -| total_timesteps | 2657792 | -| train/ | | -| approx_kl | 0.48876923 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 207630 | -| policy_gradient_loss | 0.0487 | -| std | 0.00713 | -| value_loss | 9.76e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 20765 | -| time_elapsed | 112285 | -| total_timesteps | 2657920 | -| train/ | | -| approx_kl | 0.041287612 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 207640 | -| policy_gradient_loss | 0.00873 | -| std | 0.00714 | -| value_loss | 6.74e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20766 | -| time_elapsed | 112289 | -| total_timesteps | 2658048 | -| train/ | | -| approx_kl | 0.043293625 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 207650 | -| policy_gradient_loss | 0.0107 | -| std | 0.00713 | -| value_loss | 4.52e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20767 | -| time_elapsed | 112297 | -| total_timesteps | 2658176 | -| train/ | | -| approx_kl | 0.046548396 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | 0.00244 | -| n_updates | 207660 | -| policy_gradient_loss | 0.00011 | -| std | 0.00713 | -| value_loss | 0.00493 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20768 | -| time_elapsed | 112302 | -| total_timesteps | 2658304 | -| train/ | | -| approx_kl | 0.04298565 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 207670 | -| policy_gradient_loss | 0.0148 | -| std | 0.00711 | -| value_loss | 1.3e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20769 | -| time_elapsed | 112307 | -| total_timesteps | 2658432 | -| train/ | | -| approx_kl | 0.0062597226 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 207680 | -| policy_gradient_loss | 0.00336 | -| std | 0.0071 | -| value_loss | 2.02e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20770 | -| time_elapsed | 112311 | -| total_timesteps | 2658560 | -| train/ | | -| approx_kl | 0.061887942 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 207690 | -| policy_gradient_loss | 0.0144 | -| std | 0.00708 | -| value_loss | 6.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20771 | -| time_elapsed | 112316 | -| total_timesteps | 2658688 | -| train/ | | -| approx_kl | 0.036974926 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.00944 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 207700 | -| policy_gradient_loss | 0.0101 | -| std | 0.00708 | -| value_loss | 1.62e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20772 | -| time_elapsed | 112321 | -| total_timesteps | 2658816 | -| train/ | | -| approx_kl | 0.0058559477 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 207710 | -| policy_gradient_loss | 0.00145 | -| std | 0.00708 | -| value_loss | 1.78e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 20773 | -| time_elapsed | 112325 | -| total_timesteps | 2658944 | -| train/ | | -| approx_kl | 0.025361944 | -| clip_fraction | 0.571 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | 0.052 | -| n_updates | 207720 | -| policy_gradient_loss | 0.0782 | -| std | 0.00708 | -| value_loss | 6.14e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20774 | -| time_elapsed | 112329 | -| total_timesteps | 2659072 | -| train/ | | -| approx_kl | 0.0789582 | -| clip_fraction | 0.632 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.0669 | -| n_updates | 207730 | -| policy_gradient_loss | 0.0917 | -| std | 0.00709 | -| value_loss | 2.21e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20775 | -| time_elapsed | 112338 | -| total_timesteps | 2659200 | -| train/ | | -| approx_kl | 0.0066061164 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.901 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 207740 | -| policy_gradient_loss | -0.000384 | -| std | 0.00709 | -| value_loss | 0.00204 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20776 | -| time_elapsed | 112342 | -| total_timesteps | 2659328 | -| train/ | | -| approx_kl | 0.49132267 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | 0.214 | -| n_updates | 207750 | -| policy_gradient_loss | 0.0607 | -| std | 0.00709 | -| value_loss | 7.42e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20777 | -| time_elapsed | 112346 | -| total_timesteps | 2659456 | -| train/ | | -| approx_kl | 0.0055107493 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.00561 | -| learning_rate | 0.0003 | -| loss | -0.00736 | -| n_updates | 207760 | -| policy_gradient_loss | 0.00341 | -| std | 0.00709 | -| value_loss | 1.05e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20778 | -| time_elapsed | 112351 | -| total_timesteps | 2659584 | -| train/ | | -| approx_kl | 0.057285495 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0833 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 207770 | -| policy_gradient_loss | 0.00963 | -| std | 0.00709 | -| value_loss | 1.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20779 | -| time_elapsed | 112356 | -| total_timesteps | 2659712 | -| train/ | | -| approx_kl | 0.010495327 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 207780 | -| policy_gradient_loss | 0.00303 | -| std | 0.00709 | -| value_loss | 5.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20780 | -| time_elapsed | 112360 | -| total_timesteps | 2659840 | -| train/ | | -| approx_kl | 0.002196629 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0647 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 207790 | -| policy_gradient_loss | 0.00465 | -| std | 0.00709 | -| value_loss | 3.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 20781 | -| time_elapsed | 112364 | -| total_timesteps | 2659968 | -| train/ | | -| approx_kl | 0.036983624 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 207800 | -| policy_gradient_loss | 0.000274 | -| std | 0.00709 | -| value_loss | 3.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20782 | -| time_elapsed | 112369 | -| total_timesteps | 2660096 | -| train/ | | -| approx_kl | 0.090424076 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.0755 | -| n_updates | 207810 | -| policy_gradient_loss | 0.135 | -| std | 0.00709 | -| value_loss | 2.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20783 | -| time_elapsed | 112380 | -| total_timesteps | 2660224 | -| train/ | | -| approx_kl | 0.12293591 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -2.41 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 207820 | -| policy_gradient_loss | 0.0592 | -| std | 0.00709 | -| value_loss | 0.00417 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20784 | -| time_elapsed | 112385 | -| total_timesteps | 2660352 | -| train/ | | -| approx_kl | 0.16135019 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | 0.075 | -| n_updates | 207830 | -| policy_gradient_loss | 0.0713 | -| std | 0.00709 | -| value_loss | 4.02e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20785 | -| time_elapsed | 112390 | -| total_timesteps | 2660480 | -| train/ | | -| approx_kl | 0.095562294 | -| clip_fraction | 0.64 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.00306 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 207840 | -| policy_gradient_loss | 0.0968 | -| std | 0.0071 | -| value_loss | 1.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20786 | -| time_elapsed | 112396 | -| total_timesteps | 2660608 | -| train/ | | -| approx_kl | 0.026047118 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0743 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 207850 | -| policy_gradient_loss | 0.0281 | -| std | 0.00709 | -| value_loss | 5.59e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20787 | -| time_elapsed | 112401 | -| total_timesteps | 2660736 | -| train/ | | -| approx_kl | 0.3947588 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.472 | -| learning_rate | 0.0003 | -| loss | 0.0915 | -| n_updates | 207860 | -| policy_gradient_loss | 0.0318 | -| std | 0.0071 | -| value_loss | 1.42e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20788 | -| time_elapsed | 112406 | -| total_timesteps | 2660864 | -| train/ | | -| approx_kl | 0.034643356 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 207870 | -| policy_gradient_loss | -0.00684 | -| std | 0.00711 | -| value_loss | 4.44e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 20789 | -| time_elapsed | 112412 | -| total_timesteps | 2660992 | -| train/ | | -| approx_kl | 0.006998687 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | -0.00434 | -| n_updates | 207880 | -| policy_gradient_loss | 0.00855 | -| std | 0.00711 | -| value_loss | 1.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20790 | -| time_elapsed | 112416 | -| total_timesteps | 2661120 | -| train/ | | -| approx_kl | 0.063544095 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0847 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 207890 | -| policy_gradient_loss | 0.0299 | -| std | 0.00711 | -| value_loss | 9.33e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20791 | -| time_elapsed | 112429 | -| total_timesteps | 2661248 | -| train/ | | -| approx_kl | 0.14244363 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 207900 | -| policy_gradient_loss | 0.0173 | -| std | 0.00711 | -| value_loss | 0.00278 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20792 | -| time_elapsed | 112435 | -| total_timesteps | 2661376 | -| train/ | | -| approx_kl | 0.03750365 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.294 | -| learning_rate | 0.0003 | -| loss | 4.2e-05 | -| n_updates | 207910 | -| policy_gradient_loss | 0.0204 | -| std | 0.0071 | -| value_loss | 5.58e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20793 | -| time_elapsed | 112439 | -| total_timesteps | 2661504 | -| train/ | | -| approx_kl | 0.08440158 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 0.0884 | -| n_updates | 207920 | -| policy_gradient_loss | 0.0505 | -| std | 0.0071 | -| value_loss | 9.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20794 | -| time_elapsed | 112444 | -| total_timesteps | 2661632 | -| train/ | | -| approx_kl | 0.030263055 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0767 | -| learning_rate | 0.0003 | -| loss | 0.00296 | -| n_updates | 207930 | -| policy_gradient_loss | 0.0252 | -| std | 0.0071 | -| value_loss | 6.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20795 | -| time_elapsed | 112448 | -| total_timesteps | 2661760 | -| train/ | | -| approx_kl | 0.11209333 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0784 | -| learning_rate | 0.0003 | -| loss | 0.077 | -| n_updates | 207940 | -| policy_gradient_loss | 0.0552 | -| std | 0.00711 | -| value_loss | 9.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20796 | -| time_elapsed | 112452 | -| total_timesteps | 2661888 | -| train/ | | -| approx_kl | 0.011701953 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0063 | -| n_updates | 207950 | -| policy_gradient_loss | 0.00955 | -| std | 0.00711 | -| value_loss | 8.79e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20797 | -| time_elapsed | 112457 | -| total_timesteps | 2662016 | -| train/ | | -| approx_kl | 0.0007420657 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.00384 | -| n_updates | 207960 | -| policy_gradient_loss | 0.00237 | -| std | 0.00712 | -| value_loss | 2.06e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20798 | -| time_elapsed | 112469 | -| total_timesteps | 2662144 | -| train/ | | -| approx_kl | 0.0028771092 | -| clip_fraction | 0.167 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 207970 | -| policy_gradient_loss | -0.00404 | -| std | 0.00711 | -| value_loss | 0.00337 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20799 | -| time_elapsed | 112477 | -| total_timesteps | 2662272 | -| train/ | | -| approx_kl | 0.05421198 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 207980 | -| policy_gradient_loss | 0.0291 | -| std | 0.00711 | -| value_loss | 8.81e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20800 | -| time_elapsed | 112483 | -| total_timesteps | 2662400 | -| train/ | | -| approx_kl | 0.70025796 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.271 | -| n_updates | 207990 | -| policy_gradient_loss | 0.154 | -| std | 0.00711 | -| value_loss | 1.64e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20801 | -| time_elapsed | 112488 | -| total_timesteps | 2662528 | -| train/ | | -| approx_kl | 0.0050657815 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 208000 | -| policy_gradient_loss | 0.0208 | -| std | 0.00711 | -| value_loss | 8.16e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20802 | -| time_elapsed | 112492 | -| total_timesteps | 2662656 | -| train/ | | -| approx_kl | 0.059060458 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.00957 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 208010 | -| policy_gradient_loss | 0.0143 | -| std | 0.0071 | -| value_loss | 9.53e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20803 | -| time_elapsed | 112497 | -| total_timesteps | 2662784 | -| train/ | | -| approx_kl | 0.004006547 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 208020 | -| policy_gradient_loss | 0.00738 | -| std | 0.0071 | -| value_loss | 5.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 20804 | -| time_elapsed | 112504 | -| total_timesteps | 2662912 | -| train/ | | -| approx_kl | 0.040440787 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 208030 | -| policy_gradient_loss | 0.0184 | -| std | 0.0071 | -| value_loss | 1.75e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20805 | -| time_elapsed | 112508 | -| total_timesteps | 2663040 | -| train/ | | -| approx_kl | 0.0017155926 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.000208 | -| n_updates | 208040 | -| policy_gradient_loss | 0.0233 | -| std | 0.00709 | -| value_loss | 1.07e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20806 | -| time_elapsed | 112517 | -| total_timesteps | 2663168 | -| train/ | | -| approx_kl | 0.21736006 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -6.62 | -| learning_rate | 0.0003 | -| loss | 0.0897 | -| n_updates | 208050 | -| policy_gradient_loss | 0.053 | -| std | 0.00708 | -| value_loss | 0.00561 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20807 | -| time_elapsed | 112522 | -| total_timesteps | 2663296 | -| train/ | | -| approx_kl | 0.0039795875 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | -0.00771 | -| n_updates | 208060 | -| policy_gradient_loss | 0.0266 | -| std | 0.00708 | -| value_loss | 1.64e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20808 | -| time_elapsed | 112525 | -| total_timesteps | 2663424 | -| train/ | | -| approx_kl | 0.46833694 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.00675 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 208070 | -| policy_gradient_loss | 0.115 | -| std | 0.00708 | -| value_loss | 9.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20809 | -| time_elapsed | 112530 | -| total_timesteps | 2663552 | -| train/ | | -| approx_kl | 0.018739114 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0902 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 208080 | -| policy_gradient_loss | -0.00439 | -| std | 0.00709 | -| value_loss | 1.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20810 | -| time_elapsed | 112535 | -| total_timesteps | 2663680 | -| train/ | | -| approx_kl | 0.018224236 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 208090 | -| policy_gradient_loss | 0.0199 | -| std | 0.00709 | -| value_loss | 1.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20811 | -| time_elapsed | 112540 | -| total_timesteps | 2663808 | -| train/ | | -| approx_kl | 0.23854765 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.00383 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 208100 | -| policy_gradient_loss | 0.134 | -| std | 0.0071 | -| value_loss | 3.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20812 | -| time_elapsed | 112545 | -| total_timesteps | 2663936 | -| train/ | | -| approx_kl | 0.15751162 | -| clip_fraction | 0.687 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 208110 | -| policy_gradient_loss | 0.11 | -| std | 0.0071 | -| value_loss | 2.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20813 | -| time_elapsed | 112549 | -| total_timesteps | 2664064 | -| train/ | | -| approx_kl | 0.096276306 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | 0.0747 | -| n_updates | 208120 | -| policy_gradient_loss | 0.0771 | -| std | 0.0071 | -| value_loss | 1.4e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20814 | -| time_elapsed | 112558 | -| total_timesteps | 2664192 | -| train/ | | -| approx_kl | 0.18864454 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -5.16 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 208130 | -| policy_gradient_loss | 0.166 | -| std | 0.0071 | -| value_loss | 0.00511 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20815 | -| time_elapsed | 112563 | -| total_timesteps | 2664320 | -| train/ | | -| approx_kl | 0.12540144 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0745 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 208140 | -| policy_gradient_loss | 0.117 | -| std | 0.0071 | -| value_loss | 7.8e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20816 | -| time_elapsed | 112567 | -| total_timesteps | 2664448 | -| train/ | | -| approx_kl | 0.1418112 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.00898 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 208150 | -| policy_gradient_loss | 0.0889 | -| std | 0.0071 | -| value_loss | 1.67e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20817 | -| time_elapsed | 112573 | -| total_timesteps | 2664576 | -| train/ | | -| approx_kl | 0.0242203 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 208160 | -| policy_gradient_loss | 0.0138 | -| std | 0.0071 | -| value_loss | 9.19e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20818 | -| time_elapsed | 112578 | -| total_timesteps | 2664704 | -| train/ | | -| approx_kl | 0.12522005 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.0773 | -| n_updates | 208170 | -| policy_gradient_loss | 0.0192 | -| std | 0.0071 | -| value_loss | 6.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20819 | -| time_elapsed | 112583 | -| total_timesteps | 2664832 | -| train/ | | -| approx_kl | 0.012963368 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.00556 | -| n_updates | 208180 | -| policy_gradient_loss | 0.00212 | -| std | 0.0071 | -| value_loss | 3.94e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 20820 | -| time_elapsed | 112586 | -| total_timesteps | 2664960 | -| train/ | | -| approx_kl | 0.016737277 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0847 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 208190 | -| policy_gradient_loss | 0.00807 | -| std | 0.0071 | -| value_loss | 5.22e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20821 | -| time_elapsed | 112591 | -| total_timesteps | 2665088 | -| train/ | | -| approx_kl | 0.20871359 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 208200 | -| policy_gradient_loss | 0.0816 | -| std | 0.0071 | -| value_loss | 1.63e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20822 | -| time_elapsed | 112600 | -| total_timesteps | 2665216 | -| train/ | | -| approx_kl | 0.14877006 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.687 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 208210 | -| policy_gradient_loss | 0.0139 | -| std | 0.0071 | -| value_loss | 0.00349 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20823 | -| time_elapsed | 112605 | -| total_timesteps | 2665344 | -| train/ | | -| approx_kl | 0.14311633 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | 0.0729 | -| n_updates | 208220 | -| policy_gradient_loss | 0.0747 | -| std | 0.00711 | -| value_loss | 7.97e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20824 | -| time_elapsed | 112610 | -| total_timesteps | 2665472 | -| train/ | | -| approx_kl | 0.10685794 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.72 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 208230 | -| policy_gradient_loss | 0.0718 | -| std | 0.00711 | -| value_loss | 3.23e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20825 | -| time_elapsed | 112615 | -| total_timesteps | 2665600 | -| train/ | | -| approx_kl | 0.023267124 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.333 | -| learning_rate | 0.0003 | -| loss | -0.00801 | -| n_updates | 208240 | -| policy_gradient_loss | 0.0189 | -| std | 0.00711 | -| value_loss | 2.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20826 | -| time_elapsed | 112620 | -| total_timesteps | 2665728 | -| train/ | | -| approx_kl | 0.001453144 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.000331 | -| n_updates | 208250 | -| policy_gradient_loss | 0.0237 | -| std | 0.00711 | -| value_loss | 1.05e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20827 | -| time_elapsed | 112625 | -| total_timesteps | 2665856 | -| train/ | | -| approx_kl | 0.6457578 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 208260 | -| policy_gradient_loss | 0.0519 | -| std | 0.0071 | -| value_loss | 4.28e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20828 | -| time_elapsed | 112631 | -| total_timesteps | 2665984 | -| train/ | | -| approx_kl | 0.0002565994 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | -0.00248 | -| n_updates | 208270 | -| policy_gradient_loss | -0.000759 | -| std | 0.0071 | -| value_loss | 2.28e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20829 | -| time_elapsed | 112636 | -| total_timesteps | 2666112 | -| train/ | | -| approx_kl | 0.006432472 | -| clip_fraction | 0.168 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 6.49e-05 | -| n_updates | 208280 | -| policy_gradient_loss | 0.00407 | -| std | 0.00711 | -| value_loss | 2.92e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20830 | -| time_elapsed | 112649 | -| total_timesteps | 2666240 | -| train/ | | -| approx_kl | 0.011142716 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.863 | -| learning_rate | 0.0003 | -| loss | -0.0297 | -| n_updates | 208290 | -| policy_gradient_loss | -0.0119 | -| std | 0.00711 | -| value_loss | 0.00308 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20831 | -| time_elapsed | 112655 | -| total_timesteps | 2666368 | -| train/ | | -| approx_kl | 0.0049858647 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.285 | -| learning_rate | 0.0003 | -| loss | -0.000801 | -| n_updates | 208300 | -| policy_gradient_loss | 0.00505 | -| std | 0.00712 | -| value_loss | 7.63e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20832 | -| time_elapsed | 112659 | -| total_timesteps | 2666496 | -| train/ | | -| approx_kl | 0.0012194319 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.00195 | -| n_updates | 208310 | -| policy_gradient_loss | 0.011 | -| std | 0.00712 | -| value_loss | 3.96e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20833 | -| time_elapsed | 112664 | -| total_timesteps | 2666624 | -| train/ | | -| approx_kl | 0.039264567 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 208320 | -| policy_gradient_loss | 0.00535 | -| std | 0.00712 | -| value_loss | 4.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20834 | -| time_elapsed | 112670 | -| total_timesteps | 2666752 | -| train/ | | -| approx_kl | 0.042105086 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 208330 | -| policy_gradient_loss | -0.00764 | -| std | 0.00712 | -| value_loss | 2.28e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 20835 | -| time_elapsed | 112675 | -| total_timesteps | 2666880 | -| train/ | | -| approx_kl | 0.0073244697 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.00116 | -| n_updates | 208340 | -| policy_gradient_loss | 0.00741 | -| std | 0.00712 | -| value_loss | 1.29e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20836 | -| time_elapsed | 112680 | -| total_timesteps | 2667008 | -| train/ | | -| approx_kl | 0.05420421 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 208350 | -| policy_gradient_loss | 0.00656 | -| std | 0.00712 | -| value_loss | 5.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20837 | -| time_elapsed | 112693 | -| total_timesteps | 2667136 | -| train/ | | -| approx_kl | 0.049864896 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 208360 | -| policy_gradient_loss | -0.0191 | -| std | 0.00712 | -| value_loss | 0.0011 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20838 | -| time_elapsed | 112698 | -| total_timesteps | 2667264 | -| train/ | | -| approx_kl | 0.00037628273 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.81 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 208370 | -| policy_gradient_loss | -0.00421 | -| std | 0.00712 | -| value_loss | 2.69e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20839 | -| time_elapsed | 112702 | -| total_timesteps | 2667392 | -| train/ | | -| approx_kl | 0.032873288 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 208380 | -| policy_gradient_loss | 0.00549 | -| std | 0.00712 | -| value_loss | 8.02e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20840 | -| time_elapsed | 112706 | -| total_timesteps | 2667520 | -| train/ | | -| approx_kl | 0.0065772235 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0806 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 208390 | -| policy_gradient_loss | 0.00141 | -| std | 0.00712 | -| value_loss | 4.79e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20841 | -| time_elapsed | 112711 | -| total_timesteps | 2667648 | -| train/ | | -| approx_kl | 0.06155673 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 208400 | -| policy_gradient_loss | 0.00792 | -| std | 0.00713 | -| value_loss | 2.39e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20842 | -| time_elapsed | 112715 | -| total_timesteps | 2667776 | -| train/ | | -| approx_kl | 0.08359943 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 208410 | -| policy_gradient_loss | 0.00373 | -| std | 0.00713 | -| value_loss | 4.85e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 20843 | -| time_elapsed | 112721 | -| total_timesteps | 2667904 | -| train/ | | -| approx_kl | 0.024271587 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.00539 | -| n_updates | 208420 | -| policy_gradient_loss | 0.00412 | -| std | 0.00713 | -| value_loss | 1.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20844 | -| time_elapsed | 112726 | -| total_timesteps | 2668032 | -| train/ | | -| approx_kl | 0.004760889 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | 0.000605 | -| n_updates | 208430 | -| policy_gradient_loss | 0.00582 | -| std | 0.00713 | -| value_loss | 2.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20845 | -| time_elapsed | 112736 | -| total_timesteps | 2668160 | -| train/ | | -| approx_kl | 0.028568733 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 208440 | -| policy_gradient_loss | -0.0118 | -| std | 0.00713 | -| value_loss | 0.00279 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20846 | -| time_elapsed | 112741 | -| total_timesteps | 2668288 | -| train/ | | -| approx_kl | 0.042999312 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.0304 | -| learning_rate | 0.0003 | -| loss | 0.00943 | -| n_updates | 208450 | -| policy_gradient_loss | 0.0277 | -| std | 0.00713 | -| value_loss | 1.68e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20847 | -| time_elapsed | 112745 | -| total_timesteps | 2668416 | -| train/ | | -| approx_kl | 0.664032 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.484 | -| learning_rate | 0.0003 | -| loss | 0.235 | -| n_updates | 208460 | -| policy_gradient_loss | 0.114 | -| std | 0.00713 | -| value_loss | 4.69e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20848 | -| time_elapsed | 112748 | -| total_timesteps | 2668544 | -| train/ | | -| approx_kl | 0.031025337 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.37 | -| learning_rate | 0.0003 | -| loss | 0.00213 | -| n_updates | 208470 | -| policy_gradient_loss | -0.00408 | -| std | 0.00713 | -| value_loss | 8.47e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20849 | -| time_elapsed | 112753 | -| total_timesteps | 2668672 | -| train/ | | -| approx_kl | 0.015407672 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0974 | -| learning_rate | 0.0003 | -| loss | 0.00445 | -| n_updates | 208480 | -| policy_gradient_loss | 0.0339 | -| std | 0.00713 | -| value_loss | 4.64e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20850 | -| time_elapsed | 112757 | -| total_timesteps | 2668800 | -| train/ | | -| approx_kl | 0.17915565 | -| clip_fraction | 0.692 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 208490 | -| policy_gradient_loss | 0.112 | -| std | 0.00713 | -| value_loss | 3.49e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 20851 | -| time_elapsed | 112763 | -| total_timesteps | 2668928 | -| train/ | | -| approx_kl | 0.16469155 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.056 | -| learning_rate | 0.0003 | -| loss | 0.0743 | -| n_updates | 208500 | -| policy_gradient_loss | 0.0709 | -| std | 0.00714 | -| value_loss | 2.04e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20852 | -| time_elapsed | 112768 | -| total_timesteps | 2669056 | -| train/ | | -| approx_kl | 0.122270666 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.07 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 208510 | -| policy_gradient_loss | 0.125 | -| std | 0.00714 | -| value_loss | 1.38e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20853 | -| time_elapsed | 112777 | -| total_timesteps | 2669184 | -| train/ | | -| approx_kl | 0.013011583 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 208520 | -| policy_gradient_loss | -0.0121 | -| std | 0.00714 | -| value_loss | 0.000282 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20854 | -| time_elapsed | 112783 | -| total_timesteps | 2669312 | -| train/ | | -| approx_kl | 0.013566135 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.552 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 208530 | -| policy_gradient_loss | 0.0174 | -| std | 0.00714 | -| value_loss | 5.11e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20855 | -| time_elapsed | 112787 | -| total_timesteps | 2669440 | -| train/ | | -| approx_kl | 0.13697213 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -1.68 | -| learning_rate | 0.0003 | -| loss | 0.0934 | -| n_updates | 208540 | -| policy_gradient_loss | 0.038 | -| std | 0.00715 | -| value_loss | 3.04e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20856 | -| time_elapsed | 112793 | -| total_timesteps | 2669568 | -| train/ | | -| approx_kl | 0.00754605 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.425 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 208550 | -| policy_gradient_loss | 0.00589 | -| std | 0.00714 | -| value_loss | 1.47e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20857 | -| time_elapsed | 112798 | -| total_timesteps | 2669696 | -| train/ | | -| approx_kl | 0.13285777 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 208560 | -| policy_gradient_loss | 0.0211 | -| std | 0.00714 | -| value_loss | 8.87e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20858 | -| time_elapsed | 112803 | -| total_timesteps | 2669824 | -| train/ | | -| approx_kl | 0.0003128806 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.000161 | -| n_updates | 208570 | -| policy_gradient_loss | 0.026 | -| std | 0.00713 | -| value_loss | 7.21e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 20859 | -| time_elapsed | 112806 | -| total_timesteps | 2669952 | -| train/ | | -| approx_kl | 0.17043923 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.00627 | -| learning_rate | 0.0003 | -| loss | 0.0738 | -| n_updates | 208580 | -| policy_gradient_loss | 0.0239 | -| std | 0.00711 | -| value_loss | 7.76e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20860 | -| time_elapsed | 112810 | -| total_timesteps | 2670080 | -| train/ | | -| approx_kl | 0.015299792 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | 0.00731 | -| n_updates | 208590 | -| policy_gradient_loss | 0.0256 | -| std | 0.00711 | -| value_loss | 6.92e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20861 | -| time_elapsed | 112820 | -| total_timesteps | 2670208 | -| train/ | | -| approx_kl | 0.48862246 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.36 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 208600 | -| policy_gradient_loss | 0.0176 | -| std | 0.00711 | -| value_loss | 0.00243 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20862 | -| time_elapsed | 112825 | -| total_timesteps | 2670336 | -| train/ | | -| approx_kl | 0.09718711 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 208610 | -| policy_gradient_loss | 0.0255 | -| std | 0.00711 | -| value_loss | 1.41e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20863 | -| time_elapsed | 112831 | -| total_timesteps | 2670464 | -| train/ | | -| approx_kl | 5.3970143e-07 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 4.89e-06 | -| n_updates | 208620 | -| policy_gradient_loss | 0.0236 | -| std | 0.00711 | -| value_loss | 3.37e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20864 | -| time_elapsed | 112835 | -| total_timesteps | 2670592 | -| train/ | | -| approx_kl | 0.17579621 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.068 | -| n_updates | 208630 | -| policy_gradient_loss | 0.0198 | -| std | 0.00712 | -| value_loss | 2.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20865 | -| time_elapsed | 112839 | -| total_timesteps | 2670720 | -| train/ | | -| approx_kl | 0.014884198 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 208640 | -| policy_gradient_loss | 0.0202 | -| std | 0.00712 | -| value_loss | 1.03e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20866 | -| time_elapsed | 112844 | -| total_timesteps | 2670848 | -| train/ | | -| approx_kl | 0.24836819 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0761 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 208650 | -| policy_gradient_loss | 0.115 | -| std | 0.00712 | -| value_loss | 6.59e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 20867 | -| time_elapsed | 112848 | -| total_timesteps | 2670976 | -| train/ | | -| approx_kl | 0.04608345 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0886 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 208660 | -| policy_gradient_loss | 0.0323 | -| std | 0.00712 | -| value_loss | 3.63e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 20868 | -| time_elapsed | 112852 | -| total_timesteps | 2671104 | -| train/ | | -| approx_kl | 0.13869385 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0678 | -| n_updates | 208670 | -| policy_gradient_loss | 0.019 | -| std | 0.00712 | -| value_loss | 2.46e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 20869 | -| time_elapsed | 112862 | -| total_timesteps | 2671232 | -| train/ | | -| approx_kl | 0.017349778 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 208680 | -| policy_gradient_loss | 0.0033 | -| std | 0.00712 | -| value_loss | 0.00232 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 20870 | -| time_elapsed | 112868 | -| total_timesteps | 2671360 | -| train/ | | -| approx_kl | 0.20330274 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.334 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 208690 | -| policy_gradient_loss | 0.11 | -| std | 0.00712 | -| value_loss | 9.86e-06 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 20871 | -| time_elapsed | 112872 | -| total_timesteps | 2671488 | -| train/ | | -| approx_kl | 0.220403 | -| clip_fraction | 0.679 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.0055 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 208700 | -| policy_gradient_loss | 0.146 | -| std | 0.00712 | -| value_loss | 1.26e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 20872 | -| time_elapsed | 112876 | -| total_timesteps | 2671616 | -| train/ | | -| approx_kl | 0.12513849 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 208710 | -| policy_gradient_loss | 0.108 | -| std | 0.00712 | -| value_loss | 7.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 20873 | -| time_elapsed | 112880 | -| total_timesteps | 2671744 | -| train/ | | -| approx_kl | 0.025729444 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 208720 | -| policy_gradient_loss | 0.0218 | -| std | 0.00712 | -| value_loss | 3.96e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 20874 | -| time_elapsed | 112886 | -| total_timesteps | 2671872 | -| train/ | | -| approx_kl | 0.15946053 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 208730 | -| policy_gradient_loss | 0.0169 | -| std | 0.00712 | -| value_loss | 2.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20875 | -| time_elapsed | 112891 | -| total_timesteps | 2672000 | -| train/ | | -| approx_kl | 0.011189818 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 208740 | -| policy_gradient_loss | -0.00179 | -| std | 0.00712 | -| value_loss | 2.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20876 | -| time_elapsed | 112897 | -| total_timesteps | 2672128 | -| train/ | | -| approx_kl | 0.012407608 | -| clip_fraction | 0.0875 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.00644 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 208750 | -| policy_gradient_loss | 0.000867 | -| std | 0.00713 | -| value_loss | 7.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20877 | -| time_elapsed | 112911 | -| total_timesteps | 2672256 | -| train/ | | -| approx_kl | 0.012096455 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.853 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 208760 | -| policy_gradient_loss | 0.00414 | -| std | 0.00715 | -| value_loss | 0.00324 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20878 | -| time_elapsed | 112917 | -| total_timesteps | 2672384 | -| train/ | | -| approx_kl | 0.08440108 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.095 | -| learning_rate | 0.0003 | -| loss | 0.0503 | -| n_updates | 208770 | -| policy_gradient_loss | 0.0261 | -| std | 0.00716 | -| value_loss | 7.22e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20879 | -| time_elapsed | 112921 | -| total_timesteps | 2672512 | -| train/ | | -| approx_kl | 2.777297e-05 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.000404 | -| n_updates | 208780 | -| policy_gradient_loss | 0.0204 | -| std | 0.00716 | -| value_loss | 1.36e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20880 | -| time_elapsed | 112926 | -| total_timesteps | 2672640 | -| train/ | | -| approx_kl | 0.16381116 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0991 | -| learning_rate | 0.0003 | -| loss | 0.0732 | -| n_updates | 208790 | -| policy_gradient_loss | 0.0192 | -| std | 0.00716 | -| value_loss | 8.76e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20881 | -| time_elapsed | 112930 | -| total_timesteps | 2672768 | -| train/ | | -| approx_kl | 0.1432711 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.0295 | -| n_updates | 208800 | -| policy_gradient_loss | 0.0121 | -| std | 0.00716 | -| value_loss | 1.33e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 20882 | -| time_elapsed | 112935 | -| total_timesteps | 2672896 | -| train/ | | -| approx_kl | 0.054543834 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.237 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 208810 | -| policy_gradient_loss | 0.02 | -| std | 0.00716 | -| value_loss | 3.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20883 | -| time_elapsed | 112940 | -| total_timesteps | 2673024 | -| train/ | | -| approx_kl | 0.030181503 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 208820 | -| policy_gradient_loss | 0.0235 | -| std | 0.00716 | -| value_loss | 4.11e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20884 | -| time_elapsed | 112951 | -| total_timesteps | 2673152 | -| train/ | | -| approx_kl | 0.0016896846 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.908 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 208830 | -| policy_gradient_loss | 0.00636 | -| std | 0.00716 | -| value_loss | 0.00163 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20885 | -| time_elapsed | 112957 | -| total_timesteps | 2673280 | -| train/ | | -| approx_kl | 0.009958519 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | -0.0072 | -| n_updates | 208840 | -| policy_gradient_loss | 0.0117 | -| std | 0.00716 | -| value_loss | 2.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20886 | -| time_elapsed | 112960 | -| total_timesteps | 2673408 | -| train/ | | -| approx_kl | 0.11808242 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0667 | -| n_updates | 208850 | -| policy_gradient_loss | 0.0109 | -| std | 0.00715 | -| value_loss | 2.85e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20887 | -| time_elapsed | 112965 | -| total_timesteps | 2673536 | -| train/ | | -| approx_kl | 0.0057587023 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.00928 | -| n_updates | 208860 | -| policy_gradient_loss | 0.015 | -| std | 0.00715 | -| value_loss | 1.72e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20888 | -| time_elapsed | 112970 | -| total_timesteps | 2673664 | -| train/ | | -| approx_kl | 0.013792386 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.000925 | -| n_updates | 208870 | -| policy_gradient_loss | -0.000805 | -| std | 0.00715 | -| value_loss | 6.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20889 | -| time_elapsed | 112973 | -| total_timesteps | 2673792 | -| train/ | | -| approx_kl | 0.010621764 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0961 | -| learning_rate | 0.0003 | -| loss | 0.00186 | -| n_updates | 208880 | -| policy_gradient_loss | 0.00039 | -| std | 0.00715 | -| value_loss | 2.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 20890 | -| time_elapsed | 112975 | -| total_timesteps | 2673920 | -| train/ | | -| approx_kl | 0.024019707 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | 0.00361 | -| n_updates | 208890 | -| policy_gradient_loss | 0.0234 | -| std | 0.00715 | -| value_loss | 1.19e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20891 | -| time_elapsed | 112979 | -| total_timesteps | 2674048 | -| train/ | | -| approx_kl | 0.2091097 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0666 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 208900 | -| policy_gradient_loss | 0.119 | -| std | 0.00715 | -| value_loss | 3.05e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20892 | -| time_elapsed | 112988 | -| total_timesteps | 2674176 | -| train/ | | -| approx_kl | 0.038703322 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | 0.00578 | -| n_updates | 208910 | -| policy_gradient_loss | 0.0107 | -| std | 0.00715 | -| value_loss | 0.00184 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20893 | -| time_elapsed | 112993 | -| total_timesteps | 2674304 | -| train/ | | -| approx_kl | 0.18286358 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -3.41 | -| learning_rate | 0.0003 | -| loss | 0.0795 | -| n_updates | 208920 | -| policy_gradient_loss | 0.0201 | -| std | 0.00715 | -| value_loss | 4.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20894 | -| time_elapsed | 112998 | -| total_timesteps | 2674432 | -| train/ | | -| approx_kl | 0.010720324 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | -8.35e-05 | -| n_updates | 208930 | -| policy_gradient_loss | -0.000328 | -| std | 0.00714 | -| value_loss | 2.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20895 | -| time_elapsed | 113002 | -| total_timesteps | 2674560 | -| train/ | | -| approx_kl | 0.010460897 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0712 | -| learning_rate | 0.0003 | -| loss | -0.005 | -| n_updates | 208940 | -| policy_gradient_loss | -0.00275 | -| std | 0.00714 | -| value_loss | 3.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20896 | -| time_elapsed | 113007 | -| total_timesteps | 2674688 | -| train/ | | -| approx_kl | 0.010068218 | -| clip_fraction | 0.0742 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0146 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 208950 | -| policy_gradient_loss | -0.00233 | -| std | 0.00714 | -| value_loss | 9.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20897 | -| time_elapsed | 113011 | -| total_timesteps | 2674816 | -| train/ | | -| approx_kl | 0.008429866 | -| clip_fraction | 0.0547 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0844 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 208960 | -| policy_gradient_loss | -0.000683 | -| std | 0.00713 | -| value_loss | 7.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 20898 | -| time_elapsed | 113016 | -| total_timesteps | 2674944 | -| train/ | | -| approx_kl | 0.018020676 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.00573 | -| n_updates | 208970 | -| policy_gradient_loss | 0.0241 | -| std | 0.00713 | -| value_loss | 3.44e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20899 | -| time_elapsed | 113021 | -| total_timesteps | 2675072 | -| train/ | | -| approx_kl | 0.11790131 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 208980 | -| policy_gradient_loss | 0.0344 | -| std | 0.00714 | -| value_loss | 1.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20900 | -| time_elapsed | 113028 | -| total_timesteps | 2675200 | -| train/ | | -| approx_kl | 0.013791656 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | 0.834 | -| learning_rate | 0.0003 | -| loss | -0.0144 | -| n_updates | 208990 | -| policy_gradient_loss | -0.0108 | -| std | 0.00714 | -| value_loss | 0.00434 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20901 | -| time_elapsed | 113032 | -| total_timesteps | 2675328 | -| train/ | | -| approx_kl | 0.09355187 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 209000 | -| policy_gradient_loss | 0.00476 | -| std | 0.00713 | -| value_loss | 5.7e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20902 | -| time_elapsed | 113038 | -| total_timesteps | 2675456 | -| train/ | | -| approx_kl | 0.0279884 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 209010 | -| policy_gradient_loss | 0.00123 | -| std | 0.00713 | -| value_loss | 6.38e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20903 | -| time_elapsed | 113044 | -| total_timesteps | 2675584 | -| train/ | | -| approx_kl | 0.0044349693 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | -0.00986 | -| n_updates | 209020 | -| policy_gradient_loss | 0.00224 | -| std | 0.00713 | -| value_loss | 6.23e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20904 | -| time_elapsed | 113048 | -| total_timesteps | 2675712 | -| train/ | | -| approx_kl | 0.08115514 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.52 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 209030 | -| policy_gradient_loss | 0.00735 | -| std | 0.00713 | -| value_loss | 2.62e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20905 | -| time_elapsed | 113054 | -| total_timesteps | 2675840 | -| train/ | | -| approx_kl | 0.0059990897 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0088 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 209040 | -| policy_gradient_loss | 0.001 | -| std | 0.00711 | -| value_loss | 1.27e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20906 | -| time_elapsed | 113058 | -| total_timesteps | 2675968 | -| train/ | | -| approx_kl | 0.019904673 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.00775 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 209050 | -| policy_gradient_loss | 0.0263 | -| std | 0.00708 | -| value_loss | 6.98e-05 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20907 | -| time_elapsed | 113064 | -| total_timesteps | 2676096 | -| train/ | | -| approx_kl | 1.042187 | -| clip_fraction | 0.748 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.00467 | -| learning_rate | 0.0003 | -| loss | 0.394 | -| n_updates | 209060 | -| policy_gradient_loss | 0.292 | -| std | 0.00706 | -| value_loss | 0.000243 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20908 | -| time_elapsed | 113076 | -| total_timesteps | 2676224 | -| train/ | | -| approx_kl | 0.0054995413 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 209070 | -| policy_gradient_loss | 0.0104 | -| std | 0.00706 | -| value_loss | 0.00323 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20909 | -| time_elapsed | 113082 | -| total_timesteps | 2676352 | -| train/ | | -| approx_kl | 0.07245138 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -1.76 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 209080 | -| policy_gradient_loss | 0.0119 | -| std | 0.00706 | -| value_loss | 8.33e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20910 | -| time_elapsed | 113087 | -| total_timesteps | 2676480 | -| train/ | | -| approx_kl | 7.035537e-05 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -2.1 | -| learning_rate | 0.0003 | -| loss | -0.000208 | -| n_updates | 209090 | -| policy_gradient_loss | 0.0158 | -| std | 0.00706 | -| value_loss | 5.3e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20911 | -| time_elapsed | 113093 | -| total_timesteps | 2676608 | -| train/ | | -| approx_kl | 0.15885657 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 209100 | -| policy_gradient_loss | 0.0158 | -| std | 0.00706 | -| value_loss | 3.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20912 | -| time_elapsed | 113098 | -| total_timesteps | 2676736 | -| train/ | | -| approx_kl | 0.022087647 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -153 | -| learning_rate | 0.0003 | -| loss | 0.0031 | -| n_updates | 209110 | -| policy_gradient_loss | 0.0186 | -| std | 0.00706 | -| value_loss | 1.87e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20913 | -| time_elapsed | 113103 | -| total_timesteps | 2676864 | -| train/ | | -| approx_kl | 0.21256205 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.925 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 209120 | -| policy_gradient_loss | 0.13 | -| std | 0.00706 | -| value_loss | 3.73e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 20914 | -| time_elapsed | 113108 | -| total_timesteps | 2676992 | -| train/ | | -| approx_kl | 0.043054916 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 209130 | -| policy_gradient_loss | 0.0143 | -| std | 0.00706 | -| value_loss | 3.54e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 20915 | -| time_elapsed | 113112 | -| total_timesteps | 2677120 | -| train/ | | -| approx_kl | 0.48424548 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 209140 | -| policy_gradient_loss | 0.0495 | -| std | 0.00707 | -| value_loss | 1.33e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 20916 | -| time_elapsed | 113123 | -| total_timesteps | 2677248 | -| train/ | | -| approx_kl | 0.0023388104 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -3.78 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 209150 | -| policy_gradient_loss | -0.0111 | -| std | 0.00707 | -| value_loss | 0.00482 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 20917 | -| time_elapsed | 113128 | -| total_timesteps | 2677376 | -| train/ | | -| approx_kl | 0.044741508 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 209160 | -| policy_gradient_loss | 0.0186 | -| std | 0.00707 | -| value_loss | 2.2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 20918 | -| time_elapsed | 113133 | -| total_timesteps | 2677504 | -| train/ | | -| approx_kl | 0.053488895 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.212 | -| learning_rate | 0.0003 | -| loss | 0.00874 | -| n_updates | 209170 | -| policy_gradient_loss | 0.0037 | -| std | 0.00707 | -| value_loss | 1.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 20919 | -| time_elapsed | 113138 | -| total_timesteps | 2677632 | -| train/ | | -| approx_kl | 0.043094683 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 209180 | -| policy_gradient_loss | 0.0115 | -| std | 0.00707 | -| value_loss | 4.96e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 20920 | -| time_elapsed | 113143 | -| total_timesteps | 2677760 | -| train/ | | -| approx_kl | 0.04807947 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0843 | -| learning_rate | 0.0003 | -| loss | 0.00224 | -| n_updates | 209190 | -| policy_gradient_loss | 0.00103 | -| std | 0.00707 | -| value_loss | 3.78e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 20921 | -| time_elapsed | 113148 | -| total_timesteps | 2677888 | -| train/ | | -| approx_kl | 0.034430556 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | -0.000115 | -| n_updates | 209200 | -| policy_gradient_loss | -0.000201 | -| std | 0.00707 | -| value_loss | 2.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20922 | -| time_elapsed | 113153 | -| total_timesteps | 2678016 | -| train/ | | -| approx_kl | 0.006895945 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | 4.29e-05 | -| n_updates | 209210 | -| policy_gradient_loss | 0.00461 | -| std | 0.00707 | -| value_loss | 3.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20923 | -| time_elapsed | 113167 | -| total_timesteps | 2678144 | -| train/ | | -| approx_kl | 0.14773746 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.895 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 209220 | -| policy_gradient_loss | -0.00255 | -| std | 0.00707 | -| value_loss | 0.00223 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20924 | -| time_elapsed | 113172 | -| total_timesteps | 2678272 | -| train/ | | -| approx_kl | 0.058857623 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.000819 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 209230 | -| policy_gradient_loss | 0.00593 | -| std | 0.00707 | -| value_loss | 0.000167 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20925 | -| time_elapsed | 113177 | -| total_timesteps | 2678400 | -| train/ | | -| approx_kl | 0.015486281 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 209240 | -| policy_gradient_loss | 0.0653 | -| std | 0.00706 | -| value_loss | 0.00056 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20926 | -| time_elapsed | 113183 | -| total_timesteps | 2678528 | -| train/ | | -| approx_kl | 0.010129979 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 209250 | -| policy_gradient_loss | 0.00358 | -| std | 0.00707 | -| value_loss | 4.17e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20927 | -| time_elapsed | 113187 | -| total_timesteps | 2678656 | -| train/ | | -| approx_kl | 0.031026859 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 209260 | -| policy_gradient_loss | 0.0533 | -| std | 0.00707 | -| value_loss | 1.99e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20928 | -| time_elapsed | 113191 | -| total_timesteps | 2678784 | -| train/ | | -| approx_kl | 0.14073595 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0865 | -| n_updates | 209270 | -| policy_gradient_loss | 0.0383 | -| std | 0.00707 | -| value_loss | 1.19e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 20929 | -| time_elapsed | 113196 | -| total_timesteps | 2678912 | -| train/ | | -| approx_kl | 0.014795785 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0682 | -| learning_rate | 0.0003 | -| loss | 0.00585 | -| n_updates | 209280 | -| policy_gradient_loss | 0.00915 | -| std | 0.00707 | -| value_loss | 7.88e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20930 | -| time_elapsed | 113202 | -| total_timesteps | 2679040 | -| train/ | | -| approx_kl | 0.03152612 | -| clip_fraction | 0.625 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 209290 | -| policy_gradient_loss | 0.0728 | -| std | 0.00707 | -| value_loss | 4.14e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20931 | -| time_elapsed | 113209 | -| total_timesteps | 2679168 | -| train/ | | -| approx_kl | 0.005635433 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 209300 | -| policy_gradient_loss | -0.000665 | -| std | 0.00707 | -| value_loss | 0.00332 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20932 | -| time_elapsed | 113214 | -| total_timesteps | 2679296 | -| train/ | | -| approx_kl | 0.1280712 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0761 | -| n_updates | 209310 | -| policy_gradient_loss | 0.0225 | -| std | 0.00707 | -| value_loss | 1.77e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20933 | -| time_elapsed | 113219 | -| total_timesteps | 2679424 | -| train/ | | -| approx_kl | 0.01355451 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.53 | -| explained_variance | 0.0115 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 209320 | -| policy_gradient_loss | -0.00321 | -| std | 0.00707 | -| value_loss | 2.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20934 | -| time_elapsed | 113224 | -| total_timesteps | 2679552 | -| train/ | | -| approx_kl | 0.014389107 | -| clip_fraction | 0.0836 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.00463 | -| n_updates | 209330 | -| policy_gradient_loss | 0.00166 | -| std | 0.00703 | -| value_loss | 0.000315 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20935 | -| time_elapsed | 113229 | -| total_timesteps | 2679680 | -| train/ | | -| approx_kl | 0.013484916 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 209340 | -| policy_gradient_loss | 0.00445 | -| std | 0.007 | -| value_loss | 0.00549 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20936 | -| time_elapsed | 113234 | -| total_timesteps | 2679808 | -| train/ | | -| approx_kl | 0.0014576092 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.0095 | -| n_updates | 209350 | -| policy_gradient_loss | 0.0103 | -| std | 0.00699 | -| value_loss | 0.000113 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20937 | -| time_elapsed | 113239 | -| total_timesteps | 2679936 | -| train/ | | -| approx_kl | 0.015019929 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 209360 | -| policy_gradient_loss | 0.0226 | -| std | 0.00698 | -| value_loss | 8.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20938 | -| time_elapsed | 113244 | -| total_timesteps | 2680064 | -| train/ | | -| approx_kl | 0.31165636 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 209370 | -| policy_gradient_loss | 0.213 | -| std | 0.00698 | -| value_loss | 9.12e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20939 | -| time_elapsed | 113252 | -| total_timesteps | 2680192 | -| train/ | | -| approx_kl | 0.023089705 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.808 | -| learning_rate | 0.0003 | -| loss | -0.0233 | -| n_updates | 209380 | -| policy_gradient_loss | 0.00886 | -| std | 0.00698 | -| value_loss | 0.00119 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20940 | -| time_elapsed | 113257 | -| total_timesteps | 2680320 | -| train/ | | -| approx_kl | 0.18391214 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 209390 | -| policy_gradient_loss | 0.0134 | -| std | 0.00698 | -| value_loss | 4.93e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20941 | -| time_elapsed | 113260 | -| total_timesteps | 2680448 | -| train/ | | -| approx_kl | 0.01603026 | -| clip_fraction | 0.0969 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.00586 | -| n_updates | 209400 | -| policy_gradient_loss | 0.00168 | -| std | 0.00698 | -| value_loss | 3.4e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20942 | -| time_elapsed | 113264 | -| total_timesteps | 2680576 | -| train/ | | -| approx_kl | 0.014600404 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 209410 | -| policy_gradient_loss | -0.00672 | -| std | 0.00698 | -| value_loss | 2.6e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20943 | -| time_elapsed | 113267 | -| total_timesteps | 2680704 | -| train/ | | -| approx_kl | 0.025096517 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.00727 | -| n_updates | 209420 | -| policy_gradient_loss | 0.0291 | -| std | 0.00698 | -| value_loss | 2.43e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20944 | -| time_elapsed | 113272 | -| total_timesteps | 2680832 | -| train/ | | -| approx_kl | 0.105836555 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 209430 | -| policy_gradient_loss | 0.0188 | -| std | 0.00698 | -| value_loss | 2.38e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 20945 | -| time_elapsed | 113274 | -| total_timesteps | 2680960 | -| train/ | | -| approx_kl | 0.007937798 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.00977 | -| n_updates | 209440 | -| policy_gradient_loss | 0.0143 | -| std | 0.00698 | -| value_loss | 1.68e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20946 | -| time_elapsed | 113279 | -| total_timesteps | 2681088 | -| train/ | | -| approx_kl | 0.24378651 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 209450 | -| policy_gradient_loss | 0.171 | -| std | 0.00698 | -| value_loss | 1.11e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20947 | -| time_elapsed | 113290 | -| total_timesteps | 2681216 | -| train/ | | -| approx_kl | 0.27007127 | -| clip_fraction | 0.681 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -4.38 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 209460 | -| policy_gradient_loss | 0.0277 | -| std | 0.00698 | -| value_loss | 0.0045 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20948 | -| time_elapsed | 113295 | -| total_timesteps | 2681344 | -| train/ | | -| approx_kl | 0.061992854 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 209470 | -| policy_gradient_loss | 0.0181 | -| std | 0.00698 | -| value_loss | 3.25e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20949 | -| time_elapsed | 113300 | -| total_timesteps | 2681472 | -| train/ | | -| approx_kl | 0.0035013217 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 209480 | -| policy_gradient_loss | 0.00816 | -| std | 0.00698 | -| value_loss | 1.39e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20950 | -| time_elapsed | 113305 | -| total_timesteps | 2681600 | -| train/ | | -| approx_kl | 0.04337937 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 209490 | -| policy_gradient_loss | 0.0182 | -| std | 0.00698 | -| value_loss | 1.02e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20951 | -| time_elapsed | 113308 | -| total_timesteps | 2681728 | -| train/ | | -| approx_kl | 0.11172103 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.0557 | -| n_updates | 209500 | -| policy_gradient_loss | 0.0157 | -| std | 0.00698 | -| value_loss | 8.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20952 | -| time_elapsed | 113313 | -| total_timesteps | 2681856 | -| train/ | | -| approx_kl | 0.014542041 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | -0.00732 | -| n_updates | 209510 | -| policy_gradient_loss | -0.004 | -| std | 0.00698 | -| value_loss | 7.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20953 | -| time_elapsed | 113317 | -| total_timesteps | 2681984 | -| train/ | | -| approx_kl | 0.030481089 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 209520 | -| policy_gradient_loss | 0.0367 | -| std | 0.00698 | -| value_loss | 6.38e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20954 | -| time_elapsed | 113321 | -| total_timesteps | 2682112 | -| train/ | | -| approx_kl | 0.10130312 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | 0.069 | -| n_updates | 209530 | -| policy_gradient_loss | 0.0319 | -| std | 0.00698 | -| value_loss | 3.71e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20955 | -| time_elapsed | 113334 | -| total_timesteps | 2682240 | -| train/ | | -| approx_kl | 0.01211729 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 209540 | -| policy_gradient_loss | 0.0084 | -| std | 0.00698 | -| value_loss | 7.43e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20956 | -| time_elapsed | 113338 | -| total_timesteps | 2682368 | -| train/ | | -| approx_kl | 0.005423858 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 209550 | -| policy_gradient_loss | 0.0304 | -| std | 0.00698 | -| value_loss | 2.85e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20957 | -| time_elapsed | 113343 | -| total_timesteps | 2682496 | -| train/ | | -| approx_kl | 0.4233449 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 209560 | -| policy_gradient_loss | 0.0617 | -| std | 0.00698 | -| value_loss | 2.06e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20958 | -| time_elapsed | 113347 | -| total_timesteps | 2682624 | -| train/ | | -| approx_kl | 0.048669033 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.0265 | -| n_updates | 209570 | -| policy_gradient_loss | 0.0114 | -| std | 0.00698 | -| value_loss | 1.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20959 | -| time_elapsed | 113352 | -| total_timesteps | 2682752 | -| train/ | | -| approx_kl | 0.043987673 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 209580 | -| policy_gradient_loss | 0.00966 | -| std | 0.00698 | -| value_loss | 1.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 20960 | -| time_elapsed | 113357 | -| total_timesteps | 2682880 | -| train/ | | -| approx_kl | 0.04217765 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 209590 | -| policy_gradient_loss | 0.0146 | -| std | 0.00698 | -| value_loss | 7.79e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20961 | -| time_elapsed | 113361 | -| total_timesteps | 2683008 | -| train/ | | -| approx_kl | 0.0066430657 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0736 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 209600 | -| policy_gradient_loss | 0.00466 | -| std | 0.00699 | -| value_loss | 5.61e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20962 | -| time_elapsed | 113373 | -| total_timesteps | 2683136 | -| train/ | | -| approx_kl | 0.047888093 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -3.91 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 209610 | -| policy_gradient_loss | 0.00159 | -| std | 0.00699 | -| value_loss | 0.0042 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20963 | -| time_elapsed | 113377 | -| total_timesteps | 2683264 | -| train/ | | -| approx_kl | 0.48612857 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.357 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 209620 | -| policy_gradient_loss | 0.0467 | -| std | 0.00699 | -| value_loss | 3.46e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20964 | -| time_elapsed | 113383 | -| total_timesteps | 2683392 | -| train/ | | -| approx_kl | 0.0397924 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | 0.00971 | -| n_updates | 209630 | -| policy_gradient_loss | 0.00487 | -| std | 0.00699 | -| value_loss | 2.38e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20965 | -| time_elapsed | 113387 | -| total_timesteps | 2683520 | -| train/ | | -| approx_kl | 0.006190897 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 209640 | -| policy_gradient_loss | 0.00263 | -| std | 0.007 | -| value_loss | 8.8e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20966 | -| time_elapsed | 113392 | -| total_timesteps | 2683648 | -| train/ | | -| approx_kl | 0.0017391187 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0624 | -| learning_rate | 0.0003 | -| loss | -0.000297 | -| n_updates | 209650 | -| policy_gradient_loss | 0.00619 | -| std | 0.007 | -| value_loss | 5.19e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20967 | -| time_elapsed | 113395 | -| total_timesteps | 2683776 | -| train/ | | -| approx_kl | 0.038476583 | -| clip_fraction | 0.633 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0455 | -| n_updates | 209660 | -| policy_gradient_loss | 0.0908 | -| std | 0.007 | -| value_loss | 9.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 20968 | -| time_elapsed | 113401 | -| total_timesteps | 2683904 | -| train/ | | -| approx_kl | 0.011071093 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.000996 | -| learning_rate | 0.0003 | -| loss | -0.00254 | -| n_updates | 209670 | -| policy_gradient_loss | 0.0289 | -| std | 0.007 | -| value_loss | 6.4e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20969 | -| time_elapsed | 113406 | -| total_timesteps | 2684032 | -| train/ | | -| approx_kl | 0.17537111 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | 0.0447 | -| n_updates | 209680 | -| policy_gradient_loss | 0.0117 | -| std | 0.007 | -| value_loss | 4.09e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20970 | -| time_elapsed | 113416 | -| total_timesteps | 2684160 | -| train/ | | -| approx_kl | 0.0026085074 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.782 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 209690 | -| policy_gradient_loss | -0.0031 | -| std | 0.007 | -| value_loss | 0.000903 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20971 | -| time_elapsed | 113420 | -| total_timesteps | 2684288 | -| train/ | | -| approx_kl | 0.48959497 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.00927 | -| learning_rate | 0.0003 | -| loss | 0.218 | -| n_updates | 209700 | -| policy_gradient_loss | 0.0764 | -| std | 0.007 | -| value_loss | 3.96e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20972 | -| time_elapsed | 113425 | -| total_timesteps | 2684416 | -| train/ | | -| approx_kl | 0.06461902 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.977 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 209710 | -| policy_gradient_loss | 0.016 | -| std | 0.00701 | -| value_loss | 8.53e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20973 | -| time_elapsed | 113430 | -| total_timesteps | 2684544 | -| train/ | | -| approx_kl | 0.009734041 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.000496 | -| learning_rate | 0.0003 | -| loss | -7.27e-06 | -| n_updates | 209720 | -| policy_gradient_loss | 0.00654 | -| std | 0.00701 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20974 | -| time_elapsed | 113433 | -| total_timesteps | 2684672 | -| train/ | | -| approx_kl | 0.0007028044 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 209730 | -| policy_gradient_loss | 0.00353 | -| std | 0.007 | -| value_loss | 9.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20975 | -| time_elapsed | 113438 | -| total_timesteps | 2684800 | -| train/ | | -| approx_kl | 0.050200745 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.0298 | -| n_updates | 209740 | -| policy_gradient_loss | -0.0162 | -| std | 0.007 | -| value_loss | 7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20976 | -| time_elapsed | 113442 | -| total_timesteps | 2684928 | -| train/ | | -| approx_kl | 0.008327898 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.00814 | -| n_updates | 209750 | -| policy_gradient_loss | 0.00456 | -| std | 0.007 | -| value_loss | 6.21e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20977 | -| time_elapsed | 113445 | -| total_timesteps | 2685056 | -| train/ | | -| approx_kl | 0.002044227 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | -0.00601 | -| n_updates | 209760 | -| policy_gradient_loss | 0.00634 | -| std | 0.007 | -| value_loss | 4.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20978 | -| time_elapsed | 113451 | -| total_timesteps | 2685184 | -| train/ | | -| approx_kl | 0.057236332 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.131 | -| learning_rate | 0.0003 | -| loss | 0.000858 | -| n_updates | 209770 | -| policy_gradient_loss | -0.00765 | -| std | 0.00701 | -| value_loss | 0.00261 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20979 | -| time_elapsed | 113456 | -| total_timesteps | 2685312 | -| train/ | | -| approx_kl | 0.4817545 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.771 | -| learning_rate | 0.0003 | -| loss | 0.205 | -| n_updates | 209780 | -| policy_gradient_loss | 0.0675 | -| std | 0.00702 | -| value_loss | 2.86e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20980 | -| time_elapsed | 113458 | -| total_timesteps | 2685440 | -| train/ | | -| approx_kl | 0.064150415 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0357 | -| n_updates | 209790 | -| policy_gradient_loss | 0.0143 | -| std | 0.00702 | -| value_loss | 2.98e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20981 | -| time_elapsed | 113461 | -| total_timesteps | 2685568 | -| train/ | | -| approx_kl | 0.035661884 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 209800 | -| policy_gradient_loss | 0.00846 | -| std | 0.00702 | -| value_loss | 2.96e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20982 | -| time_elapsed | 113465 | -| total_timesteps | 2685696 | -| train/ | | -| approx_kl | 0.0073929937 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 209810 | -| policy_gradient_loss | 0.00636 | -| std | 0.00703 | -| value_loss | 2.29e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20983 | -| time_elapsed | 113468 | -| total_timesteps | 2685824 | -| train/ | | -| approx_kl | 0.068057835 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 209820 | -| policy_gradient_loss | 0.00846 | -| std | 0.00703 | -| value_loss | 1.88e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 20984 | -| time_elapsed | 113473 | -| total_timesteps | 2685952 | -| train/ | | -| approx_kl | 0.038426448 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 209830 | -| policy_gradient_loss | 0.01 | -| std | 0.00702 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20985 | -| time_elapsed | 113477 | -| total_timesteps | 2686080 | -| train/ | | -| approx_kl | 0.006121255 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 209840 | -| policy_gradient_loss | 0.00565 | -| std | 0.00702 | -| value_loss | 9.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20986 | -| time_elapsed | 113484 | -| total_timesteps | 2686208 | -| train/ | | -| approx_kl | 0.017000232 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.87 | -| learning_rate | 0.0003 | -| loss | 0.00892 | -| n_updates | 209850 | -| policy_gradient_loss | 0.00297 | -| std | 0.00701 | -| value_loss | 0.0025 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20987 | -| time_elapsed | 113488 | -| total_timesteps | 2686336 | -| train/ | | -| approx_kl | 0.009682715 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | -0.00498 | -| n_updates | 209860 | -| policy_gradient_loss | -0.00235 | -| std | 0.007 | -| value_loss | 1.66e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20988 | -| time_elapsed | 113492 | -| total_timesteps | 2686464 | -| train/ | | -| approx_kl | 0.023132984 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0681 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 209870 | -| policy_gradient_loss | 0.0154 | -| std | 0.00699 | -| value_loss | 3.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20989 | -| time_elapsed | 113495 | -| total_timesteps | 2686592 | -| train/ | | -| approx_kl | 0.10737366 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | 0.0643 | -| n_updates | 209880 | -| policy_gradient_loss | 0.0289 | -| std | 0.007 | -| value_loss | 1.99e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20990 | -| time_elapsed | 113498 | -| total_timesteps | 2686720 | -| train/ | | -| approx_kl | 0.115522854 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.0675 | -| n_updates | 209890 | -| policy_gradient_loss | 0.0224 | -| std | 0.007 | -| value_loss | 1.63e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20991 | -| time_elapsed | 113503 | -| total_timesteps | 2686848 | -| train/ | | -| approx_kl | 0.1495478 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.0648 | -| n_updates | 209900 | -| policy_gradient_loss | 0.0309 | -| std | 0.007 | -| value_loss | 1.24e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 20992 | -| time_elapsed | 113507 | -| total_timesteps | 2686976 | -| train/ | | -| approx_kl | 0.046256747 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.0095 | -| n_updates | 209910 | -| policy_gradient_loss | 0.0176 | -| std | 0.007 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 20993 | -| time_elapsed | 113511 | -| total_timesteps | 2687104 | -| train/ | | -| approx_kl | 0.041062854 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.00534 | -| n_updates | 209920 | -| policy_gradient_loss | 0.0341 | -| std | 0.007 | -| value_loss | 8.85e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 20994 | -| time_elapsed | 113522 | -| total_timesteps | 2687232 | -| train/ | | -| approx_kl | 0.0040866514 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.898 | -| learning_rate | 0.0003 | -| loss | -0.00933 | -| n_updates | 209930 | -| policy_gradient_loss | 0.0171 | -| std | 0.007 | -| value_loss | 0.000926 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 20995 | -| time_elapsed | 113525 | -| total_timesteps | 2687360 | -| train/ | | -| approx_kl | 0.009757899 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 209940 | -| policy_gradient_loss | 0.0232 | -| std | 0.007 | -| value_loss | 0.000136 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 20996 | -| time_elapsed | 113529 | -| total_timesteps | 2687488 | -| train/ | | -| approx_kl | 0.0036362857 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0847 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 209950 | -| policy_gradient_loss | 0.0222 | -| std | 0.007 | -| value_loss | 2.69e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 20997 | -| time_elapsed | 113534 | -| total_timesteps | 2687616 | -| train/ | | -| approx_kl | 0.053744797 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.00405 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 209960 | -| policy_gradient_loss | 0.0146 | -| std | 0.007 | -| value_loss | 7.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 20998 | -| time_elapsed | 113539 | -| total_timesteps | 2687744 | -| train/ | | -| approx_kl | 0.13500684 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.0513 | -| n_updates | 209970 | -| policy_gradient_loss | 0.0348 | -| std | 0.007 | -| value_loss | 4.55e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 20999 | -| time_elapsed | 113544 | -| total_timesteps | 2687872 | -| train/ | | -| approx_kl | 0.35277933 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 209980 | -| policy_gradient_loss | 0.144 | -| std | 0.00701 | -| value_loss | 4.17e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21000 | -| time_elapsed | 113548 | -| total_timesteps | 2688000 | -| train/ | | -| approx_kl | 0.058430217 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 209990 | -| policy_gradient_loss | 0.0217 | -| std | 0.00701 | -| value_loss | 3.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21001 | -| time_elapsed | 113554 | -| total_timesteps | 2688128 | -| train/ | | -| approx_kl | 0.13834338 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.00379 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 210000 | -| policy_gradient_loss | 0.0159 | -| std | 0.007 | -| value_loss | 1.64e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21002 | -| time_elapsed | 113562 | -| total_timesteps | 2688256 | -| train/ | | -| approx_kl | 0.03416691 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | 0.00298 | -| n_updates | 210010 | -| policy_gradient_loss | -0.00116 | -| std | 0.00699 | -| value_loss | 0.0011 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21003 | -| time_elapsed | 113566 | -| total_timesteps | 2688384 | -| train/ | | -| approx_kl | 0.24810547 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.54 | -| explained_variance | -0.00893 | -| learning_rate | 0.0003 | -| loss | 0.0838 | -| n_updates | 210020 | -| policy_gradient_loss | 0.0284 | -| std | 0.00699 | -| value_loss | 1.37e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21004 | -| time_elapsed | 113571 | -| total_timesteps | 2688512 | -| train/ | | -| approx_kl | 0.12548009 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.00489 | -| learning_rate | 0.0003 | -| loss | 0.0764 | -| n_updates | 210030 | -| policy_gradient_loss | 0.0129 | -| std | 0.00698 | -| value_loss | 4.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21005 | -| time_elapsed | 113576 | -| total_timesteps | 2688640 | -| train/ | | -| approx_kl | 0.037577964 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0453 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 210040 | -| policy_gradient_loss | 0.0336 | -| std | 0.00697 | -| value_loss | 1.69e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21006 | -| time_elapsed | 113581 | -| total_timesteps | 2688768 | -| train/ | | -| approx_kl | 0.09417948 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.405 | -| learning_rate | 0.0003 | -| loss | 0.0455 | -| n_updates | 210050 | -| policy_gradient_loss | 0.0206 | -| std | 0.00697 | -| value_loss | 3.8e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21007 | -| time_elapsed | 113586 | -| total_timesteps | 2688896 | -| train/ | | -| approx_kl | 0.59708124 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0027 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 210060 | -| policy_gradient_loss | 0.0425 | -| std | 0.00697 | -| value_loss | 1.08e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21008 | -| time_elapsed | 113590 | -| total_timesteps | 2689024 | -| train/ | | -| approx_kl | 0.02911178 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 210070 | -| policy_gradient_loss | 0.00843 | -| std | 0.00697 | -| value_loss | 7.79e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21009 | -| time_elapsed | 113602 | -| total_timesteps | 2689152 | -| train/ | | -| approx_kl | 0.017599965 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.822 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 210080 | -| policy_gradient_loss | -0.00908 | -| std | 0.00697 | -| value_loss | 0.00459 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21010 | -| time_elapsed | 113606 | -| total_timesteps | 2689280 | -| train/ | | -| approx_kl | 0.07504821 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.00664 | -| learning_rate | 0.0003 | -| loss | 0.00276 | -| n_updates | 210090 | -| policy_gradient_loss | -0.00253 | -| std | 0.00697 | -| value_loss | 0.000122 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21011 | -| time_elapsed | 113609 | -| total_timesteps | 2689408 | -| train/ | | -| approx_kl | 0.04219217 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.0099 | -| learning_rate | 0.0003 | -| loss | 0.00474 | -| n_updates | 210100 | -| policy_gradient_loss | 0.00354 | -| std | 0.00697 | -| value_loss | 7.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21012 | -| time_elapsed | 113614 | -| total_timesteps | 2689536 | -| train/ | | -| approx_kl | 0.00775229 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.00693 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 210110 | -| policy_gradient_loss | 0.00695 | -| std | 0.00697 | -| value_loss | 3.83e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21013 | -| time_elapsed | 113618 | -| total_timesteps | 2689664 | -| train/ | | -| approx_kl | 0.0011255783 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.00251 | -| n_updates | 210120 | -| policy_gradient_loss | 0.0119 | -| std | 0.00697 | -| value_loss | 2.87e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21014 | -| time_elapsed | 113621 | -| total_timesteps | 2689792 | -| train/ | | -| approx_kl | 0.0043247244 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 210130 | -| policy_gradient_loss | 0.00376 | -| std | 0.00697 | -| value_loss | 2.06e-06 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21015 | -| time_elapsed | 113625 | -| total_timesteps | 2689920 | -| train/ | | -| approx_kl | 0.000103489496 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | 0.000617 | -| n_updates | 210140 | -| policy_gradient_loss | 0.0248 | -| std | 0.00697 | -| value_loss | 1.41e-06 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21016 | -| time_elapsed | 113629 | -| total_timesteps | 2690048 | -| train/ | | -| approx_kl | 0.65832424 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | 0.251 | -| n_updates | 210150 | -| policy_gradient_loss | 0.16 | -| std | 0.00698 | -| value_loss | 7.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21017 | -| time_elapsed | 113639 | -| total_timesteps | 2690176 | -| train/ | | -| approx_kl | 0.13417408 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.849 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 210160 | -| policy_gradient_loss | -0.00773 | -| std | 0.00698 | -| value_loss | 0.0029 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21018 | -| time_elapsed | 113644 | -| total_timesteps | 2690304 | -| train/ | | -| approx_kl | 0.017947834 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | 0.00693 | -| n_updates | 210170 | -| policy_gradient_loss | 0.0227 | -| std | 0.00697 | -| value_loss | 2.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21019 | -| time_elapsed | 113648 | -| total_timesteps | 2690432 | -| train/ | | -| approx_kl | 0.004241648 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -2.45 | -| learning_rate | 0.0003 | -| loss | -0.000504 | -| n_updates | 210180 | -| policy_gradient_loss | 0.0174 | -| std | 0.00696 | -| value_loss | 6.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21020 | -| time_elapsed | 113652 | -| total_timesteps | 2690560 | -| train/ | | -| approx_kl | 0.03398126 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.00341 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 210190 | -| policy_gradient_loss | 0.0525 | -| std | 0.00695 | -| value_loss | 1.13e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21021 | -| time_elapsed | 113657 | -| total_timesteps | 2690688 | -| train/ | | -| approx_kl | 0.16667964 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.00711 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 210200 | -| policy_gradient_loss | 0.0407 | -| std | 0.00695 | -| value_loss | 1.58e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21022 | -| time_elapsed | 113661 | -| total_timesteps | 2690816 | -| train/ | | -| approx_kl | 0.048554096 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 210210 | -| policy_gradient_loss | 0.0727 | -| std | 0.00695 | -| value_loss | 1.53e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21023 | -| time_elapsed | 113666 | -| total_timesteps | 2690944 | -| train/ | | -| approx_kl | 0.017646208 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 210220 | -| policy_gradient_loss | 0.00348 | -| std | 0.00695 | -| value_loss | 1.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21024 | -| time_elapsed | 113671 | -| total_timesteps | 2691072 | -| train/ | | -| approx_kl | 0.028104307 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 210230 | -| policy_gradient_loss | 0.0552 | -| std | 0.00694 | -| value_loss | 5.58e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21025 | -| time_elapsed | 113679 | -| total_timesteps | 2691200 | -| train/ | | -| approx_kl | 0.0045019905 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.886 | -| learning_rate | 0.0003 | -| loss | -0.00766 | -| n_updates | 210240 | -| policy_gradient_loss | 0.0744 | -| std | 0.00694 | -| value_loss | 0.00108 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21026 | -| time_elapsed | 113684 | -| total_timesteps | 2691328 | -| train/ | | -| approx_kl | 1.1345768 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.378 | -| learning_rate | 0.0003 | -| loss | 0.384 | -| n_updates | 210250 | -| policy_gradient_loss | 0.219 | -| std | 0.00694 | -| value_loss | 8.97e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21027 | -| time_elapsed | 113689 | -| total_timesteps | 2691456 | -| train/ | | -| approx_kl | 0.03483389 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.00828 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 210260 | -| policy_gradient_loss | 0.0748 | -| std | 0.00693 | -| value_loss | 1.71e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21028 | -| time_elapsed | 113695 | -| total_timesteps | 2691584 | -| train/ | | -| approx_kl | 0.23065823 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 210270 | -| policy_gradient_loss | 0.0422 | -| std | 0.00693 | -| value_loss | 8.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21029 | -| time_elapsed | 113699 | -| total_timesteps | 2691712 | -| train/ | | -| approx_kl | 0.048649475 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0602 | -| learning_rate | 0.0003 | -| loss | 0.0398 | -| n_updates | 210280 | -| policy_gradient_loss | 0.0548 | -| std | 0.00694 | -| value_loss | 4.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21030 | -| time_elapsed | 113703 | -| total_timesteps | 2691840 | -| train/ | | -| approx_kl | 0.22744186 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0863 | -| learning_rate | 0.0003 | -| loss | 0.0925 | -| n_updates | 210290 | -| policy_gradient_loss | 0.0427 | -| std | 0.00694 | -| value_loss | 4.55e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21031 | -| time_elapsed | 113708 | -| total_timesteps | 2691968 | -| train/ | | -| approx_kl | 0.048797596 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 210300 | -| policy_gradient_loss | 0.0643 | -| std | 0.00694 | -| value_loss | 3.28e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21032 | -| time_elapsed | 113713 | -| total_timesteps | 2692096 | -| train/ | | -| approx_kl | 0.05010731 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 210310 | -| policy_gradient_loss | 0.0376 | -| std | 0.00694 | -| value_loss | 2.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21033 | -| time_elapsed | 113721 | -| total_timesteps | 2692224 | -| train/ | | -| approx_kl | 0.19979225 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | 0.0991 | -| n_updates | 210320 | -| policy_gradient_loss | 0.0458 | -| std | 0.00694 | -| value_loss | 0.000172 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21034 | -| time_elapsed | 113725 | -| total_timesteps | 2692352 | -| train/ | | -| approx_kl | 0.040980864 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.00717 | -| learning_rate | 0.0003 | -| loss | 0.0057 | -| n_updates | 210330 | -| policy_gradient_loss | 0.0687 | -| std | 0.00694 | -| value_loss | 1.86e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21035 | -| time_elapsed | 113730 | -| total_timesteps | 2692480 | -| train/ | | -| approx_kl | 0.016292905 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | -0.00777 | -| n_updates | 210340 | -| policy_gradient_loss | 0.0117 | -| std | 0.00694 | -| value_loss | 8.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21036 | -| time_elapsed | 113733 | -| total_timesteps | 2692608 | -| train/ | | -| approx_kl | 0.026189249 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0101 | -| learning_rate | 0.0003 | -| loss | -0.00508 | -| n_updates | 210350 | -| policy_gradient_loss | 0.0333 | -| std | 0.00694 | -| value_loss | 4.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21037 | -| time_elapsed | 113738 | -| total_timesteps | 2692736 | -| train/ | | -| approx_kl | 0.002114331 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 210360 | -| policy_gradient_loss | 0.00776 | -| std | 0.00694 | -| value_loss | 3.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21038 | -| time_elapsed | 113743 | -| total_timesteps | 2692864 | -| train/ | | -| approx_kl | 0.24413621 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.0616 | -| n_updates | 210370 | -| policy_gradient_loss | 0.0227 | -| std | 0.00694 | -| value_loss | 2.58e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21039 | -| time_elapsed | 113749 | -| total_timesteps | 2692992 | -| train/ | | -| approx_kl | 0.03127009 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 210380 | -| policy_gradient_loss | 0.0461 | -| std | 0.00694 | -| value_loss | 2.13e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21040 | -| time_elapsed | 113754 | -| total_timesteps | 2693120 | -| train/ | | -| approx_kl | 0.18731149 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 210390 | -| policy_gradient_loss | 0.0507 | -| std | 0.00694 | -| value_loss | 1.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21041 | -| time_elapsed | 113766 | -| total_timesteps | 2693248 | -| train/ | | -| approx_kl | 0.042996142 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 210400 | -| policy_gradient_loss | 0.0262 | -| std | 0.00694 | -| value_loss | 0.000252 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21042 | -| time_elapsed | 113771 | -| total_timesteps | 2693376 | -| train/ | | -| approx_kl | 0.018377148 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.00293 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 210410 | -| policy_gradient_loss | 0.0195 | -| std | 0.00694 | -| value_loss | 1.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21043 | -| time_elapsed | 113775 | -| total_timesteps | 2693504 | -| train/ | | -| approx_kl | 0.041548703 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.0135 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 210420 | -| policy_gradient_loss | 0.0746 | -| std | 0.00694 | -| value_loss | 3.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21044 | -| time_elapsed | 113780 | -| total_timesteps | 2693632 | -| train/ | | -| approx_kl | 0.18306921 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.044 | -| n_updates | 210430 | -| policy_gradient_loss | 0.0423 | -| std | 0.00694 | -| value_loss | 2.89e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21045 | -| time_elapsed | 113786 | -| total_timesteps | 2693760 | -| train/ | | -| approx_kl | 0.0028940793 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 210440 | -| policy_gradient_loss | 0.0142 | -| std | 0.00694 | -| value_loss | 1.51e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21046 | -| time_elapsed | 113791 | -| total_timesteps | 2693888 | -| train/ | | -| approx_kl | 0.023835268 | -| clip_fraction | 0.581 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0597 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 210450 | -| policy_gradient_loss | 0.0911 | -| std | 0.00695 | -| value_loss | 1.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21047 | -| time_elapsed | 113797 | -| total_timesteps | 2694016 | -| train/ | | -| approx_kl | 0.01140381 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.0049 | -| n_updates | 210460 | -| policy_gradient_loss | 0.0294 | -| std | 0.00695 | -| value_loss | 8.71e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21048 | -| time_elapsed | 113809 | -| total_timesteps | 2694144 | -| train/ | | -| approx_kl | 0.18208793 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | 0.0299 | -| n_updates | 210470 | -| policy_gradient_loss | 0.00235 | -| std | 0.00695 | -| value_loss | 0.00067 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21049 | -| time_elapsed | 113815 | -| total_timesteps | 2694272 | -| train/ | | -| approx_kl | 0.06285995 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 210480 | -| policy_gradient_loss | 0.00585 | -| std | 0.00693 | -| value_loss | 8.55e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21050 | -| time_elapsed | 113820 | -| total_timesteps | 2694400 | -| train/ | | -| approx_kl | 0.04400085 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -158 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 210490 | -| policy_gradient_loss | 6.85e-05 | -| std | 0.00692 | -| value_loss | 3.8e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21051 | -| time_elapsed | 113825 | -| total_timesteps | 2694528 | -| train/ | | -| approx_kl | 0.1078513 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.671 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 210500 | -| policy_gradient_loss | 0.0164 | -| std | 0.00692 | -| value_loss | 9.52e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21052 | -| time_elapsed | 113831 | -| total_timesteps | 2694656 | -| train/ | | -| approx_kl | 0.0005472726 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.55 | -| explained_variance | -0.00615 | -| learning_rate | 0.0003 | -| loss | -0.0039 | -| n_updates | 210510 | -| policy_gradient_loss | 0.023 | -| std | 0.00692 | -| value_loss | 7.3e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21053 | -| time_elapsed | 113833 | -| total_timesteps | 2694784 | -| train/ | | -| approx_kl | 0.17422709 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 210520 | -| policy_gradient_loss | 0.0309 | -| std | 0.00689 | -| value_loss | 3.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21054 | -| time_elapsed | 113838 | -| total_timesteps | 2694912 | -| train/ | | -| approx_kl | 0.014537426 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -3.08 | -| learning_rate | 0.0003 | -| loss | -0.00246 | -| n_updates | 210530 | -| policy_gradient_loss | -0.00159 | -| std | 0.00688 | -| value_loss | 7.26e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21055 | -| time_elapsed | 113843 | -| total_timesteps | 2695040 | -| train/ | | -| approx_kl | 0.011819209 | -| clip_fraction | 0.0867 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -6.75 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 210540 | -| policy_gradient_loss | -0.0101 | -| std | 0.00688 | -| value_loss | 7.75e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21056 | -| time_elapsed | 113852 | -| total_timesteps | 2695168 | -| train/ | | -| approx_kl | 0.09750295 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.0171 | -| n_updates | 210550 | -| policy_gradient_loss | -0.00539 | -| std | 0.00688 | -| value_loss | 0.00301 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21057 | -| time_elapsed | 113858 | -| total_timesteps | 2695296 | -| train/ | | -| approx_kl | 0.0311156 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | 0.236 | -| learning_rate | 0.0003 | -| loss | 0.0249 | -| n_updates | 210560 | -| policy_gradient_loss | 0.0271 | -| std | 0.00688 | -| value_loss | 2.6e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21058 | -| time_elapsed | 113861 | -| total_timesteps | 2695424 | -| train/ | | -| approx_kl | 0.08802435 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.00348 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 210570 | -| policy_gradient_loss | 0.0657 | -| std | 0.00687 | -| value_loss | 6.51e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21059 | -| time_elapsed | 113865 | -| total_timesteps | 2695552 | -| train/ | | -| approx_kl | 0.00067983475 | -| clip_fraction | 0.564 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | -0.00029 | -| n_updates | 210580 | -| policy_gradient_loss | 0.0788 | -| std | 0.00687 | -| value_loss | 1.7e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21060 | -| time_elapsed | 113870 | -| total_timesteps | 2695680 | -| train/ | | -| approx_kl | 0.019379081 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 210590 | -| policy_gradient_loss | 0.0463 | -| std | 0.00687 | -| value_loss | 2.42e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21061 | -| time_elapsed | 113875 | -| total_timesteps | 2695808 | -| train/ | | -| approx_kl | 0.27180028 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 210600 | -| policy_gradient_loss | 0.142 | -| std | 0.00687 | -| value_loss | 1.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21062 | -| time_elapsed | 113881 | -| total_timesteps | 2695936 | -| train/ | | -| approx_kl | 0.16621795 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 210610 | -| policy_gradient_loss | 0.137 | -| std | 0.00687 | -| value_loss | 1.47e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21063 | -| time_elapsed | 113886 | -| total_timesteps | 2696064 | -| train/ | | -| approx_kl | 0.027461 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 210620 | -| policy_gradient_loss | 0.0204 | -| std | 0.00687 | -| value_loss | 1.13e-07 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21064 | -| time_elapsed | 113894 | -| total_timesteps | 2696192 | -| train/ | | -| approx_kl | 0.01409468 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | 0.834 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 210630 | -| policy_gradient_loss | -0.00882 | -| std | 0.00687 | -| value_loss | 0.00418 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21065 | -| time_elapsed | 113899 | -| total_timesteps | 2696320 | -| train/ | | -| approx_kl | 0.072063416 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -1.69 | -| learning_rate | 0.0003 | -| loss | 0.0668 | -| n_updates | 210640 | -| policy_gradient_loss | 0.0792 | -| std | 0.00687 | -| value_loss | 1.71e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21066 | -| time_elapsed | 113903 | -| total_timesteps | 2696448 | -| train/ | | -| approx_kl | 0.01859631 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.00618 | -| n_updates | 210650 | -| policy_gradient_loss | 0.0294 | -| std | 0.00687 | -| value_loss | 3.86e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21067 | -| time_elapsed | 113908 | -| total_timesteps | 2696576 | -| train/ | | -| approx_kl | 0.39502066 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | 0.00329 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 210660 | -| policy_gradient_loss | 0.0481 | -| std | 0.00687 | -| value_loss | 1.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21068 | -| time_elapsed | 113911 | -| total_timesteps | 2696704 | -| train/ | | -| approx_kl | 0.008445968 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | -0.003 | -| n_updates | 210670 | -| policy_gradient_loss | 0.00528 | -| std | 0.00687 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21069 | -| time_elapsed | 113915 | -| total_timesteps | 2696832 | -| train/ | | -| approx_kl | 0.002509992 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 210680 | -| policy_gradient_loss | 0.00838 | -| std | 0.00687 | -| value_loss | 8.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21070 | -| time_elapsed | 113920 | -| total_timesteps | 2696960 | -| train/ | | -| approx_kl | 0.04455383 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 210690 | -| policy_gradient_loss | 0.142 | -| std | 0.00688 | -| value_loss | 6.85e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21071 | -| time_elapsed | 113924 | -| total_timesteps | 2697088 | -| train/ | | -| approx_kl | 0.07990463 | -| clip_fraction | 0.664 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.0576 | -| n_updates | 210700 | -| policy_gradient_loss | 0.133 | -| std | 0.00688 | -| value_loss | 4.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21072 | -| time_elapsed | 113935 | -| total_timesteps | 2697216 | -| train/ | | -| approx_kl | 0.14558195 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | 0.805 | -| learning_rate | 0.0003 | -| loss | 0.064 | -| n_updates | 210710 | -| policy_gradient_loss | 0.0814 | -| std | 0.00688 | -| value_loss | 0.00547 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21073 | -| time_elapsed | 113940 | -| total_timesteps | 2697344 | -| train/ | | -| approx_kl | 0.024939481 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -1e-05 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 210720 | -| policy_gradient_loss | 0.0258 | -| std | 0.00688 | -| value_loss | 2.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21074 | -| time_elapsed | 113944 | -| total_timesteps | 2697472 | -| train/ | | -| approx_kl | 0.16077965 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.0905 | -| n_updates | 210730 | -| policy_gradient_loss | 0.0228 | -| std | 0.00688 | -| value_loss | 7.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21075 | -| time_elapsed | 113948 | -| total_timesteps | 2697600 | -| train/ | | -| approx_kl | 0.015225848 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.0014 | -| n_updates | 210740 | -| policy_gradient_loss | 5.03e-05 | -| std | 0.00688 | -| value_loss | 4.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21076 | -| time_elapsed | 113952 | -| total_timesteps | 2697728 | -| train/ | | -| approx_kl | 0.013486228 | -| clip_fraction | 0.106 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 210750 | -| policy_gradient_loss | -0.00375 | -| std | 0.00687 | -| value_loss | 3.72e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21077 | -| time_elapsed | 113956 | -| total_timesteps | 2697856 | -| train/ | | -| approx_kl | 0.0944848 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.56 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.0574 | -| n_updates | 210760 | -| policy_gradient_loss | 0.0265 | -| std | 0.00685 | -| value_loss | 1.24e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21078 | -| time_elapsed | 113961 | -| total_timesteps | 2697984 | -| train/ | | -| approx_kl | 0.12816057 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -1.99 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 210770 | -| policy_gradient_loss | 0.00857 | -| std | 0.00684 | -| value_loss | 2.15e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21079 | -| time_elapsed | 113964 | -| total_timesteps | 2698112 | -| train/ | | -| approx_kl | 0.0009432649 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.00335 | -| n_updates | 210780 | -| policy_gradient_loss | 0.0251 | -| std | 0.00684 | -| value_loss | 2.17e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21080 | -| time_elapsed | 113975 | -| total_timesteps | 2698240 | -| train/ | | -| approx_kl | 0.29198727 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 210790 | -| policy_gradient_loss | 0.0723 | -| std | 0.00683 | -| value_loss | 0.000691 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21081 | -| time_elapsed | 113981 | -| total_timesteps | 2698368 | -| train/ | | -| approx_kl | 0.07485975 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.00309 | -| learning_rate | 0.0003 | -| loss | 0.0339 | -| n_updates | 210800 | -| policy_gradient_loss | 0.0211 | -| std | 0.00683 | -| value_loss | 1.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21082 | -| time_elapsed | 113986 | -| total_timesteps | 2698496 | -| train/ | | -| approx_kl | 0.101759575 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.00619 | -| learning_rate | 0.0003 | -| loss | 0.0701 | -| n_updates | 210810 | -| policy_gradient_loss | 0.0183 | -| std | 0.00684 | -| value_loss | 2.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21083 | -| time_elapsed | 113991 | -| total_timesteps | 2698624 | -| train/ | | -| approx_kl | 0.026824558 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.00334 | -| n_updates | 210820 | -| policy_gradient_loss | 0.026 | -| std | 0.00684 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21084 | -| time_elapsed | 113995 | -| total_timesteps | 2698752 | -| train/ | | -| approx_kl | 0.105603576 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.0564 | -| n_updates | 210830 | -| policy_gradient_loss | 0.0284 | -| std | 0.00684 | -| value_loss | 9.07e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21085 | -| time_elapsed | 114001 | -| total_timesteps | 2698880 | -| train/ | | -| approx_kl | 0.0054358635 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0689 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 210840 | -| policy_gradient_loss | 0.0212 | -| std | 0.00684 | -| value_loss | 1.68e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21086 | -| time_elapsed | 114005 | -| total_timesteps | 2699008 | -| train/ | | -| approx_kl | 0.18919846 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | 0.0771 | -| n_updates | 210850 | -| policy_gradient_loss | 0.0188 | -| std | 0.00683 | -| value_loss | 2.78e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21087 | -| time_elapsed | 114017 | -| total_timesteps | 2699136 | -| train/ | | -| approx_kl | 0.058007155 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.795 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 210860 | -| policy_gradient_loss | -0.00639 | -| std | 0.00683 | -| value_loss | 0.000843 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21088 | -| time_elapsed | 114022 | -| total_timesteps | 2699264 | -| train/ | | -| approx_kl | 0.20770398 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 210870 | -| policy_gradient_loss | 0.0204 | -| std | 0.00683 | -| value_loss | 4.03e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21089 | -| time_elapsed | 114027 | -| total_timesteps | 2699392 | -| train/ | | -| approx_kl | 0.0015151948 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | -0.000939 | -| n_updates | 210880 | -| policy_gradient_loss | 0.0178 | -| std | 0.00683 | -| value_loss | 2.3e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21090 | -| time_elapsed | 114032 | -| total_timesteps | 2699520 | -| train/ | | -| approx_kl | 2.3432076e-06 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | -8.91e-05 | -| n_updates | 210890 | -| policy_gradient_loss | 0.00624 | -| std | 0.00682 | -| value_loss | 9.29e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21091 | -| time_elapsed | 114037 | -| total_timesteps | 2699648 | -| train/ | | -| approx_kl | 0.055942763 | -| clip_fraction | 0.578 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.035 | -| n_updates | 210900 | -| policy_gradient_loss | 0.0586 | -| std | 0.00682 | -| value_loss | 1.27e-05 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21092 | -| time_elapsed | 114041 | -| total_timesteps | 2699776 | -| train/ | | -| approx_kl | 0.250847 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -12.6 | -| learning_rate | 0.0003 | -| loss | 0.0249 | -| n_updates | 210910 | -| policy_gradient_loss | 0.0173 | -| std | 0.00682 | -| value_loss | 5.29e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21093 | -| time_elapsed | 114046 | -| total_timesteps | 2699904 | -| train/ | | -| approx_kl | 0.053390834 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -4.19 | -| learning_rate | 0.0003 | -| loss | 0.00636 | -| n_updates | 210920 | -| policy_gradient_loss | 0.0371 | -| std | 0.00682 | -| value_loss | 9.23e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21094 | -| time_elapsed | 114051 | -| total_timesteps | 2700032 | -| train/ | | -| approx_kl | 0.2292208 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.00606 | -| learning_rate | 0.0003 | -| loss | 0.0922 | -| n_updates | 210930 | -| policy_gradient_loss | 0.04 | -| std | 0.00682 | -| value_loss | 3.04e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21095 | -| time_elapsed | 114061 | -| total_timesteps | 2700160 | -| train/ | | -| approx_kl | 0.0058755 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.821 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 210940 | -| policy_gradient_loss | 0.0195 | -| std | 0.00682 | -| value_loss | 0.00442 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21096 | -| time_elapsed | 114065 | -| total_timesteps | 2700288 | -| train/ | | -| approx_kl | 0.18800537 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.586 | -| learning_rate | 0.0003 | -| loss | 0.0802 | -| n_updates | 210950 | -| policy_gradient_loss | 0.0371 | -| std | 0.00682 | -| value_loss | 6.75e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21097 | -| time_elapsed | 114069 | -| total_timesteps | 2700416 | -| train/ | | -| approx_kl | 0.050854042 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.00584 | -| learning_rate | 0.0003 | -| loss | 0.00518 | -| n_updates | 210960 | -| policy_gradient_loss | 0.0654 | -| std | 0.00682 | -| value_loss | 1.75e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21098 | -| time_elapsed | 114072 | -| total_timesteps | 2700544 | -| train/ | | -| approx_kl | 0.00026581762 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0016 | -| learning_rate | 0.0003 | -| loss | 0.00235 | -| n_updates | 210970 | -| policy_gradient_loss | 0.0897 | -| std | 0.00682 | -| value_loss | 9.72e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21099 | -| time_elapsed | 114076 | -| total_timesteps | 2700672 | -| train/ | | -| approx_kl | 0.11026342 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0691 | -| n_updates | 210980 | -| policy_gradient_loss | 0.153 | -| std | 0.00683 | -| value_loss | 4.92e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21100 | -| time_elapsed | 114079 | -| total_timesteps | 2700800 | -| train/ | | -| approx_kl | 0.07957223 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 210990 | -| policy_gradient_loss | 0.0324 | -| std | 0.00683 | -| value_loss | 3.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21101 | -| time_elapsed | 114082 | -| total_timesteps | 2700928 | -| train/ | | -| approx_kl | 0.12615694 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | 0.054 | -| n_updates | 211000 | -| policy_gradient_loss | 0.0235 | -| std | 0.00683 | -| value_loss | 2.47e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21102 | -| time_elapsed | 114088 | -| total_timesteps | 2701056 | -| train/ | | -| approx_kl | 0.00080642663 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 211010 | -| policy_gradient_loss | 0.0274 | -| std | 0.00683 | -| value_loss | 2.15e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21103 | -| time_elapsed | 114098 | -| total_timesteps | 2701184 | -| train/ | | -| approx_kl | 0.40295753 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -4.93 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 211020 | -| policy_gradient_loss | 0.011 | -| std | 0.00683 | -| value_loss | 0.00405 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21104 | -| time_elapsed | 114103 | -| total_timesteps | 2701312 | -| train/ | | -| approx_kl | 0.07981465 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 211030 | -| policy_gradient_loss | 0.00861 | -| std | 0.00683 | -| value_loss | 6.41e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21105 | -| time_elapsed | 114108 | -| total_timesteps | 2701440 | -| train/ | | -| approx_kl | 0.012468129 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.00586 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 211040 | -| policy_gradient_loss | 0.00116 | -| std | 0.00684 | -| value_loss | 8.53e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21106 | -| time_elapsed | 114114 | -| total_timesteps | 2701568 | -| train/ | | -| approx_kl | 0.052090216 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 211050 | -| policy_gradient_loss | 0.00529 | -| std | 0.00684 | -| value_loss | 3.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21107 | -| time_elapsed | 114120 | -| total_timesteps | 2701696 | -| train/ | | -| approx_kl | 0.038687028 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 211060 | -| policy_gradient_loss | 0.00716 | -| std | 0.00684 | -| value_loss | 2.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21108 | -| time_elapsed | 114125 | -| total_timesteps | 2701824 | -| train/ | | -| approx_kl | 0.007125032 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 211070 | -| policy_gradient_loss | 0.00465 | -| std | 0.00684 | -| value_loss | 1.93e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21109 | -| time_elapsed | 114131 | -| total_timesteps | 2701952 | -| train/ | | -| approx_kl | 0.0015853397 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | -0.0019 | -| n_updates | 211080 | -| policy_gradient_loss | 0.00656 | -| std | 0.00684 | -| value_loss | 1.26e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21110 | -| time_elapsed | 114137 | -| total_timesteps | 2702080 | -| train/ | | -| approx_kl | 8.4750354e-07 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0576 | -| learning_rate | 0.0003 | -| loss | 5.07e-05 | -| n_updates | 211090 | -| policy_gradient_loss | 0.0417 | -| std | 0.00684 | -| value_loss | 8.91e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21111 | -| time_elapsed | 114145 | -| total_timesteps | 2702208 | -| train/ | | -| approx_kl | 0.14774294 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.639 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 211100 | -| policy_gradient_loss | 0.0427 | -| std | 0.00684 | -| value_loss | 0.00824 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21112 | -| time_elapsed | 114150 | -| total_timesteps | 2702336 | -| train/ | | -| approx_kl | 9.261584e-05 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.725 | -| learning_rate | 0.0003 | -| loss | 0.000148 | -| n_updates | 211110 | -| policy_gradient_loss | 0.0113 | -| std | 0.00682 | -| value_loss | 0.000153 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21113 | -| time_elapsed | 114155 | -| total_timesteps | 2702464 | -| train/ | | -| approx_kl | 8.722767e-06 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.738 | -| learning_rate | 0.0003 | -| loss | 0.000143 | -| n_updates | 211120 | -| policy_gradient_loss | 0.037 | -| std | 0.0068 | -| value_loss | 3.73e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21114 | -| time_elapsed | 114160 | -| total_timesteps | 2702592 | -| train/ | | -| approx_kl | 0.22034916 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | 0.0122 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 211130 | -| policy_gradient_loss | 0.0492 | -| std | 0.00679 | -| value_loss | 1e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21115 | -| time_elapsed | 114164 | -| total_timesteps | 2702720 | -| train/ | | -| approx_kl | 0.04694908 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 211140 | -| policy_gradient_loss | 0.0417 | -| std | 0.00679 | -| value_loss | 8.39e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21116 | -| time_elapsed | 114168 | -| total_timesteps | 2702848 | -| train/ | | -| approx_kl | 0.9815295 | -| clip_fraction | 0.765 | -| clip_range | 0.2 | -| entropy_loss | 3.57 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.315 | -| n_updates | 211150 | -| policy_gradient_loss | 0.412 | -| std | 0.00678 | -| value_loss | 5.18e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21117 | -| time_elapsed | 114171 | -| total_timesteps | 2702976 | -| train/ | | -| approx_kl | 0.05934056 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 211160 | -| policy_gradient_loss | 0.00846 | -| std | 0.00677 | -| value_loss | 0.000281 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21118 | -| time_elapsed | 114174 | -| total_timesteps | 2703104 | -| train/ | | -| approx_kl | 0.048497047 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 211170 | -| policy_gradient_loss | 0.00867 | -| std | 0.00676 | -| value_loss | 0.0086 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21119 | -| time_elapsed | 114183 | -| total_timesteps | 2703232 | -| train/ | | -| approx_kl | 0.017039556 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.672 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 211180 | -| policy_gradient_loss | 0.0055 | -| std | 0.00675 | -| value_loss | 0.00537 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21120 | -| time_elapsed | 114187 | -| total_timesteps | 2703360 | -| train/ | | -| approx_kl | 0.057205066 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 211190 | -| policy_gradient_loss | 0.0179 | -| std | 0.00675 | -| value_loss | 0.000451 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21121 | -| time_elapsed | 114190 | -| total_timesteps | 2703488 | -| train/ | | -| approx_kl | 0.0442759 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 211200 | -| policy_gradient_loss | 0.0133 | -| std | 0.00675 | -| value_loss | 0.000213 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21122 | -| time_elapsed | 114195 | -| total_timesteps | 2703616 | -| train/ | | -| approx_kl | 0.042706158 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 211210 | -| policy_gradient_loss | 0.00593 | -| std | 0.00674 | -| value_loss | 0.000204 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21123 | -| time_elapsed | 114199 | -| total_timesteps | 2703744 | -| train/ | | -| approx_kl | 0.0074053514 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.000781 | -| n_updates | 211220 | -| policy_gradient_loss | 0.00567 | -| std | 0.00674 | -| value_loss | 0.00015 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21124 | -| time_elapsed | 114203 | -| total_timesteps | 2703872 | -| train/ | | -| approx_kl | 0.0009168959 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | 0.00674 | -| n_updates | 211230 | -| policy_gradient_loss | 0.0038 | -| std | 0.00674 | -| value_loss | 0.000131 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21125 | -| time_elapsed | 114207 | -| total_timesteps | 2704000 | -| train/ | | -| approx_kl | 0.004816703 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 211240 | -| policy_gradient_loss | 0.00528 | -| std | 0.00674 | -| value_loss | 9.49e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21126 | -| time_elapsed | 114212 | -| total_timesteps | 2704128 | -| train/ | | -| approx_kl | 0.035360318 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.00435 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 211250 | -| policy_gradient_loss | 0.0924 | -| std | 0.00674 | -| value_loss | 0.000495 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21127 | -| time_elapsed | 114223 | -| total_timesteps | 2704256 | -| train/ | | -| approx_kl | 0.1140018 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | 0.0804 | -| n_updates | 211260 | -| policy_gradient_loss | 0.051 | -| std | 0.00674 | -| value_loss | 0.000663 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21128 | -| time_elapsed | 114227 | -| total_timesteps | 2704384 | -| train/ | | -| approx_kl | 0.1731107 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.0955 | -| n_updates | 211270 | -| policy_gradient_loss | 0.143 | -| std | 0.00674 | -| value_loss | 2.34e-05 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21129 | -| time_elapsed | 114232 | -| total_timesteps | 2704512 | -| train/ | | -| approx_kl | 0.1283099 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0897 | -| learning_rate | 0.0003 | -| loss | 0.0919 | -| n_updates | 211280 | -| policy_gradient_loss | 0.103 | -| std | 0.00674 | -| value_loss | 2.23e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21130 | -| time_elapsed | 114237 | -| total_timesteps | 2704640 | -| train/ | | -| approx_kl | 0.028556217 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.00315 | -| n_updates | 211290 | -| policy_gradient_loss | 0.0234 | -| std | 0.00674 | -| value_loss | 2.26e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21131 | -| time_elapsed | 114241 | -| total_timesteps | 2704768 | -| train/ | | -| approx_kl | 0.5058274 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 211300 | -| policy_gradient_loss | 0.0523 | -| std | 0.00674 | -| value_loss | 2.03e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21132 | -| time_elapsed | 114246 | -| total_timesteps | 2704896 | -| train/ | | -| approx_kl | 0.010460798 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 211310 | -| policy_gradient_loss | 0.00756 | -| std | 0.00675 | -| value_loss | 1.73e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21133 | -| time_elapsed | 114251 | -| total_timesteps | 2705024 | -| train/ | | -| approx_kl | 0.07344775 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 211320 | -| policy_gradient_loss | 0.0198 | -| std | 0.00675 | -| value_loss | 1.23e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21134 | -| time_elapsed | 114261 | -| total_timesteps | 2705152 | -| train/ | | -| approx_kl | 0.012197845 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 211330 | -| policy_gradient_loss | 0.001 | -| std | 0.00675 | -| value_loss | 0.000232 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21135 | -| time_elapsed | 114267 | -| total_timesteps | 2705280 | -| train/ | | -| approx_kl | 0.03969204 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.0185 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 211340 | -| policy_gradient_loss | 0.0114 | -| std | 0.00674 | -| value_loss | 4.91e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21136 | -| time_elapsed | 114271 | -| total_timesteps | 2705408 | -| train/ | | -| approx_kl | 0.008087459 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.000325 | -| n_updates | 211350 | -| policy_gradient_loss | 0.00671 | -| std | 0.00674 | -| value_loss | 4.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21137 | -| time_elapsed | 114276 | -| total_timesteps | 2705536 | -| train/ | | -| approx_kl | 0.07944071 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0383 | -| n_updates | 211360 | -| policy_gradient_loss | 0.0142 | -| std | 0.00673 | -| value_loss | 3.76e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21138 | -| time_elapsed | 114281 | -| total_timesteps | 2705664 | -| train/ | | -| approx_kl | 0.010949016 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 211370 | -| policy_gradient_loss | 0.00472 | -| std | 0.00673 | -| value_loss | 3.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21139 | -| time_elapsed | 114286 | -| total_timesteps | 2705792 | -| train/ | | -| approx_kl | 0.002793213 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 211380 | -| policy_gradient_loss | 0.00827 | -| std | 0.00673 | -| value_loss | 2.13e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21140 | -| time_elapsed | 114291 | -| total_timesteps | 2705920 | -| train/ | | -| approx_kl | 7.874332e-06 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | -2.21e-05 | -| n_updates | 211390 | -| policy_gradient_loss | 0.0248 | -| std | 0.00673 | -| value_loss | 1.12e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21141 | -| time_elapsed | 114296 | -| total_timesteps | 2706048 | -| train/ | | -| approx_kl | 0.6177321 | -| clip_fraction | 0.748 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0734 | -| learning_rate | 0.0003 | -| loss | 0.257 | -| n_updates | 211400 | -| policy_gradient_loss | 0.14 | -| std | 0.00672 | -| value_loss | 1.16e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21142 | -| time_elapsed | 114305 | -| total_timesteps | 2706176 | -| train/ | | -| approx_kl | 0.0007832586 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 211410 | -| policy_gradient_loss | -0.0116 | -| std | 0.00671 | -| value_loss | 0.00105 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21143 | -| time_elapsed | 114311 | -| total_timesteps | 2706304 | -| train/ | | -| approx_kl | 0.004103881 | -| clip_fraction | 0.546 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | -0.000473 | -| n_updates | 211420 | -| policy_gradient_loss | 0.0901 | -| std | 0.0067 | -| value_loss | 4.92e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21144 | -| time_elapsed | 114315 | -| total_timesteps | 2706432 | -| train/ | | -| approx_kl | 0.008800031 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 211430 | -| policy_gradient_loss | 0.0111 | -| std | 0.00669 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21145 | -| time_elapsed | 114320 | -| total_timesteps | 2706560 | -| train/ | | -| approx_kl | 0.047216926 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | 0.0319 | -| n_updates | 211440 | -| policy_gradient_loss | 0.0822 | -| std | 0.00669 | -| value_loss | 3.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21146 | -| time_elapsed | 114325 | -| total_timesteps | 2706688 | -| train/ | | -| approx_kl | 0.0030882102 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.00857 | -| learning_rate | 0.0003 | -| loss | -0.00527 | -| n_updates | 211450 | -| policy_gradient_loss | 0.0641 | -| std | 0.00669 | -| value_loss | 2.93e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21147 | -| time_elapsed | 114329 | -| total_timesteps | 2706816 | -| train/ | | -| approx_kl | 1.1326106 | -| clip_fraction | 0.739 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.00607 | -| learning_rate | 0.0003 | -| loss | 0.317 | -| n_updates | 211460 | -| policy_gradient_loss | 0.208 | -| std | 0.00669 | -| value_loss | 1.31e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21148 | -| time_elapsed | 114334 | -| total_timesteps | 2706944 | -| train/ | | -| approx_kl | 0.027245868 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.935 | -| learning_rate | 0.0003 | -| loss | -0.000489 | -| n_updates | 211470 | -| policy_gradient_loss | 0.00572 | -| std | 0.0067 | -| value_loss | 3.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21149 | -| time_elapsed | 114338 | -| total_timesteps | 2707072 | -| train/ | | -| approx_kl | 0.103850804 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0564 | -| learning_rate | 0.0003 | -| loss | 0.0995 | -| n_updates | 211480 | -| policy_gradient_loss | 0.0184 | -| std | 0.0067 | -| value_loss | 2.35e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21150 | -| time_elapsed | 114346 | -| total_timesteps | 2707200 | -| train/ | | -| approx_kl | 0.08672374 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.776 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 211490 | -| policy_gradient_loss | -0.0102 | -| std | 0.0067 | -| value_loss | 0.00553 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21151 | -| time_elapsed | 114351 | -| total_timesteps | 2707328 | -| train/ | | -| approx_kl | 0.00036334107 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 211500 | -| policy_gradient_loss | 0.0266 | -| std | 0.0067 | -| value_loss | 1.11e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21152 | -| time_elapsed | 114355 | -| total_timesteps | 2707456 | -| train/ | | -| approx_kl | 0.17275833 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.00883 | -| learning_rate | 0.0003 | -| loss | 0.0437 | -| n_updates | 211510 | -| policy_gradient_loss | 0.015 | -| std | 0.0067 | -| value_loss | 2.73e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21153 | -| time_elapsed | 114361 | -| total_timesteps | 2707584 | -| train/ | | -| approx_kl | 0.025089853 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.00759 | -| n_updates | 211520 | -| policy_gradient_loss | 0.0311 | -| std | 0.0067 | -| value_loss | 1.83e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21154 | -| time_elapsed | 114365 | -| total_timesteps | 2707712 | -| train/ | | -| approx_kl | 0.14198746 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 211530 | -| policy_gradient_loss | 0.0357 | -| std | 0.0067 | -| value_loss | 1.68e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21155 | -| time_elapsed | 114369 | -| total_timesteps | 2707840 | -| train/ | | -| approx_kl | 0.006978711 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0249 | -| n_updates | 211540 | -| policy_gradient_loss | 0.00701 | -| std | 0.0067 | -| value_loss | 1.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21156 | -| time_elapsed | 114374 | -| total_timesteps | 2707968 | -| train/ | | -| approx_kl | 0.058932357 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 211550 | -| policy_gradient_loss | 0.026 | -| std | 0.00671 | -| value_loss | 8e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21157 | -| time_elapsed | 114379 | -| total_timesteps | 2708096 | -| train/ | | -| approx_kl | 0.1587076 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 211560 | -| policy_gradient_loss | 0.0297 | -| std | 0.0067 | -| value_loss | 1.08e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21158 | -| time_elapsed | 114389 | -| total_timesteps | 2708224 | -| train/ | | -| approx_kl | 0.010655144 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.722 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 211570 | -| policy_gradient_loss | 0.00561 | -| std | 0.0067 | -| value_loss | 0.00851 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21159 | -| time_elapsed | 114393 | -| total_timesteps | 2708352 | -| train/ | | -| approx_kl | 0.0014110273 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | -0.0016 | -| n_updates | 211580 | -| policy_gradient_loss | 0.0371 | -| std | 0.0067 | -| value_loss | 4.89e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21160 | -| time_elapsed | 114398 | -| total_timesteps | 2708480 | -| train/ | | -| approx_kl | 0.0034367293 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.000823 | -| n_updates | 211590 | -| policy_gradient_loss | 0.0377 | -| std | 0.0067 | -| value_loss | 3.93e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21161 | -| time_elapsed | 114402 | -| total_timesteps | 2708608 | -| train/ | | -| approx_kl | 0.0027968967 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | 1.38e-05 | -| n_updates | 211600 | -| policy_gradient_loss | 0.0297 | -| std | 0.00669 | -| value_loss | 1.92e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21162 | -| time_elapsed | 114406 | -| total_timesteps | 2708736 | -| train/ | | -| approx_kl | 0.72440296 | -| clip_fraction | 0.752 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.304 | -| n_updates | 211610 | -| policy_gradient_loss | 0.171 | -| std | 0.00669 | -| value_loss | 1.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21163 | -| time_elapsed | 114409 | -| total_timesteps | 2708864 | -| train/ | | -| approx_kl | 0.026396407 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 211620 | -| policy_gradient_loss | -0.00734 | -| std | 0.00669 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21164 | -| time_elapsed | 114414 | -| total_timesteps | 2708992 | -| train/ | | -| approx_kl | 0.017185349 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 211630 | -| policy_gradient_loss | 0.023 | -| std | 0.00669 | -| value_loss | 1.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21165 | -| time_elapsed | 114418 | -| total_timesteps | 2709120 | -| train/ | | -| approx_kl | 0.29851848 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.225 | -| n_updates | 211640 | -| policy_gradient_loss | 0.155 | -| std | 0.00669 | -| value_loss | 1.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21166 | -| time_elapsed | 114432 | -| total_timesteps | 2709248 | -| train/ | | -| approx_kl | 0.15770295 | -| clip_fraction | 0.729 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | 0.0865 | -| n_updates | 211650 | -| policy_gradient_loss | 0.0931 | -| std | 0.00669 | -| value_loss | 0.00366 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21167 | -| time_elapsed | 114437 | -| total_timesteps | 2709376 | -| train/ | | -| approx_kl | 0.13441858 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.00732 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 211660 | -| policy_gradient_loss | 0.126 | -| std | 0.00669 | -| value_loss | 1.37e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21168 | -| time_elapsed | 114442 | -| total_timesteps | 2709504 | -| train/ | | -| approx_kl | 0.15834783 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 211670 | -| policy_gradient_loss | 0.12 | -| std | 0.00669 | -| value_loss | 6.47e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21169 | -| time_elapsed | 114446 | -| total_timesteps | 2709632 | -| train/ | | -| approx_kl | 0.11579412 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.000913 | -| learning_rate | 0.0003 | -| loss | 0.0913 | -| n_updates | 211680 | -| policy_gradient_loss | 0.107 | -| std | 0.0067 | -| value_loss | 4.49e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21170 | -| time_elapsed | 114450 | -| total_timesteps | 2709760 | -| train/ | | -| approx_kl | 0.026285693 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 211690 | -| policy_gradient_loss | 0.0242 | -| std | 0.00669 | -| value_loss | 1.97e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21171 | -| time_elapsed | 114454 | -| total_timesteps | 2709888 | -| train/ | | -| approx_kl | 0.0018601562 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 211700 | -| policy_gradient_loss | 0.0297 | -| std | 0.0067 | -| value_loss | 1.61e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21172 | -| time_elapsed | 114458 | -| total_timesteps | 2710016 | -| train/ | | -| approx_kl | 0.55272067 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0943 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 211710 | -| policy_gradient_loss | 0.0518 | -| std | 0.00671 | -| value_loss | 9.14e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21173 | -| time_elapsed | 114470 | -| total_timesteps | 2710144 | -| train/ | | -| approx_kl | 0.16951291 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 211720 | -| policy_gradient_loss | -0.00877 | -| std | 0.00672 | -| value_loss | 0.000443 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21174 | -| time_elapsed | 114474 | -| total_timesteps | 2710272 | -| train/ | | -| approx_kl | 0.058657955 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.691 | -| learning_rate | 0.0003 | -| loss | 0.0594 | -| n_updates | 211730 | -| policy_gradient_loss | 0.0103 | -| std | 0.00673 | -| value_loss | 3.09e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21175 | -| time_elapsed | 114478 | -| total_timesteps | 2710400 | -| train/ | | -| approx_kl | 0.24973822 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 211740 | -| policy_gradient_loss | 0.0362 | -| std | 0.00674 | -| value_loss | 2.01e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21176 | -| time_elapsed | 114483 | -| total_timesteps | 2710528 | -| train/ | | -| approx_kl | 0.062622465 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.00799 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 211750 | -| policy_gradient_loss | 0.0642 | -| std | 0.00674 | -| value_loss | 4.81e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21177 | -| time_elapsed | 114488 | -| total_timesteps | 2710656 | -| train/ | | -| approx_kl | 0.0931703 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.00121 | -| learning_rate | 0.0003 | -| loss | 0.0711 | -| n_updates | 211760 | -| policy_gradient_loss | 0.0316 | -| std | 0.00674 | -| value_loss | 1.62e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21178 | -| time_elapsed | 114491 | -| total_timesteps | 2710784 | -| train/ | | -| approx_kl | 0.12233795 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.0578 | -| n_updates | 211770 | -| policy_gradient_loss | 0.0164 | -| std | 0.00674 | -| value_loss | 1.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21179 | -| time_elapsed | 114494 | -| total_timesteps | 2710912 | -| train/ | | -| approx_kl | 0.035585128 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 211780 | -| policy_gradient_loss | 0.0149 | -| std | 0.00674 | -| value_loss | 1.09e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21180 | -| time_elapsed | 114498 | -| total_timesteps | 2711040 | -| train/ | | -| approx_kl | 0.261832 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 211790 | -| policy_gradient_loss | 0.114 | -| std | 0.00674 | -| value_loss | 8.81e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21181 | -| time_elapsed | 114508 | -| total_timesteps | 2711168 | -| train/ | | -| approx_kl | 0.04750481 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.00755 | -| n_updates | 211800 | -| policy_gradient_loss | 0.00903 | -| std | 0.00674 | -| value_loss | 0.000455 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21182 | -| time_elapsed | 114514 | -| total_timesteps | 2711296 | -| train/ | | -| approx_kl | 0.18552643 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 211810 | -| policy_gradient_loss | 0.0283 | -| std | 0.00674 | -| value_loss | 1.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21183 | -| time_elapsed | 114519 | -| total_timesteps | 2711424 | -| train/ | | -| approx_kl | 0.023067512 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 211820 | -| policy_gradient_loss | 0.0177 | -| std | 0.00674 | -| value_loss | 5.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21184 | -| time_elapsed | 114522 | -| total_timesteps | 2711552 | -| train/ | | -| approx_kl | 0.08458148 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.00508 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 211830 | -| policy_gradient_loss | 0.0127 | -| std | 0.00674 | -| value_loss | 3.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21185 | -| time_elapsed | 114526 | -| total_timesteps | 2711680 | -| train/ | | -| approx_kl | 0.023074865 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0499 | -| n_updates | 211840 | -| policy_gradient_loss | -0.00878 | -| std | 0.00674 | -| value_loss | 2.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21186 | -| time_elapsed | 114530 | -| total_timesteps | 2711808 | -| train/ | | -| approx_kl | 0.003513168 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0805 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 211850 | -| policy_gradient_loss | 0.0326 | -| std | 0.00674 | -| value_loss | 2.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 21187 | -| time_elapsed | 114535 | -| total_timesteps | 2711936 | -| train/ | | -| approx_kl | 0.48744595 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 211860 | -| policy_gradient_loss | 0.0648 | -| std | 0.00673 | -| value_loss | 3.71e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21188 | -| time_elapsed | 114540 | -| total_timesteps | 2712064 | -| train/ | | -| approx_kl | 0.06340404 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0938 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 211870 | -| policy_gradient_loss | 0.0138 | -| std | 0.00674 | -| value_loss | 2.86e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21189 | -| time_elapsed | 114547 | -| total_timesteps | 2712192 | -| train/ | | -| approx_kl | 0.0029622465 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 211880 | -| policy_gradient_loss | -0.00379 | -| std | 0.00674 | -| value_loss | 4.65e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21190 | -| time_elapsed | 114553 | -| total_timesteps | 2712320 | -| train/ | | -| approx_kl | 0.05321706 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.0129 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 211890 | -| policy_gradient_loss | 0.0104 | -| std | 0.00674 | -| value_loss | 1.29e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21191 | -| time_elapsed | 114558 | -| total_timesteps | 2712448 | -| train/ | | -| approx_kl | 0.03669028 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.0127 | -| learning_rate | 0.0003 | -| loss | -0.00357 | -| n_updates | 211900 | -| policy_gradient_loss | 0.000861 | -| std | 0.00674 | -| value_loss | 5.03e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21192 | -| time_elapsed | 114562 | -| total_timesteps | 2712576 | -| train/ | | -| approx_kl | 0.007045024 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.00997 | -| learning_rate | 0.0003 | -| loss | -0.000869 | -| n_updates | 211910 | -| policy_gradient_loss | 0.00688 | -| std | 0.00674 | -| value_loss | 2.8e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21193 | -| time_elapsed | 114567 | -| total_timesteps | 2712704 | -| train/ | | -| approx_kl | 0.06937927 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.047 | -| n_updates | 211920 | -| policy_gradient_loss | 0.0191 | -| std | 0.00674 | -| value_loss | 1.73e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21194 | -| time_elapsed | 114572 | -| total_timesteps | 2712832 | -| train/ | | -| approx_kl | 0.035415523 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | -0.00639 | -| n_updates | 211930 | -| policy_gradient_loss | -0.00154 | -| std | 0.00674 | -| value_loss | 1.38e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21195 | -| time_elapsed | 114576 | -| total_timesteps | 2712960 | -| train/ | | -| approx_kl | 4.0092506e-05 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 211940 | -| policy_gradient_loss | 0.00173 | -| std | 0.00674 | -| value_loss | 1.23e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21196 | -| time_elapsed | 114580 | -| total_timesteps | 2713088 | -| train/ | | -| approx_kl | 0.039536554 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 211950 | -| policy_gradient_loss | 0.0108 | -| std | 0.00674 | -| value_loss | 7.24e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21197 | -| time_elapsed | 114588 | -| total_timesteps | 2713216 | -| train/ | | -| approx_kl | 0.00012645777 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.767 | -| learning_rate | 0.0003 | -| loss | -0.00542 | -| n_updates | 211960 | -| policy_gradient_loss | -0.0024 | -| std | 0.00674 | -| value_loss | 0.00626 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21198 | -| time_elapsed | 114594 | -| total_timesteps | 2713344 | -| train/ | | -| approx_kl | 0.0048929253 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 211970 | -| policy_gradient_loss | 0.00639 | -| std | 0.00673 | -| value_loss | 1.29e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21199 | -| time_elapsed | 114600 | -| total_timesteps | 2713472 | -| train/ | | -| approx_kl | 0.00033685146 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.00221 | -| n_updates | 211980 | -| policy_gradient_loss | 0.00274 | -| std | 0.00673 | -| value_loss | 2.8e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21200 | -| time_elapsed | 114604 | -| total_timesteps | 2713600 | -| train/ | | -| approx_kl | 0.042294804 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.431 | -| learning_rate | 0.0003 | -| loss | 0.00697 | -| n_updates | 211990 | -| policy_gradient_loss | 0.00245 | -| std | 0.00673 | -| value_loss | 4.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21201 | -| time_elapsed | 114608 | -| total_timesteps | 2713728 | -| train/ | | -| approx_kl | 0.009075474 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 212000 | -| policy_gradient_loss | 0.00237 | -| std | 0.00672 | -| value_loss | 3.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21202 | -| time_elapsed | 114613 | -| total_timesteps | 2713856 | -| train/ | | -| approx_kl | 0.07064737 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 212010 | -| policy_gradient_loss | 0.00732 | -| std | 0.00672 | -| value_loss | 2.54e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 21203 | -| time_elapsed | 114618 | -| total_timesteps | 2713984 | -| train/ | | -| approx_kl | 0.010769344 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.00629 | -| n_updates | 212020 | -| policy_gradient_loss | 0.00994 | -| std | 0.00672 | -| value_loss | 1.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21204 | -| time_elapsed | 114623 | -| total_timesteps | 2714112 | -| train/ | | -| approx_kl | 0.07099213 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | 0.0448 | -| n_updates | 212030 | -| policy_gradient_loss | 0.0179 | -| std | 0.00672 | -| value_loss | 1.41e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21205 | -| time_elapsed | 114634 | -| total_timesteps | 2714240 | -| train/ | | -| approx_kl | 0.0066096485 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | -0.00606 | -| n_updates | 212040 | -| policy_gradient_loss | 0.00662 | -| std | 0.00672 | -| value_loss | 0.00498 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21206 | -| time_elapsed | 114639 | -| total_timesteps | 2714368 | -| train/ | | -| approx_kl | 0.0022267448 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.00355 | -| n_updates | 212050 | -| policy_gradient_loss | 0.00597 | -| std | 0.00672 | -| value_loss | 5.32e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21207 | -| time_elapsed | 114644 | -| total_timesteps | 2714496 | -| train/ | | -| approx_kl | 0.056863263 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.00397 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 212060 | -| policy_gradient_loss | 0.00985 | -| std | 0.00672 | -| value_loss | 5.81e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21208 | -| time_elapsed | 114649 | -| total_timesteps | 2714624 | -| train/ | | -| approx_kl | 0.04268868 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0344 | -| n_updates | 212070 | -| policy_gradient_loss | 0.017 | -| std | 0.00672 | -| value_loss | 3.05e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21209 | -| time_elapsed | 114654 | -| total_timesteps | 2714752 | -| train/ | | -| approx_kl | 0.052168444 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0974 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 212080 | -| policy_gradient_loss | 0.0194 | -| std | 0.00672 | -| value_loss | 2.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21210 | -| time_elapsed | 114658 | -| total_timesteps | 2714880 | -| train/ | | -| approx_kl | 0.049559556 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 212090 | -| policy_gradient_loss | 0.0122 | -| std | 0.00672 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21211 | -| time_elapsed | 114663 | -| total_timesteps | 2715008 | -| train/ | | -| approx_kl | 0.008623326 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | -0.0743 | -| learning_rate | 0.0003 | -| loss | -0.00996 | -| n_updates | 212100 | -| policy_gradient_loss | 0.00505 | -| std | 0.00672 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21212 | -| time_elapsed | 114672 | -| total_timesteps | 2715136 | -| train/ | | -| approx_kl | 0.009072799 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 212110 | -| policy_gradient_loss | -0.0105 | -| std | 0.00672 | -| value_loss | 0.00326 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21213 | -| time_elapsed | 114676 | -| total_timesteps | 2715264 | -| train/ | | -| approx_kl | 0.012527859 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.58 | -| explained_variance | 0.511 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 212120 | -| policy_gradient_loss | 0.00104 | -| std | 0.00672 | -| value_loss | 1.72e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21214 | -| time_elapsed | 114679 | -| total_timesteps | 2715392 | -| train/ | | -| approx_kl | 0.013297709 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.000237 | -| learning_rate | 0.0003 | -| loss | 0.00699 | -| n_updates | 212130 | -| policy_gradient_loss | 0.0113 | -| std | 0.00668 | -| value_loss | 1.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21215 | -| time_elapsed | 114683 | -| total_timesteps | 2715520 | -| train/ | | -| approx_kl | 0.051907845 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.00541 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 212140 | -| policy_gradient_loss | 0.0273 | -| std | 0.00667 | -| value_loss | 3.83e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21216 | -| time_elapsed | 114688 | -| total_timesteps | 2715648 | -| train/ | | -| approx_kl | 1.2445157 | -| clip_fraction | 0.76 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.0109 | -| learning_rate | 0.0003 | -| loss | 0.323 | -| n_updates | 212150 | -| policy_gradient_loss | 0.173 | -| std | 0.00666 | -| value_loss | 1.02e-05 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21217 | -| time_elapsed | 114693 | -| total_timesteps | 2715776 | -| train/ | | -| approx_kl | 0.0628828 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | 0.057 | -| n_updates | 212160 | -| policy_gradient_loss | 0.00791 | -| std | 0.00666 | -| value_loss | 4.77e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21218 | -| time_elapsed | 114698 | -| total_timesteps | 2715904 | -| train/ | | -| approx_kl | 0.25585198 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | 0.0821 | -| n_updates | 212170 | -| policy_gradient_loss | 0.0196 | -| std | 0.00665 | -| value_loss | 6.07e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21219 | -| time_elapsed | 114704 | -| total_timesteps | 2716032 | -| train/ | | -| approx_kl | 0.018550433 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.326 | -| learning_rate | 0.0003 | -| loss | 0.000826 | -| n_updates | 212180 | -| policy_gradient_loss | 0.0319 | -| std | 0.00664 | -| value_loss | 1.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21220 | -| time_elapsed | 114716 | -| total_timesteps | 2716160 | -| train/ | | -| approx_kl | 0.04625335 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | -0.00821 | -| n_updates | 212190 | -| policy_gradient_loss | -0.000577 | -| std | 0.00664 | -| value_loss | 0.00299 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21221 | -| time_elapsed | 114720 | -| total_timesteps | 2716288 | -| train/ | | -| approx_kl | 0.5636433 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 212200 | -| policy_gradient_loss | 0.0568 | -| std | 0.00664 | -| value_loss | 3.82e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21222 | -| time_elapsed | 114725 | -| total_timesteps | 2716416 | -| train/ | | -| approx_kl | 0.010890666 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -14.4 | -| learning_rate | 0.0003 | -| loss | -0.000977 | -| n_updates | 212210 | -| policy_gradient_loss | 0.00404 | -| std | 0.00664 | -| value_loss | 1.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21223 | -| time_elapsed | 114730 | -| total_timesteps | 2716544 | -| train/ | | -| approx_kl | 0.0028681546 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.000519 | -| learning_rate | 0.0003 | -| loss | -0.00092 | -| n_updates | 212220 | -| policy_gradient_loss | 0.00803 | -| std | 0.00664 | -| value_loss | 8.88e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21224 | -| time_elapsed | 114735 | -| total_timesteps | 2716672 | -| train/ | | -| approx_kl | 0.035044175 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | 0.0324 | -| n_updates | 212230 | -| policy_gradient_loss | 0.104 | -| std | 0.00664 | -| value_loss | 8.11e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21225 | -| time_elapsed | 114739 | -| total_timesteps | 2716800 | -| train/ | | -| approx_kl | 0.08889447 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0767 | -| n_updates | 212240 | -| policy_gradient_loss | 0.109 | -| std | 0.00665 | -| value_loss | 5.62e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21226 | -| time_elapsed | 114743 | -| total_timesteps | 2716928 | -| train/ | | -| approx_kl | 0.12150989 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 212250 | -| policy_gradient_loss | 0.146 | -| std | 0.00665 | -| value_loss | 4.78e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21227 | -| time_elapsed | 114748 | -| total_timesteps | 2717056 | -| train/ | | -| approx_kl | 0.122517705 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.0748 | -| n_updates | 212260 | -| policy_gradient_loss | 0.0621 | -| std | 0.00665 | -| value_loss | 3.85e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21228 | -| time_elapsed | 114757 | -| total_timesteps | 2717184 | -| train/ | | -| approx_kl | 0.027483733 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | -0.0069 | -| n_updates | 212270 | -| policy_gradient_loss | 0.0106 | -| std | 0.00665 | -| value_loss | 0.000998 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21229 | -| time_elapsed | 114761 | -| total_timesteps | 2717312 | -| train/ | | -| approx_kl | 0.17523395 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.654 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 212280 | -| policy_gradient_loss | 0.0096 | -| std | 0.00665 | -| value_loss | 1.2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21230 | -| time_elapsed | 114765 | -| total_timesteps | 2717440 | -| train/ | | -| approx_kl | 0.027150635 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | 0.00336 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 212290 | -| policy_gradient_loss | 0.0527 | -| std | 0.00665 | -| value_loss | 7.72e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21231 | -| time_elapsed | 114769 | -| total_timesteps | 2717568 | -| train/ | | -| approx_kl | 0.34612674 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | 0.277 | -| n_updates | 212300 | -| policy_gradient_loss | 0.147 | -| std | 0.00665 | -| value_loss | 8.66e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21232 | -| time_elapsed | 114772 | -| total_timesteps | 2717696 | -| train/ | | -| approx_kl | 0.04629172 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.59 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.00539 | -| n_updates | 212310 | -| policy_gradient_loss | 0.0178 | -| std | 0.00665 | -| value_loss | 7.74e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21233 | -| time_elapsed | 114777 | -| total_timesteps | 2717824 | -| train/ | | -| approx_kl | 0.0012206556 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 212320 | -| policy_gradient_loss | 0.029 | -| std | 0.00664 | -| value_loss | 6.46e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21234 | -| time_elapsed | 114780 | -| total_timesteps | 2717952 | -| train/ | | -| approx_kl | 0.21047775 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | 0.0729 | -| n_updates | 212330 | -| policy_gradient_loss | 0.0175 | -| std | 0.00663 | -| value_loss | 1.49e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21235 | -| time_elapsed | 114783 | -| total_timesteps | 2718080 | -| train/ | | -| approx_kl | 0.022940252 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0946 | -| learning_rate | 0.0003 | -| loss | -0.00438 | -| n_updates | 212340 | -| policy_gradient_loss | -0.00447 | -| std | 0.00663 | -| value_loss | 1.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21236 | -| time_elapsed | 114793 | -| total_timesteps | 2718208 | -| train/ | | -| approx_kl | 0.011701388 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.726 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 212350 | -| policy_gradient_loss | 0.00364 | -| std | 0.00663 | -| value_loss | 0.00248 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21237 | -| time_elapsed | 114797 | -| total_timesteps | 2718336 | -| train/ | | -| approx_kl | 9.76813e-05 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.65 | -| learning_rate | 0.0003 | -| loss | 0.000465 | -| n_updates | 212360 | -| policy_gradient_loss | 0.0191 | -| std | 0.00663 | -| value_loss | 1.44e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21238 | -| time_elapsed | 114802 | -| total_timesteps | 2718464 | -| train/ | | -| approx_kl | 0.0013638041 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00141 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 212370 | -| policy_gradient_loss | 0.0264 | -| std | 0.00663 | -| value_loss | 7.49e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21239 | -| time_elapsed | 114807 | -| total_timesteps | 2718592 | -| train/ | | -| approx_kl | 0.6101469 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0977 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 212380 | -| policy_gradient_loss | 0.062 | -| std | 0.00663 | -| value_loss | 6.33e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21240 | -| time_elapsed | 114813 | -| total_timesteps | 2718720 | -| train/ | | -| approx_kl | 0.0058813416 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 212390 | -| policy_gradient_loss | 0.00638 | -| std | 0.00663 | -| value_loss | 5.98e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21241 | -| time_elapsed | 114818 | -| total_timesteps | 2718848 | -| train/ | | -| approx_kl | 0.037430115 | -| clip_fraction | 0.625 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 212400 | -| policy_gradient_loss | 0.103 | -| std | 0.00664 | -| value_loss | 2.65e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21242 | -| time_elapsed | 114823 | -| total_timesteps | 2718976 | -| train/ | | -| approx_kl | 0.089266196 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 212410 | -| policy_gradient_loss | 0.0763 | -| std | 0.00664 | -| value_loss | 2.1e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21243 | -| time_elapsed | 114829 | -| total_timesteps | 2719104 | -| train/ | | -| approx_kl | 0.017583018 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.00827 | -| n_updates | 212420 | -| policy_gradient_loss | 0.0209 | -| std | 0.00664 | -| value_loss | 1.85e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21244 | -| time_elapsed | 114840 | -| total_timesteps | 2719232 | -| train/ | | -| approx_kl | 0.20501956 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.939 | -| learning_rate | 0.0003 | -| loss | 0.0709 | -| n_updates | 212430 | -| policy_gradient_loss | 0.0205 | -| std | 0.00664 | -| value_loss | 0.000833 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21245 | -| time_elapsed | 114845 | -| total_timesteps | 2719360 | -| train/ | | -| approx_kl | 0.014586899 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.63 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 212440 | -| policy_gradient_loss | -0.00263 | -| std | 0.00664 | -| value_loss | 6.11e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21246 | -| time_elapsed | 114850 | -| total_timesteps | 2719488 | -| train/ | | -| approx_kl | 0.02909302 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 212450 | -| policy_gradient_loss | 0.0379 | -| std | 0.00664 | -| value_loss | 6.71e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21247 | -| time_elapsed | 114856 | -| total_timesteps | 2719616 | -| train/ | | -| approx_kl | 0.31919017 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.205 | -| n_updates | 212460 | -| policy_gradient_loss | 0.183 | -| std | 0.00664 | -| value_loss | 5.77e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21248 | -| time_elapsed | 114860 | -| total_timesteps | 2719744 | -| train/ | | -| approx_kl | 0.16815181 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.0987 | -| n_updates | 212470 | -| policy_gradient_loss | 0.13 | -| std | 0.00664 | -| value_loss | 3.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21249 | -| time_elapsed | 114865 | -| total_timesteps | 2719872 | -| train/ | | -| approx_kl | 0.11446982 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | 0.0961 | -| n_updates | 212480 | -| policy_gradient_loss | 0.0956 | -| std | 0.00664 | -| value_loss | 1.37e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21250 | -| time_elapsed | 114869 | -| total_timesteps | 2720000 | -| train/ | | -| approx_kl | 0.025056636 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 212490 | -| policy_gradient_loss | 0.0185 | -| std | 0.00664 | -| value_loss | 1.34e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21251 | -| time_elapsed | 114874 | -| total_timesteps | 2720128 | -| train/ | | -| approx_kl | 0.48290676 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00361 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 212500 | -| policy_gradient_loss | 0.064 | -| std | 0.00664 | -| value_loss | 7.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21252 | -| time_elapsed | 114884 | -| total_timesteps | 2720256 | -| train/ | | -| approx_kl | 0.016922146 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | -0.00966 | -| n_updates | 212510 | -| policy_gradient_loss | -0.00158 | -| std | 0.00664 | -| value_loss | 0.000439 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21253 | -| time_elapsed | 114889 | -| total_timesteps | 2720384 | -| train/ | | -| approx_kl | 0.054723542 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 212520 | -| policy_gradient_loss | 0.0141 | -| std | 0.00663 | -| value_loss | 2.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21254 | -| time_elapsed | 114894 | -| total_timesteps | 2720512 | -| train/ | | -| approx_kl | 0.039399214 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0989 | -| learning_rate | 0.0003 | -| loss | 0.0049 | -| n_updates | 212530 | -| policy_gradient_loss | 0.00269 | -| std | 0.00662 | -| value_loss | 7.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21255 | -| time_elapsed | 114899 | -| total_timesteps | 2720640 | -| train/ | | -| approx_kl | 0.048839547 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 212540 | -| policy_gradient_loss | 0.0136 | -| std | 0.00662 | -| value_loss | 2.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21256 | -| time_elapsed | 114904 | -| total_timesteps | 2720768 | -| train/ | | -| approx_kl | 0.008059323 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0657 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 212550 | -| policy_gradient_loss | 0.0087 | -| std | 0.00661 | -| value_loss | 9.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 21257 | -| time_elapsed | 114908 | -| total_timesteps | 2720896 | -| train/ | | -| approx_kl | 0.09644869 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.785 | -| learning_rate | 0.0003 | -| loss | 0.00444 | -| n_updates | 212560 | -| policy_gradient_loss | 0.0246 | -| std | 0.00661 | -| value_loss | 3.83e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21258 | -| time_elapsed | 114914 | -| total_timesteps | 2721024 | -| train/ | | -| approx_kl | 1.0648159 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.349 | -| n_updates | 212570 | -| policy_gradient_loss | 0.217 | -| std | 0.00661 | -| value_loss | 1.89e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21259 | -| time_elapsed | 114925 | -| total_timesteps | 2721152 | -| train/ | | -| approx_kl | 0.1847496 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | 0.0191 | -| n_updates | 212580 | -| policy_gradient_loss | 0.00561 | -| std | 0.0066 | -| value_loss | 0.000864 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21260 | -| time_elapsed | 114933 | -| total_timesteps | 2721280 | -| train/ | | -| approx_kl | 0.095954254 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.555 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 212590 | -| policy_gradient_loss | 0.0243 | -| std | 0.0066 | -| value_loss | 6.23e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21261 | -| time_elapsed | 114939 | -| total_timesteps | 2721408 | -| train/ | | -| approx_kl | 0.3863661 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00981 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 212600 | -| policy_gradient_loss | 0.155 | -| std | 0.0066 | -| value_loss | 2.33e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21262 | -| time_elapsed | 114944 | -| total_timesteps | 2721536 | -| train/ | | -| approx_kl | 0.0007451363 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -6.85e-05 | -| n_updates | 212610 | -| policy_gradient_loss | 0.0292 | -| std | 0.00657 | -| value_loss | 0.000316 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21263 | -| time_elapsed | 114950 | -| total_timesteps | 2721664 | -| train/ | | -| approx_kl | 0.21250923 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 212620 | -| policy_gradient_loss | 0.0807 | -| std | 0.00656 | -| value_loss | 0.000424 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21264 | -| time_elapsed | 114954 | -| total_timesteps | 2721792 | -| train/ | | -| approx_kl | 0.037659097 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.909 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 212630 | -| policy_gradient_loss | 0.0207 | -| std | 0.00656 | -| value_loss | 3.08e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 21265 | -| time_elapsed | 114959 | -| total_timesteps | 2721920 | -| train/ | | -| approx_kl | 0.49650496 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.0122 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 212640 | -| policy_gradient_loss | 0.0548 | -| std | 0.00655 | -| value_loss | 1.11e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21266 | -| time_elapsed | 114966 | -| total_timesteps | 2722048 | -| train/ | | -| approx_kl | 0.011772878 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 212650 | -| policy_gradient_loss | 0.00212 | -| std | 0.00655 | -| value_loss | 7.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21267 | -| time_elapsed | 114973 | -| total_timesteps | 2722176 | -| train/ | | -| approx_kl | 0.018301712 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.27 | -| learning_rate | 0.0003 | -| loss | -0.0261 | -| n_updates | 212660 | -| policy_gradient_loss | -0.00957 | -| std | 0.00655 | -| value_loss | 0.00168 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21268 | -| time_elapsed | 114979 | -| total_timesteps | 2722304 | -| train/ | | -| approx_kl | 0.09212491 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.000772 | -| n_updates | 212670 | -| policy_gradient_loss | -0.00975 | -| std | 0.00655 | -| value_loss | 5.63e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21269 | -| time_elapsed | 114985 | -| total_timesteps | 2722432 | -| train/ | | -| approx_kl | 0.04434205 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.888 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 212680 | -| policy_gradient_loss | 0.0117 | -| std | 0.00655 | -| value_loss | 1.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21270 | -| time_elapsed | 114991 | -| total_timesteps | 2722560 | -| train/ | | -| approx_kl | 0.04960848 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0833 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 212690 | -| policy_gradient_loss | 0.00725 | -| std | 0.00656 | -| value_loss | 7.98e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21271 | -| time_elapsed | 114996 | -| total_timesteps | 2722688 | -| train/ | | -| approx_kl | 0.009813833 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 212700 | -| policy_gradient_loss | 0.00802 | -| std | 0.00655 | -| value_loss | 5.91e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21272 | -| time_elapsed | 115002 | -| total_timesteps | 2722816 | -| train/ | | -| approx_kl | 0.05790699 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.000702 | -| n_updates | 212710 | -| policy_gradient_loss | -0.004 | -| std | 0.00655 | -| value_loss | 4.99e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21273 | -| time_elapsed | 115006 | -| total_timesteps | 2722944 | -| train/ | | -| approx_kl | 0.03494572 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 212720 | -| policy_gradient_loss | 0.00935 | -| std | 0.00655 | -| value_loss | 3.21e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21274 | -| time_elapsed | 115010 | -| total_timesteps | 2723072 | -| train/ | | -| approx_kl | 0.0070962 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 212730 | -| policy_gradient_loss | 0.00542 | -| std | 0.00656 | -| value_loss | 1.87e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21275 | -| time_elapsed | 115020 | -| total_timesteps | 2723200 | -| train/ | | -| approx_kl | 0.07631502 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | -0.00984 | -| n_updates | 212740 | -| policy_gradient_loss | -0.0116 | -| std | 0.00658 | -| value_loss | 0.00021 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21276 | -| time_elapsed | 115025 | -| total_timesteps | 2723328 | -| train/ | | -| approx_kl | 0.0070167077 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 212750 | -| policy_gradient_loss | 0.00674 | -| std | 0.00659 | -| value_loss | 9.08e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21277 | -| time_elapsed | 115030 | -| total_timesteps | 2723456 | -| train/ | | -| approx_kl | 0.064889744 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.014 | -| learning_rate | 0.0003 | -| loss | 0.00473 | -| n_updates | 212760 | -| policy_gradient_loss | -0.00269 | -| std | 0.00659 | -| value_loss | 2.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21278 | -| time_elapsed | 115035 | -| total_timesteps | 2723584 | -| train/ | | -| approx_kl | 0.01231325 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 212770 | -| policy_gradient_loss | 0.000284 | -| std | 0.00659 | -| value_loss | 1.99e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21279 | -| time_elapsed | 115038 | -| total_timesteps | 2723712 | -| train/ | | -| approx_kl | 0.0005322676 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.000761 | -| n_updates | 212780 | -| policy_gradient_loss | 0.0376 | -| std | 0.00659 | -| value_loss | 1.06e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21280 | -| time_elapsed | 115044 | -| total_timesteps | 2723840 | -| train/ | | -| approx_kl | 0.16732758 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 212790 | -| policy_gradient_loss | 0.0507 | -| std | 0.00659 | -| value_loss | 7.91e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 21281 | -| time_elapsed | 115049 | -| total_timesteps | 2723968 | -| train/ | | -| approx_kl | 0.24039593 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 212800 | -| policy_gradient_loss | 0.0338 | -| std | 0.0066 | -| value_loss | 5.84e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21282 | -| time_elapsed | 115054 | -| total_timesteps | 2724096 | -| train/ | | -| approx_kl | 0.0014005271 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | 0.000441 | -| n_updates | 212810 | -| policy_gradient_loss | 0.0307 | -| std | 0.00659 | -| value_loss | 3.98e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21283 | -| time_elapsed | 115065 | -| total_timesteps | 2724224 | -| train/ | | -| approx_kl | 0.038700625 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | 0.00825 | -| n_updates | 212820 | -| policy_gradient_loss | -0.00151 | -| std | 0.00659 | -| value_loss | 0.000695 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21284 | -| time_elapsed | 115070 | -| total_timesteps | 2724352 | -| train/ | | -| approx_kl | 0.14359845 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | 0.0603 | -| n_updates | 212830 | -| policy_gradient_loss | 0.0258 | -| std | 0.00659 | -| value_loss | 1.39e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21285 | -| time_elapsed | 115075 | -| total_timesteps | 2724480 | -| train/ | | -| approx_kl | 0.00078039663 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00926 | -| learning_rate | 0.0003 | -| loss | -0.00368 | -| n_updates | 212840 | -| policy_gradient_loss | 0.0203 | -| std | 0.00659 | -| value_loss | 2.8e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21286 | -| time_elapsed | 115078 | -| total_timesteps | 2724608 | -| train/ | | -| approx_kl | 0.49520975 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 212850 | -| policy_gradient_loss | 0.0516 | -| std | 0.00659 | -| value_loss | 1.6e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21287 | -| time_elapsed | 115083 | -| total_timesteps | 2724736 | -| train/ | | -| approx_kl | 0.013336444 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.00482 | -| n_updates | 212860 | -| policy_gradient_loss | 0.00993 | -| std | 0.00659 | -| value_loss | 8.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21288 | -| time_elapsed | 115087 | -| total_timesteps | 2724864 | -| train/ | | -| approx_kl | 0.06715186 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.0388 | -| n_updates | 212870 | -| policy_gradient_loss | 0.0161 | -| std | 0.00659 | -| value_loss | 4.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 21289 | -| time_elapsed | 115092 | -| total_timesteps | 2724992 | -| train/ | | -| approx_kl | 0.009305075 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0913 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 212880 | -| policy_gradient_loss | 0.00143 | -| std | 0.00659 | -| value_loss | 4.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21290 | -| time_elapsed | 115096 | -| total_timesteps | 2725120 | -| train/ | | -| approx_kl | 0.03040555 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.0294 | -| n_updates | 212890 | -| policy_gradient_loss | 0.0969 | -| std | 0.00659 | -| value_loss | 2.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21291 | -| time_elapsed | 115107 | -| total_timesteps | 2725248 | -| train/ | | -| approx_kl | 0.20381023 | -| clip_fraction | 0.681 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.808 | -| learning_rate | 0.0003 | -| loss | 0.0435 | -| n_updates | 212900 | -| policy_gradient_loss | 0.0461 | -| std | 0.00659 | -| value_loss | 0.000729 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21292 | -| time_elapsed | 115111 | -| total_timesteps | 2725376 | -| train/ | | -| approx_kl | 0.2727501 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -6.46 | -| learning_rate | 0.0003 | -| loss | 0.087 | -| n_updates | 212910 | -| policy_gradient_loss | 0.0524 | -| std | 0.00659 | -| value_loss | 6.47e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21293 | -| time_elapsed | 115116 | -| total_timesteps | 2725504 | -| train/ | | -| approx_kl | 0.23913264 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -2.82 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 212920 | -| policy_gradient_loss | 0.148 | -| std | 0.00659 | -| value_loss | 6.41e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21294 | -| time_elapsed | 115121 | -| total_timesteps | 2725632 | -| train/ | | -| approx_kl | 0.032085408 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 212930 | -| policy_gradient_loss | 0.0244 | -| std | 0.0066 | -| value_loss | 2e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21295 | -| time_elapsed | 115125 | -| total_timesteps | 2725760 | -| train/ | | -| approx_kl | 0.17214996 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0789 | -| learning_rate | 0.0003 | -| loss | 0.0388 | -| n_updates | 212940 | -| policy_gradient_loss | 0.0118 | -| std | 0.0066 | -| value_loss | 1.38e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 21296 | -| time_elapsed | 115130 | -| total_timesteps | 2725888 | -| train/ | | -| approx_kl | 0.02335352 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | -0.00779 | -| n_updates | 212950 | -| policy_gradient_loss | 0.0218 | -| std | 0.0066 | -| value_loss | 1.08e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21297 | -| time_elapsed | 115135 | -| total_timesteps | 2726016 | -| train/ | | -| approx_kl | 0.31096473 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 212960 | -| policy_gradient_loss | 0.11 | -| std | 0.0066 | -| value_loss | 9.03e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21298 | -| time_elapsed | 115146 | -| total_timesteps | 2726144 | -| train/ | | -| approx_kl | 0.0019530952 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.723 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 212970 | -| policy_gradient_loss | 0.00115 | -| std | 0.0066 | -| value_loss | 0.000926 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21299 | -| time_elapsed | 115149 | -| total_timesteps | 2726272 | -| train/ | | -| approx_kl | 0.28349406 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.35 | -| learning_rate | 0.0003 | -| loss | 0.0964 | -| n_updates | 212980 | -| policy_gradient_loss | 0.0239 | -| std | 0.0066 | -| value_loss | 1.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21300 | -| time_elapsed | 115153 | -| total_timesteps | 2726400 | -| train/ | | -| approx_kl | 0.015678946 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00693 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 212990 | -| policy_gradient_loss | 0.026 | -| std | 0.0066 | -| value_loss | 2.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21301 | -| time_elapsed | 115157 | -| total_timesteps | 2726528 | -| train/ | | -| approx_kl | 0.10962045 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 213000 | -| policy_gradient_loss | 0.00656 | -| std | 0.0066 | -| value_loss | 1.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21302 | -| time_elapsed | 115161 | -| total_timesteps | 2726656 | -| train/ | | -| approx_kl | 9.802496e-05 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | -0.000125 | -| n_updates | 213010 | -| policy_gradient_loss | 0.0294 | -| std | 0.0066 | -| value_loss | 7.54e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21303 | -| time_elapsed | 115166 | -| total_timesteps | 2726784 | -| train/ | | -| approx_kl | 0.5622126 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0972 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 213020 | -| policy_gradient_loss | 0.0633 | -| std | 0.00661 | -| value_loss | 1.13e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 21304 | -| time_elapsed | 115170 | -| total_timesteps | 2726912 | -| train/ | | -| approx_kl | 0.0106919035 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.000693 | -| n_updates | 213030 | -| policy_gradient_loss | 0.00537 | -| std | 0.00661 | -| value_loss | 5.53e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21305 | -| time_elapsed | 115175 | -| total_timesteps | 2727040 | -| train/ | | -| approx_kl | 0.003125825 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.0044 | -| n_updates | 213040 | -| policy_gradient_loss | 0.00954 | -| std | 0.00661 | -| value_loss | 3.8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21306 | -| time_elapsed | 115185 | -| total_timesteps | 2727168 | -| train/ | | -| approx_kl | 0.018156627 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.958 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 213050 | -| policy_gradient_loss | -0.000643 | -| std | 0.00661 | -| value_loss | 0.000525 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21307 | -| time_elapsed | 115190 | -| total_timesteps | 2727296 | -| train/ | | -| approx_kl | 0.075141795 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.0484 | -| n_updates | 213060 | -| policy_gradient_loss | 0.113 | -| std | 0.00661 | -| value_loss | 5.79e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21308 | -| time_elapsed | 115194 | -| total_timesteps | 2727424 | -| train/ | | -| approx_kl | 0.09363063 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | 0.0803 | -| n_updates | 213070 | -| policy_gradient_loss | 0.105 | -| std | 0.00661 | -| value_loss | 1.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21309 | -| time_elapsed | 115197 | -| total_timesteps | 2727552 | -| train/ | | -| approx_kl | 0.022546029 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.000561 | -| learning_rate | 0.0003 | -| loss | -0.0036 | -| n_updates | 213080 | -| policy_gradient_loss | 0.0257 | -| std | 0.00661 | -| value_loss | 6.08e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21310 | -| time_elapsed | 115201 | -| total_timesteps | 2727680 | -| train/ | | -| approx_kl | 0.00019438611 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.000257 | -| n_updates | 213090 | -| policy_gradient_loss | 0.026 | -| std | 0.00661 | -| value_loss | 2.46e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21311 | -| time_elapsed | 115205 | -| total_timesteps | 2727808 | -| train/ | | -| approx_kl | 0.0010932777 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 213100 | -| policy_gradient_loss | 0.0279 | -| std | 0.00661 | -| value_loss | 1.89e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21312 | -| time_elapsed | 115210 | -| total_timesteps | 2727936 | -| train/ | | -| approx_kl | 0.0027511315 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 213110 | -| policy_gradient_loss | 0.0387 | -| std | 0.0066 | -| value_loss | 9.81e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21313 | -| time_elapsed | 115214 | -| total_timesteps | 2728064 | -| train/ | | -| approx_kl | 0.3926458 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 213120 | -| policy_gradient_loss | 0.0477 | -| std | 0.0066 | -| value_loss | 9.74e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21314 | -| time_elapsed | 115222 | -| total_timesteps | 2728192 | -| train/ | | -| approx_kl | 0.060412966 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.824 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 213130 | -| policy_gradient_loss | -0.000497 | -| std | 0.0066 | -| value_loss | 0.00404 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21315 | -| time_elapsed | 115228 | -| total_timesteps | 2728320 | -| train/ | | -| approx_kl | 0.0015035663 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.00163 | -| n_updates | 213140 | -| policy_gradient_loss | 0.0166 | -| std | 0.00659 | -| value_loss | 7.66e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21316 | -| time_elapsed | 115232 | -| total_timesteps | 2728448 | -| train/ | | -| approx_kl | 0.17521621 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.617 | -| learning_rate | 0.0003 | -| loss | 0.0351 | -| n_updates | 213150 | -| policy_gradient_loss | 0.0108 | -| std | 0.00659 | -| value_loss | 2.31e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21317 | -| time_elapsed | 115235 | -| total_timesteps | 2728576 | -| train/ | | -| approx_kl | 0.0031557484 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0877 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 213160 | -| policy_gradient_loss | 0.0229 | -| std | 0.00659 | -| value_loss | 1.2e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21318 | -| time_elapsed | 115239 | -| total_timesteps | 2728704 | -| train/ | | -| approx_kl | 0.16735926 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0633 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 213170 | -| policy_gradient_loss | 0.0168 | -| std | 0.00659 | -| value_loss | 1e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21319 | -| time_elapsed | 115243 | -| total_timesteps | 2728832 | -| train/ | | -| approx_kl | 0.015669426 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 213180 | -| policy_gradient_loss | -0.00833 | -| std | 0.00659 | -| value_loss | 5.94e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 21320 | -| time_elapsed | 115247 | -| total_timesteps | 2728960 | -| train/ | | -| approx_kl | 0.0109148435 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0771 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 213190 | -| policy_gradient_loss | -0.00178 | -| std | 0.00659 | -| value_loss | 3.53e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21321 | -| time_elapsed | 115252 | -| total_timesteps | 2729088 | -| train/ | | -| approx_kl | 0.012635778 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0848 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 213200 | -| policy_gradient_loss | -0.00176 | -| std | 0.00659 | -| value_loss | 2.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21322 | -| time_elapsed | 115262 | -| total_timesteps | 2729216 | -| train/ | | -| approx_kl | 0.0056981095 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 213210 | -| policy_gradient_loss | 0.00538 | -| std | 0.00659 | -| value_loss | 0.0002 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21323 | -| time_elapsed | 115267 | -| total_timesteps | 2729344 | -| train/ | | -| approx_kl | 0.22958466 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 213220 | -| policy_gradient_loss | 0.105 | -| std | 0.00659 | -| value_loss | 1.46e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21324 | -| time_elapsed | 115272 | -| total_timesteps | 2729472 | -| train/ | | -| approx_kl | 0.17345 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 213230 | -| policy_gradient_loss | 0.113 | -| std | 0.00659 | -| value_loss | 2.75e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21325 | -| time_elapsed | 115276 | -| total_timesteps | 2729600 | -| train/ | | -| approx_kl | 0.02976081 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0652 | -| learning_rate | 0.0003 | -| loss | 0.00655 | -| n_updates | 213240 | -| policy_gradient_loss | 0.0216 | -| std | 0.00659 | -| value_loss | 2.08e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21326 | -| time_elapsed | 115281 | -| total_timesteps | 2729728 | -| train/ | | -| approx_kl | 0.16445182 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0437 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 213250 | -| policy_gradient_loss | 0.0139 | -| std | 0.00659 | -| value_loss | 1.6e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21327 | -| time_elapsed | 115285 | -| total_timesteps | 2729856 | -| train/ | | -| approx_kl | 0.014774047 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.00582 | -| n_updates | 213260 | -| policy_gradient_loss | 0.00223 | -| std | 0.00659 | -| value_loss | 9.64e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 21328 | -| time_elapsed | 115289 | -| total_timesteps | 2729984 | -| train/ | | -| approx_kl | 0.023006601 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 213270 | -| policy_gradient_loss | 0.0318 | -| std | 0.0066 | -| value_loss | 5.84e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21329 | -| time_elapsed | 115295 | -| total_timesteps | 2730112 | -| train/ | | -| approx_kl | 0.3063769 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 213280 | -| policy_gradient_loss | 0.147 | -| std | 0.0066 | -| value_loss | 5.27e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21330 | -| time_elapsed | 115306 | -| total_timesteps | 2730240 | -| train/ | | -| approx_kl | 0.3235157 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.0359 | -| learning_rate | 0.0003 | -| loss | 0.0599 | -| n_updates | 213290 | -| policy_gradient_loss | 0.0425 | -| std | 0.0066 | -| value_loss | 0.00221 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21331 | -| time_elapsed | 115312 | -| total_timesteps | 2730368 | -| train/ | | -| approx_kl | 0.08773806 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.381 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 213300 | -| policy_gradient_loss | 0.0205 | -| std | 0.0066 | -| value_loss | 3e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21332 | -| time_elapsed | 115317 | -| total_timesteps | 2730496 | -| train/ | | -| approx_kl | 6.354833e-05 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00841 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 213310 | -| policy_gradient_loss | 0.0272 | -| std | 0.0066 | -| value_loss | 4.22e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21333 | -| time_elapsed | 115322 | -| total_timesteps | 2730624 | -| train/ | | -| approx_kl | 0.15424602 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.0626 | -| n_updates | 213320 | -| policy_gradient_loss | 0.0158 | -| std | 0.0066 | -| value_loss | 2.1e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21334 | -| time_elapsed | 115325 | -| total_timesteps | 2730752 | -| train/ | | -| approx_kl | 0.019473571 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | 0.00323 | -| n_updates | 213330 | -| policy_gradient_loss | 0.000309 | -| std | 0.0066 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21335 | -| time_elapsed | 115328 | -| total_timesteps | 2730880 | -| train/ | | -| approx_kl | 0.015115368 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0483 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 213340 | -| policy_gradient_loss | -0.00794 | -| std | 0.0066 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21336 | -| time_elapsed | 115334 | -| total_timesteps | 2731008 | -| train/ | | -| approx_kl | 0.014948862 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.000417 | -| n_updates | 213350 | -| policy_gradient_loss | 0.00012 | -| std | 0.0066 | -| value_loss | 6.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21337 | -| time_elapsed | 115346 | -| total_timesteps | 2731136 | -| train/ | | -| approx_kl | 0.004238549 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 213360 | -| policy_gradient_loss | 0.00629 | -| std | 0.0066 | -| value_loss | 0.00225 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21338 | -| time_elapsed | 115351 | -| total_timesteps | 2731264 | -| train/ | | -| approx_kl | 0.06402085 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.259 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 213370 | -| policy_gradient_loss | 0.0208 | -| std | 0.0066 | -| value_loss | 8.39e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21339 | -| time_elapsed | 115356 | -| total_timesteps | 2731392 | -| train/ | | -| approx_kl | 0.15598367 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.0674 | -| n_updates | 213380 | -| policy_gradient_loss | 0.0196 | -| std | 0.0066 | -| value_loss | 9.7e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21340 | -| time_elapsed | 115363 | -| total_timesteps | 2731520 | -| train/ | | -| approx_kl | 0.01357431 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 213390 | -| policy_gradient_loss | -0.0068 | -| std | 0.0066 | -| value_loss | 3.27e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21341 | -| time_elapsed | 115370 | -| total_timesteps | 2731648 | -| train/ | | -| approx_kl | 0.0133062005 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.00567 | -| n_updates | 213400 | -| policy_gradient_loss | 0.00274 | -| std | 0.0066 | -| value_loss | 2.27e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21342 | -| time_elapsed | 115375 | -| total_timesteps | 2731776 | -| train/ | | -| approx_kl | 0.011339909 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 213410 | -| policy_gradient_loss | -0.0065 | -| std | 0.00659 | -| value_loss | 1.44e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21343 | -| time_elapsed | 115379 | -| total_timesteps | 2731904 | -| train/ | | -| approx_kl | 0.0239176 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | -0.000909 | -| n_updates | 213420 | -| policy_gradient_loss | 0.026 | -| std | 0.00659 | -| value_loss | 9.43e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21344 | -| time_elapsed | 115383 | -| total_timesteps | 2732032 | -| train/ | | -| approx_kl | 0.2430317 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 213430 | -| policy_gradient_loss | 0.126 | -| std | 0.0066 | -| value_loss | 1.26e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21345 | -| time_elapsed | 115392 | -| total_timesteps | 2732160 | -| train/ | | -| approx_kl | 0.019298304 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -2.76 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 213440 | -| policy_gradient_loss | 0.0111 | -| std | 0.0066 | -| value_loss | 0.00393 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21346 | -| time_elapsed | 115398 | -| total_timesteps | 2732288 | -| train/ | | -| approx_kl | 0.45829076 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.212 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 213450 | -| policy_gradient_loss | 0.0509 | -| std | 0.0066 | -| value_loss | 2.97e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21347 | -| time_elapsed | 115402 | -| total_timesteps | 2732416 | -| train/ | | -| approx_kl | 0.005850425 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00458 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 213460 | -| policy_gradient_loss | 0.00402 | -| std | 0.00661 | -| value_loss | 9.78e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21348 | -| time_elapsed | 115406 | -| total_timesteps | 2732544 | -| train/ | | -| approx_kl | 0.07634345 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.21 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 213470 | -| policy_gradient_loss | 0.0185 | -| std | 0.00661 | -| value_loss | 1.64e-06 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21349 | -| time_elapsed | 115411 | -| total_timesteps | 2732672 | -| train/ | | -| approx_kl | 0.041983 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00961 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 213480 | -| policy_gradient_loss | 0.0117 | -| std | 0.00661 | -| value_loss | 2.46e-07 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21350 | -| time_elapsed | 115417 | -| total_timesteps | 2732800 | -| train/ | | -| approx_kl | 0.0072068656 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 213490 | -| policy_gradient_loss | 0.00885 | -| std | 0.00661 | -| value_loss | 1.83e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 21351 | -| time_elapsed | 115422 | -| total_timesteps | 2732928 | -| train/ | | -| approx_kl | 0.0016975198 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0527 | -| learning_rate | 0.0003 | -| loss | -0.0002 | -| n_updates | 213500 | -| policy_gradient_loss | 0.00633 | -| std | 0.00661 | -| value_loss | 6.18e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21352 | -| time_elapsed | 115427 | -| total_timesteps | 2733056 | -| train/ | | -| approx_kl | 0.036858834 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 213510 | -| policy_gradient_loss | 0.102 | -| std | 0.00661 | -| value_loss | 7.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21353 | -| time_elapsed | 115436 | -| total_timesteps | 2733184 | -| train/ | | -| approx_kl | 0.078755304 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.428 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 213520 | -| policy_gradient_loss | 0.0395 | -| std | 0.00661 | -| value_loss | 0.00245 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21354 | -| time_elapsed | 115441 | -| total_timesteps | 2733312 | -| train/ | | -| approx_kl | 0.092960276 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -5.71 | -| learning_rate | 0.0003 | -| loss | 0.081 | -| n_updates | 213530 | -| policy_gradient_loss | 0.0806 | -| std | 0.00661 | -| value_loss | 1.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21355 | -| time_elapsed | 115445 | -| total_timesteps | 2733440 | -| train/ | | -| approx_kl | 0.11696429 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 213540 | -| policy_gradient_loss | 0.118 | -| std | 0.00661 | -| value_loss | 1.75e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21356 | -| time_elapsed | 115450 | -| total_timesteps | 2733568 | -| train/ | | -| approx_kl | 0.14555588 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.0076 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 213550 | -| policy_gradient_loss | 0.128 | -| std | 0.00661 | -| value_loss | 7.9e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21357 | -| time_elapsed | 115453 | -| total_timesteps | 2733696 | -| train/ | | -| approx_kl | 0.14655387 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 213560 | -| policy_gradient_loss | 0.15 | -| std | 0.00661 | -| value_loss | 4.52e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21358 | -| time_elapsed | 115457 | -| total_timesteps | 2733824 | -| train/ | | -| approx_kl | 0.02137521 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 213570 | -| policy_gradient_loss | 0.022 | -| std | 0.0066 | -| value_loss | 1.32e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21359 | -| time_elapsed | 115460 | -| total_timesteps | 2733952 | -| train/ | | -| approx_kl | 0.16224064 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -69.1 | -| learning_rate | 0.0003 | -| loss | 0.0521 | -| n_updates | 213580 | -| policy_gradient_loss | 0.0171 | -| std | 0.00659 | -| value_loss | 2.38e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21360 | -| time_elapsed | 115464 | -| total_timesteps | 2734080 | -| train/ | | -| approx_kl | 0.016928645 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 213590 | -| policy_gradient_loss | 0.00531 | -| std | 0.00659 | -| value_loss | 7.02e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21361 | -| time_elapsed | 115475 | -| total_timesteps | 2734208 | -| train/ | | -| approx_kl | 0.011690298 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.421 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 213600 | -| policy_gradient_loss | 0.00438 | -| std | 0.00659 | -| value_loss | 0.00172 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21362 | -| time_elapsed | 115480 | -| total_timesteps | 2734336 | -| train/ | | -| approx_kl | 0.21081847 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.4 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 213610 | -| policy_gradient_loss | 0.123 | -| std | 0.00659 | -| value_loss | 8.9e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21363 | -| time_elapsed | 115484 | -| total_timesteps | 2734464 | -| train/ | | -| approx_kl | 0.1878995 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 213620 | -| policy_gradient_loss | 0.126 | -| std | 0.00659 | -| value_loss | 1.94e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21364 | -| time_elapsed | 115488 | -| total_timesteps | 2734592 | -| train/ | | -| approx_kl | 0.031895168 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00557 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 213630 | -| policy_gradient_loss | 0.0234 | -| std | 0.00659 | -| value_loss | 1.19e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21365 | -| time_elapsed | 115493 | -| total_timesteps | 2734720 | -| train/ | | -| approx_kl | 0.5324248 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.195 | -| n_updates | 213640 | -| policy_gradient_loss | 0.0615 | -| std | 0.00659 | -| value_loss | 5.36e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21366 | -| time_elapsed | 115498 | -| total_timesteps | 2734848 | -| train/ | | -| approx_kl | 0.011295771 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0533 | -| learning_rate | 0.0003 | -| loss | -8.5e-05 | -| n_updates | 213650 | -| policy_gradient_loss | 0.00742 | -| std | 0.0066 | -| value_loss | 4.19e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21367 | -| time_elapsed | 115502 | -| total_timesteps | 2734976 | -| train/ | | -| approx_kl | 0.0026939753 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | -0.000868 | -| n_updates | 213660 | -| policy_gradient_loss | 0.00837 | -| std | 0.00659 | -| value_loss | 2.3e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21368 | -| time_elapsed | 115507 | -| total_timesteps | 2735104 | -| train/ | | -| approx_kl | 6.761402e-06 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0659 | -| learning_rate | 0.0003 | -| loss | 8.81e-05 | -| n_updates | 213670 | -| policy_gradient_loss | 0.0282 | -| std | 0.00659 | -| value_loss | 3.04e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21369 | -| time_elapsed | 115518 | -| total_timesteps | 2735232 | -| train/ | | -| approx_kl | 0.38747016 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | 0.0933 | -| n_updates | 213680 | -| policy_gradient_loss | 0.024 | -| std | 0.00659 | -| value_loss | 0.00317 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21370 | -| time_elapsed | 115523 | -| total_timesteps | 2735360 | -| train/ | | -| approx_kl | 0.0069744014 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00582 | -| n_updates | 213690 | -| policy_gradient_loss | 0.0071 | -| std | 0.00659 | -| value_loss | 5.73e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21371 | -| time_elapsed | 115528 | -| total_timesteps | 2735488 | -| train/ | | -| approx_kl | 0.07584402 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00884 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 213700 | -| policy_gradient_loss | 0.00862 | -| std | 0.00658 | -| value_loss | 3.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21372 | -| time_elapsed | 115533 | -| total_timesteps | 2735616 | -| train/ | | -| approx_kl | 0.015984187 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.083 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 213710 | -| policy_gradient_loss | 0.0112 | -| std | 0.00658 | -| value_loss | 3.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21373 | -| time_elapsed | 115539 | -| total_timesteps | 2735744 | -| train/ | | -| approx_kl | 0.054730587 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.000625 | -| n_updates | 213720 | -| policy_gradient_loss | -0.00403 | -| std | 0.00659 | -| value_loss | 3.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21374 | -| time_elapsed | 115544 | -| total_timesteps | 2735872 | -| train/ | | -| approx_kl | 0.013028884 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 213730 | -| policy_gradient_loss | 0.00687 | -| std | 0.00659 | -| value_loss | 2.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21375 | -| time_elapsed | 115548 | -| total_timesteps | 2736000 | -| train/ | | -| approx_kl | 0.0031328406 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 213740 | -| policy_gradient_loss | 0.0085 | -| std | 0.00659 | -| value_loss | 1.68e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21376 | -| time_elapsed | 115552 | -| total_timesteps | 2736128 | -| train/ | | -| approx_kl | 8.4405765e-06 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00785 | -| learning_rate | 0.0003 | -| loss | 0.000316 | -| n_updates | 213750 | -| policy_gradient_loss | 0.0424 | -| std | 0.00658 | -| value_loss | 5.33e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21377 | -| time_elapsed | 115560 | -| total_timesteps | 2736256 | -| train/ | | -| approx_kl | 0.29963103 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.94 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 213760 | -| policy_gradient_loss | 0.0269 | -| std | 0.00658 | -| value_loss | 0.000935 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21378 | -| time_elapsed | 115565 | -| total_timesteps | 2736384 | -| train/ | | -| approx_kl | 0.006067943 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | -0.0099 | -| n_updates | 213770 | -| policy_gradient_loss | 0.00724 | -| std | 0.00658 | -| value_loss | 1.16e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21379 | -| time_elapsed | 115569 | -| total_timesteps | 2736512 | -| train/ | | -| approx_kl | 8.854829e-05 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.00205 | -| learning_rate | 0.0003 | -| loss | 0.000456 | -| n_updates | 213780 | -| policy_gradient_loss | 0.0295 | -| std | 0.00659 | -| value_loss | 2.03e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21380 | -| time_elapsed | 115574 | -| total_timesteps | 2736640 | -| train/ | | -| approx_kl | 0.13626282 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | 0.0903 | -| n_updates | 213790 | -| policy_gradient_loss | 0.0441 | -| std | 0.00659 | -| value_loss | 5.8e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21381 | -| time_elapsed | 115578 | -| total_timesteps | 2736768 | -| train/ | | -| approx_kl | 0.0011322876 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.000491 | -| n_updates | 213800 | -| policy_gradient_loss | 0.011 | -| std | 0.00659 | -| value_loss | 3.69e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21382 | -| time_elapsed | 115583 | -| total_timesteps | 2736896 | -| train/ | | -| approx_kl | 0.009282992 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.0176 | -| n_updates | 213810 | -| policy_gradient_loss | 0.00202 | -| std | 0.00659 | -| value_loss | 4.6e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21383 | -| time_elapsed | 115587 | -| total_timesteps | 2737024 | -| train/ | | -| approx_kl | 0.18062125 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 213820 | -| policy_gradient_loss | 0.026 | -| std | 0.00659 | -| value_loss | 1.59e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21384 | -| time_elapsed | 115598 | -| total_timesteps | 2737152 | -| train/ | | -| approx_kl | 0.1565876 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 213830 | -| policy_gradient_loss | 0.00689 | -| std | 0.00658 | -| value_loss | 2.82e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21385 | -| time_elapsed | 115603 | -| total_timesteps | 2737280 | -| train/ | | -| approx_kl | 0.026204258 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 213840 | -| policy_gradient_loss | 0.0337 | -| std | 0.00658 | -| value_loss | 4.41e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21386 | -| time_elapsed | 115608 | -| total_timesteps | 2737408 | -| train/ | | -| approx_kl | 0.275585 | -| clip_fraction | 0.683 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 213850 | -| policy_gradient_loss | 0.12 | -| std | 0.00658 | -| value_loss | 1.57e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21387 | -| time_elapsed | 115613 | -| total_timesteps | 2737536 | -| train/ | | -| approx_kl | 0.18491396 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 213860 | -| policy_gradient_loss | 0.158 | -| std | 0.00658 | -| value_loss | 1.33e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21388 | -| time_elapsed | 115618 | -| total_timesteps | 2737664 | -| train/ | | -| approx_kl | 0.1543004 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.0942 | -| n_updates | 213870 | -| policy_gradient_loss | 0.13 | -| std | 0.00658 | -| value_loss | 1.01e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21389 | -| time_elapsed | 115622 | -| total_timesteps | 2737792 | -| train/ | | -| approx_kl | 0.026200578 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.0096 | -| n_updates | 213880 | -| policy_gradient_loss | 0.0244 | -| std | 0.00658 | -| value_loss | 7.82e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21390 | -| time_elapsed | 115626 | -| total_timesteps | 2737920 | -| train/ | | -| approx_kl | 0.14487457 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.0613 | -| n_updates | 213890 | -| policy_gradient_loss | 0.0163 | -| std | 0.00658 | -| value_loss | 5.09e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21391 | -| time_elapsed | 115630 | -| total_timesteps | 2738048 | -| train/ | | -| approx_kl | 0.01661668 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.0019 | -| n_updates | 213900 | -| policy_gradient_loss | 0.000334 | -| std | 0.00658 | -| value_loss | 3.16e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21392 | -| time_elapsed | 115639 | -| total_timesteps | 2738176 | -| train/ | | -| approx_kl | 0.014704995 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.573 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 213910 | -| policy_gradient_loss | 0.000171 | -| std | 0.00658 | -| value_loss | 0.00158 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21393 | -| time_elapsed | 115644 | -| total_timesteps | 2738304 | -| train/ | | -| approx_kl | 0.63152826 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.599 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 213920 | -| policy_gradient_loss | 0.0707 | -| std | 0.00658 | -| value_loss | 2.23e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21394 | -| time_elapsed | 115649 | -| total_timesteps | 2738432 | -| train/ | | -| approx_kl | 0.052654248 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 213930 | -| policy_gradient_loss | 0.0157 | -| std | 0.00658 | -| value_loss | 2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21395 | -| time_elapsed | 115654 | -| total_timesteps | 2738560 | -| train/ | | -| approx_kl | 0.04116637 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0657 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 213940 | -| policy_gradient_loss | 0.00858 | -| std | 0.00658 | -| value_loss | 1.7e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21396 | -| time_elapsed | 115659 | -| total_timesteps | 2738688 | -| train/ | | -| approx_kl | 0.0563265 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 213950 | -| policy_gradient_loss | 0.00877 | -| std | 0.00658 | -| value_loss | 1.08e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21397 | -| time_elapsed | 115663 | -| total_timesteps | 2738816 | -| train/ | | -| approx_kl | 0.009384451 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.000138 | -| n_updates | 213960 | -| policy_gradient_loss | 0.00807 | -| std | 0.00658 | -| value_loss | 5.92e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21398 | -| time_elapsed | 115666 | -| total_timesteps | 2738944 | -| train/ | | -| approx_kl | 0.0023367335 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 213970 | -| policy_gradient_loss | 0.00882 | -| std | 0.00658 | -| value_loss | 3.9e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21399 | -| time_elapsed | 115671 | -| total_timesteps | 2739072 | -| train/ | | -| approx_kl | 1.671724e-06 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -2.82e-06 | -| n_updates | 213980 | -| policy_gradient_loss | 0.0406 | -| std | 0.00658 | -| value_loss | 2.44e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21400 | -| time_elapsed | 115680 | -| total_timesteps | 2739200 | -| train/ | | -| approx_kl | 1.0173506 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | 0.332 | -| n_updates | 213990 | -| policy_gradient_loss | 0.136 | -| std | 0.00658 | -| value_loss | 4.08e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21401 | -| time_elapsed | 115684 | -| total_timesteps | 2739328 | -| train/ | | -| approx_kl | 0.008374182 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 214000 | -| policy_gradient_loss | 0.0215 | -| std | 0.00658 | -| value_loss | 1.77e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21402 | -| time_elapsed | 115688 | -| total_timesteps | 2739456 | -| train/ | | -| approx_kl | 0.26360694 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | 0.00907 | -| learning_rate | 0.0003 | -| loss | 0.218 | -| n_updates | 214010 | -| policy_gradient_loss | 0.16 | -| std | 0.00658 | -| value_loss | 4.74e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21403 | -| time_elapsed | 115691 | -| total_timesteps | 2739584 | -| train/ | | -| approx_kl | 0.23170352 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.6 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 214020 | -| policy_gradient_loss | 0.167 | -| std | 0.00658 | -| value_loss | 4.39e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21404 | -| time_elapsed | 115694 | -| total_timesteps | 2739712 | -| train/ | | -| approx_kl | 0.14011586 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.0848 | -| n_updates | 214030 | -| policy_gradient_loss | 0.147 | -| std | 0.00658 | -| value_loss | 2.98e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21405 | -| time_elapsed | 115699 | -| total_timesteps | 2739840 | -| train/ | | -| approx_kl | 0.14357649 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 214040 | -| policy_gradient_loss | 0.1 | -| std | 0.00658 | -| value_loss | 1.06e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 21406 | -| time_elapsed | 115704 | -| total_timesteps | 2739968 | -| train/ | | -| approx_kl | 0.034214005 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 214050 | -| policy_gradient_loss | 0.0314 | -| std | 0.00658 | -| value_loss | 7.95e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21407 | -| time_elapsed | 115708 | -| total_timesteps | 2740096 | -| train/ | | -| approx_kl | 0.046451777 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 214060 | -| policy_gradient_loss | -0.00324 | -| std | 0.00657 | -| value_loss | 1.63e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21408 | -| time_elapsed | 115717 | -| total_timesteps | 2740224 | -| train/ | | -| approx_kl | 0.042134333 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | 0.00387 | -| n_updates | 214070 | -| policy_gradient_loss | 0.00221 | -| std | 0.00657 | -| value_loss | 0.000121 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21409 | -| time_elapsed | 115721 | -| total_timesteps | 2740352 | -| train/ | | -| approx_kl | 0.008359982 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | 0.00658 | -| n_updates | 214080 | -| policy_gradient_loss | 0.0324 | -| std | 0.00657 | -| value_loss | 1.03e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21410 | -| time_elapsed | 115726 | -| total_timesteps | 2740480 | -| train/ | | -| approx_kl | 0.0021500448 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.00602 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 214090 | -| policy_gradient_loss | -0.000136 | -| std | 0.00657 | -| value_loss | 1.81e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21411 | -| time_elapsed | 115731 | -| total_timesteps | 2740608 | -| train/ | | -| approx_kl | 0.09735106 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 214100 | -| policy_gradient_loss | 0.0474 | -| std | 0.00657 | -| value_loss | 1.24e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21412 | -| time_elapsed | 115737 | -| total_timesteps | 2740736 | -| train/ | | -| approx_kl | 0.40311006 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.258 | -| n_updates | 214110 | -| policy_gradient_loss | 0.179 | -| std | 0.00657 | -| value_loss | 1.02e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21413 | -| time_elapsed | 115743 | -| total_timesteps | 2740864 | -| train/ | | -| approx_kl | 0.054211766 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 214120 | -| policy_gradient_loss | 0.0239 | -| std | 0.00657 | -| value_loss | 8.72e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21414 | -| time_elapsed | 115748 | -| total_timesteps | 2740992 | -| train/ | | -| approx_kl | 0.53163105 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 214130 | -| policy_gradient_loss | 0.0401 | -| std | 0.00657 | -| value_loss | 6.02e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21415 | -| time_elapsed | 115754 | -| total_timesteps | 2741120 | -| train/ | | -| approx_kl | 0.040091746 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 214140 | -| policy_gradient_loss | 0.0123 | -| std | 0.00657 | -| value_loss | 3.07e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21416 | -| time_elapsed | 115764 | -| total_timesteps | 2741248 | -| train/ | | -| approx_kl | 0.0028206888 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.828 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 214150 | -| policy_gradient_loss | -0.00775 | -| std | 0.00657 | -| value_loss | 0.00455 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21417 | -| time_elapsed | 115769 | -| total_timesteps | 2741376 | -| train/ | | -| approx_kl | 0.07045587 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.0393 | -| n_updates | 214160 | -| policy_gradient_loss | 0.0146 | -| std | 0.00657 | -| value_loss | 4.71e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21418 | -| time_elapsed | 115774 | -| total_timesteps | 2741504 | -| train/ | | -| approx_kl | 0.048504803 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.00927 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 214170 | -| policy_gradient_loss | 0.00998 | -| std | 0.00657 | -| value_loss | 4.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21419 | -| time_elapsed | 115779 | -| total_timesteps | 2741632 | -| train/ | | -| approx_kl | 0.04732234 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | 0.0235 | -| n_updates | 214180 | -| policy_gradient_loss | 0.0109 | -| std | 0.00657 | -| value_loss | 2.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21420 | -| time_elapsed | 115783 | -| total_timesteps | 2741760 | -| train/ | | -| approx_kl | 0.008827665 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0968 | -| learning_rate | 0.0003 | -| loss | -0.00552 | -| n_updates | 214190 | -| policy_gradient_loss | 0.00484 | -| std | 0.00657 | -| value_loss | 3.38e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21421 | -| time_elapsed | 115787 | -| total_timesteps | 2741888 | -| train/ | | -| approx_kl | 0.0026760856 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | -4.53e-05 | -| n_updates | 214200 | -| policy_gradient_loss | 0.0102 | -| std | 0.00656 | -| value_loss | 4.53e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21422 | -| time_elapsed | 115791 | -| total_timesteps | 2742016 | -| train/ | | -| approx_kl | 0.1394581 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 214210 | -| policy_gradient_loss | 0.12 | -| std | 0.00655 | -| value_loss | 0.0109 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21423 | -| time_elapsed | 115803 | -| total_timesteps | 2742144 | -| train/ | | -| approx_kl | 0.0017774571 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | -0.00844 | -| n_updates | 214220 | -| policy_gradient_loss | 0.00761 | -| std | 0.00655 | -| value_loss | 0.00652 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21424 | -| time_elapsed | 115808 | -| total_timesteps | 2742272 | -| train/ | | -| approx_kl | 0.006316272 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.00249 | -| learning_rate | 0.0003 | -| loss | -0.004 | -| n_updates | 214230 | -| policy_gradient_loss | 0.0392 | -| std | 0.00655 | -| value_loss | 0.000409 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21425 | -| time_elapsed | 115812 | -| total_timesteps | 2742400 | -| train/ | | -| approx_kl | 0.68873006 | -| clip_fraction | 0.747 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.249 | -| n_updates | 214240 | -| policy_gradient_loss | 0.15 | -| std | 0.00655 | -| value_loss | 0.000191 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21426 | -| time_elapsed | 115816 | -| total_timesteps | 2742528 | -| train/ | | -| approx_kl | 0.009783626 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 214250 | -| policy_gradient_loss | 0.0268 | -| std | 0.00655 | -| value_loss | 0.000111 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21427 | -| time_elapsed | 115822 | -| total_timesteps | 2742656 | -| train/ | | -| approx_kl | 0.081136584 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.0527 | -| n_updates | 214260 | -| policy_gradient_loss | 0.0265 | -| std | 0.00655 | -| value_loss | 7.58e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21428 | -| time_elapsed | 115827 | -| total_timesteps | 2742784 | -| train/ | | -| approx_kl | 0.17341602 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.0494 | -| n_updates | 214270 | -| policy_gradient_loss | 0.0212 | -| std | 0.00655 | -| value_loss | 6.15e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21429 | -| time_elapsed | 115831 | -| total_timesteps | 2742912 | -| train/ | | -| approx_kl | 0.02805648 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 214280 | -| policy_gradient_loss | 0.0283 | -| std | 0.00655 | -| value_loss | 4.75e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21430 | -| time_elapsed | 115835 | -| total_timesteps | 2743040 | -| train/ | | -| approx_kl | 0.11122753 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.0422 | -| n_updates | 214290 | -| policy_gradient_loss | 0.0207 | -| std | 0.00655 | -| value_loss | 3.29e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21431 | -| time_elapsed | 115846 | -| total_timesteps | 2743168 | -| train/ | | -| approx_kl | 0.5187592 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.849 | -| learning_rate | 0.0003 | -| loss | 0.0765 | -| n_updates | 214300 | -| policy_gradient_loss | 0.0225 | -| std | 0.00656 | -| value_loss | 0.00316 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21432 | -| time_elapsed | 115850 | -| total_timesteps | 2743296 | -| train/ | | -| approx_kl | 0.0017337254 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.00604 | -| learning_rate | 0.0003 | -| loss | -0.000488 | -| n_updates | 214310 | -| policy_gradient_loss | 0.00904 | -| std | 0.00655 | -| value_loss | 1.48e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21433 | -| time_elapsed | 115855 | -| total_timesteps | 2743424 | -| train/ | | -| approx_kl | 0.08705485 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 214320 | -| policy_gradient_loss | 0.00953 | -| std | 0.00654 | -| value_loss | 1.64e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21434 | -| time_elapsed | 115859 | -| total_timesteps | 2743552 | -| train/ | | -| approx_kl | 0.00051674293 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.000198 | -| n_updates | 214330 | -| policy_gradient_loss | 0.0127 | -| std | 0.00654 | -| value_loss | 1.26e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21435 | -| time_elapsed | 115864 | -| total_timesteps | 2743680 | -| train/ | | -| approx_kl | 0.20775591 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 214340 | -| policy_gradient_loss | 0.0341 | -| std | 0.00653 | -| value_loss | 1.04e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21436 | -| time_elapsed | 115868 | -| total_timesteps | 2743808 | -| train/ | | -| approx_kl | 0.24170613 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.00892 | -| learning_rate | 0.0003 | -| loss | 0.0619 | -| n_updates | 214350 | -| policy_gradient_loss | 0.02 | -| std | 0.00653 | -| value_loss | 5.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21437 | -| time_elapsed | 115873 | -| total_timesteps | 2743936 | -| train/ | | -| approx_kl | 0.017699152 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 214360 | -| policy_gradient_loss | -0.00746 | -| std | 0.00653 | -| value_loss | 4.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21438 | -| time_elapsed | 115878 | -| total_timesteps | 2744064 | -| train/ | | -| approx_kl | 0.023098305 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.0188 | -| n_updates | 214370 | -| policy_gradient_loss | 0.0124 | -| std | 0.00653 | -| value_loss | 3.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21439 | -| time_elapsed | 115886 | -| total_timesteps | 2744192 | -| train/ | | -| approx_kl | 0.050749674 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -1.44 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 214380 | -| policy_gradient_loss | -0.00475 | -| std | 0.00653 | -| value_loss | 0.00331 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21440 | -| time_elapsed | 115890 | -| total_timesteps | 2744320 | -| train/ | | -| approx_kl | 6.117858e-06 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | 8.55e-05 | -| n_updates | 214390 | -| policy_gradient_loss | 0.0256 | -| std | 0.00653 | -| value_loss | 5.33e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21441 | -| time_elapsed | 115894 | -| total_timesteps | 2744448 | -| train/ | | -| approx_kl | 0.60486877 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.868 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 214400 | -| policy_gradient_loss | 0.0484 | -| std | 0.00653 | -| value_loss | 1.88e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21442 | -| time_elapsed | 115897 | -| total_timesteps | 2744576 | -| train/ | | -| approx_kl | 0.05121019 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0727 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 214410 | -| policy_gradient_loss | 0.012 | -| std | 0.00653 | -| value_loss | 2.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21443 | -| time_elapsed | 115902 | -| total_timesteps | 2744704 | -| train/ | | -| approx_kl | 0.009208072 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -8.9e-05 | -| learning_rate | 0.0003 | -| loss | 0.002 | -| n_updates | 214420 | -| policy_gradient_loss | 0.00774 | -| std | 0.00652 | -| value_loss | 5.5e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21444 | -| time_elapsed | 115906 | -| total_timesteps | 2744832 | -| train/ | | -| approx_kl | 0.0699301 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -1.03 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 214430 | -| policy_gradient_loss | 0.00355 | -| std | 0.00651 | -| value_loss | 1.63e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21445 | -| time_elapsed | 115910 | -| total_timesteps | 2744960 | -| train/ | | -| approx_kl | 0.0103095705 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00606 | -| n_updates | 214440 | -| policy_gradient_loss | 0.00323 | -| std | 0.00651 | -| value_loss | 9.25e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21446 | -| time_elapsed | 115913 | -| total_timesteps | 2745088 | -| train/ | | -| approx_kl | 0.0028487653 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | -0.000521 | -| n_updates | 214450 | -| policy_gradient_loss | 0.00843 | -| std | 0.0065 | -| value_loss | 5.11e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21447 | -| time_elapsed | 115923 | -| total_timesteps | 2745216 | -| train/ | | -| approx_kl | 0.07578052 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.64 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 214460 | -| policy_gradient_loss | -0.00207 | -| std | 0.0065 | -| value_loss | 0.00122 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21448 | -| time_elapsed | 115927 | -| total_timesteps | 2745344 | -| train/ | | -| approx_kl | 1.0296509 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | 0.383 | -| n_updates | 214470 | -| policy_gradient_loss | 0.146 | -| std | 0.0065 | -| value_loss | 9.5e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21449 | -| time_elapsed | 115931 | -| total_timesteps | 2745472 | -| train/ | | -| approx_kl | 0.0023590392 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 214480 | -| policy_gradient_loss | 0.0181 | -| std | 0.00651 | -| value_loss | 1.19e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21450 | -| time_elapsed | 115936 | -| total_timesteps | 2745600 | -| train/ | | -| approx_kl | 0.16051975 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 0.0501 | -| n_updates | 214490 | -| policy_gradient_loss | 0.0148 | -| std | 0.00651 | -| value_loss | 9.84e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21451 | -| time_elapsed | 115940 | -| total_timesteps | 2745728 | -| train/ | | -| approx_kl | 0.021753844 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 214500 | -| policy_gradient_loss | 0.0335 | -| std | 0.00651 | -| value_loss | 6.44e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21452 | -| time_elapsed | 115945 | -| total_timesteps | 2745856 | -| train/ | | -| approx_kl | 0.101810254 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 214510 | -| policy_gradient_loss | 0.0268 | -| std | 0.00651 | -| value_loss | 3.92e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21453 | -| time_elapsed | 115950 | -| total_timesteps | 2745984 | -| train/ | | -| approx_kl | 0.112470135 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0929 | -| learning_rate | 0.0003 | -| loss | 0.0767 | -| n_updates | 214520 | -| policy_gradient_loss | 0.0213 | -| std | 0.00651 | -| value_loss | 3.58e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21454 | -| time_elapsed | 115955 | -| total_timesteps | 2746112 | -| train/ | | -| approx_kl | 0.011621838 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.00626 | -| n_updates | 214530 | -| policy_gradient_loss | -0.0029 | -| std | 0.00651 | -| value_loss | 1.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21455 | -| time_elapsed | 115967 | -| total_timesteps | 2746240 | -| train/ | | -| approx_kl | 0.006706586 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 214540 | -| policy_gradient_loss | 0.00307 | -| std | 0.00651 | -| value_loss | 0.00117 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21456 | -| time_elapsed | 115971 | -| total_timesteps | 2746368 | -| train/ | | -| approx_kl | 0.00018970761 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.822 | -| learning_rate | 0.0003 | -| loss | 0.000306 | -| n_updates | 214550 | -| policy_gradient_loss | 0.0272 | -| std | 0.00651 | -| value_loss | 4.67e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21457 | -| time_elapsed | 115976 | -| total_timesteps | 2746496 | -| train/ | | -| approx_kl | 0.00097574294 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | -0.000635 | -| n_updates | 214560 | -| policy_gradient_loss | 0.0281 | -| std | 0.00651 | -| value_loss | 1.65e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21458 | -| time_elapsed | 115980 | -| total_timesteps | 2746624 | -| train/ | | -| approx_kl | 0.03742938 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 214570 | -| policy_gradient_loss | 0.0382 | -| std | 0.00651 | -| value_loss | 0.000135 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21459 | -| time_elapsed | 115985 | -| total_timesteps | 2746752 | -| train/ | | -| approx_kl | 0.1488325 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.312 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 214580 | -| policy_gradient_loss | 0.0687 | -| std | 0.00651 | -| value_loss | 0.000394 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21460 | -| time_elapsed | 115990 | -| total_timesteps | 2746880 | -| train/ | | -| approx_kl | 0.20266294 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 214590 | -| policy_gradient_loss | 0.0325 | -| std | 0.00651 | -| value_loss | 7.35e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21461 | -| time_elapsed | 115995 | -| total_timesteps | 2747008 | -| train/ | | -| approx_kl | 0.5576581 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00591 | -| learning_rate | 0.0003 | -| loss | 0.215 | -| n_updates | 214600 | -| policy_gradient_loss | 0.06 | -| std | 0.00651 | -| value_loss | 2.85e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21462 | -| time_elapsed | 116007 | -| total_timesteps | 2747136 | -| train/ | | -| approx_kl | 0.0074021453 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.52 | -| learning_rate | 0.0003 | -| loss | -0.00948 | -| n_updates | 214610 | -| policy_gradient_loss | 0.00181 | -| std | 0.00651 | -| value_loss | 0.00157 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21463 | -| time_elapsed | 116011 | -| total_timesteps | 2747264 | -| train/ | | -| approx_kl | 0.08176032 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 214620 | -| policy_gradient_loss | 0.0138 | -| std | 0.00651 | -| value_loss | 9.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21464 | -| time_elapsed | 116015 | -| total_timesteps | 2747392 | -| train/ | | -| approx_kl | 0.044564057 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0865 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 214630 | -| policy_gradient_loss | 0.0168 | -| std | 0.0065 | -| value_loss | 1.31e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21465 | -| time_elapsed | 116020 | -| total_timesteps | 2747520 | -| train/ | | -| approx_kl | 0.0054690544 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00994 | -| learning_rate | 0.0003 | -| loss | -0.000194 | -| n_updates | 214640 | -| policy_gradient_loss | 0.00479 | -| std | 0.0065 | -| value_loss | 5.08e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21466 | -| time_elapsed | 116025 | -| total_timesteps | 2747648 | -| train/ | | -| approx_kl | 0.0026105973 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 214650 | -| policy_gradient_loss | 0.0109 | -| std | 0.00651 | -| value_loss | 1.74e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21467 | -| time_elapsed | 116030 | -| total_timesteps | 2747776 | -| train/ | | -| approx_kl | 0.049977366 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 214660 | -| policy_gradient_loss | 0.113 | -| std | 0.00651 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21468 | -| time_elapsed | 116035 | -| total_timesteps | 2747904 | -| train/ | | -| approx_kl | 0.0130601805 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 214670 | -| policy_gradient_loss | 0.0287 | -| std | 0.00651 | -| value_loss | 1.09e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21469 | -| time_elapsed | 116040 | -| total_timesteps | 2748032 | -| train/ | | -| approx_kl | 0.5801103 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 214680 | -| policy_gradient_loss | 0.0684 | -| std | 0.00651 | -| value_loss | 9.8e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21470 | -| time_elapsed | 116048 | -| total_timesteps | 2748160 | -| train/ | | -| approx_kl | 0.0027941498 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.879 | -| learning_rate | 0.0003 | -| loss | -0.0199 | -| n_updates | 214690 | -| policy_gradient_loss | -0.0105 | -| std | 0.00651 | -| value_loss | 0.0024 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21471 | -| time_elapsed | 116052 | -| total_timesteps | 2748288 | -| train/ | | -| approx_kl | 0.003703007 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00316 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 214700 | -| policy_gradient_loss | 0.03 | -| std | 0.00651 | -| value_loss | 7.19e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21472 | -| time_elapsed | 116057 | -| total_timesteps | 2748416 | -| train/ | | -| approx_kl | 0.5238177 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00382 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 214710 | -| policy_gradient_loss | 0.059 | -| std | 0.00651 | -| value_loss | 1.47e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21473 | -| time_elapsed | 116061 | -| total_timesteps | 2748544 | -| train/ | | -| approx_kl | 0.05910957 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.038 | -| n_updates | 214720 | -| policy_gradient_loss | 0.0182 | -| std | 0.00651 | -| value_loss | 9.17e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21474 | -| time_elapsed | 116065 | -| total_timesteps | 2748672 | -| train/ | | -| approx_kl | 0.05571776 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.0329 | -| n_updates | 214730 | -| policy_gradient_loss | 0.0159 | -| std | 0.00652 | -| value_loss | 8.79e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21475 | -| time_elapsed | 116068 | -| total_timesteps | 2748800 | -| train/ | | -| approx_kl | 0.04909535 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | 0.0326 | -| n_updates | 214740 | -| policy_gradient_loss | 0.0156 | -| std | 0.00652 | -| value_loss | 4.34e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 21476 | -| time_elapsed | 116072 | -| total_timesteps | 2748928 | -| train/ | | -| approx_kl | 0.05354974 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0695 | -| learning_rate | 0.0003 | -| loss | 0.00355 | -| n_updates | 214750 | -| policy_gradient_loss | 0.00158 | -| std | 0.00651 | -| value_loss | 3.45e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21477 | -| time_elapsed | 116077 | -| total_timesteps | 2749056 | -| train/ | | -| approx_kl | 0.008569805 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 214760 | -| policy_gradient_loss | 0.00624 | -| std | 0.00651 | -| value_loss | 2.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21478 | -| time_elapsed | 116087 | -| total_timesteps | 2749184 | -| train/ | | -| approx_kl | 0.005102745 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 214770 | -| policy_gradient_loss | 0.00302 | -| std | 0.00649 | -| value_loss | 0.000135 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21479 | -| time_elapsed | 116091 | -| total_timesteps | 2749312 | -| train/ | | -| approx_kl | 0.03853952 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00343 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 214780 | -| policy_gradient_loss | 0.0134 | -| std | 0.00647 | -| value_loss | 3.58e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21480 | -| time_elapsed | 116096 | -| total_timesteps | 2749440 | -| train/ | | -| approx_kl | 0.048765842 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 214790 | -| policy_gradient_loss | 0.0145 | -| std | 0.00644 | -| value_loss | 3.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21481 | -| time_elapsed | 116101 | -| total_timesteps | 2749568 | -| train/ | | -| approx_kl | 0.009818872 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0621 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 214800 | -| policy_gradient_loss | 0.00598 | -| std | 0.00642 | -| value_loss | 1.61e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21482 | -| time_elapsed | 116107 | -| total_timesteps | 2749696 | -| train/ | | -| approx_kl | 0.0012786686 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00238 | -| learning_rate | 0.0003 | -| loss | 0.00645 | -| n_updates | 214810 | -| policy_gradient_loss | 0.00494 | -| std | 0.00641 | -| value_loss | 3.62e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21483 | -| time_elapsed | 116111 | -| total_timesteps | 2749824 | -| train/ | | -| approx_kl | 0.066704385 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0688 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 214820 | -| policy_gradient_loss | 0.0152 | -| std | 0.00641 | -| value_loss | 3.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 21484 | -| time_elapsed | 116115 | -| total_timesteps | 2749952 | -| train/ | | -| approx_kl | 0.05337388 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 214830 | -| policy_gradient_loss | 0.0205 | -| std | 0.00641 | -| value_loss | 1.86e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21485 | -| time_elapsed | 116120 | -| total_timesteps | 2750080 | -| train/ | | -| approx_kl | 0.009369463 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0766 | -| learning_rate | 0.0003 | -| loss | -0.000205 | -| n_updates | 214840 | -| policy_gradient_loss | 0.00735 | -| std | 0.00641 | -| value_loss | 1.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21486 | -| time_elapsed | 116127 | -| total_timesteps | 2750208 | -| train/ | | -| approx_kl | 0.032935962 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | -0.00544 | -| n_updates | 214850 | -| policy_gradient_loss | 0.0221 | -| std | 0.00641 | -| value_loss | 0.00161 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21487 | -| time_elapsed | 116132 | -| total_timesteps | 2750336 | -| train/ | | -| approx_kl | 1.53283 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | 0.729 | -| n_updates | 214860 | -| policy_gradient_loss | 0.301 | -| std | 0.00641 | -| value_loss | 9.39e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21488 | -| time_elapsed | 116137 | -| total_timesteps | 2750464 | -| train/ | | -| approx_kl | 0.028849976 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00131 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 214870 | -| policy_gradient_loss | 0.00171 | -| std | 0.00641 | -| value_loss | 2.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21489 | -| time_elapsed | 116143 | -| total_timesteps | 2750592 | -| train/ | | -| approx_kl | 0.021331258 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0161 | -| learning_rate | 0.0003 | -| loss | 0.00438 | -| n_updates | 214880 | -| policy_gradient_loss | 0.000897 | -| std | 0.0064 | -| value_loss | 7.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21490 | -| time_elapsed | 116148 | -| total_timesteps | 2750720 | -| train/ | | -| approx_kl | 0.022993669 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | 0.00977 | -| n_updates | 214890 | -| policy_gradient_loss | 0.0301 | -| std | 0.0064 | -| value_loss | 5.59e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21491 | -| time_elapsed | 116154 | -| total_timesteps | 2750848 | -| train/ | | -| approx_kl | 0.12722646 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | 0.0767 | -| n_updates | 214900 | -| policy_gradient_loss | 0.0373 | -| std | 0.0064 | -| value_loss | 4.31e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21492 | -| time_elapsed | 116158 | -| total_timesteps | 2750976 | -| train/ | | -| approx_kl | 0.119802386 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 214910 | -| policy_gradient_loss | 0.0178 | -| std | 0.0064 | -| value_loss | 2.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21493 | -| time_elapsed | 116164 | -| total_timesteps | 2751104 | -| train/ | | -| approx_kl | 0.012372198 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0659 | -| learning_rate | 0.0003 | -| loss | 0.00727 | -| n_updates | 214920 | -| policy_gradient_loss | 0.00381 | -| std | 0.0064 | -| value_loss | 2.2e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21494 | -| time_elapsed | 116174 | -| total_timesteps | 2751232 | -| train/ | | -| approx_kl | 0.526979 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.574 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 214930 | -| policy_gradient_loss | 0.00674 | -| std | 0.00639 | -| value_loss | 0.00141 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21495 | -| time_elapsed | 116179 | -| total_timesteps | 2751360 | -| train/ | | -| approx_kl | 0.19079764 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -5.21 | -| learning_rate | 0.0003 | -| loss | 0.0568 | -| n_updates | 214940 | -| policy_gradient_loss | 0.0173 | -| std | 0.00639 | -| value_loss | 2.63e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21496 | -| time_elapsed | 116184 | -| total_timesteps | 2751488 | -| train/ | | -| approx_kl | 0.020509649 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.00422 | -| n_updates | 214950 | -| policy_gradient_loss | 0.0215 | -| std | 0.0064 | -| value_loss | 1.59e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21497 | -| time_elapsed | 116190 | -| total_timesteps | 2751616 | -| train/ | | -| approx_kl | 0.13568035 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0656 | -| learning_rate | 0.0003 | -| loss | 0.0651 | -| n_updates | 214960 | -| policy_gradient_loss | 0.0333 | -| std | 0.0064 | -| value_loss | 1.02e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21498 | -| time_elapsed | 116196 | -| total_timesteps | 2751744 | -| train/ | | -| approx_kl | 0.15749538 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.0709 | -| n_updates | 214970 | -| policy_gradient_loss | 0.0215 | -| std | 0.0064 | -| value_loss | 6.56e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21499 | -| time_elapsed | 116200 | -| total_timesteps | 2751872 | -| train/ | | -| approx_kl | 0.031853136 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 214980 | -| policy_gradient_loss | 0.0356 | -| std | 0.0064 | -| value_loss | 2.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21500 | -| time_elapsed | 116205 | -| total_timesteps | 2752000 | -| train/ | | -| approx_kl | 0.24519451 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -8.95 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 214990 | -| policy_gradient_loss | 0.0758 | -| std | 0.0064 | -| value_loss | 1.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21501 | -| time_elapsed | 116210 | -| total_timesteps | 2752128 | -| train/ | | -| approx_kl | 0.18422641 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0901 | -| n_updates | 215000 | -| policy_gradient_loss | 0.0849 | -| std | 0.0064 | -| value_loss | 9.89e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21502 | -| time_elapsed | 116223 | -| total_timesteps | 2752256 | -| train/ | | -| approx_kl | 0.49618888 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.856 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 215010 | -| policy_gradient_loss | 0.114 | -| std | 0.0064 | -| value_loss | 0.00281 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21503 | -| time_elapsed | 116229 | -| total_timesteps | 2752384 | -| train/ | | -| approx_kl | 0.09974636 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 215020 | -| policy_gradient_loss | 0.0307 | -| std | 0.0064 | -| value_loss | 3.11e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21504 | -| time_elapsed | 116234 | -| total_timesteps | 2752512 | -| train/ | | -| approx_kl | 0.18321685 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00474 | -| learning_rate | 0.0003 | -| loss | 0.0847 | -| n_updates | 215030 | -| policy_gradient_loss | 0.0281 | -| std | 0.0064 | -| value_loss | 6.83e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21505 | -| time_elapsed | 116238 | -| total_timesteps | 2752640 | -| train/ | | -| approx_kl | 0.03006273 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00992 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 215040 | -| policy_gradient_loss | 0.0359 | -| std | 0.0064 | -| value_loss | 4.36e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21506 | -| time_elapsed | 116244 | -| total_timesteps | 2752768 | -| train/ | | -| approx_kl | 0.35439774 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 215050 | -| policy_gradient_loss | 0.155 | -| std | 0.00641 | -| value_loss | 1.78e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 21507 | -| time_elapsed | 116248 | -| total_timesteps | 2752896 | -| train/ | | -| approx_kl | 0.04660899 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0849 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 215060 | -| policy_gradient_loss | 0.0214 | -| std | 0.00641 | -| value_loss | 1.46e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21508 | -| time_elapsed | 116252 | -| total_timesteps | 2753024 | -| train/ | | -| approx_kl | 0.0006531221 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | 0.0015 | -| n_updates | 215070 | -| policy_gradient_loss | 0.0393 | -| std | 0.00641 | -| value_loss | 1.18e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21509 | -| time_elapsed | 116261 | -| total_timesteps | 2753152 | -| train/ | | -| approx_kl | 0.005426892 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 215080 | -| policy_gradient_loss | -0.00856 | -| std | 0.00641 | -| value_loss | 0.00325 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21510 | -| time_elapsed | 116267 | -| total_timesteps | 2753280 | -| train/ | | -| approx_kl | 0.041103736 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -5.33 | -| learning_rate | 0.0003 | -| loss | 0.075 | -| n_updates | 215090 | -| policy_gradient_loss | 0.0632 | -| std | 0.00641 | -| value_loss | 6.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21511 | -| time_elapsed | 116273 | -| total_timesteps | 2753408 | -| train/ | | -| approx_kl | 0.115373306 | -| clip_fraction | 0.66 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.0861 | -| n_updates | 215100 | -| policy_gradient_loss | 0.131 | -| std | 0.00641 | -| value_loss | 6.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21512 | -| time_elapsed | 116278 | -| total_timesteps | 2753536 | -| train/ | | -| approx_kl | 0.14697257 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.0741 | -| n_updates | 215110 | -| policy_gradient_loss | 0.0883 | -| std | 0.00641 | -| value_loss | 3.48e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21513 | -| time_elapsed | 116282 | -| total_timesteps | 2753664 | -| train/ | | -| approx_kl | 0.029800152 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.0096 | -| n_updates | 215120 | -| policy_gradient_loss | 0.0306 | -| std | 0.00641 | -| value_loss | 2.16e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21514 | -| time_elapsed | 116287 | -| total_timesteps | 2753792 | -| train/ | | -| approx_kl | 0.6324018 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 215130 | -| policy_gradient_loss | 0.0525 | -| std | 0.00642 | -| value_loss | 1.58e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21515 | -| time_elapsed | 116292 | -| total_timesteps | 2753920 | -| train/ | | -| approx_kl | 0.046920724 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0445 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 215140 | -| policy_gradient_loss | 0.0102 | -| std | 0.00642 | -| value_loss | 1.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21516 | -| time_elapsed | 116297 | -| total_timesteps | 2754048 | -| train/ | | -| approx_kl | 0.008518366 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 215150 | -| policy_gradient_loss | 0.00532 | -| std | 0.00642 | -| value_loss | 1.01e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21517 | -| time_elapsed | 116308 | -| total_timesteps | 2754176 | -| train/ | | -| approx_kl | 0.005873902 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 215160 | -| policy_gradient_loss | 0.045 | -| std | 0.00642 | -| value_loss | 0.00479 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21518 | -| time_elapsed | 116313 | -| total_timesteps | 2754304 | -| train/ | | -| approx_kl | 0.011281133 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.969 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 215170 | -| policy_gradient_loss | 0.0291 | -| std | 0.00642 | -| value_loss | 7.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21519 | -| time_elapsed | 116318 | -| total_timesteps | 2754432 | -| train/ | | -| approx_kl | 0.22355719 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0731 | -| n_updates | 215180 | -| policy_gradient_loss | 0.0203 | -| std | 0.00642 | -| value_loss | 5.8e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21520 | -| time_elapsed | 116323 | -| total_timesteps | 2754560 | -| train/ | | -| approx_kl | 0.02045599 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 215190 | -| policy_gradient_loss | 0.00596 | -| std | 0.00642 | -| value_loss | 3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21521 | -| time_elapsed | 116328 | -| total_timesteps | 2754688 | -| train/ | | -| approx_kl | 0.024770176 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0904 | -| learning_rate | 0.0003 | -| loss | 0.00723 | -| n_updates | 215200 | -| policy_gradient_loss | 0.0274 | -| std | 0.00643 | -| value_loss | 2.22e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21522 | -| time_elapsed | 116332 | -| total_timesteps | 2754816 | -| train/ | | -| approx_kl | 0.13222373 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | 0.084 | -| n_updates | 215210 | -| policy_gradient_loss | 0.0382 | -| std | 0.00644 | -| value_loss | 1.57e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 21523 | -| time_elapsed | 116336 | -| total_timesteps | 2754944 | -| train/ | | -| approx_kl | 0.00019004615 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 215220 | -| policy_gradient_loss | 0.0281 | -| std | 0.00644 | -| value_loss | 1.14e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21524 | -| time_elapsed | 116341 | -| total_timesteps | 2755072 | -| train/ | | -| approx_kl | 0.5336418 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 215230 | -| policy_gradient_loss | 0.054 | -| std | 0.00644 | -| value_loss | 1e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21525 | -| time_elapsed | 116349 | -| total_timesteps | 2755200 | -| train/ | | -| approx_kl | 0.004227111 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 215240 | -| policy_gradient_loss | -0.00739 | -| std | 0.00644 | -| value_loss | 0.000508 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21526 | -| time_elapsed | 116352 | -| total_timesteps | 2755328 | -| train/ | | -| approx_kl | 0.16166788 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 215250 | -| policy_gradient_loss | 0.139 | -| std | 0.00644 | -| value_loss | 7.81e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21527 | -| time_elapsed | 116355 | -| total_timesteps | 2755456 | -| train/ | | -| approx_kl | 0.023967706 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00996 | -| learning_rate | 0.0003 | -| loss | 0.00713 | -| n_updates | 215260 | -| policy_gradient_loss | 0.0222 | -| std | 0.00644 | -| value_loss | 8.31e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21528 | -| time_elapsed | 116358 | -| total_timesteps | 2755584 | -| train/ | | -| approx_kl | 0.00041847676 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | 0.00245 | -| n_updates | 215270 | -| policy_gradient_loss | 0.0354 | -| std | 0.00644 | -| value_loss | 5.11e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21529 | -| time_elapsed | 116362 | -| total_timesteps | 2755712 | -| train/ | | -| approx_kl | 0.50883627 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 215280 | -| policy_gradient_loss | 0.0625 | -| std | 0.00644 | -| value_loss | 4.44e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21530 | -| time_elapsed | 116366 | -| total_timesteps | 2755840 | -| train/ | | -| approx_kl | 0.056082472 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 215290 | -| policy_gradient_loss | 0.0174 | -| std | 0.00644 | -| value_loss | 3.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 21531 | -| time_elapsed | 116372 | -| total_timesteps | 2755968 | -| train/ | | -| approx_kl | 0.009738382 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 215300 | -| policy_gradient_loss | 0.00727 | -| std | 0.00644 | -| value_loss | 2.17e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21532 | -| time_elapsed | 116378 | -| total_timesteps | 2756096 | -| train/ | | -| approx_kl | 0.0010336358 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.0069 | -| n_updates | 215310 | -| policy_gradient_loss | 0.00524 | -| std | 0.00644 | -| value_loss | 1.71e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21533 | -| time_elapsed | 116388 | -| total_timesteps | 2756224 | -| train/ | | -| approx_kl | 0.02653766 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.847 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 215320 | -| policy_gradient_loss | -0.00046 | -| std | 0.00644 | -| value_loss | 0.00286 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21534 | -| time_elapsed | 116392 | -| total_timesteps | 2756352 | -| train/ | | -| approx_kl | 0.0024575074 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 215330 | -| policy_gradient_loss | 0.0107 | -| std | 0.00644 | -| value_loss | 3.57e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21535 | -| time_elapsed | 116397 | -| total_timesteps | 2756480 | -| train/ | | -| approx_kl | 3.8133003e-06 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.00024 | -| n_updates | 215340 | -| policy_gradient_loss | 0.0321 | -| std | 0.00644 | -| value_loss | 2.34e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21536 | -| time_elapsed | 116401 | -| total_timesteps | 2756608 | -| train/ | | -| approx_kl | 0.79252565 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.223 | -| n_updates | 215350 | -| policy_gradient_loss | 0.178 | -| std | 0.00644 | -| value_loss | 1.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21537 | -| time_elapsed | 116405 | -| total_timesteps | 2756736 | -| train/ | | -| approx_kl | 0.011046882 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | -0.0155 | -| n_updates | 215360 | -| policy_gradient_loss | 0.0162 | -| std | 0.00644 | -| value_loss | 1.29e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21538 | -| time_elapsed | 116411 | -| total_timesteps | 2756864 | -| train/ | | -| approx_kl | 0.2540651 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 215370 | -| policy_gradient_loss | 0.134 | -| std | 0.00644 | -| value_loss | 8.59e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 21539 | -| time_elapsed | 116415 | -| total_timesteps | 2756992 | -| train/ | | -| approx_kl | 0.043421857 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 215380 | -| policy_gradient_loss | 0.0246 | -| std | 0.00644 | -| value_loss | 5.49e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 21540 | -| time_elapsed | 116418 | -| total_timesteps | 2757120 | -| train/ | | -| approx_kl | 0.0008570859 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 215390 | -| policy_gradient_loss | 0.0301 | -| std | 0.00644 | -| value_loss | 3.66e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 21541 | -| time_elapsed | 116429 | -| total_timesteps | 2757248 | -| train/ | | -| approx_kl | 0.019009387 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.00926 | -| n_updates | 215400 | -| policy_gradient_loss | 0.0128 | -| std | 0.00644 | -| value_loss | 0.000194 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 21542 | -| time_elapsed | 116434 | -| total_timesteps | 2757376 | -| train/ | | -| approx_kl | 0.22087133 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00937 | -| learning_rate | 0.0003 | -| loss | 0.0756 | -| n_updates | 215410 | -| policy_gradient_loss | 0.0242 | -| std | 0.00644 | -| value_loss | 1.79e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 21543 | -| time_elapsed | 116438 | -| total_timesteps | 2757504 | -| train/ | | -| approx_kl | 0.023293532 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.000757 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 215420 | -| policy_gradient_loss | 0.0368 | -| std | 0.00644 | -| value_loss | 5.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 21544 | -| time_elapsed | 116445 | -| total_timesteps | 2757632 | -| train/ | | -| approx_kl | 0.114524536 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 215430 | -| policy_gradient_loss | 0.0308 | -| std | 0.00644 | -| value_loss | 4.85e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 21545 | -| time_elapsed | 116450 | -| total_timesteps | 2757760 | -| train/ | | -| approx_kl | 0.17297098 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.0968 | -| n_updates | 215440 | -| policy_gradient_loss | 0.0336 | -| std | 0.00644 | -| value_loss | 2.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 21546 | -| time_elapsed | 116454 | -| total_timesteps | 2757888 | -| train/ | | -| approx_kl | 0.033027634 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0688 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 215450 | -| policy_gradient_loss | 0.0365 | -| std | 0.00644 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21547 | -| time_elapsed | 116461 | -| total_timesteps | 2758016 | -| train/ | | -| approx_kl | 0.32036817 | -| clip_fraction | 0.687 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 215460 | -| policy_gradient_loss | 0.144 | -| std | 0.00644 | -| value_loss | 1.46e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21548 | -| time_elapsed | 116474 | -| total_timesteps | 2758144 | -| train/ | | -| approx_kl | 0.02404583 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 215470 | -| policy_gradient_loss | 0.00703 | -| std | 0.00644 | -| value_loss | 0.000492 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21549 | -| time_elapsed | 116479 | -| total_timesteps | 2758272 | -| train/ | | -| approx_kl | 0.17972617 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.09 | -| learning_rate | 0.0003 | -| loss | 0.0677 | -| n_updates | 215480 | -| policy_gradient_loss | 0.0172 | -| std | 0.00644 | -| value_loss | 1.07e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21550 | -| time_elapsed | 116482 | -| total_timesteps | 2758400 | -| train/ | | -| approx_kl | 0.01782978 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00396 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 215490 | -| policy_gradient_loss | 0.00584 | -| std | 0.00644 | -| value_loss | 2.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21551 | -| time_elapsed | 116487 | -| total_timesteps | 2758528 | -| train/ | | -| approx_kl | 0.027762042 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | 0.00478 | -| n_updates | 215500 | -| policy_gradient_loss | 0.0313 | -| std | 0.00644 | -| value_loss | 1.19e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21552 | -| time_elapsed | 116492 | -| total_timesteps | 2758656 | -| train/ | | -| approx_kl | 0.2517079 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 215510 | -| policy_gradient_loss | 0.15 | -| std | 0.00644 | -| value_loss | 2.88e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21553 | -| time_elapsed | 116496 | -| total_timesteps | 2758784 | -| train/ | | -| approx_kl | 0.18477929 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 215520 | -| policy_gradient_loss | 0.141 | -| std | 0.00644 | -| value_loss | 2.56e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21554 | -| time_elapsed | 116501 | -| total_timesteps | 2758912 | -| train/ | | -| approx_kl | 0.14477304 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 215530 | -| policy_gradient_loss | 0.126 | -| std | 0.00644 | -| value_loss | 1.84e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21555 | -| time_elapsed | 116506 | -| total_timesteps | 2759040 | -| train/ | | -| approx_kl | 0.03451976 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 215540 | -| policy_gradient_loss | 0.0334 | -| std | 0.00644 | -| value_loss | 1.42e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21556 | -| time_elapsed | 116517 | -| total_timesteps | 2759168 | -| train/ | | -| approx_kl | 0.5329459 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.786 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 215550 | -| policy_gradient_loss | 0.0499 | -| std | 0.00644 | -| value_loss | 0.00224 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21557 | -| time_elapsed | 116521 | -| total_timesteps | 2759296 | -| train/ | | -| approx_kl | 0.06573608 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | 0.000635 | -| n_updates | 215560 | -| policy_gradient_loss | -0.00154 | -| std | 0.00644 | -| value_loss | 1.45e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21558 | -| time_elapsed | 116525 | -| total_timesteps | 2759424 | -| train/ | | -| approx_kl | 0.009415941 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00258 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 215570 | -| policy_gradient_loss | 0.00436 | -| std | 0.00644 | -| value_loss | 3.63e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21559 | -| time_elapsed | 116530 | -| total_timesteps | 2759552 | -| train/ | | -| approx_kl | 0.0014398689 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00787 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 215580 | -| policy_gradient_loss | 0.0116 | -| std | 0.00646 | -| value_loss | 2.7e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21560 | -| time_elapsed | 116534 | -| total_timesteps | 2759680 | -| train/ | | -| approx_kl | 0.041938826 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -6.39 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 215590 | -| policy_gradient_loss | 0.0446 | -| std | 0.00647 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21561 | -| time_elapsed | 116538 | -| total_timesteps | 2759808 | -| train/ | | -| approx_kl | 0.0109560955 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 215600 | -| policy_gradient_loss | 0.0268 | -| std | 0.00649 | -| value_loss | 3.12e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 21562 | -| time_elapsed | 116542 | -| total_timesteps | 2759936 | -| train/ | | -| approx_kl | 0.72239757 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | 0.194 | -| n_updates | 215610 | -| policy_gradient_loss | 0.0576 | -| std | 0.00649 | -| value_loss | 3.8e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21563 | -| time_elapsed | 116546 | -| total_timesteps | 2760064 | -| train/ | | -| approx_kl | 0.05356045 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 215620 | -| policy_gradient_loss | 0.00816 | -| std | 0.00649 | -| value_loss | 1.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21564 | -| time_elapsed | 116555 | -| total_timesteps | 2760192 | -| train/ | | -| approx_kl | 0.028468499 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | -0.0166 | -| n_updates | 215630 | -| policy_gradient_loss | -0.00625 | -| std | 0.00649 | -| value_loss | 0.000158 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21565 | -| time_elapsed | 116560 | -| total_timesteps | 2760320 | -| train/ | | -| approx_kl | 0.0037556137 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.0057 | -| n_updates | 215640 | -| policy_gradient_loss | 0.0109 | -| std | 0.00649 | -| value_loss | 9.08e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21566 | -| time_elapsed | 116564 | -| total_timesteps | 2760448 | -| train/ | | -| approx_kl | 0.0636247 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.308 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 215650 | -| policy_gradient_loss | 0.0157 | -| std | 0.00649 | -| value_loss | 1.57e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21567 | -| time_elapsed | 116569 | -| total_timesteps | 2760576 | -| train/ | | -| approx_kl | 0.009622667 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -34.2 | -| learning_rate | 0.0003 | -| loss | 0.00154 | -| n_updates | 215660 | -| policy_gradient_loss | 0.00458 | -| std | 0.00649 | -| value_loss | 4.86e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21568 | -| time_elapsed | 116574 | -| total_timesteps | 2760704 | -| train/ | | -| approx_kl | 0.07195952 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 215670 | -| policy_gradient_loss | 0.0116 | -| std | 0.00649 | -| value_loss | 3.69e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21569 | -| time_elapsed | 116578 | -| total_timesteps | 2760832 | -| train/ | | -| approx_kl | 0.041138932 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 215680 | -| policy_gradient_loss | -0.00698 | -| std | 0.00649 | -| value_loss | 2.22e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 21570 | -| time_elapsed | 116582 | -| total_timesteps | 2760960 | -| train/ | | -| approx_kl | 0.007892928 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0478 | -| learning_rate | 0.0003 | -| loss | 0.000629 | -| n_updates | 215690 | -| policy_gradient_loss | 0.00725 | -| std | 0.00649 | -| value_loss | 1.21e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21571 | -| time_elapsed | 116587 | -| total_timesteps | 2761088 | -| train/ | | -| approx_kl | 0.0022864402 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 215700 | -| policy_gradient_loss | 0.00951 | -| std | 0.00649 | -| value_loss | 7.67e-11 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21572 | -| time_elapsed | 116595 | -| total_timesteps | 2761216 | -| train/ | | -| approx_kl | 0.035446253 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 215710 | -| policy_gradient_loss | 0.0082 | -| std | 0.00649 | -| value_loss | 0.000241 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21573 | -| time_elapsed | 116600 | -| total_timesteps | 2761344 | -| train/ | | -| approx_kl | 0.10331478 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | 0.0552 | -| n_updates | 215720 | -| policy_gradient_loss | 0.025 | -| std | 0.00649 | -| value_loss | 7.01e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21574 | -| time_elapsed | 116604 | -| total_timesteps | 2761472 | -| train/ | | -| approx_kl | 0.71813655 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 215730 | -| policy_gradient_loss | 0.0394 | -| std | 0.0065 | -| value_loss | 3.2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21575 | -| time_elapsed | 116608 | -| total_timesteps | 2761600 | -| train/ | | -| approx_kl | 0.036732666 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 215740 | -| policy_gradient_loss | 0.0133 | -| std | 0.0065 | -| value_loss | 3.76e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21576 | -| time_elapsed | 116612 | -| total_timesteps | 2761728 | -| train/ | | -| approx_kl | 0.0053426847 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | -0.00427 | -| n_updates | 215750 | -| policy_gradient_loss | 0.00564 | -| std | 0.0065 | -| value_loss | 1.27e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21577 | -| time_elapsed | 116617 | -| total_timesteps | 2761856 | -| train/ | | -| approx_kl | 0.00019739429 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0662 | -| learning_rate | 0.0003 | -| loss | 0.000266 | -| n_updates | 215760 | -| policy_gradient_loss | 0.0395 | -| std | 0.0065 | -| value_loss | 4.13e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21578 | -| time_elapsed | 116620 | -| total_timesteps | 2761984 | -| train/ | | -| approx_kl | 0.7913343 | -| clip_fraction | 0.776 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.313 | -| n_updates | 215770 | -| policy_gradient_loss | 0.213 | -| std | 0.00651 | -| value_loss | 8.83e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21579 | -| time_elapsed | 116625 | -| total_timesteps | 2762112 | -| train/ | | -| approx_kl | 0.03127117 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 215780 | -| policy_gradient_loss | -0.00697 | -| std | 0.00651 | -| value_loss | 3.9e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21580 | -| time_elapsed | 116636 | -| total_timesteps | 2762240 | -| train/ | | -| approx_kl | 0.012354834 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | -0.00483 | -| n_updates | 215790 | -| policy_gradient_loss | 0.00331 | -| std | 0.00651 | -| value_loss | 0.000689 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21581 | -| time_elapsed | 116643 | -| total_timesteps | 2762368 | -| train/ | | -| approx_kl | 0.013150831 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 215800 | -| policy_gradient_loss | 0.0387 | -| std | 0.00651 | -| value_loss | 2.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21582 | -| time_elapsed | 116648 | -| total_timesteps | 2762496 | -| train/ | | -| approx_kl | 0.09667507 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.064 | -| n_updates | 215810 | -| policy_gradient_loss | 0.0316 | -| std | 0.00651 | -| value_loss | 3.02e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21583 | -| time_elapsed | 116653 | -| total_timesteps | 2762624 | -| train/ | | -| approx_kl | 0.0060370793 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 215820 | -| policy_gradient_loss | 0.00648 | -| std | 0.00651 | -| value_loss | 1.48e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21584 | -| time_elapsed | 116658 | -| total_timesteps | 2762752 | -| train/ | | -| approx_kl | 0.25279987 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0069 | -| learning_rate | 0.0003 | -| loss | 0.179 | -| n_updates | 215830 | -| policy_gradient_loss | 0.142 | -| std | 0.00651 | -| value_loss | 3.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21585 | -| time_elapsed | 116663 | -| total_timesteps | 2762880 | -| train/ | | -| approx_kl | 0.14110154 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 215840 | -| policy_gradient_loss | 0.11 | -| std | 0.00651 | -| value_loss | 2.75e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21586 | -| time_elapsed | 116667 | -| total_timesteps | 2763008 | -| train/ | | -| approx_kl | 0.17602503 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 215850 | -| policy_gradient_loss | 0.185 | -| std | 0.00652 | -| value_loss | 2.23e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21587 | -| time_elapsed | 116679 | -| total_timesteps | 2763136 | -| train/ | | -| approx_kl | 0.024358634 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.603 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 215860 | -| policy_gradient_loss | 0.00355 | -| std | 0.00652 | -| value_loss | 0.00285 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21588 | -| time_elapsed | 116684 | -| total_timesteps | 2763264 | -| train/ | | -| approx_kl | 0.622291 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.0234 | -| learning_rate | 0.0003 | -| loss | 0.251 | -| n_updates | 215870 | -| policy_gradient_loss | 0.0838 | -| std | 0.00652 | -| value_loss | 0.0272 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21589 | -| time_elapsed | 116690 | -| total_timesteps | 2763392 | -| train/ | | -| approx_kl | 0.049282968 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.47 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 215880 | -| policy_gradient_loss | 0.0124 | -| std | 0.00651 | -| value_loss | 0.000155 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21590 | -| time_elapsed | 116695 | -| total_timesteps | 2763520 | -| train/ | | -| approx_kl | 0.0101958085 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 215890 | -| policy_gradient_loss | 0.0058 | -| std | 0.00651 | -| value_loss | 1.63e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21591 | -| time_elapsed | 116700 | -| total_timesteps | 2763648 | -| train/ | | -| approx_kl | 0.035064917 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 215900 | -| policy_gradient_loss | 0.0155 | -| std | 0.00651 | -| value_loss | 6.32e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21592 | -| time_elapsed | 116705 | -| total_timesteps | 2763776 | -| train/ | | -| approx_kl | 0.1773676 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.075 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 215910 | -| policy_gradient_loss | 0.0283 | -| std | 0.00651 | -| value_loss | 4.43e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 21593 | -| time_elapsed | 116709 | -| total_timesteps | 2763904 | -| train/ | | -| approx_kl | 0.6003377 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 215920 | -| policy_gradient_loss | 0.0441 | -| std | 0.00651 | -| value_loss | 1.39e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21594 | -| time_elapsed | 116714 | -| total_timesteps | 2764032 | -| train/ | | -| approx_kl | 0.051907193 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 215930 | -| policy_gradient_loss | 0.00734 | -| std | 0.00651 | -| value_loss | 1.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21595 | -| time_elapsed | 116724 | -| total_timesteps | 2764160 | -| train/ | | -| approx_kl | 0.030704085 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -3.9 | -| learning_rate | 0.0003 | -| loss | -0.0277 | -| n_updates | 215940 | -| policy_gradient_loss | -0.00471 | -| std | 0.00651 | -| value_loss | 0.00415 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21596 | -| time_elapsed | 116729 | -| total_timesteps | 2764288 | -| train/ | | -| approx_kl | 0.011014121 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 215950 | -| policy_gradient_loss | 0.0405 | -| std | 0.00651 | -| value_loss | 4.84e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21597 | -| time_elapsed | 116734 | -| total_timesteps | 2764416 | -| train/ | | -| approx_kl | 0.18194257 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00532 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 215960 | -| policy_gradient_loss | 0.0668 | -| std | 0.00651 | -| value_loss | 7.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21598 | -| time_elapsed | 116740 | -| total_timesteps | 2764544 | -| train/ | | -| approx_kl | 0.04787128 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 215970 | -| policy_gradient_loss | 0.0638 | -| std | 0.0065 | -| value_loss | 4.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21599 | -| time_elapsed | 116744 | -| total_timesteps | 2764672 | -| train/ | | -| approx_kl | 0.12427503 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | 0.0961 | -| n_updates | 215980 | -| policy_gradient_loss | 0.0505 | -| std | 0.0065 | -| value_loss | 2.24e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21600 | -| time_elapsed | 116750 | -| total_timesteps | 2764800 | -| train/ | | -| approx_kl | 0.0063016606 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0942 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 215990 | -| policy_gradient_loss | 0.00485 | -| std | 0.0065 | -| value_loss | 1.62e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21601 | -| time_elapsed | 116756 | -| total_timesteps | 2764928 | -| train/ | | -| approx_kl | 0.034252785 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 216000 | -| policy_gradient_loss | 0.0365 | -| std | 0.0065 | -| value_loss | 1.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21602 | -| time_elapsed | 116760 | -| total_timesteps | 2765056 | -| train/ | | -| approx_kl | 0.14279455 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | 0.0758 | -| n_updates | 216010 | -| policy_gradient_loss | 0.0591 | -| std | 0.00651 | -| value_loss | 2.29e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21603 | -| time_elapsed | 116771 | -| total_timesteps | 2765184 | -| train/ | | -| approx_kl | 0.0060408674 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 216020 | -| policy_gradient_loss | 0.00813 | -| std | 0.00651 | -| value_loss | 0.000344 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21604 | -| time_elapsed | 116775 | -| total_timesteps | 2765312 | -| train/ | | -| approx_kl | 0.26486573 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -1.22 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 216030 | -| policy_gradient_loss | 0.0707 | -| std | 0.00651 | -| value_loss | 5.11e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21605 | -| time_elapsed | 116780 | -| total_timesteps | 2765440 | -| train/ | | -| approx_kl | 0.012114335 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0516 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 216040 | -| policy_gradient_loss | 0.0108 | -| std | 0.00651 | -| value_loss | 7.5e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21606 | -| time_elapsed | 116784 | -| total_timesteps | 2765568 | -| train/ | | -| approx_kl | 0.2650913 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.235 | -| n_updates | 216050 | -| policy_gradient_loss | 0.0421 | -| std | 0.00651 | -| value_loss | 3.35e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21607 | -| time_elapsed | 116790 | -| total_timesteps | 2765696 | -| train/ | | -| approx_kl | 0.002003002 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -25.7 | -| learning_rate | 0.0003 | -| loss | 0.00088 | -| n_updates | 216060 | -| policy_gradient_loss | 0.000477 | -| std | 0.00652 | -| value_loss | 2.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21608 | -| time_elapsed | 116794 | -| total_timesteps | 2765824 | -| train/ | | -| approx_kl | 0.22867452 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.00965 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 216070 | -| policy_gradient_loss | 0.177 | -| std | 0.00652 | -| value_loss | 4.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21609 | -| time_elapsed | 116799 | -| total_timesteps | 2765952 | -| train/ | | -| approx_kl | 0.041287336 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.00085 | -| n_updates | 216080 | -| policy_gradient_loss | 0.0256 | -| std | 0.00652 | -| value_loss | 1.26e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21610 | -| time_elapsed | 116804 | -| total_timesteps | 2766080 | -| train/ | | -| approx_kl | 0.0015532929 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.0024 | -| learning_rate | 0.0003 | -| loss | 0.00499 | -| n_updates | 216090 | -| policy_gradient_loss | 0.0346 | -| std | 0.00652 | -| value_loss | 6.2e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21611 | -| time_elapsed | 116813 | -| total_timesteps | 2766208 | -| train/ | | -| approx_kl | 0.2934997 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | 0.0357 | -| n_updates | 216100 | -| policy_gradient_loss | 0.0161 | -| std | 0.00652 | -| value_loss | 0.000744 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21612 | -| time_elapsed | 116818 | -| total_timesteps | 2766336 | -| train/ | | -| approx_kl | 0.033245526 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | -0.00572 | -| n_updates | 216110 | -| policy_gradient_loss | 0.0221 | -| std | 0.00652 | -| value_loss | 1.12e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21613 | -| time_elapsed | 116822 | -| total_timesteps | 2766464 | -| train/ | | -| approx_kl | 0.8227218 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.00137 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 216120 | -| policy_gradient_loss | 0.209 | -| std | 0.00652 | -| value_loss | 1.06e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21614 | -| time_elapsed | 116827 | -| total_timesteps | 2766592 | -| train/ | | -| approx_kl | 0.029466407 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 216130 | -| policy_gradient_loss | 0.0024 | -| std | 0.00652 | -| value_loss | 5.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21615 | -| time_elapsed | 116833 | -| total_timesteps | 2766720 | -| train/ | | -| approx_kl | 0.021333866 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 216140 | -| policy_gradient_loss | 0.0324 | -| std | 0.00652 | -| value_loss | 3.57e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21616 | -| time_elapsed | 116839 | -| total_timesteps | 2766848 | -| train/ | | -| approx_kl | 0.27240843 | -| clip_fraction | 0.683 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.213 | -| n_updates | 216150 | -| policy_gradient_loss | 0.157 | -| std | 0.00652 | -| value_loss | 3.3e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21617 | -| time_elapsed | 116843 | -| total_timesteps | 2766976 | -| train/ | | -| approx_kl | 0.044050094 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 216160 | -| policy_gradient_loss | 0.028 | -| std | 0.00652 | -| value_loss | 1.82e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21618 | -| time_elapsed | 116847 | -| total_timesteps | 2767104 | -| train/ | | -| approx_kl | 0.7298099 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 216170 | -| policy_gradient_loss | 0.0489 | -| std | 0.00652 | -| value_loss | 1.46e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21619 | -| time_elapsed | 116858 | -| total_timesteps | 2767232 | -| train/ | | -| approx_kl | 0.013267549 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.389 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 216180 | -| policy_gradient_loss | -0.0111 | -| std | 0.00652 | -| value_loss | 0.00163 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21620 | -| time_elapsed | 116863 | -| total_timesteps | 2767360 | -| train/ | | -| approx_kl | 0.09083556 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 216190 | -| policy_gradient_loss | 0.00245 | -| std | 0.00652 | -| value_loss | 3.24e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21621 | -| time_elapsed | 116867 | -| total_timesteps | 2767488 | -| train/ | | -| approx_kl | 0.0017211861 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.00714 | -| learning_rate | 0.0003 | -| loss | -0.00914 | -| n_updates | 216200 | -| policy_gradient_loss | -0.00615 | -| std | 0.00652 | -| value_loss | 2.99e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21622 | -| time_elapsed | 116872 | -| total_timesteps | 2767616 | -| train/ | | -| approx_kl | 0.050171968 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.000623 | -| n_updates | 216210 | -| policy_gradient_loss | 0.00127 | -| std | 0.00653 | -| value_loss | 1.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21623 | -| time_elapsed | 116877 | -| total_timesteps | 2767744 | -| train/ | | -| approx_kl | 0.008757013 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0985 | -| learning_rate | 0.0003 | -| loss | -0.00704 | -| n_updates | 216220 | -| policy_gradient_loss | 0.00646 | -| std | 0.00653 | -| value_loss | 9.72e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21624 | -| time_elapsed | 116882 | -| total_timesteps | 2767872 | -| train/ | | -| approx_kl | 0.0018801205 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 216230 | -| policy_gradient_loss | 0.00637 | -| std | 0.00653 | -| value_loss | 5.46e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21625 | -| time_elapsed | 116887 | -| total_timesteps | 2768000 | -| train/ | | -| approx_kl | 0.0838023 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0714 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 216240 | -| policy_gradient_loss | 0.00886 | -| std | 0.00652 | -| value_loss | 4.72e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21626 | -| time_elapsed | 116892 | -| total_timesteps | 2768128 | -| train/ | | -| approx_kl | 0.042265892 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | 0.00507 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 216250 | -| policy_gradient_loss | 0.0387 | -| std | 0.00652 | -| value_loss | 2.25e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21627 | -| time_elapsed | 116901 | -| total_timesteps | 2768256 | -| train/ | | -| approx_kl | 0.6980494 | -| clip_fraction | 0.757 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 216260 | -| policy_gradient_loss | 0.0818 | -| std | 0.00651 | -| value_loss | 0.00397 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21628 | -| time_elapsed | 116906 | -| total_timesteps | 2768384 | -| train/ | | -| approx_kl | 0.022670222 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.332 | -| learning_rate | 0.0003 | -| loss | -0.00265 | -| n_updates | 216270 | -| policy_gradient_loss | -0.00395 | -| std | 0.00651 | -| value_loss | 7.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21629 | -| time_elapsed | 116910 | -| total_timesteps | 2768512 | -| train/ | | -| approx_kl | 0.017428562 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 216280 | -| policy_gradient_loss | -0.0065 | -| std | 0.0065 | -| value_loss | 5.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21630 | -| time_elapsed | 116913 | -| total_timesteps | 2768640 | -| train/ | | -| approx_kl | 0.024516033 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0854 | -| learning_rate | 0.0003 | -| loss | 0.00745 | -| n_updates | 216290 | -| policy_gradient_loss | 0.0282 | -| std | 0.0065 | -| value_loss | 4.03e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21631 | -| time_elapsed | 116918 | -| total_timesteps | 2768768 | -| train/ | | -| approx_kl | 0.117066875 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | 0.0615 | -| n_updates | 216300 | -| policy_gradient_loss | 0.0308 | -| std | 0.00649 | -| value_loss | 2.55e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 21632 | -| time_elapsed | 116923 | -| total_timesteps | 2768896 | -| train/ | | -| approx_kl | 0.13878207 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0713 | -| learning_rate | 0.0003 | -| loss | 0.0578 | -| n_updates | 216310 | -| policy_gradient_loss | 0.0222 | -| std | 0.00649 | -| value_loss | 1.92e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21633 | -| time_elapsed | 116928 | -| total_timesteps | 2769024 | -| train/ | | -| approx_kl | 0.02709945 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 216320 | -| policy_gradient_loss | 0.0275 | -| std | 0.00649 | -| value_loss | 1.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21634 | -| time_elapsed | 116940 | -| total_timesteps | 2769152 | -| train/ | | -| approx_kl | 0.38542593 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.811 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 216330 | -| policy_gradient_loss | 0.0777 | -| std | 0.00649 | -| value_loss | 0.0051 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21635 | -| time_elapsed | 116946 | -| total_timesteps | 2769280 | -| train/ | | -| approx_kl | 0.079228535 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.218 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 216340 | -| policy_gradient_loss | 0.0313 | -| std | 0.00649 | -| value_loss | 8.71e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21636 | -| time_elapsed | 116950 | -| total_timesteps | 2769408 | -| train/ | | -| approx_kl | 0.12552057 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | 0.049 | -| n_updates | 216350 | -| policy_gradient_loss | 0.0154 | -| std | 0.00649 | -| value_loss | 2.02e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21637 | -| time_elapsed | 116955 | -| total_timesteps | 2769536 | -| train/ | | -| approx_kl | 0.02785295 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.248 | -| learning_rate | 0.0003 | -| loss | 0.00872 | -| n_updates | 216360 | -| policy_gradient_loss | 0.0347 | -| std | 0.00648 | -| value_loss | 9.9e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21638 | -| time_elapsed | 116960 | -| total_timesteps | 2769664 | -| train/ | | -| approx_kl | 0.24224037 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 216370 | -| policy_gradient_loss | 0.113 | -| std | 0.00648 | -| value_loss | 1.38e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21639 | -| time_elapsed | 116965 | -| total_timesteps | 2769792 | -| train/ | | -| approx_kl | 0.04994214 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0778 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 216380 | -| policy_gradient_loss | 0.0248 | -| std | 0.00648 | -| value_loss | 8.56e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21640 | -| time_elapsed | 116970 | -| total_timesteps | 2769920 | -| train/ | | -| approx_kl | 0.00056183105 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0785 | -| learning_rate | 0.0003 | -| loss | 0.00102 | -| n_updates | 216390 | -| policy_gradient_loss | 0.0267 | -| std | 0.00648 | -| value_loss | 5e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21641 | -| time_elapsed | 116976 | -| total_timesteps | 2770048 | -| train/ | | -| approx_kl | 0.62246156 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 216400 | -| policy_gradient_loss | 0.0593 | -| std | 0.00648 | -| value_loss | 5.08e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21642 | -| time_elapsed | 116985 | -| total_timesteps | 2770176 | -| train/ | | -| approx_kl | 0.001559014 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.939 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 216410 | -| policy_gradient_loss | -0.00323 | -| std | 0.00648 | -| value_loss | 0.00095 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21643 | -| time_elapsed | 116989 | -| total_timesteps | 2770304 | -| train/ | | -| approx_kl | 0.060387738 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.219 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 216420 | -| policy_gradient_loss | 0.144 | -| std | 0.00648 | -| value_loss | 8.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21644 | -| time_elapsed | 116993 | -| total_timesteps | 2770432 | -| train/ | | -| approx_kl | 0.107822716 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00835 | -| learning_rate | 0.0003 | -| loss | 0.0684 | -| n_updates | 216430 | -| policy_gradient_loss | 0.133 | -| std | 0.00648 | -| value_loss | 1.28e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21645 | -| time_elapsed | 116999 | -| total_timesteps | 2770560 | -| train/ | | -| approx_kl | 0.14470583 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -4.18 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 216440 | -| policy_gradient_loss | 0.0487 | -| std | 0.00648 | -| value_loss | 1.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21646 | -| time_elapsed | 117003 | -| total_timesteps | 2770688 | -| train/ | | -| approx_kl | 0.028072955 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -8.07 | -| learning_rate | 0.0003 | -| loss | 0.00222 | -| n_updates | 216450 | -| policy_gradient_loss | 0.0166 | -| std | 0.00648 | -| value_loss | 2.55e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21647 | -| time_elapsed | 117008 | -| total_timesteps | 2770816 | -| train/ | | -| approx_kl | 0.00035671936 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.00128 | -| n_updates | 216460 | -| policy_gradient_loss | 0.0285 | -| std | 0.00648 | -| value_loss | 4.09e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 21648 | -| time_elapsed | 117012 | -| total_timesteps | 2770944 | -| train/ | | -| approx_kl | 0.0011450979 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | -0.000756 | -| n_updates | 216470 | -| policy_gradient_loss | 0.0304 | -| std | 0.00648 | -| value_loss | 1.36e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21649 | -| time_elapsed | 117016 | -| total_timesteps | 2771072 | -| train/ | | -| approx_kl | 0.0022454225 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | -0.000142 | -| n_updates | 216480 | -| policy_gradient_loss | 0.039 | -| std | 0.00646 | -| value_loss | 1.84e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21650 | -| time_elapsed | 117024 | -| total_timesteps | 2771200 | -| train/ | | -| approx_kl | 0.29586706 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | 0.0915 | -| n_updates | 216490 | -| policy_gradient_loss | 0.0199 | -| std | 0.00646 | -| value_loss | 8.83e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21651 | -| time_elapsed | 117029 | -| total_timesteps | 2771328 | -| train/ | | -| approx_kl | 0.07139097 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.18 | -| learning_rate | 0.0003 | -| loss | 0.00845 | -| n_updates | 216500 | -| policy_gradient_loss | 0.000209 | -| std | 0.00645 | -| value_loss | 2.74e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21652 | -| time_elapsed | 117034 | -| total_timesteps | 2771456 | -| train/ | | -| approx_kl | 0.0122974925 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00581 | -| n_updates | 216510 | -| policy_gradient_loss | 0.00631 | -| std | 0.00645 | -| value_loss | 1.5e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21653 | -| time_elapsed | 117038 | -| total_timesteps | 2771584 | -| train/ | | -| approx_kl | 0.0745164 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00842 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 216520 | -| policy_gradient_loss | 0.00451 | -| std | 0.00645 | -| value_loss | 1.03e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21654 | -| time_elapsed | 117043 | -| total_timesteps | 2771712 | -| train/ | | -| approx_kl | 0.046679318 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 216530 | -| policy_gradient_loss | 0.0128 | -| std | 0.00645 | -| value_loss | 7.03e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21655 | -| time_elapsed | 117049 | -| total_timesteps | 2771840 | -| train/ | | -| approx_kl | 0.054839555 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 216540 | -| policy_gradient_loss | 0.0464 | -| std | 0.00646 | -| value_loss | 3.07e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 21656 | -| time_elapsed | 117053 | -| total_timesteps | 2771968 | -| train/ | | -| approx_kl | 0.03323266 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.488 | -| learning_rate | 0.0003 | -| loss | 0.00839 | -| n_updates | 216550 | -| policy_gradient_loss | 0.033 | -| std | 0.00646 | -| value_loss | 2.53e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21657 | -| time_elapsed | 117057 | -| total_timesteps | 2772096 | -| train/ | | -| approx_kl | 0.15081538 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 216560 | -| policy_gradient_loss | 0.066 | -| std | 0.00646 | -| value_loss | 8.95e-11 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21658 | -| time_elapsed | 117066 | -| total_timesteps | 2772224 | -| train/ | | -| approx_kl | 0.0017732321 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 216570 | -| policy_gradient_loss | -0.00647 | -| std | 0.00646 | -| value_loss | 0.00398 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21659 | -| time_elapsed | 117071 | -| total_timesteps | 2772352 | -| train/ | | -| approx_kl | 0.03824144 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 216580 | -| policy_gradient_loss | 0.0103 | -| std | 0.00646 | -| value_loss | 9.26e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21660 | -| time_elapsed | 117076 | -| total_timesteps | 2772480 | -| train/ | | -| approx_kl | 0.010665503 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.00484 | -| n_updates | 216590 | -| policy_gradient_loss | 0.00961 | -| std | 0.00645 | -| value_loss | 3.83e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21661 | -| time_elapsed | 117081 | -| total_timesteps | 2772608 | -| train/ | | -| approx_kl | 0.002809675 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.778 | -| learning_rate | 0.0003 | -| loss | -0.00193 | -| n_updates | 216600 | -| policy_gradient_loss | 0.00721 | -| std | 0.00645 | -| value_loss | 2.13e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21662 | -| time_elapsed | 117087 | -| total_timesteps | 2772736 | -| train/ | | -| approx_kl | 4.5327004e-05 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.000488 | -| n_updates | 216610 | -| policy_gradient_loss | 0.0344 | -| std | 0.00647 | -| value_loss | 3.33e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21663 | -| time_elapsed | 117091 | -| total_timesteps | 2772864 | -| train/ | | -| approx_kl | 0.15049674 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 216620 | -| policy_gradient_loss | 0.044 | -| std | 0.00649 | -| value_loss | 3.35e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 21664 | -| time_elapsed | 117095 | -| total_timesteps | 2772992 | -| train/ | | -| approx_kl | 0.0012466153 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.00275 | -| n_updates | 216630 | -| policy_gradient_loss | 0.0142 | -| std | 0.00648 | -| value_loss | 4.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21665 | -| time_elapsed | 117100 | -| total_timesteps | 2773120 | -| train/ | | -| approx_kl | 0.008716787 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.416 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 216640 | -| policy_gradient_loss | 0.00703 | -| std | 0.00648 | -| value_loss | 1.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21666 | -| time_elapsed | 117112 | -| total_timesteps | 2773248 | -| train/ | | -| approx_kl | 0.28300628 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.705 | -| learning_rate | 0.0003 | -| loss | 0.0457 | -| n_updates | 216650 | -| policy_gradient_loss | -0.00414 | -| std | 0.00648 | -| value_loss | 0.00132 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21667 | -| time_elapsed | 117116 | -| total_timesteps | 2773376 | -| train/ | | -| approx_kl | 0.5607381 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -11.8 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 216660 | -| policy_gradient_loss | 0.00658 | -| std | 0.00648 | -| value_loss | 5.77e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21668 | -| time_elapsed | 117121 | -| total_timesteps | 2773504 | -| train/ | | -| approx_kl | 0.013151865 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 216670 | -| policy_gradient_loss | 0.0044 | -| std | 0.00648 | -| value_loss | 5.37e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21669 | -| time_elapsed | 117126 | -| total_timesteps | 2773632 | -| train/ | | -| approx_kl | 0.0032508308 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00634 | -| n_updates | 216680 | -| policy_gradient_loss | 0.00852 | -| std | 0.00648 | -| value_loss | 3.44e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21670 | -| time_elapsed | 117129 | -| total_timesteps | 2773760 | -| train/ | | -| approx_kl | 0.04055104 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.0462 | -| n_updates | 216690 | -| policy_gradient_loss | 0.0864 | -| std | 0.00649 | -| value_loss | 2.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21671 | -| time_elapsed | 117135 | -| total_timesteps | 2773888 | -| train/ | | -| approx_kl | 0.011098606 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 216700 | -| policy_gradient_loss | 0.0288 | -| std | 0.00649 | -| value_loss | 2.25e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21672 | -| time_elapsed | 117141 | -| total_timesteps | 2774016 | -| train/ | | -| approx_kl | 0.21255529 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.0834 | -| n_updates | 216710 | -| policy_gradient_loss | 0.0211 | -| std | 0.00649 | -| value_loss | 1.47e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21673 | -| time_elapsed | 117151 | -| total_timesteps | 2774144 | -| train/ | | -| approx_kl | 0.013085416 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.481 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 216720 | -| policy_gradient_loss | -0.0117 | -| std | 0.00649 | -| value_loss | 0.00294 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21674 | -| time_elapsed | 117156 | -| total_timesteps | 2774272 | -| train/ | | -| approx_kl | 0.15933101 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.485 | -| learning_rate | 0.0003 | -| loss | 0.0399 | -| n_updates | 216730 | -| policy_gradient_loss | 0.0126 | -| std | 0.00649 | -| value_loss | 0.000118 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21675 | -| time_elapsed | 117161 | -| total_timesteps | 2774400 | -| train/ | | -| approx_kl | 0.015905462 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | 0.00027 | -| n_updates | 216740 | -| policy_gradient_loss | -0.000234 | -| std | 0.00648 | -| value_loss | 2.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21676 | -| time_elapsed | 117166 | -| total_timesteps | 2774528 | -| train/ | | -| approx_kl | 0.02456869 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | -0.000355 | -| n_updates | 216750 | -| policy_gradient_loss | 0.0272 | -| std | 0.00648 | -| value_loss | 1.52e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21677 | -| time_elapsed | 117171 | -| total_timesteps | 2774656 | -| train/ | | -| approx_kl | 0.28879905 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 216760 | -| policy_gradient_loss | 0.141 | -| std | 0.00648 | -| value_loss | 4.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21678 | -| time_elapsed | 117173 | -| total_timesteps | 2774784 | -| train/ | | -| approx_kl | 0.057791084 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 216770 | -| policy_gradient_loss | 0.0277 | -| std | 0.00647 | -| value_loss | 1.43e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21679 | -| time_elapsed | 117177 | -| total_timesteps | 2774912 | -| train/ | | -| approx_kl | 0.00052759936 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 6.6e-05 | -| n_updates | 216780 | -| policy_gradient_loss | 0.0281 | -| std | 0.00648 | -| value_loss | 6.35e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21680 | -| time_elapsed | 117182 | -| total_timesteps | 2775040 | -| train/ | | -| approx_kl | 0.0034302864 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | 0.000408 | -| n_updates | 216790 | -| policy_gradient_loss | 0.025 | -| std | 0.00646 | -| value_loss | 9.9e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21681 | -| time_elapsed | 117191 | -| total_timesteps | 2775168 | -| train/ | | -| approx_kl | 0.04177594 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | -0.0038 | -| n_updates | 216800 | -| policy_gradient_loss | 0.028 | -| std | 0.00645 | -| value_loss | 3.46e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21682 | -| time_elapsed | 117196 | -| total_timesteps | 2775296 | -| train/ | | -| approx_kl | 0.004281267 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 216810 | -| policy_gradient_loss | 0.00889 | -| std | 0.00643 | -| value_loss | 1.73e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21683 | -| time_elapsed | 117201 | -| total_timesteps | 2775424 | -| train/ | | -| approx_kl | 4.1083433e-05 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | -9.75e-05 | -| n_updates | 216820 | -| policy_gradient_loss | 0.0206 | -| std | 0.00643 | -| value_loss | 3.09e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21684 | -| time_elapsed | 117205 | -| total_timesteps | 2775552 | -| train/ | | -| approx_kl | 0.00032216404 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | -0.000439 | -| n_updates | 216830 | -| policy_gradient_loss | 0.00912 | -| std | 0.00643 | -| value_loss | 2.18e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21685 | -| time_elapsed | 117208 | -| total_timesteps | 2775680 | -| train/ | | -| approx_kl | 0.07147206 | -| clip_fraction | 0.594 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 216840 | -| policy_gradient_loss | 0.0701 | -| std | 0.00643 | -| value_loss | 1.1e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21686 | -| time_elapsed | 117212 | -| total_timesteps | 2775808 | -| train/ | | -| approx_kl | 0.028123975 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 216850 | -| policy_gradient_loss | 0.017 | -| std | 0.00644 | -| value_loss | 4.44e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21687 | -| time_elapsed | 117216 | -| total_timesteps | 2775936 | -| train/ | | -| approx_kl | 0.033653714 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | -0.0268 | -| n_updates | 216860 | -| policy_gradient_loss | 0.0178 | -| std | 0.00644 | -| value_loss | 4.15e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21688 | -| time_elapsed | 117221 | -| total_timesteps | 2776064 | -| train/ | | -| approx_kl | 0.2214218 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.000307 | -| learning_rate | 0.0003 | -| loss | 0.0569 | -| n_updates | 216870 | -| policy_gradient_loss | 0.04 | -| std | 0.00644 | -| value_loss | 1.14e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21689 | -| time_elapsed | 117228 | -| total_timesteps | 2776192 | -| train/ | | -| approx_kl | 0.026214145 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.831 | -| learning_rate | 0.0003 | -| loss | -0.00755 | -| n_updates | 216880 | -| policy_gradient_loss | -0.00692 | -| std | 0.00644 | -| value_loss | 0.00415 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21690 | -| time_elapsed | 117232 | -| total_timesteps | 2776320 | -| train/ | | -| approx_kl | 0.053994145 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | 0.0365 | -| n_updates | 216890 | -| policy_gradient_loss | 0.0976 | -| std | 0.00643 | -| value_loss | 9.75e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21691 | -| time_elapsed | 117237 | -| total_timesteps | 2776448 | -| train/ | | -| approx_kl | 0.01948224 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00859 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 216900 | -| policy_gradient_loss | 0.0176 | -| std | 0.00643 | -| value_loss | 3.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21692 | -| time_elapsed | 117242 | -| total_timesteps | 2776576 | -| train/ | | -| approx_kl | 0.15901467 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | 0.0871 | -| n_updates | 216910 | -| policy_gradient_loss | 0.0346 | -| std | 0.00643 | -| value_loss | 1.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21693 | -| time_elapsed | 117247 | -| total_timesteps | 2776704 | -| train/ | | -| approx_kl | 0.048800386 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 216920 | -| policy_gradient_loss | 0.0541 | -| std | 0.00643 | -| value_loss | 5.91e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21694 | -| time_elapsed | 117251 | -| total_timesteps | 2776832 | -| train/ | | -| approx_kl | 0.0022458732 | -| clip_fraction | 0.569 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0648 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 216930 | -| policy_gradient_loss | 0.0792 | -| std | 0.00643 | -| value_loss | 3.53e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21695 | -| time_elapsed | 117255 | -| total_timesteps | 2776960 | -| train/ | | -| approx_kl | 0.15620437 | -| clip_fraction | 0.694 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0716 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 216940 | -| policy_gradient_loss | 0.176 | -| std | 0.00643 | -| value_loss | 3.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21696 | -| time_elapsed | 117259 | -| total_timesteps | 2777088 | -| train/ | | -| approx_kl | 0.087205715 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0577 | -| n_updates | 216950 | -| policy_gradient_loss | 0.0472 | -| std | 0.00642 | -| value_loss | 4.02e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21697 | -| time_elapsed | 117270 | -| total_timesteps | 2777216 | -| train/ | | -| approx_kl | 0.55393 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | 0.0849 | -| n_updates | 216960 | -| policy_gradient_loss | 0.0412 | -| std | 0.00641 | -| value_loss | 0.000985 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21698 | -| time_elapsed | 117275 | -| total_timesteps | 2777344 | -| train/ | | -| approx_kl | 0.28089467 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.3 | -| learning_rate | 0.0003 | -| loss | 0.0721 | -| n_updates | 216970 | -| policy_gradient_loss | 0.0634 | -| std | 0.00641 | -| value_loss | 2.81e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21699 | -| time_elapsed | 117281 | -| total_timesteps | 2777472 | -| train/ | | -| approx_kl | 0.054814838 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 216980 | -| policy_gradient_loss | 0.0205 | -| std | 0.00641 | -| value_loss | 3.31e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21700 | -| time_elapsed | 117288 | -| total_timesteps | 2777600 | -| train/ | | -| approx_kl | 0.4804734 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.0906 | -| n_updates | 216990 | -| policy_gradient_loss | 0.0232 | -| std | 0.00642 | -| value_loss | 1.5e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21701 | -| time_elapsed | 117293 | -| total_timesteps | 2777728 | -| train/ | | -| approx_kl | 0.040560134 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.421 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 217000 | -| policy_gradient_loss | 0.00624 | -| std | 0.00643 | -| value_loss | 1.35e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21702 | -| time_elapsed | 117297 | -| total_timesteps | 2777856 | -| train/ | | -| approx_kl | 0.0073571024 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00563 | -| learning_rate | 0.0003 | -| loss | -0.00353 | -| n_updates | 217010 | -| policy_gradient_loss | 0.00249 | -| std | 0.00644 | -| value_loss | 6.65e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21703 | -| time_elapsed | 117303 | -| total_timesteps | 2777984 | -| train/ | | -| approx_kl | 0.0012472048 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.00852 | -| n_updates | 217020 | -| policy_gradient_loss | 0.00171 | -| std | 0.00644 | -| value_loss | 6.62e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21704 | -| time_elapsed | 117309 | -| total_timesteps | 2778112 | -| train/ | | -| approx_kl | 0.05643639 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.00552 | -| n_updates | 217030 | -| policy_gradient_loss | 0.00107 | -| std | 0.00644 | -| value_loss | 3.92e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21705 | -| time_elapsed | 117322 | -| total_timesteps | 2778240 | -| train/ | | -| approx_kl | 0.068336904 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.484 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 217040 | -| policy_gradient_loss | -0.00884 | -| std | 0.00644 | -| value_loss | 0.00149 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21706 | -| time_elapsed | 117326 | -| total_timesteps | 2778368 | -| train/ | | -| approx_kl | 0.031832617 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 217050 | -| policy_gradient_loss | 0.0115 | -| std | 0.00644 | -| value_loss | 4.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21707 | -| time_elapsed | 117330 | -| total_timesteps | 2778496 | -| train/ | | -| approx_kl | 0.061087526 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 217060 | -| policy_gradient_loss | 0.0154 | -| std | 0.00645 | -| value_loss | 1.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21708 | -| time_elapsed | 117334 | -| total_timesteps | 2778624 | -| train/ | | -| approx_kl | 0.051806502 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 217070 | -| policy_gradient_loss | 0.00871 | -| std | 0.00644 | -| value_loss | 2.27e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21709 | -| time_elapsed | 117339 | -| total_timesteps | 2778752 | -| train/ | | -| approx_kl | 0.05151008 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00969 | -| learning_rate | 0.0003 | -| loss | 0.00604 | -| n_updates | 217080 | -| policy_gradient_loss | 0.00247 | -| std | 0.00644 | -| value_loss | 6.07e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 21710 | -| time_elapsed | 117343 | -| total_timesteps | 2778880 | -| train/ | | -| approx_kl | 0.010209672 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 217090 | -| policy_gradient_loss | 0.0053 | -| std | 0.00644 | -| value_loss | 4.18e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21711 | -| time_elapsed | 117347 | -| total_timesteps | 2779008 | -| train/ | | -| approx_kl | 0.0024554832 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | -0.000299 | -| n_updates | 217100 | -| policy_gradient_loss | 0.00998 | -| std | 0.00644 | -| value_loss | 8.03e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21712 | -| time_elapsed | 117359 | -| total_timesteps | 2779136 | -| train/ | | -| approx_kl | 0.026793592 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.801 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 217110 | -| policy_gradient_loss | -0.00755 | -| std | 0.00643 | -| value_loss | 0.000802 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21713 | -| time_elapsed | 117366 | -| total_timesteps | 2779264 | -| train/ | | -| approx_kl | 0.0018433835 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.051 | -| learning_rate | 0.0003 | -| loss | -0.00943 | -| n_updates | 217120 | -| policy_gradient_loss | 0.0335 | -| std | 0.00643 | -| value_loss | 0.00259 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21714 | -| time_elapsed | 117371 | -| total_timesteps | 2779392 | -| train/ | | -| approx_kl | 0.8444875 | -| clip_fraction | 0.782 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.368 | -| learning_rate | 0.0003 | -| loss | 0.268 | -| n_updates | 217130 | -| policy_gradient_loss | 0.224 | -| std | 0.00643 | -| value_loss | 0.000462 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21715 | -| time_elapsed | 117377 | -| total_timesteps | 2779520 | -| train/ | | -| approx_kl | 0.029331494 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.00792 | -| n_updates | 217140 | -| policy_gradient_loss | 0.000775 | -| std | 0.00643 | -| value_loss | 5.63e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21716 | -| time_elapsed | 117382 | -| total_timesteps | 2779648 | -| train/ | | -| approx_kl | 0.013007002 | -| clip_fraction | 0.0727 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 217150 | -| policy_gradient_loss | -0.00188 | -| std | 0.00643 | -| value_loss | 2.23e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21717 | -| time_elapsed | 117386 | -| total_timesteps | 2779776 | -| train/ | | -| approx_kl | 0.030147502 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0727 | -| learning_rate | 0.0003 | -| loss | 0.00795 | -| n_updates | 217160 | -| policy_gradient_loss | 0.0309 | -| std | 0.00643 | -| value_loss | 1.58e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 21718 | -| time_elapsed | 117391 | -| total_timesteps | 2779904 | -| train/ | | -| approx_kl | 0.11971749 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 217170 | -| policy_gradient_loss | 0.0229 | -| std | 0.00643 | -| value_loss | 1.39e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21719 | -| time_elapsed | 117394 | -| total_timesteps | 2780032 | -| train/ | | -| approx_kl | 0.007404257 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 217180 | -| policy_gradient_loss | 0.00884 | -| std | 0.00643 | -| value_loss | 9.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21720 | -| time_elapsed | 117403 | -| total_timesteps | 2780160 | -| train/ | | -| approx_kl | 0.08306318 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 217190 | -| policy_gradient_loss | 0.00143 | -| std | 0.00643 | -| value_loss | 0.0003 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21721 | -| time_elapsed | 117407 | -| total_timesteps | 2780288 | -| train/ | | -| approx_kl | 0.5445104 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 217200 | -| policy_gradient_loss | 0.0604 | -| std | 0.00643 | -| value_loss | 2.06e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21722 | -| time_elapsed | 117411 | -| total_timesteps | 2780416 | -| train/ | | -| approx_kl | 0.012466568 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 217210 | -| policy_gradient_loss | 0.00339 | -| std | 0.00642 | -| value_loss | 3.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21723 | -| time_elapsed | 117417 | -| total_timesteps | 2780544 | -| train/ | | -| approx_kl | 0.0029688268 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 217220 | -| policy_gradient_loss | 0.00689 | -| std | 0.00642 | -| value_loss | 1.13e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21724 | -| time_elapsed | 117423 | -| total_timesteps | 2780672 | -| train/ | | -| approx_kl | 1.5191268e-05 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0662 | -| learning_rate | 0.0003 | -| loss | 0.000379 | -| n_updates | 217230 | -| policy_gradient_loss | 0.0305 | -| std | 0.00642 | -| value_loss | 2.06e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21725 | -| time_elapsed | 117427 | -| total_timesteps | 2780800 | -| train/ | | -| approx_kl | 0.17610501 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 217240 | -| policy_gradient_loss | 0.0497 | -| std | 0.00642 | -| value_loss | 1.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 21726 | -| time_elapsed | 117432 | -| total_timesteps | 2780928 | -| train/ | | -| approx_kl | 0.01132777 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 217250 | -| policy_gradient_loss | 0.0141 | -| std | 0.00642 | -| value_loss | 6.62e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21727 | -| time_elapsed | 117436 | -| total_timesteps | 2781056 | -| train/ | | -| approx_kl | 1.4538411e-05 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | -0.000255 | -| n_updates | 217260 | -| policy_gradient_loss | 0.0134 | -| std | 0.00642 | -| value_loss | 5.45e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21728 | -| time_elapsed | 117443 | -| total_timesteps | 2781184 | -| train/ | | -| approx_kl | 0.0048002168 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | -0.00998 | -| n_updates | 217270 | -| policy_gradient_loss | 0.000937 | -| std | 0.0064 | -| value_loss | 0.000616 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21729 | -| time_elapsed | 117447 | -| total_timesteps | 2781312 | -| train/ | | -| approx_kl | 0.00038440851 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.000737 | -| n_updates | 217280 | -| policy_gradient_loss | 0.0276 | -| std | 0.0064 | -| value_loss | 5.6e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21730 | -| time_elapsed | 117452 | -| total_timesteps | 2781440 | -| train/ | | -| approx_kl | 0.84160966 | -| clip_fraction | 0.761 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0701 | -| learning_rate | 0.0003 | -| loss | 0.298 | -| n_updates | 217290 | -| policy_gradient_loss | 0.164 | -| std | 0.00639 | -| value_loss | 2.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21731 | -| time_elapsed | 117456 | -| total_timesteps | 2781568 | -| train/ | | -| approx_kl | 0.021613624 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 217300 | -| policy_gradient_loss | 0.00392 | -| std | 0.00639 | -| value_loss | 1.91e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21732 | -| time_elapsed | 117461 | -| total_timesteps | 2781696 | -| train/ | | -| approx_kl | 0.020047963 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.00605 | -| n_updates | 217310 | -| policy_gradient_loss | 0.0259 | -| std | 0.0064 | -| value_loss | 1.2e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21733 | -| time_elapsed | 117466 | -| total_timesteps | 2781824 | -| train/ | | -| approx_kl | 0.24497518 | -| clip_fraction | 0.722 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 217320 | -| policy_gradient_loss | 0.103 | -| std | 0.0064 | -| value_loss | 8.29e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 21734 | -| time_elapsed | 117470 | -| total_timesteps | 2781952 | -| train/ | | -| approx_kl | 0.18384902 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 217330 | -| policy_gradient_loss | 0.139 | -| std | 0.0064 | -| value_loss | 5.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21735 | -| time_elapsed | 117476 | -| total_timesteps | 2782080 | -| train/ | | -| approx_kl | 0.031892538 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 217340 | -| policy_gradient_loss | 0.026 | -| std | 0.0064 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21736 | -| time_elapsed | 117485 | -| total_timesteps | 2782208 | -| train/ | | -| approx_kl | 0.020027023 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.539 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 217350 | -| policy_gradient_loss | 0.00714 | -| std | 0.0064 | -| value_loss | 0.00147 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21737 | -| time_elapsed | 117489 | -| total_timesteps | 2782336 | -| train/ | | -| approx_kl | 0.23473963 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -13 | -| learning_rate | 0.0003 | -| loss | 0.0361 | -| n_updates | 217360 | -| policy_gradient_loss | 0.00612 | -| std | 0.0064 | -| value_loss | 4.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21738 | -| time_elapsed | 117494 | -| total_timesteps | 2782464 | -| train/ | | -| approx_kl | 0.025645452 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0731 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 217370 | -| policy_gradient_loss | -0.0125 | -| std | 0.0064 | -| value_loss | 9.11e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21739 | -| time_elapsed | 117499 | -| total_timesteps | 2782592 | -| train/ | | -| approx_kl | 0.017670546 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 217380 | -| policy_gradient_loss | -0.00949 | -| std | 0.0064 | -| value_loss | 4.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21740 | -| time_elapsed | 117504 | -| total_timesteps | 2782720 | -| train/ | | -| approx_kl | 0.030124154 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0761 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 217390 | -| policy_gradient_loss | 0.0207 | -| std | 0.0064 | -| value_loss | 3.36e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21741 | -| time_elapsed | 117509 | -| total_timesteps | 2782848 | -| train/ | | -| approx_kl | 0.11010632 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | 0.0288 | -| n_updates | 217400 | -| policy_gradient_loss | 0.0169 | -| std | 0.0064 | -| value_loss | 2.46e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21742 | -| time_elapsed | 117513 | -| total_timesteps | 2782976 | -| train/ | | -| approx_kl | 0.00022752257 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | -0.00349 | -| n_updates | 217410 | -| policy_gradient_loss | 0.0289 | -| std | 0.0064 | -| value_loss | 1.84e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21743 | -| time_elapsed | 117516 | -| total_timesteps | 2783104 | -| train/ | | -| approx_kl | 0.56815565 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 217420 | -| policy_gradient_loss | 0.0551 | -| std | 0.0064 | -| value_loss | 1.12e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21744 | -| time_elapsed | 117523 | -| total_timesteps | 2783232 | -| train/ | | -| approx_kl | 0.16100061 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.73 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 217430 | -| policy_gradient_loss | -0.0105 | -| std | 0.00641 | -| value_loss | 0.00101 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21745 | -| time_elapsed | 117527 | -| total_timesteps | 2783360 | -| train/ | | -| approx_kl | 0.015774317 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 217440 | -| policy_gradient_loss | 0.0114 | -| std | 0.00641 | -| value_loss | 7.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21746 | -| time_elapsed | 117530 | -| total_timesteps | 2783488 | -| train/ | | -| approx_kl | 0.24248414 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 217450 | -| policy_gradient_loss | 0.138 | -| std | 0.00641 | -| value_loss | 6.39e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21747 | -| time_elapsed | 117535 | -| total_timesteps | 2783616 | -| train/ | | -| approx_kl | 0.14652142 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.0888 | -| n_updates | 217460 | -| policy_gradient_loss | 0.0823 | -| std | 0.00641 | -| value_loss | 3.2e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21748 | -| time_elapsed | 117539 | -| total_timesteps | 2783744 | -| train/ | | -| approx_kl | 0.17971383 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | 0.0573 | -| n_updates | 217470 | -| policy_gradient_loss | 0.0816 | -| std | 0.00644 | -| value_loss | 5.1e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21749 | -| time_elapsed | 117543 | -| total_timesteps | 2783872 | -| train/ | | -| approx_kl | 0.027711133 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -3.14 | -| learning_rate | 0.0003 | -| loss | 0.00148 | -| n_updates | 217480 | -| policy_gradient_loss | 0.0171 | -| std | 0.00645 | -| value_loss | 6.08e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21750 | -| time_elapsed | 117547 | -| total_timesteps | 2784000 | -| train/ | | -| approx_kl | 0.6948028 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00398 | -| learning_rate | 0.0003 | -| loss | 0.153 | -| n_updates | 217490 | -| policy_gradient_loss | 0.0621 | -| std | 0.00645 | -| value_loss | 2.06e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21751 | -| time_elapsed | 117552 | -| total_timesteps | 2784128 | -| train/ | | -| approx_kl | 0.044313397 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00361 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 217500 | -| policy_gradient_loss | 0.007 | -| std | 0.00646 | -| value_loss | 8.22e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21752 | -| time_elapsed | 117565 | -| total_timesteps | 2784256 | -| train/ | | -| approx_kl | 0.048229806 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.786 | -| learning_rate | 0.0003 | -| loss | 0.00544 | -| n_updates | 217510 | -| policy_gradient_loss | 0.013 | -| std | 0.00647 | -| value_loss | 0.0054 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21753 | -| time_elapsed | 117570 | -| total_timesteps | 2784384 | -| train/ | | -| approx_kl | 0.1579092 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 217520 | -| policy_gradient_loss | 0.0703 | -| std | 0.00648 | -| value_loss | 0.00113 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21754 | -| time_elapsed | 117573 | -| total_timesteps | 2784512 | -| train/ | | -| approx_kl | 0.04320801 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00758 | -| learning_rate | 0.0003 | -| loss | -0.0253 | -| n_updates | 217530 | -| policy_gradient_loss | 0.0108 | -| std | 0.00648 | -| value_loss | 0.000212 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21755 | -| time_elapsed | 117578 | -| total_timesteps | 2784640 | -| train/ | | -| approx_kl | 1.1131974 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | 0.277 | -| n_updates | 217540 | -| policy_gradient_loss | 0.125 | -| std | 0.00648 | -| value_loss | 9.54e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21756 | -| time_elapsed | 117584 | -| total_timesteps | 2784768 | -| train/ | | -| approx_kl | 0.007603941 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 217550 | -| policy_gradient_loss | 0.0185 | -| std | 0.00648 | -| value_loss | 6.48e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21757 | -| time_elapsed | 117590 | -| total_timesteps | 2784896 | -| train/ | | -| approx_kl | 0.0001798151 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.000788 | -| n_updates | 217560 | -| policy_gradient_loss | 0.0262 | -| std | 0.00648 | -| value_loss | 4.27e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21758 | -| time_elapsed | 117595 | -| total_timesteps | 2785024 | -| train/ | | -| approx_kl | 0.18449701 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | 0.0788 | -| n_updates | 217570 | -| policy_gradient_loss | 0.0185 | -| std | 0.00648 | -| value_loss | 3.23e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21759 | -| time_elapsed | 117606 | -| total_timesteps | 2785152 | -| train/ | | -| approx_kl | 0.0799342 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.961 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 217580 | -| policy_gradient_loss | 0.0136 | -| std | 0.00648 | -| value_loss | 0.000474 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21760 | -| time_elapsed | 117610 | -| total_timesteps | 2785280 | -| train/ | | -| approx_kl | 0.03832314 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 217590 | -| policy_gradient_loss | 0.0233 | -| std | 0.00648 | -| value_loss | 3.31e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21761 | -| time_elapsed | 117615 | -| total_timesteps | 2785408 | -| train/ | | -| approx_kl | 0.049809728 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 217600 | -| policy_gradient_loss | 0.0284 | -| std | 0.00648 | -| value_loss | 4.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21762 | -| time_elapsed | 117620 | -| total_timesteps | 2785536 | -| train/ | | -| approx_kl | 0.40115657 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 217610 | -| policy_gradient_loss | 0.0732 | -| std | 0.00648 | -| value_loss | 1.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21763 | -| time_elapsed | 117624 | -| total_timesteps | 2785664 | -| train/ | | -| approx_kl | 0.004698484 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0802 | -| learning_rate | 0.0003 | -| loss | -0.00814 | -| n_updates | 217620 | -| policy_gradient_loss | 0.0026 | -| std | 0.00648 | -| value_loss | 1.28e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21764 | -| time_elapsed | 117629 | -| total_timesteps | 2785792 | -| train/ | | -| approx_kl | 0.00011684606 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.055 | -| learning_rate | 0.0003 | -| loss | 0.000624 | -| n_updates | 217630 | -| policy_gradient_loss | 0.0107 | -| std | 0.00648 | -| value_loss | 7.92e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21765 | -| time_elapsed | 117635 | -| total_timesteps | 2785920 | -| train/ | | -| approx_kl | 0.0003921548 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0702 | -| learning_rate | 0.0003 | -| loss | -0.000803 | -| n_updates | 217640 | -| policy_gradient_loss | 0.0121 | -| std | 0.00648 | -| value_loss | 5.02e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21766 | -| time_elapsed | 117640 | -| total_timesteps | 2786048 | -| train/ | | -| approx_kl | 0.06734157 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0857 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 217650 | -| policy_gradient_loss | 0.0579 | -| std | 0.00648 | -| value_loss | 4.57e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21767 | -| time_elapsed | 117648 | -| total_timesteps | 2786176 | -| train/ | | -| approx_kl | 0.048192035 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.034 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 217660 | -| policy_gradient_loss | -0.0128 | -| std | 0.00648 | -| value_loss | 0.00222 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21768 | -| time_elapsed | 117653 | -| total_timesteps | 2786304 | -| train/ | | -| approx_kl | 0.35077193 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.623 | -| learning_rate | 0.0003 | -| loss | 0.0628 | -| n_updates | 217670 | -| policy_gradient_loss | 0.0193 | -| std | 0.00648 | -| value_loss | 3.24e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21769 | -| time_elapsed | 117659 | -| total_timesteps | 2786432 | -| train/ | | -| approx_kl | 0.16745567 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0104 | -| learning_rate | 0.0003 | -| loss | 0.0711 | -| n_updates | 217680 | -| policy_gradient_loss | 0.0124 | -| std | 0.00648 | -| value_loss | 1.54e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21770 | -| time_elapsed | 117664 | -| total_timesteps | 2786560 | -| train/ | | -| approx_kl | 0.007469024 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | 0.00701 | -| n_updates | 217690 | -| policy_gradient_loss | 0.0198 | -| std | 0.00648 | -| value_loss | 6.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21771 | -| time_elapsed | 117668 | -| total_timesteps | 2786688 | -| train/ | | -| approx_kl | 0.015742568 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 217700 | -| policy_gradient_loss | 0.0431 | -| std | 0.00648 | -| value_loss | 3.12e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21772 | -| time_elapsed | 117673 | -| total_timesteps | 2786816 | -| train/ | | -| approx_kl | 0.12004739 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.044 | -| n_updates | 217710 | -| policy_gradient_loss | 0.0241 | -| std | 0.00647 | -| value_loss | 1.54e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 21773 | -| time_elapsed | 117678 | -| total_timesteps | 2786944 | -| train/ | | -| approx_kl | 0.1937865 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | 0.0586 | -| n_updates | 217720 | -| policy_gradient_loss | 0.0204 | -| std | 0.00647 | -| value_loss | 2.42e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21774 | -| time_elapsed | 117683 | -| total_timesteps | 2787072 | -| train/ | | -| approx_kl | 0.026969116 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 217730 | -| policy_gradient_loss | 0.0315 | -| std | 0.00648 | -| value_loss | 1.24e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21775 | -| time_elapsed | 117691 | -| total_timesteps | 2787200 | -| train/ | | -| approx_kl | 0.21274522 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 217740 | -| policy_gradient_loss | 0.125 | -| std | 0.00648 | -| value_loss | 3.98e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21776 | -| time_elapsed | 117695 | -| total_timesteps | 2787328 | -| train/ | | -| approx_kl | 0.18408468 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.856 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 217750 | -| policy_gradient_loss | 0.133 | -| std | 0.00648 | -| value_loss | 1.85e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21777 | -| time_elapsed | 117700 | -| total_timesteps | 2787456 | -| train/ | | -| approx_kl | 0.02590163 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.00142 | -| n_updates | 217760 | -| policy_gradient_loss | 0.0191 | -| std | 0.00648 | -| value_loss | 3.08e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21778 | -| time_elapsed | 117706 | -| total_timesteps | 2787584 | -| train/ | | -| approx_kl | 0.5542801 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00646 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 217770 | -| policy_gradient_loss | 0.0546 | -| std | 0.00648 | -| value_loss | 1.5e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21779 | -| time_elapsed | 117710 | -| total_timesteps | 2787712 | -| train/ | | -| approx_kl | 0.0538233 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.0265 | -| n_updates | 217780 | -| policy_gradient_loss | 0.0139 | -| std | 0.00648 | -| value_loss | 9.83e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21780 | -| time_elapsed | 117714 | -| total_timesteps | 2787840 | -| train/ | | -| approx_kl | 0.06351856 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 217790 | -| policy_gradient_loss | 0.02 | -| std | 0.00647 | -| value_loss | 5.71e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21781 | -| time_elapsed | 117718 | -| total_timesteps | 2787968 | -| train/ | | -| approx_kl | 0.048895653 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 217800 | -| policy_gradient_loss | 0.00614 | -| std | 0.00647 | -| value_loss | 4.24e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21782 | -| time_elapsed | 117723 | -| total_timesteps | 2788096 | -| train/ | | -| approx_kl | 0.00893637 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 217810 | -| policy_gradient_loss | 0.00499 | -| std | 0.00647 | -| value_loss | 3.24e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21783 | -| time_elapsed | 117734 | -| total_timesteps | 2788224 | -| train/ | | -| approx_kl | 0.0005521318 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | 0.00476 | -| n_updates | 217820 | -| policy_gradient_loss | 0.00242 | -| std | 0.00646 | -| value_loss | 0.0032 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21784 | -| time_elapsed | 117740 | -| total_timesteps | 2788352 | -| train/ | | -| approx_kl | 0.068242 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.264 | -| learning_rate | 0.0003 | -| loss | -0.000549 | -| n_updates | 217830 | -| policy_gradient_loss | -0.00267 | -| std | 0.00646 | -| value_loss | 3.51e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21785 | -| time_elapsed | 117746 | -| total_timesteps | 2788480 | -| train/ | | -| approx_kl | 0.010522164 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.000331 | -| learning_rate | 0.0003 | -| loss | -0.000942 | -| n_updates | 217840 | -| policy_gradient_loss | 0.00751 | -| std | 0.00646 | -| value_loss | 3.61e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21786 | -| time_elapsed | 117749 | -| total_timesteps | 2788608 | -| train/ | | -| approx_kl | 0.060124 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.00317 | -| n_updates | 217850 | -| policy_gradient_loss | -0.00267 | -| std | 0.00646 | -| value_loss | 2.17e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21787 | -| time_elapsed | 117755 | -| total_timesteps | 2788736 | -| train/ | | -| approx_kl | 0.043769725 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 217860 | -| policy_gradient_loss | 0.0126 | -| std | 0.00646 | -| value_loss | 1.49e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21788 | -| time_elapsed | 117758 | -| total_timesteps | 2788864 | -| train/ | | -| approx_kl | 0.0078081605 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | 0.000528 | -| n_updates | 217870 | -| policy_gradient_loss | 0.00663 | -| std | 0.00646 | -| value_loss | 1.03e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21789 | -| time_elapsed | 117762 | -| total_timesteps | 2788992 | -| train/ | | -| approx_kl | 0.0026250375 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 217880 | -| policy_gradient_loss | 0.00934 | -| std | 0.00646 | -| value_loss | 6.7e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21790 | -| time_elapsed | 117767 | -| total_timesteps | 2789120 | -| train/ | | -| approx_kl | 0.043098036 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.0887 | -| n_updates | 217890 | -| policy_gradient_loss | 0.0819 | -| std | 0.00646 | -| value_loss | 4.14e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21791 | -| time_elapsed | 117779 | -| total_timesteps | 2789248 | -| train/ | | -| approx_kl | 0.2117879 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.462 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 217900 | -| policy_gradient_loss | 0.028 | -| std | 0.00646 | -| value_loss | 0.0016 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21792 | -| time_elapsed | 117784 | -| total_timesteps | 2789376 | -| train/ | | -| approx_kl | 0.016949086 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -21 | -| learning_rate | 0.0003 | -| loss | 0.00641 | -| n_updates | 217910 | -| policy_gradient_loss | 0.011 | -| std | 0.00647 | -| value_loss | 7.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21793 | -| time_elapsed | 117788 | -| total_timesteps | 2789504 | -| train/ | | -| approx_kl | 0.048701607 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0972 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 217920 | -| policy_gradient_loss | 0.034 | -| std | 0.00648 | -| value_loss | 7.16e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21794 | -| time_elapsed | 117792 | -| total_timesteps | 2789632 | -| train/ | | -| approx_kl | 0.32232958 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.244 | -| n_updates | 217930 | -| policy_gradient_loss | 0.144 | -| std | 0.00648 | -| value_loss | 3.08e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21795 | -| time_elapsed | 117797 | -| total_timesteps | 2789760 | -| train/ | | -| approx_kl | 0.055915277 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 217940 | -| policy_gradient_loss | 0.0284 | -| std | 0.00648 | -| value_loss | 1.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21796 | -| time_elapsed | 117801 | -| total_timesteps | 2789888 | -| train/ | | -| approx_kl | 0.53618777 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 217950 | -| policy_gradient_loss | 0.0435 | -| std | 0.00648 | -| value_loss | 1.44e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21797 | -| time_elapsed | 117805 | -| total_timesteps | 2790016 | -| train/ | | -| approx_kl | 0.03706572 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.00744 | -| n_updates | 217960 | -| policy_gradient_loss | 0.00575 | -| std | 0.00648 | -| value_loss | 1.1e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21798 | -| time_elapsed | 117817 | -| total_timesteps | 2790144 | -| train/ | | -| approx_kl | 0.038982287 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.0186 | -| n_updates | 217970 | -| policy_gradient_loss | -0.00991 | -| std | 0.00648 | -| value_loss | 0.000467 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21799 | -| time_elapsed | 117821 | -| total_timesteps | 2790272 | -| train/ | | -| approx_kl | 0.07587997 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0218 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 217980 | -| policy_gradient_loss | 0.00756 | -| std | 0.00649 | -| value_loss | 3.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21800 | -| time_elapsed | 117827 | -| total_timesteps | 2790400 | -| train/ | | -| approx_kl | 0.010590849 | -| clip_fraction | 0.196 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 217990 | -| policy_gradient_loss | 0.00474 | -| std | 0.00648 | -| value_loss | 4.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21801 | -| time_elapsed | 117832 | -| total_timesteps | 2790528 | -| train/ | | -| approx_kl | 0.024125796 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.00931 | -| n_updates | 218000 | -| policy_gradient_loss | 0.0182 | -| std | 0.00649 | -| value_loss | 3.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21802 | -| time_elapsed | 117836 | -| total_timesteps | 2790656 | -| train/ | | -| approx_kl | 0.046601746 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.00409 | -| n_updates | 218010 | -| policy_gradient_loss | 0.0299 | -| std | 0.0065 | -| value_loss | 1.07e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21803 | -| time_elapsed | 117840 | -| total_timesteps | 2790784 | -| train/ | | -| approx_kl | 0.1162362 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0907 | -| n_updates | 218020 | -| policy_gradient_loss | 0.0505 | -| std | 0.00651 | -| value_loss | 2.13e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 21804 | -| time_elapsed | 117845 | -| total_timesteps | 2790912 | -| train/ | | -| approx_kl | 0.00016317703 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.000562 | -| n_updates | 218030 | -| policy_gradient_loss | 0.0148 | -| std | 0.00651 | -| value_loss | 1.32e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21805 | -| time_elapsed | 117850 | -| total_timesteps | 2791040 | -| train/ | | -| approx_kl | 0.040961295 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 218040 | -| policy_gradient_loss | 0.0339 | -| std | 0.00651 | -| value_loss | 8.93e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21806 | -| time_elapsed | 117859 | -| total_timesteps | 2791168 | -| train/ | | -| approx_kl | 0.13640216 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | 0.0784 | -| n_updates | 218050 | -| policy_gradient_loss | 0.047 | -| std | 0.00651 | -| value_loss | 4e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21807 | -| time_elapsed | 117864 | -| total_timesteps | 2791296 | -| train/ | | -| approx_kl | 0.037940912 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 218060 | -| policy_gradient_loss | 0.0399 | -| std | 0.00651 | -| value_loss | 2.91e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21808 | -| time_elapsed | 117869 | -| total_timesteps | 2791424 | -| train/ | | -| approx_kl | 0.69996995 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00354 | -| learning_rate | 0.0003 | -| loss | 0.286 | -| n_updates | 218070 | -| policy_gradient_loss | 0.146 | -| std | 0.00651 | -| value_loss | 8.49e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21809 | -| time_elapsed | 117872 | -| total_timesteps | 2791552 | -| train/ | | -| approx_kl | 0.009316046 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | 0.00048 | -| n_updates | 218080 | -| policy_gradient_loss | 0.0404 | -| std | 0.00651 | -| value_loss | 5.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21810 | -| time_elapsed | 117875 | -| total_timesteps | 2791680 | -| train/ | | -| approx_kl | 0.099006414 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0651 | -| n_updates | 218090 | -| policy_gradient_loss | 0.0332 | -| std | 0.0065 | -| value_loss | 6.24e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21811 | -| time_elapsed | 117879 | -| total_timesteps | 2791808 | -| train/ | | -| approx_kl | 2.03792e-05 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | -0.000299 | -| n_updates | 218100 | -| policy_gradient_loss | 0.0424 | -| std | 0.0065 | -| value_loss | 2.89e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21812 | -| time_elapsed | 117883 | -| total_timesteps | 2791936 | -| train/ | | -| approx_kl | 0.71645296 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 218110 | -| policy_gradient_loss | 0.0731 | -| std | 0.00649 | -| value_loss | 1.83e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21813 | -| time_elapsed | 117888 | -| total_timesteps | 2792064 | -| train/ | | -| approx_kl | 0.044321742 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 218120 | -| policy_gradient_loss | 0.00693 | -| std | 0.00649 | -| value_loss | 1.37e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21814 | -| time_elapsed | 117897 | -| total_timesteps | 2792192 | -| train/ | | -| approx_kl | 0.073592044 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.504 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 218130 | -| policy_gradient_loss | -0.00869 | -| std | 0.00649 | -| value_loss | 0.00148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21815 | -| time_elapsed | 117901 | -| total_timesteps | 2792320 | -| train/ | | -| approx_kl | 0.017810494 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -2.48 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 218140 | -| policy_gradient_loss | 0.011 | -| std | 0.00649 | -| value_loss | 4.86e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21816 | -| time_elapsed | 117905 | -| total_timesteps | 2792448 | -| train/ | | -| approx_kl | 0.03446005 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -4.85 | -| learning_rate | 0.0003 | -| loss | -0.00213 | -| n_updates | 218150 | -| policy_gradient_loss | 0.0163 | -| std | 0.00649 | -| value_loss | 4.8e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21817 | -| time_elapsed | 117909 | -| total_timesteps | 2792576 | -| train/ | | -| approx_kl | 0.1694852 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 218160 | -| policy_gradient_loss | 0.0581 | -| std | 0.00649 | -| value_loss | 1.06e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21818 | -| time_elapsed | 117914 | -| total_timesteps | 2792704 | -| train/ | | -| approx_kl | 0.34207144 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.182 | -| n_updates | 218170 | -| policy_gradient_loss | 0.0916 | -| std | 0.00647 | -| value_loss | 2.54e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21819 | -| time_elapsed | 117918 | -| total_timesteps | 2792832 | -| train/ | | -| approx_kl | 0.068729855 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -4.95 | -| learning_rate | 0.0003 | -| loss | 0.006 | -| n_updates | 218180 | -| policy_gradient_loss | 0.0223 | -| std | 0.00646 | -| value_loss | 4.97e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21820 | -| time_elapsed | 117922 | -| total_timesteps | 2792960 | -| train/ | | -| approx_kl | 1.162208 | -| clip_fraction | 0.759 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | 0.257 | -| n_updates | 218190 | -| policy_gradient_loss | 0.181 | -| std | 0.00647 | -| value_loss | 2.65e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21821 | -| time_elapsed | 117926 | -| total_timesteps | 2793088 | -| train/ | | -| approx_kl | 0.044810347 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -9.88 | -| learning_rate | 0.0003 | -| loss | -0.000147 | -| n_updates | 218200 | -| policy_gradient_loss | -0.00392 | -| std | 0.00647 | -| value_loss | 3.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21822 | -| time_elapsed | 117935 | -| total_timesteps | 2793216 | -| train/ | | -| approx_kl | 0.020461693 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.578 | -| learning_rate | 0.0003 | -| loss | -0.00101 | -| n_updates | 218210 | -| policy_gradient_loss | -0.00521 | -| std | 0.00646 | -| value_loss | 0.0117 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21823 | -| time_elapsed | 117939 | -| total_timesteps | 2793344 | -| train/ | | -| approx_kl | 0.026547994 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 218220 | -| policy_gradient_loss | 0.0292 | -| std | 0.00646 | -| value_loss | 0.000532 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21824 | -| time_elapsed | 117944 | -| total_timesteps | 2793472 | -| train/ | | -| approx_kl | 0.40422475 | -| clip_fraction | 0.728 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00524 | -| learning_rate | 0.0003 | -| loss | 0.264 | -| n_updates | 218230 | -| policy_gradient_loss | 0.2 | -| std | 0.00646 | -| value_loss | 0.000112 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21825 | -| time_elapsed | 117949 | -| total_timesteps | 2793600 | -| train/ | | -| approx_kl | 0.049128767 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00575 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 218240 | -| policy_gradient_loss | 0.0191 | -| std | 0.00646 | -| value_loss | 7.61e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21826 | -| time_elapsed | 117955 | -| total_timesteps | 2793728 | -| train/ | | -| approx_kl | 0.57717705 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 218250 | -| policy_gradient_loss | 0.0547 | -| std | 0.00646 | -| value_loss | 4.04e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21827 | -| time_elapsed | 117960 | -| total_timesteps | 2793856 | -| train/ | | -| approx_kl | 0.010937221 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.00159 | -| n_updates | 218260 | -| policy_gradient_loss | 0.00652 | -| std | 0.00646 | -| value_loss | 2.33e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 21828 | -| time_elapsed | 117965 | -| total_timesteps | 2793984 | -| train/ | | -| approx_kl | 0.00062305434 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.0069 | -| n_updates | 218270 | -| policy_gradient_loss | -0.00101 | -| std | 0.00646 | -| value_loss | 1.9e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21829 | -| time_elapsed | 117969 | -| total_timesteps | 2794112 | -| train/ | | -| approx_kl | 0.061743222 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 218280 | -| policy_gradient_loss | 0.0174 | -| std | 0.00646 | -| value_loss | 8.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21830 | -| time_elapsed | 117981 | -| total_timesteps | 2794240 | -| train/ | | -| approx_kl | 0.020784158 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.806 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 218290 | -| policy_gradient_loss | -0.00828 | -| std | 0.00646 | -| value_loss | 0.00482 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21831 | -| time_elapsed | 117986 | -| total_timesteps | 2794368 | -| train/ | | -| approx_kl | 0.08533393 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0425 | -| n_updates | 218300 | -| policy_gradient_loss | 0.015 | -| std | 0.00646 | -| value_loss | 4.05e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21832 | -| time_elapsed | 117991 | -| total_timesteps | 2794496 | -| train/ | | -| approx_kl | 0.014219394 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00251 | -| learning_rate | 0.0003 | -| loss | 0.00178 | -| n_updates | 218310 | -| policy_gradient_loss | 0.00747 | -| std | 0.00646 | -| value_loss | 6.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21833 | -| time_elapsed | 117996 | -| total_timesteps | 2794624 | -| train/ | | -| approx_kl | 0.060348436 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0798 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 218320 | -| policy_gradient_loss | 0.0129 | -| std | 0.00646 | -| value_loss | 4.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21834 | -| time_elapsed | 118001 | -| total_timesteps | 2794752 | -| train/ | | -| approx_kl | 0.055252142 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0588 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 218330 | -| policy_gradient_loss | 0.0143 | -| std | 0.00646 | -| value_loss | 3.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21835 | -| time_elapsed | 118004 | -| total_timesteps | 2794880 | -| train/ | | -| approx_kl | 0.038114697 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 218340 | -| policy_gradient_loss | 0.00555 | -| std | 0.00646 | -| value_loss | 2.12e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21836 | -| time_elapsed | 118008 | -| total_timesteps | 2795008 | -| train/ | | -| approx_kl | 0.05543325 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0621 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 218350 | -| policy_gradient_loss | 0.0081 | -| std | 0.00646 | -| value_loss | 1.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21837 | -| time_elapsed | 118018 | -| total_timesteps | 2795136 | -| train/ | | -| approx_kl | 0.011750102 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.251 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 218360 | -| policy_gradient_loss | -0.0103 | -| std | 0.00646 | -| value_loss | 0.00177 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21838 | -| time_elapsed | 118023 | -| total_timesteps | 2795264 | -| train/ | | -| approx_kl | 0.0054163793 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0602 | -| learning_rate | 0.0003 | -| loss | 0.00379 | -| n_updates | 218370 | -| policy_gradient_loss | 0.00763 | -| std | 0.00645 | -| value_loss | 0.00298 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21839 | -| time_elapsed | 118027 | -| total_timesteps | 2795392 | -| train/ | | -| approx_kl | 0.064275526 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 218380 | -| policy_gradient_loss | -0.00137 | -| std | 0.00645 | -| value_loss | 0.000216 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21840 | -| time_elapsed | 118032 | -| total_timesteps | 2795520 | -| train/ | | -| approx_kl | 0.09215488 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | 0.0704 | -| n_updates | 218390 | -| policy_gradient_loss | 0.0319 | -| std | 0.00642 | -| value_loss | 0.00304 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21841 | -| time_elapsed | 118036 | -| total_timesteps | 2795648 | -| train/ | | -| approx_kl | 0.47679454 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -3.01 | -| learning_rate | 0.0003 | -| loss | 0.205 | -| n_updates | 218400 | -| policy_gradient_loss | 0.0579 | -| std | 0.0064 | -| value_loss | 2.14e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21842 | -| time_elapsed | 118040 | -| total_timesteps | 2795776 | -| train/ | | -| approx_kl | 0.0039761937 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.000314 | -| learning_rate | 0.0003 | -| loss | -0.000719 | -| n_updates | 218410 | -| policy_gradient_loss | 0.0182 | -| std | 0.0064 | -| value_loss | 7.42e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 21843 | -| time_elapsed | 118044 | -| total_timesteps | 2795904 | -| train/ | | -| approx_kl | 0.00705524 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0914 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 218420 | -| policy_gradient_loss | 0.00428 | -| std | 0.0064 | -| value_loss | 1.07e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21844 | -| time_elapsed | 118048 | -| total_timesteps | 2796032 | -| train/ | | -| approx_kl | 0.0054380298 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 218430 | -| policy_gradient_loss | 0.0763 | -| std | 0.0064 | -| value_loss | 3.7e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21845 | -| time_elapsed | 118057 | -| total_timesteps | 2796160 | -| train/ | | -| approx_kl | 0.06223358 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.473 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 218440 | -| policy_gradient_loss | 0.00911 | -| std | 0.0064 | -| value_loss | 0.00136 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21846 | -| time_elapsed | 118063 | -| total_timesteps | 2796288 | -| train/ | | -| approx_kl | 0.22090116 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | 0.0729 | -| n_updates | 218450 | -| policy_gradient_loss | 0.0441 | -| std | 0.0064 | -| value_loss | 2.51e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21847 | -| time_elapsed | 118068 | -| total_timesteps | 2796416 | -| train/ | | -| approx_kl | 0.0026158332 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.00128 | -| n_updates | 218460 | -| policy_gradient_loss | 0.00782 | -| std | 0.0064 | -| value_loss | 1.32e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21848 | -| time_elapsed | 118073 | -| total_timesteps | 2796544 | -| train/ | | -| approx_kl | 9.011943e-06 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0997 | -| learning_rate | 0.0003 | -| loss | 0.000117 | -| n_updates | 218470 | -| policy_gradient_loss | 0.00913 | -| std | 0.00641 | -| value_loss | 1.07e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21849 | -| time_elapsed | 118079 | -| total_timesteps | 2796672 | -| train/ | | -| approx_kl | 0.08383361 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.0554 | -| n_updates | 218480 | -| policy_gradient_loss | 0.0881 | -| std | 0.00641 | -| value_loss | 7.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21850 | -| time_elapsed | 118084 | -| total_timesteps | 2796800 | -| train/ | | -| approx_kl | 0.26273334 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.0608 | -| n_updates | 218490 | -| policy_gradient_loss | 0.0346 | -| std | 0.00641 | -| value_loss | 6.46e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 21851 | -| time_elapsed | 118089 | -| total_timesteps | 2796928 | -| train/ | | -| approx_kl | 0.0011866898 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | -0.00115 | -| n_updates | 218500 | -| policy_gradient_loss | 0.0169 | -| std | 0.00641 | -| value_loss | 3.51e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21852 | -| time_elapsed | 118093 | -| total_timesteps | 2797056 | -| train/ | | -| approx_kl | 8.887146e-06 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | -0.000459 | -| n_updates | 218510 | -| policy_gradient_loss | 0.00325 | -| std | 0.00641 | -| value_loss | 2.94e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21853 | -| time_elapsed | 118101 | -| total_timesteps | 2797184 | -| train/ | | -| approx_kl | 0.007918481 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | -0.00609 | -| n_updates | 218520 | -| policy_gradient_loss | -0.00522 | -| std | 0.00641 | -| value_loss | 0.00421 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21854 | -| time_elapsed | 118106 | -| total_timesteps | 2797312 | -| train/ | | -| approx_kl | 0.0058416105 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.02 | -| learning_rate | 0.0003 | -| loss | -0.00841 | -| n_updates | 218530 | -| policy_gradient_loss | 0.00307 | -| std | 0.00641 | -| value_loss | 1.82e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21855 | -| time_elapsed | 118111 | -| total_timesteps | 2797440 | -| train/ | | -| approx_kl | 7.235631e-05 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | 0.000638 | -| n_updates | 218540 | -| policy_gradient_loss | 0.00944 | -| std | 0.00641 | -| value_loss | 6.34e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21856 | -| time_elapsed | 118115 | -| total_timesteps | 2797568 | -| train/ | | -| approx_kl | 0.079555675 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 218550 | -| policy_gradient_loss | 0.0711 | -| std | 0.00641 | -| value_loss | 5.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21857 | -| time_elapsed | 118120 | -| total_timesteps | 2797696 | -| train/ | | -| approx_kl | 0.10196283 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.0717 | -| n_updates | 218560 | -| policy_gradient_loss | 0.0317 | -| std | 0.0064 | -| value_loss | 1.13e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21858 | -| time_elapsed | 118125 | -| total_timesteps | 2797824 | -| train/ | | -| approx_kl | 0.10885972 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.414 | -| learning_rate | 0.0003 | -| loss | 0.0677 | -| n_updates | 218570 | -| policy_gradient_loss | 0.0183 | -| std | 0.0064 | -| value_loss | 1.36e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21859 | -| time_elapsed | 118130 | -| total_timesteps | 2797952 | -| train/ | | -| approx_kl | 0.004111062 | -| clip_fraction | 0.0492 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 218580 | -| policy_gradient_loss | -0.000171 | -| std | 0.0064 | -| value_loss | 5.64e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21860 | -| time_elapsed | 118135 | -| total_timesteps | 2798080 | -| train/ | | -| approx_kl | 0.039144944 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0913 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 218590 | -| policy_gradient_loss | 0.0391 | -| std | 0.00641 | -| value_loss | 5.67e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21861 | -| time_elapsed | 118145 | -| total_timesteps | 2798208 | -| train/ | | -| approx_kl | 0.020390937 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 218600 | -| policy_gradient_loss | -0.0054 | -| std | 0.00641 | -| value_loss | 0.00179 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21862 | -| time_elapsed | 118151 | -| total_timesteps | 2798336 | -| train/ | | -| approx_kl | 0.013804473 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 218610 | -| policy_gradient_loss | -0.00743 | -| std | 0.00641 | -| value_loss | 2.89e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21863 | -| time_elapsed | 118156 | -| total_timesteps | 2798464 | -| train/ | | -| approx_kl | 0.19226679 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00714 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 218620 | -| policy_gradient_loss | 0.0136 | -| std | 0.00641 | -| value_loss | 3.04e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21864 | -| time_elapsed | 118160 | -| total_timesteps | 2798592 | -| train/ | | -| approx_kl | 0.1021353 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0972 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 218630 | -| policy_gradient_loss | 0.0485 | -| std | 0.00641 | -| value_loss | 1.89e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21865 | -| time_elapsed | 118164 | -| total_timesteps | 2798720 | -| train/ | | -| approx_kl | 0.0031034946 | -| clip_fraction | 0.0797 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0857 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 218640 | -| policy_gradient_loss | 0.000374 | -| std | 0.00641 | -| value_loss | 1.32e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21866 | -| time_elapsed | 118168 | -| total_timesteps | 2798848 | -| train/ | | -| approx_kl | 0.08579158 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0918 | -| learning_rate | 0.0003 | -| loss | 0.047 | -| n_updates | 218650 | -| policy_gradient_loss | 0.00933 | -| std | 0.00642 | -| value_loss | 1.63e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21867 | -| time_elapsed | 118173 | -| total_timesteps | 2798976 | -| train/ | | -| approx_kl | 0.041706953 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 218660 | -| policy_gradient_loss | 0.03 | -| std | 0.00642 | -| value_loss | 1.2e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21868 | -| time_elapsed | 118179 | -| total_timesteps | 2799104 | -| train/ | | -| approx_kl | 0.14961194 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00562 | -| learning_rate | 0.0003 | -| loss | 0.0977 | -| n_updates | 218670 | -| policy_gradient_loss | 0.0431 | -| std | 0.00642 | -| value_loss | 8.62e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21869 | -| time_elapsed | 118188 | -| total_timesteps | 2799232 | -| train/ | | -| approx_kl | 0.05426807 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.0082 | -| n_updates | 218680 | -| policy_gradient_loss | -0.0045 | -| std | 0.00643 | -| value_loss | 0.000437 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21870 | -| time_elapsed | 118193 | -| total_timesteps | 2799360 | -| train/ | | -| approx_kl | 0.018855356 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.539 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 218690 | -| policy_gradient_loss | 0.00826 | -| std | 0.00643 | -| value_loss | 2.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21871 | -| time_elapsed | 118198 | -| total_timesteps | 2799488 | -| train/ | | -| approx_kl | 0.03594919 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 218700 | -| policy_gradient_loss | 0.0472 | -| std | 0.00643 | -| value_loss | 2.19e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21872 | -| time_elapsed | 118204 | -| total_timesteps | 2799616 | -| train/ | | -| approx_kl | 0.1785199 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 218710 | -| policy_gradient_loss | 0.0495 | -| std | 0.00643 | -| value_loss | 1.21e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21873 | -| time_elapsed | 118207 | -| total_timesteps | 2799744 | -| train/ | | -| approx_kl | 0.004211166 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 218720 | -| policy_gradient_loss | 0.00178 | -| std | 0.00643 | -| value_loss | 1.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21874 | -| time_elapsed | 118211 | -| total_timesteps | 2799872 | -| train/ | | -| approx_kl | 0.07096066 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 218730 | -| policy_gradient_loss | 0.0577 | -| std | 0.00643 | -| value_loss | 9.69e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21875 | -| time_elapsed | 118216 | -| total_timesteps | 2800000 | -| train/ | | -| approx_kl | 0.2658548 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.0217 | -| n_updates | 218740 | -| policy_gradient_loss | 0.0337 | -| std | 0.00643 | -| value_loss | 8.42e-09 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21876 | -| time_elapsed | 118221 | -| total_timesteps | 2800128 | -| train/ | | -| approx_kl | 0.0016709715 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00301 | -| learning_rate | 0.0003 | -| loss | -0.00677 | -| n_updates | 218750 | -| policy_gradient_loss | 0.00227 | -| std | 0.00643 | -| value_loss | 4.25e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21877 | -| time_elapsed | 118228 | -| total_timesteps | 2800256 | -| train/ | | -| approx_kl | 0.0007186108 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 218760 | -| policy_gradient_loss | 0.000387 | -| std | 0.00642 | -| value_loss | 0.000224 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21878 | -| time_elapsed | 118234 | -| total_timesteps | 2800384 | -| train/ | | -| approx_kl | 0.00017510541 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.252 | -| learning_rate | 0.0003 | -| loss | -0.000325 | -| n_updates | 218770 | -| policy_gradient_loss | 0.0154 | -| std | 0.00643 | -| value_loss | 6.99e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21879 | -| time_elapsed | 118239 | -| total_timesteps | 2800512 | -| train/ | | -| approx_kl | 5.254522e-06 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.084 | -| learning_rate | 0.0003 | -| loss | -0.000164 | -| n_updates | 218780 | -| policy_gradient_loss | 0.0113 | -| std | 0.00642 | -| value_loss | 1.52e-05 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21880 | -| time_elapsed | 118244 | -| total_timesteps | 2800640 | -| train/ | | -| approx_kl | 0.064108 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 218790 | -| policy_gradient_loss | 0.0551 | -| std | 0.00641 | -| value_loss | 0.000177 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21881 | -| time_elapsed | 118249 | -| total_timesteps | 2800768 | -| train/ | | -| approx_kl | 0.046654895 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 218800 | -| policy_gradient_loss | 0.0232 | -| std | 0.0064 | -| value_loss | 6.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21882 | -| time_elapsed | 118253 | -| total_timesteps | 2800896 | -| train/ | | -| approx_kl | 0.000724704 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 218810 | -| policy_gradient_loss | 0.106 | -| std | 0.0064 | -| value_loss | 4.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21883 | -| time_elapsed | 118256 | -| total_timesteps | 2801024 | -| train/ | | -| approx_kl | 0.025489476 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | 0.032 | -| n_updates | 218820 | -| policy_gradient_loss | 0.0432 | -| std | 0.0064 | -| value_loss | 1.77e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21884 | -| time_elapsed | 118265 | -| total_timesteps | 2801152 | -| train/ | | -| approx_kl | 0.36128974 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 218830 | -| policy_gradient_loss | 0.11 | -| std | 0.0064 | -| value_loss | 6.31e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21885 | -| time_elapsed | 118270 | -| total_timesteps | 2801280 | -| train/ | | -| approx_kl | 0.2091388 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.0809 | -| n_updates | 218840 | -| policy_gradient_loss | 0.0957 | -| std | 0.0064 | -| value_loss | 5.91e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21886 | -| time_elapsed | 118274 | -| total_timesteps | 2801408 | -| train/ | | -| approx_kl | 0.13647284 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.412 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 218850 | -| policy_gradient_loss | 0.118 | -| std | 0.0064 | -| value_loss | 5.34e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21887 | -| time_elapsed | 118279 | -| total_timesteps | 2801536 | -| train/ | | -| approx_kl | 0.1725815 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 218860 | -| policy_gradient_loss | 0.158 | -| std | 0.0064 | -| value_loss | 2.2e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21888 | -| time_elapsed | 118284 | -| total_timesteps | 2801664 | -| train/ | | -| approx_kl | 0.12556414 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0066 | -| learning_rate | 0.0003 | -| loss | 0.096 | -| n_updates | 218870 | -| policy_gradient_loss | 0.118 | -| std | 0.0064 | -| value_loss | 1.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21889 | -| time_elapsed | 118289 | -| total_timesteps | 2801792 | -| train/ | | -| approx_kl | 0.024917683 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | 0.00987 | -| n_updates | 218880 | -| policy_gradient_loss | 0.0242 | -| std | 0.0064 | -| value_loss | 9.03e-09 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 21890 | -| time_elapsed | 118293 | -| total_timesteps | 2801920 | -| train/ | | -| approx_kl | 0.00042603305 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.000313 | -| n_updates | 218890 | -| policy_gradient_loss | 0.0374 | -| std | 0.0064 | -| value_loss | 4.57e-09 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21891 | -| time_elapsed | 118297 | -| total_timesteps | 2802048 | -| train/ | | -| approx_kl | 0.0010616607 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 218900 | -| policy_gradient_loss | 0.0347 | -| std | 0.0064 | -| value_loss | 4.68e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21892 | -| time_elapsed | 118307 | -| total_timesteps | 2802176 | -| train/ | | -| approx_kl | 0.106679946 | -| clip_fraction | 0.6 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.828 | -| learning_rate | 0.0003 | -| loss | 0.0712 | -| n_updates | 218910 | -| policy_gradient_loss | 0.0376 | -| std | 0.0064 | -| value_loss | 0.00393 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21893 | -| time_elapsed | 118313 | -| total_timesteps | 2802304 | -| train/ | | -| approx_kl | 0.042146932 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 218920 | -| policy_gradient_loss | 0.101 | -| std | 0.0064 | -| value_loss | 2.73e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21894 | -| time_elapsed | 118317 | -| total_timesteps | 2802432 | -| train/ | | -| approx_kl | 0.012257058 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00217 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 218930 | -| policy_gradient_loss | 0.0265 | -| std | 0.0064 | -| value_loss | 5.66e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21895 | -| time_elapsed | 118322 | -| total_timesteps | 2802560 | -| train/ | | -| approx_kl | 0.21281299 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 218940 | -| policy_gradient_loss | 0.0284 | -| std | 0.00641 | -| value_loss | 2.1e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21896 | -| time_elapsed | 118327 | -| total_timesteps | 2802688 | -| train/ | | -| approx_kl | 0.017141143 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | 0.0004 | -| n_updates | 218950 | -| policy_gradient_loss | -0.000746 | -| std | 0.00641 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21897 | -| time_elapsed | 118333 | -| total_timesteps | 2802816 | -| train/ | | -| approx_kl | 0.018210348 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | 0.00166 | -| n_updates | 218960 | -| policy_gradient_loss | 0.000334 | -| std | 0.0064 | -| value_loss | 9.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21898 | -| time_elapsed | 118337 | -| total_timesteps | 2802944 | -| train/ | | -| approx_kl | 0.031511366 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 218970 | -| policy_gradient_loss | 0.0228 | -| std | 0.0064 | -| value_loss | 8.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21899 | -| time_elapsed | 118342 | -| total_timesteps | 2803072 | -| train/ | | -| approx_kl | 0.33037812 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.192 | -| n_updates | 218980 | -| policy_gradient_loss | 0.14 | -| std | 0.00641 | -| value_loss | 6.88e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21900 | -| time_elapsed | 118351 | -| total_timesteps | 2803200 | -| train/ | | -| approx_kl | 0.0038440358 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.803 | -| learning_rate | 0.0003 | -| loss | -0.00821 | -| n_updates | 218990 | -| policy_gradient_loss | 0.000641 | -| std | 0.0064 | -| value_loss | 0.00507 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21901 | -| time_elapsed | 118356 | -| total_timesteps | 2803328 | -| train/ | | -| approx_kl | 0.54594624 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0734 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 219000 | -| policy_gradient_loss | 0.064 | -| std | 0.0064 | -| value_loss | 2.85e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21902 | -| time_elapsed | 118361 | -| total_timesteps | 2803456 | -| train/ | | -| approx_kl | 0.10239714 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.075 | -| n_updates | 219010 | -| policy_gradient_loss | 0.0718 | -| std | 0.00642 | -| value_loss | 4.08e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21903 | -| time_elapsed | 118366 | -| total_timesteps | 2803584 | -| train/ | | -| approx_kl | 7.920433e-05 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | -0.000922 | -| n_updates | 219020 | -| policy_gradient_loss | 0.00833 | -| std | 0.00643 | -| value_loss | 2.22e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21904 | -| time_elapsed | 118372 | -| total_timesteps | 2803712 | -| train/ | | -| approx_kl | 0.26489413 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 219030 | -| policy_gradient_loss | 0.044 | -| std | 0.00643 | -| value_loss | 1.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21905 | -| time_elapsed | 118378 | -| total_timesteps | 2803840 | -| train/ | | -| approx_kl | 0.19078255 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0709 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 219040 | -| policy_gradient_loss | 0.0182 | -| std | 0.00643 | -| value_loss | 8.91e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 21906 | -| time_elapsed | 118384 | -| total_timesteps | 2803968 | -| train/ | | -| approx_kl | 0.030771103 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0603 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 219050 | -| policy_gradient_loss | 0.045 | -| std | 0.00643 | -| value_loss | 5.59e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21907 | -| time_elapsed | 118389 | -| total_timesteps | 2804096 | -| train/ | | -| approx_kl | 0.1226629 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.0665 | -| n_updates | 219060 | -| policy_gradient_loss | 0.0338 | -| std | 0.00643 | -| value_loss | 5.14e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21908 | -| time_elapsed | 118399 | -| total_timesteps | 2804224 | -| train/ | | -| approx_kl | 0.015203055 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -5.97 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 219070 | -| policy_gradient_loss | -0.00109 | -| std | 0.00643 | -| value_loss | 0.00437 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21909 | -| time_elapsed | 118403 | -| total_timesteps | 2804352 | -| train/ | | -| approx_kl | 0.6074411 | -| clip_fraction | 0.507 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -98.5 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 219080 | -| policy_gradient_loss | 0.0256 | -| std | 0.00643 | -| value_loss | 3.83e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21910 | -| time_elapsed | 118406 | -| total_timesteps | 2804480 | -| train/ | | -| approx_kl | 0.0112130195 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0533 | -| learning_rate | 0.0003 | -| loss | 0.00423 | -| n_updates | 219090 | -| policy_gradient_loss | 0.0117 | -| std | 0.00643 | -| value_loss | 9.53e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21911 | -| time_elapsed | 118411 | -| total_timesteps | 2804608 | -| train/ | | -| approx_kl | 0.0007816097 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.39 | -| learning_rate | 0.0003 | -| loss | 0.00209 | -| n_updates | 219100 | -| policy_gradient_loss | 0.0048 | -| std | 0.00643 | -| value_loss | 3.07e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21912 | -| time_elapsed | 118417 | -| total_timesteps | 2804736 | -| train/ | | -| approx_kl | 0.06601087 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 219110 | -| policy_gradient_loss | 0.0143 | -| std | 0.00643 | -| value_loss | 2.04e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21913 | -| time_elapsed | 118421 | -| total_timesteps | 2804864 | -| train/ | | -| approx_kl | 0.04191206 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.00278 | -| n_updates | 219120 | -| policy_gradient_loss | 0.00176 | -| std | 0.00643 | -| value_loss | 3.78e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 21914 | -| time_elapsed | 118426 | -| total_timesteps | 2804992 | -| train/ | | -| approx_kl | 0.05198349 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00247 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 219130 | -| policy_gradient_loss | 0.012 | -| std | 0.00645 | -| value_loss | 1.11e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21915 | -| time_elapsed | 118431 | -| total_timesteps | 2805120 | -| train/ | | -| approx_kl | 0.0075540347 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0665 | -| learning_rate | 0.0003 | -| loss | -0.00543 | -| n_updates | 219140 | -| policy_gradient_loss | 0.00497 | -| std | 0.00645 | -| value_loss | 3.61e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21916 | -| time_elapsed | 118445 | -| total_timesteps | 2805248 | -| train/ | | -| approx_kl | 0.046439238 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0771 | -| learning_rate | 0.0003 | -| loss | -0.00708 | -| n_updates | 219150 | -| policy_gradient_loss | -0.00857 | -| std | 0.00646 | -| value_loss | 0.00205 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21917 | -| time_elapsed | 118449 | -| total_timesteps | 2805376 | -| train/ | | -| approx_kl | 3.16184e-07 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.0001 | -| n_updates | 219160 | -| policy_gradient_loss | 0.000753 | -| std | 0.00646 | -| value_loss | 5.46e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21918 | -| time_elapsed | 118453 | -| total_timesteps | 2805504 | -| train/ | | -| approx_kl | 0.06470478 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00275 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 219170 | -| policy_gradient_loss | 0.0118 | -| std | 0.00646 | -| value_loss | 3.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21919 | -| time_elapsed | 118457 | -| total_timesteps | 2805632 | -| train/ | | -| approx_kl | 0.042553894 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | 0.00621 | -| n_updates | 219180 | -| policy_gradient_loss | 0.00294 | -| std | 0.00647 | -| value_loss | 3.26e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21920 | -| time_elapsed | 118461 | -| total_timesteps | 2805760 | -| train/ | | -| approx_kl | 0.008800892 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 5.42e-05 | -| n_updates | 219190 | -| policy_gradient_loss | 0.00517 | -| std | 0.00647 | -| value_loss | 1.41e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 21921 | -| time_elapsed | 118467 | -| total_timesteps | 2805888 | -| train/ | | -| approx_kl | 0.0022271373 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0877 | -| learning_rate | 0.0003 | -| loss | -0.000943 | -| n_updates | 219200 | -| policy_gradient_loss | 0.0102 | -| std | 0.00648 | -| value_loss | 8.44e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21922 | -| time_elapsed | 118472 | -| total_timesteps | 2806016 | -| train/ | | -| approx_kl | 0.040292095 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | 0.0517 | -| n_updates | 219210 | -| policy_gradient_loss | 0.084 | -| std | 0.00648 | -| value_loss | 9.96e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21923 | -| time_elapsed | 118485 | -| total_timesteps | 2806144 | -| train/ | | -| approx_kl | 0.11248699 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.894 | -| learning_rate | 0.0003 | -| loss | 0.0518 | -| n_updates | 219220 | -| policy_gradient_loss | 0.0679 | -| std | 0.00648 | -| value_loss | 0.00183 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21924 | -| time_elapsed | 118491 | -| total_timesteps | 2806272 | -| train/ | | -| approx_kl | 0.024570897 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0814 | -| learning_rate | 0.0003 | -| loss | 0.00515 | -| n_updates | 219230 | -| policy_gradient_loss | 0.0222 | -| std | 0.00647 | -| value_loss | 2.6e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21925 | -| time_elapsed | 118495 | -| total_timesteps | 2806400 | -| train/ | | -| approx_kl | 0.72623736 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.26 | -| n_updates | 219240 | -| policy_gradient_loss | 0.0767 | -| std | 0.00647 | -| value_loss | 4.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21926 | -| time_elapsed | 118499 | -| total_timesteps | 2806528 | -| train/ | | -| approx_kl | 0.010343924 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00312 | -| learning_rate | 0.0003 | -| loss | 0.00417 | -| n_updates | 219250 | -| policy_gradient_loss | 0.00927 | -| std | 0.00646 | -| value_loss | 2.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21927 | -| time_elapsed | 118504 | -| total_timesteps | 2806656 | -| train/ | | -| approx_kl | 0.073610604 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -6.46 | -| learning_rate | 0.0003 | -| loss | 0.00203 | -| n_updates | 219260 | -| policy_gradient_loss | -0.000323 | -| std | 0.00646 | -| value_loss | 1.76e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21928 | -| time_elapsed | 118511 | -| total_timesteps | 2806784 | -| train/ | | -| approx_kl | 0.010044157 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | 0.000527 | -| n_updates | 219270 | -| policy_gradient_loss | 0.00543 | -| std | 0.00645 | -| value_loss | 2.78e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 21929 | -| time_elapsed | 118516 | -| total_timesteps | 2806912 | -| train/ | | -| approx_kl | 0.0006954456 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0561 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 219280 | -| policy_gradient_loss | 0.00646 | -| std | 0.00645 | -| value_loss | 1.94e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21930 | -| time_elapsed | 118520 | -| total_timesteps | 2807040 | -| train/ | | -| approx_kl | 0.055787303 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0871 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 219290 | -| policy_gradient_loss | 0.00464 | -| std | 0.00645 | -| value_loss | 8.94e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21931 | -| time_elapsed | 118530 | -| total_timesteps | 2807168 | -| train/ | | -| approx_kl | 0.01689898 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 219300 | -| policy_gradient_loss | -0.00454 | -| std | 0.00645 | -| value_loss | 0.00214 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21932 | -| time_elapsed | 118535 | -| total_timesteps | 2807296 | -| train/ | | -| approx_kl | 0.07316789 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.285 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 219310 | -| policy_gradient_loss | 0.0161 | -| std | 0.00644 | -| value_loss | 2.35e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21933 | -| time_elapsed | 118539 | -| total_timesteps | 2807424 | -| train/ | | -| approx_kl | 0.011194484 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0694 | -| learning_rate | 0.0003 | -| loss | -0.00386 | -| n_updates | 219320 | -| policy_gradient_loss | 0.00639 | -| std | 0.00644 | -| value_loss | 1.06e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21934 | -| time_elapsed | 118545 | -| total_timesteps | 2807552 | -| train/ | | -| approx_kl | 0.06677338 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00675 | -| learning_rate | 0.0003 | -| loss | 0.0356 | -| n_updates | 219330 | -| policy_gradient_loss | 0.0141 | -| std | 0.00643 | -| value_loss | 1.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21935 | -| time_elapsed | 118550 | -| total_timesteps | 2807680 | -| train/ | | -| approx_kl | 0.00955633 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.00891 | -| n_updates | 219340 | -| policy_gradient_loss | 0.00284 | -| std | 0.00643 | -| value_loss | 7.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21936 | -| time_elapsed | 118554 | -| total_timesteps | 2807808 | -| train/ | | -| approx_kl | 0.06707955 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | -0.00304 | -| n_updates | 219350 | -| policy_gradient_loss | -0.00626 | -| std | 0.00643 | -| value_loss | 6.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 21937 | -| time_elapsed | 118559 | -| total_timesteps | 2807936 | -| train/ | | -| approx_kl | 0.015168809 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.00484 | -| n_updates | 219360 | -| policy_gradient_loss | 0.0116 | -| std | 0.00643 | -| value_loss | 3.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21938 | -| time_elapsed | 118565 | -| total_timesteps | 2808064 | -| train/ | | -| approx_kl | 0.0030146735 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0579 | -| learning_rate | 0.0003 | -| loss | -0.00862 | -| n_updates | 219370 | -| policy_gradient_loss | 0.00764 | -| std | 0.00643 | -| value_loss | 2.87e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21939 | -| time_elapsed | 118572 | -| total_timesteps | 2808192 | -| train/ | | -| approx_kl | 0.042693477 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.67 | -| learning_rate | 0.0003 | -| loss | 0.0356 | -| n_updates | 219380 | -| policy_gradient_loss | 0.0814 | -| std | 0.00643 | -| value_loss | 0.013 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21940 | -| time_elapsed | 118576 | -| total_timesteps | 2808320 | -| train/ | | -| approx_kl | 0.012373799 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | 0.0039 | -| n_updates | 219390 | -| policy_gradient_loss | 0.0321 | -| std | 0.00643 | -| value_loss | 3.95e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21941 | -| time_elapsed | 118581 | -| total_timesteps | 2808448 | -| train/ | | -| approx_kl | 0.5480708 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | 0.22 | -| n_updates | 219400 | -| policy_gradient_loss | 0.0662 | -| std | 0.00643 | -| value_loss | 1.07e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21942 | -| time_elapsed | 118586 | -| total_timesteps | 2808576 | -| train/ | | -| approx_kl | 0.010339048 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00705 | -| n_updates | 219410 | -| policy_gradient_loss | 0.00562 | -| std | 0.00643 | -| value_loss | 6.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21943 | -| time_elapsed | 118592 | -| total_timesteps | 2808704 | -| train/ | | -| approx_kl | 0.061220318 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.038 | -| n_updates | 219420 | -| policy_gradient_loss | 0.0152 | -| std | 0.00643 | -| value_loss | 3.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21944 | -| time_elapsed | 118597 | -| total_timesteps | 2808832 | -| train/ | | -| approx_kl | 0.038566798 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 219430 | -| policy_gradient_loss | 0.00882 | -| std | 0.00643 | -| value_loss | 2.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 21945 | -| time_elapsed | 118602 | -| total_timesteps | 2808960 | -| train/ | | -| approx_kl | 0.007656244 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.00556 | -| n_updates | 219440 | -| policy_gradient_loss | 0.00473 | -| std | 0.00643 | -| value_loss | 1.66e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21946 | -| time_elapsed | 118607 | -| total_timesteps | 2809088 | -| train/ | | -| approx_kl | 0.3868728 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 219450 | -| policy_gradient_loss | 0.0569 | -| std | 0.00642 | -| value_loss | 0.000423 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21947 | -| time_elapsed | 118617 | -| total_timesteps | 2809216 | -| train/ | | -| approx_kl | 0.08791756 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.855 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 219460 | -| policy_gradient_loss | 0.0143 | -| std | 0.00641 | -| value_loss | 0.00225 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21948 | -| time_elapsed | 118621 | -| total_timesteps | 2809344 | -| train/ | | -| approx_kl | 0.034551 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.77 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 219470 | -| policy_gradient_loss | -0.000202 | -| std | 0.00641 | -| value_loss | 2.39e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21949 | -| time_elapsed | 118627 | -| total_timesteps | 2809472 | -| train/ | | -| approx_kl | 0.06694873 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -9.53 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 219480 | -| policy_gradient_loss | 0.00699 | -| std | 0.00641 | -| value_loss | 6.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21950 | -| time_elapsed | 118631 | -| total_timesteps | 2809600 | -| train/ | | -| approx_kl | 0.041084573 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -156 | -| learning_rate | 0.0003 | -| loss | 0.00741 | -| n_updates | 219490 | -| policy_gradient_loss | 0.00392 | -| std | 0.00641 | -| value_loss | 6.54e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21951 | -| time_elapsed | 118636 | -| total_timesteps | 2809728 | -| train/ | | -| approx_kl | 0.008548228 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.573 | -| learning_rate | 0.0003 | -| loss | 0.000242 | -| n_updates | 219500 | -| policy_gradient_loss | 0.00701 | -| std | 0.00641 | -| value_loss | 7.43e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21952 | -| time_elapsed | 118640 | -| total_timesteps | 2809856 | -| train/ | | -| approx_kl | 0.06783668 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.0434 | -| n_updates | 219510 | -| policy_gradient_loss | 0.017 | -| std | 0.00641 | -| value_loss | 5.12e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 21953 | -| time_elapsed | 118644 | -| total_timesteps | 2809984 | -| train/ | | -| approx_kl | 0.011802037 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0615 | -| learning_rate | 0.0003 | -| loss | 0.000396 | -| n_updates | 219520 | -| policy_gradient_loss | 0.00599 | -| std | 0.00641 | -| value_loss | 3.15e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21954 | -| time_elapsed | 118648 | -| total_timesteps | 2810112 | -| train/ | | -| approx_kl | 0.062187742 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | 0.0482 | -| n_updates | 219530 | -| policy_gradient_loss | 0.0204 | -| std | 0.00641 | -| value_loss | 1.84e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21955 | -| time_elapsed | 118658 | -| total_timesteps | 2810240 | -| train/ | | -| approx_kl | 0.011353726 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.0227 | -| n_updates | 219540 | -| policy_gradient_loss | -0.0076 | -| std | 0.00641 | -| value_loss | 0.000481 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21956 | -| time_elapsed | 118663 | -| total_timesteps | 2810368 | -| train/ | | -| approx_kl | 0.10463621 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 219550 | -| policy_gradient_loss | 0.011 | -| std | 0.00641 | -| value_loss | 3.63e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21957 | -| time_elapsed | 118667 | -| total_timesteps | 2810496 | -| train/ | | -| approx_kl | 0.22748539 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00176 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 219560 | -| policy_gradient_loss | 0.0393 | -| std | 0.00641 | -| value_loss | 2.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21958 | -| time_elapsed | 118672 | -| total_timesteps | 2810624 | -| train/ | | -| approx_kl | 0.15497985 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | 0.0606 | -| n_updates | 219570 | -| policy_gradient_loss | 0.0186 | -| std | 0.00641 | -| value_loss | 1.83e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21959 | -| time_elapsed | 118677 | -| total_timesteps | 2810752 | -| train/ | | -| approx_kl | 0.025301307 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 219580 | -| policy_gradient_loss | 0.0305 | -| std | 0.00641 | -| value_loss | 1.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21960 | -| time_elapsed | 118681 | -| total_timesteps | 2810880 | -| train/ | | -| approx_kl | 0.29971468 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.223 | -| n_updates | 219590 | -| policy_gradient_loss | 0.156 | -| std | 0.00641 | -| value_loss | 1.24e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21961 | -| time_elapsed | 118685 | -| total_timesteps | 2811008 | -| train/ | | -| approx_kl | 0.14998674 | -| clip_fraction | 0.687 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 219600 | -| policy_gradient_loss | 0.102 | -| std | 0.00641 | -| value_loss | 8.49e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21962 | -| time_elapsed | 118696 | -| total_timesteps | 2811136 | -| train/ | | -| approx_kl | 0.12335892 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.895 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 219610 | -| policy_gradient_loss | 0.0588 | -| std | 0.00641 | -| value_loss | 0.00187 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21963 | -| time_elapsed | 118702 | -| total_timesteps | 2811264 | -| train/ | | -| approx_kl | 0.13595095 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.44 | -| learning_rate | 0.0003 | -| loss | 0.0827 | -| n_updates | 219620 | -| policy_gradient_loss | 0.0741 | -| std | 0.00641 | -| value_loss | 2.93e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21964 | -| time_elapsed | 118707 | -| total_timesteps | 2811392 | -| train/ | | -| approx_kl | 0.030072918 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0116 | -| learning_rate | 0.0003 | -| loss | -0.00417 | -| n_updates | 219630 | -| policy_gradient_loss | 0.0267 | -| std | 0.00641 | -| value_loss | 1.25e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21965 | -| time_elapsed | 118713 | -| total_timesteps | 2811520 | -| train/ | | -| approx_kl | 0.20199104 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0105 | -| learning_rate | 0.0003 | -| loss | 0.083 | -| n_updates | 219640 | -| policy_gradient_loss | 0.0255 | -| std | 0.00641 | -| value_loss | 5.53e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21966 | -| time_elapsed | 118716 | -| total_timesteps | 2811648 | -| train/ | | -| approx_kl | 0.01916865 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.00293 | -| n_updates | 219650 | -| policy_gradient_loss | 0.0212 | -| std | 0.00641 | -| value_loss | 3.89e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21967 | -| time_elapsed | 118721 | -| total_timesteps | 2811776 | -| train/ | | -| approx_kl | 0.43102098 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 219660 | -| policy_gradient_loss | 0.187 | -| std | 0.00644 | -| value_loss | 2.33e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 21968 | -| time_elapsed | 118724 | -| total_timesteps | 2811904 | -| train/ | | -| approx_kl | 0.18203641 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.87 | -| learning_rate | 0.0003 | -| loss | 0.0791 | -| n_updates | 219670 | -| policy_gradient_loss | 0.104 | -| std | 0.00645 | -| value_loss | 1.94e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21969 | -| time_elapsed | 118728 | -| total_timesteps | 2812032 | -| train/ | | -| approx_kl | 0.030286174 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00637 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 219680 | -| policy_gradient_loss | 0.0216 | -| std | 0.00645 | -| value_loss | 3.34e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21970 | -| time_elapsed | 118738 | -| total_timesteps | 2812160 | -| train/ | | -| approx_kl | 0.13947427 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 219690 | -| policy_gradient_loss | 5.18e-05 | -| std | 0.00645 | -| value_loss | 0.00118 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21971 | -| time_elapsed | 118743 | -| total_timesteps | 2812288 | -| train/ | | -| approx_kl | 0.026910305 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | -0.00592 | -| n_updates | 219700 | -| policy_gradient_loss | 0.0237 | -| std | 0.00645 | -| value_loss | 7.48e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21972 | -| time_elapsed | 118747 | -| total_timesteps | 2812416 | -| train/ | | -| approx_kl | 0.41417697 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.261 | -| n_updates | 219710 | -| policy_gradient_loss | 0.183 | -| std | 0.00645 | -| value_loss | 1.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21973 | -| time_elapsed | 118751 | -| total_timesteps | 2812544 | -| train/ | | -| approx_kl | 0.046209246 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00283 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 219720 | -| policy_gradient_loss | 0.0208 | -| std | 0.00645 | -| value_loss | 9.41e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21974 | -| time_elapsed | 118754 | -| total_timesteps | 2812672 | -| train/ | | -| approx_kl | 0.1959212 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0707 | -| n_updates | 219730 | -| policy_gradient_loss | 0.0223 | -| std | 0.00645 | -| value_loss | 6.15e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21975 | -| time_elapsed | 118758 | -| total_timesteps | 2812800 | -| train/ | | -| approx_kl | 0.02220545 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 219740 | -| policy_gradient_loss | 0.0324 | -| std | 0.00645 | -| value_loss | 2.91e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 21976 | -| time_elapsed | 118765 | -| total_timesteps | 2812928 | -| train/ | | -| approx_kl | 0.1533351 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0757 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 219750 | -| policy_gradient_loss | 0.0535 | -| std | 0.00646 | -| value_loss | 1.83e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21977 | -| time_elapsed | 118770 | -| total_timesteps | 2813056 | -| train/ | | -| approx_kl | 0.00014508143 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0693 | -| learning_rate | 0.0003 | -| loss | -0.000624 | -| n_updates | 219760 | -| policy_gradient_loss | 0.0216 | -| std | 0.00647 | -| value_loss | 2.73e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21978 | -| time_elapsed | 118781 | -| total_timesteps | 2813184 | -| train/ | | -| approx_kl | 0.02814636 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.478 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 219770 | -| policy_gradient_loss | -0.0144 | -| std | 0.00648 | -| value_loss | 0.00256 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21979 | -| time_elapsed | 118787 | -| total_timesteps | 2813312 | -| train/ | | -| approx_kl | 0.0031290385 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.99 | -| learning_rate | 0.0003 | -| loss | -0.00494 | -| n_updates | 219780 | -| policy_gradient_loss | 0.0025 | -| std | 0.00648 | -| value_loss | 1.12e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21980 | -| time_elapsed | 118793 | -| total_timesteps | 2813440 | -| train/ | | -| approx_kl | 7.150229e-06 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -26.5 | -| learning_rate | 0.0003 | -| loss | 5.14e-05 | -| n_updates | 219790 | -| policy_gradient_loss | 0.00747 | -| std | 0.00648 | -| value_loss | 1.91e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21981 | -| time_elapsed | 118799 | -| total_timesteps | 2813568 | -| train/ | | -| approx_kl | 0.06638466 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -1.34 | -| learning_rate | 0.0003 | -| loss | 0.0282 | -| n_updates | 219800 | -| policy_gradient_loss | 0.0592 | -| std | 0.00648 | -| value_loss | 1.4e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21982 | -| time_elapsed | 118804 | -| total_timesteps | 2813696 | -| train/ | | -| approx_kl | 0.13412474 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.174 | -| learning_rate | 0.0003 | -| loss | 0.0944 | -| n_updates | 219810 | -| policy_gradient_loss | 0.0425 | -| std | 0.00648 | -| value_loss | 3.07e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21983 | -| time_elapsed | 118809 | -| total_timesteps | 2813824 | -| train/ | | -| approx_kl | 0.057284094 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 219820 | -| policy_gradient_loss | 0.0112 | -| std | 0.00648 | -| value_loss | 3.51e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 21984 | -| time_elapsed | 118813 | -| total_timesteps | 2813952 | -| train/ | | -| approx_kl | 0.0017941655 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0603 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 219830 | -| policy_gradient_loss | 0.0974 | -| std | 0.00648 | -| value_loss | 1.68e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21985 | -| time_elapsed | 118817 | -| total_timesteps | 2814080 | -| train/ | | -| approx_kl | 0.026697949 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 219840 | -| policy_gradient_loss | 0.0409 | -| std | 0.00648 | -| value_loss | 1.52e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21986 | -| time_elapsed | 118825 | -| total_timesteps | 2814208 | -| train/ | | -| approx_kl | 0.13431342 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.832 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 219850 | -| policy_gradient_loss | 0.0033 | -| std | 0.00648 | -| value_loss | 0.000645 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21987 | -| time_elapsed | 118830 | -| total_timesteps | 2814336 | -| train/ | | -| approx_kl | 0.0020558294 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.457 | -| learning_rate | 0.0003 | -| loss | -0.00461 | -| n_updates | 219860 | -| policy_gradient_loss | 0.0939 | -| std | 0.00648 | -| value_loss | 2.11e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21988 | -| time_elapsed | 118835 | -| total_timesteps | 2814464 | -| train/ | | -| approx_kl | 0.029084258 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00703 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 219870 | -| policy_gradient_loss | 0.0428 | -| std | 0.00649 | -| value_loss | 9.33e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21989 | -| time_elapsed | 118840 | -| total_timesteps | 2814592 | -| train/ | | -| approx_kl | 0.33866626 | -| clip_fraction | 0.704 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 219880 | -| policy_gradient_loss | 0.128 | -| std | 0.00649 | -| value_loss | 6.91e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21990 | -| time_elapsed | 118845 | -| total_timesteps | 2814720 | -| train/ | | -| approx_kl | 0.18527459 | -| clip_fraction | 0.679 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 219890 | -| policy_gradient_loss | 0.105 | -| std | 0.00649 | -| value_loss | 6.38e-09 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21991 | -| time_elapsed | 118848 | -| total_timesteps | 2814848 | -| train/ | | -| approx_kl | 0.132534 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.074 | -| n_updates | 219900 | -| policy_gradient_loss | 0.115 | -| std | 0.00649 | -| value_loss | 3.54e-09 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 21992 | -| time_elapsed | 118852 | -| total_timesteps | 2814976 | -| train/ | | -| approx_kl | 0.13948233 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.1 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 219910 | -| policy_gradient_loss | 0.112 | -| std | 0.0065 | -| value_loss | 2.37e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 21993 | -| time_elapsed | 118858 | -| total_timesteps | 2815104 | -| train/ | | -| approx_kl | 0.026323091 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.00275 | -| n_updates | 219920 | -| policy_gradient_loss | 0.0236 | -| std | 0.0065 | -| value_loss | 1.91e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 21994 | -| time_elapsed | 118869 | -| total_timesteps | 2815232 | -| train/ | | -| approx_kl | 0.24200575 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -5.75 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 219930 | -| policy_gradient_loss | -0.00117 | -| std | 0.0065 | -| value_loss | 0.0038 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 21995 | -| time_elapsed | 118876 | -| total_timesteps | 2815360 | -| train/ | | -| approx_kl | 0.044658512 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 219940 | -| policy_gradient_loss | 0.0132 | -| std | 0.0065 | -| value_loss | 4.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 21996 | -| time_elapsed | 118880 | -| total_timesteps | 2815488 | -| train/ | | -| approx_kl | 0.11098438 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00915 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 219950 | -| policy_gradient_loss | 0.0168 | -| std | 0.0065 | -| value_loss | 6.12e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 21997 | -| time_elapsed | 118884 | -| total_timesteps | 2815616 | -| train/ | | -| approx_kl | 0.36231828 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 219960 | -| policy_gradient_loss | 0.158 | -| std | 0.0065 | -| value_loss | 3.93e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 21998 | -| time_elapsed | 118889 | -| total_timesteps | 2815744 | -| train/ | | -| approx_kl | 0.18917617 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0932 | -| n_updates | 219970 | -| policy_gradient_loss | 0.103 | -| std | 0.0065 | -| value_loss | 2.18e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 21999 | -| time_elapsed | 118895 | -| total_timesteps | 2815872 | -| train/ | | -| approx_kl | 0.039176963 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 219980 | -| policy_gradient_loss | 0.0319 | -| std | 0.0065 | -| value_loss | 1.57e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22000 | -| time_elapsed | 118900 | -| total_timesteps | 2816000 | -| train/ | | -| approx_kl | 0.2437517 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 219990 | -| policy_gradient_loss | 0.0206 | -| std | 0.0065 | -| value_loss | 8.28e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22001 | -| time_elapsed | 118905 | -| total_timesteps | 2816128 | -| train/ | | -| approx_kl | 0.022255685 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00686 | -| learning_rate | 0.0003 | -| loss | -0.00652 | -| n_updates | 220000 | -| policy_gradient_loss | 0.0251 | -| std | 0.0065 | -| value_loss | 4.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22002 | -| time_elapsed | 118915 | -| total_timesteps | 2816256 | -| train/ | | -| approx_kl | 0.002478132 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.78 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 220010 | -| policy_gradient_loss | 0.0337 | -| std | 0.0065 | -| value_loss | 0.00564 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22003 | -| time_elapsed | 118920 | -| total_timesteps | 2816384 | -| train/ | | -| approx_kl | 0.14121193 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | 0.0934 | -| n_updates | 220020 | -| policy_gradient_loss | 0.262 | -| std | 0.0065 | -| value_loss | 6.54e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22004 | -| time_elapsed | 118925 | -| total_timesteps | 2816512 | -| train/ | | -| approx_kl | 0.08021443 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 220030 | -| policy_gradient_loss | 0.0274 | -| std | 0.0065 | -| value_loss | 1.68e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22005 | -| time_elapsed | 118930 | -| total_timesteps | 2816640 | -| train/ | | -| approx_kl | 0.0009661899 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00029 | -| n_updates | 220040 | -| policy_gradient_loss | 0.0225 | -| std | 0.00649 | -| value_loss | 8.49e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22006 | -| time_elapsed | 118933 | -| total_timesteps | 2816768 | -| train/ | | -| approx_kl | 0.09731305 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0348 | -| n_updates | 220050 | -| policy_gradient_loss | 0.0396 | -| std | 0.00648 | -| value_loss | 5.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22007 | -| time_elapsed | 118937 | -| total_timesteps | 2816896 | -| train/ | | -| approx_kl | 0.13598543 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 220060 | -| policy_gradient_loss | 0.0241 | -| std | 0.00648 | -| value_loss | 1.81e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22008 | -| time_elapsed | 118942 | -| total_timesteps | 2817024 | -| train/ | | -| approx_kl | 0.00057862373 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 220070 | -| policy_gradient_loss | 0.02 | -| std | 0.00647 | -| value_loss | 8.45e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22009 | -| time_elapsed | 118953 | -| total_timesteps | 2817152 | -| train/ | | -| approx_kl | 0.5634042 | -| clip_fraction | 0.546 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | 0.0802 | -| n_updates | 220080 | -| policy_gradient_loss | 0.0266 | -| std | 0.00647 | -| value_loss | 0.0032 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22010 | -| time_elapsed | 118957 | -| total_timesteps | 2817280 | -| train/ | | -| approx_kl | 0.013027625 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.00622 | -| n_updates | 220090 | -| policy_gradient_loss | 0.00728 | -| std | 0.00647 | -| value_loss | 1.63e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22011 | -| time_elapsed | 118961 | -| total_timesteps | 2817408 | -| train/ | | -| approx_kl | 0.00040566316 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.00243 | -| n_updates | 220100 | -| policy_gradient_loss | 0.00526 | -| std | 0.00647 | -| value_loss | 5.67e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22012 | -| time_elapsed | 118966 | -| total_timesteps | 2817536 | -| train/ | | -| approx_kl | 0.060883466 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.083 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 220110 | -| policy_gradient_loss | 0.0155 | -| std | 0.00647 | -| value_loss | 4.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22013 | -| time_elapsed | 118970 | -| total_timesteps | 2817664 | -| train/ | | -| approx_kl | 0.009377746 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | -0.00419 | -| n_updates | 220120 | -| policy_gradient_loss | 0.00749 | -| std | 0.00647 | -| value_loss | 2.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22014 | -| time_elapsed | 118975 | -| total_timesteps | 2817792 | -| train/ | | -| approx_kl | 0.06469344 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.0331 | -| n_updates | 220130 | -| policy_gradient_loss | 0.013 | -| std | 0.00647 | -| value_loss | 1.86e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22015 | -| time_elapsed | 118978 | -| total_timesteps | 2817920 | -| train/ | | -| approx_kl | 0.00928829 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 220140 | -| policy_gradient_loss | 0.00348 | -| std | 0.00647 | -| value_loss | 1.3e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22016 | -| time_elapsed | 118982 | -| total_timesteps | 2818048 | -| train/ | | -| approx_kl | 0.06379541 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.0162 | -| n_updates | 220150 | -| policy_gradient_loss | 0.00426 | -| std | 0.00647 | -| value_loss | 1.02e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22017 | -| time_elapsed | 118990 | -| total_timesteps | 2818176 | -| train/ | | -| approx_kl | 0.04003585 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | 0.00661 | -| n_updates | 220160 | -| policy_gradient_loss | 0.00366 | -| std | 0.00647 | -| value_loss | 0.00198 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22018 | -| time_elapsed | 118995 | -| total_timesteps | 2818304 | -| train/ | | -| approx_kl | 0.004186568 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 220170 | -| policy_gradient_loss | 0.00771 | -| std | 0.00646 | -| value_loss | 1.04e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22019 | -| time_elapsed | 119000 | -| total_timesteps | 2818432 | -| train/ | | -| approx_kl | 5.7655852e-05 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0118 | -| learning_rate | 0.0003 | -| loss | 0.000129 | -| n_updates | 220180 | -| policy_gradient_loss | 0.0312 | -| std | 0.00647 | -| value_loss | 1.54e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22020 | -| time_elapsed | 119004 | -| total_timesteps | 2818560 | -| train/ | | -| approx_kl | 0.17939997 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | 0.096 | -| n_updates | 220190 | -| policy_gradient_loss | 0.052 | -| std | 0.00647 | -| value_loss | 8.64e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22021 | -| time_elapsed | 119008 | -| total_timesteps | 2818688 | -| train/ | | -| approx_kl | 0.04517839 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 220200 | -| policy_gradient_loss | 0.0463 | -| std | 0.00647 | -| value_loss | 3.72e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22022 | -| time_elapsed | 119013 | -| total_timesteps | 2818816 | -| train/ | | -| approx_kl | 0.8943127 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0962 | -| learning_rate | 0.0003 | -| loss | 0.353 | -| n_updates | 220210 | -| policy_gradient_loss | 0.193 | -| std | 0.00647 | -| value_loss | 2.14e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 22023 | -| time_elapsed | 119016 | -| total_timesteps | 2818944 | -| train/ | | -| approx_kl | 0.03662263 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 220220 | -| policy_gradient_loss | -0.0154 | -| std | 0.00647 | -| value_loss | 1.59e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22024 | -| time_elapsed | 119019 | -| total_timesteps | 2819072 | -| train/ | | -| approx_kl | 0.015962282 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | 0.00529 | -| n_updates | 220230 | -| policy_gradient_loss | 0.00205 | -| std | 0.00645 | -| value_loss | 9.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22025 | -| time_elapsed | 119029 | -| total_timesteps | 2819200 | -| train/ | | -| approx_kl | 0.010263449 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.701 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 220240 | -| policy_gradient_loss | 0.0217 | -| std | 0.00644 | -| value_loss | 0.00213 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22026 | -| time_elapsed | 119034 | -| total_timesteps | 2819328 | -| train/ | | -| approx_kl | 0.21839057 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 220250 | -| policy_gradient_loss | 0.114 | -| std | 0.00643 | -| value_loss | 2.21e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22027 | -| time_elapsed | 119039 | -| total_timesteps | 2819456 | -| train/ | | -| approx_kl | 0.17157422 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00479 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 220260 | -| policy_gradient_loss | 0.121 | -| std | 0.00643 | -| value_loss | 4.43e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22028 | -| time_elapsed | 119044 | -| total_timesteps | 2819584 | -| train/ | | -| approx_kl | 0.03314212 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00795 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 220270 | -| policy_gradient_loss | 0.0269 | -| std | 0.00643 | -| value_loss | 2.51e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22029 | -| time_elapsed | 119049 | -| total_timesteps | 2819712 | -| train/ | | -| approx_kl | 0.13686989 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.0573 | -| n_updates | 220280 | -| policy_gradient_loss | 0.0147 | -| std | 0.00643 | -| value_loss | 1.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22030 | -| time_elapsed | 119055 | -| total_timesteps | 2819840 | -| train/ | | -| approx_kl | 0.015926162 | -| clip_fraction | 0.11 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.00531 | -| n_updates | 220290 | -| policy_gradient_loss | 0.00233 | -| std | 0.00642 | -| value_loss | 9.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 22031 | -| time_elapsed | 119060 | -| total_timesteps | 2819968 | -| train/ | | -| approx_kl | 0.02211684 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | -0.000345 | -| n_updates | 220300 | -| policy_gradient_loss | 0.0196 | -| std | 0.00641 | -| value_loss | 5.32e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22032 | -| time_elapsed | 119065 | -| total_timesteps | 2820096 | -| train/ | | -| approx_kl | 0.32770652 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.195 | -| n_updates | 220310 | -| policy_gradient_loss | 0.147 | -| std | 0.0064 | -| value_loss | 1.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22033 | -| time_elapsed | 119077 | -| total_timesteps | 2820224 | -| train/ | | -| approx_kl | 0.043673016 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 220320 | -| policy_gradient_loss | 0.0082 | -| std | 0.0064 | -| value_loss | 6.06e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22034 | -| time_elapsed | 119081 | -| total_timesteps | 2820352 | -| train/ | | -| approx_kl | 0.0004493571 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.00218 | -| n_updates | 220330 | -| policy_gradient_loss | 0.0234 | -| std | 0.0064 | -| value_loss | 6.2e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22035 | -| time_elapsed | 119085 | -| total_timesteps | 2820480 | -| train/ | | -| approx_kl | 0.00097517297 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0678 | -| learning_rate | 0.0003 | -| loss | -0.000705 | -| n_updates | 220340 | -| policy_gradient_loss | 0.0369 | -| std | 0.0064 | -| value_loss | 3.11e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22036 | -| time_elapsed | 119089 | -| total_timesteps | 2820608 | -| train/ | | -| approx_kl | 0.52714723 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 220350 | -| policy_gradient_loss | 0.0562 | -| std | 0.00639 | -| value_loss | 5.22e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22037 | -| time_elapsed | 119093 | -| total_timesteps | 2820736 | -| train/ | | -| approx_kl | 1.7695129e-07 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | 9.36e-05 | -| n_updates | 220360 | -| policy_gradient_loss | -0.00482 | -| std | 0.00639 | -| value_loss | 4.02e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22038 | -| time_elapsed | 119099 | -| total_timesteps | 2820864 | -| train/ | | -| approx_kl | 0.0081011895 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.297 | -| learning_rate | 0.0003 | -| loss | -0.00955 | -| n_updates | 220370 | -| policy_gradient_loss | 0.00574 | -| std | 0.00639 | -| value_loss | 2.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22039 | -| time_elapsed | 119103 | -| total_timesteps | 2820992 | -| train/ | | -| approx_kl | 0.039851263 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.361 | -| learning_rate | 0.0003 | -| loss | 0.039 | -| n_updates | 220380 | -| policy_gradient_loss | 0.1 | -| std | 0.00639 | -| value_loss | 4.61e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22040 | -| time_elapsed | 119106 | -| total_timesteps | 2821120 | -| train/ | | -| approx_kl | 0.10493134 | -| clip_fraction | 0.683 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.077 | -| n_updates | 220390 | -| policy_gradient_loss | 0.13 | -| std | 0.00639 | -| value_loss | 2.59e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22041 | -| time_elapsed | 119117 | -| total_timesteps | 2821248 | -| train/ | | -| approx_kl | 0.0062050805 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 220400 | -| policy_gradient_loss | 0.0229 | -| std | 0.00639 | -| value_loss | 0.00118 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22042 | -| time_elapsed | 119122 | -| total_timesteps | 2821376 | -| train/ | | -| approx_kl | 0.22598532 | -| clip_fraction | 0.496 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 220410 | -| policy_gradient_loss | 0.0691 | -| std | 0.00639 | -| value_loss | 2.4e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22043 | -| time_elapsed | 119126 | -| total_timesteps | 2821504 | -| train/ | | -| approx_kl | 0.046838846 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0122 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 220420 | -| policy_gradient_loss | 0.0187 | -| std | 0.00639 | -| value_loss | 6.87e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22044 | -| time_elapsed | 119132 | -| total_timesteps | 2821632 | -| train/ | | -| approx_kl | 0.12018188 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0109 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 220430 | -| policy_gradient_loss | 0.0646 | -| std | 0.00639 | -| value_loss | 3.54e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22045 | -| time_elapsed | 119138 | -| total_timesteps | 2821760 | -| train/ | | -| approx_kl | 0.036901705 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 220440 | -| policy_gradient_loss | 0.0369 | -| std | 0.00639 | -| value_loss | 2.58e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22046 | -| time_elapsed | 119142 | -| total_timesteps | 2821888 | -| train/ | | -| approx_kl | 0.839897 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.29 | -| n_updates | 220450 | -| policy_gradient_loss | 0.163 | -| std | 0.00639 | -| value_loss | 1.38e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22047 | -| time_elapsed | 119146 | -| total_timesteps | 2822016 | -| train/ | | -| approx_kl | 0.008611055 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0624 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 220460 | -| policy_gradient_loss | 0.0262 | -| std | 0.00639 | -| value_loss | 1.25e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22048 | -| time_elapsed | 119157 | -| total_timesteps | 2822144 | -| train/ | | -| approx_kl | 0.3393949 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 220470 | -| policy_gradient_loss | 0.0827 | -| std | 0.00638 | -| value_loss | 0.0011 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22049 | -| time_elapsed | 119161 | -| total_timesteps | 2822272 | -| train/ | | -| approx_kl | 0.17569984 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0958 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 220480 | -| policy_gradient_loss | 0.107 | -| std | 0.00638 | -| value_loss | 2.57e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22050 | -| time_elapsed | 119165 | -| total_timesteps | 2822400 | -| train/ | | -| approx_kl | 0.15740915 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.00142 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 220490 | -| policy_gradient_loss | 0.131 | -| std | 0.00638 | -| value_loss | 1.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22051 | -| time_elapsed | 119171 | -| total_timesteps | 2822528 | -| train/ | | -| approx_kl | 0.029473387 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 220500 | -| policy_gradient_loss | 0.0257 | -| std | 0.00638 | -| value_loss | 7.09e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22052 | -| time_elapsed | 119175 | -| total_timesteps | 2822656 | -| train/ | | -| approx_kl | 0.58253634 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.192 | -| n_updates | 220510 | -| policy_gradient_loss | 0.0589 | -| std | 0.00638 | -| value_loss | 4.91e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22053 | -| time_elapsed | 119178 | -| total_timesteps | 2822784 | -| train/ | | -| approx_kl | 0.058380608 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 220520 | -| policy_gradient_loss | 0.00995 | -| std | 0.00638 | -| value_loss | 4.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22054 | -| time_elapsed | 119183 | -| total_timesteps | 2822912 | -| train/ | | -| approx_kl | 0.008368547 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 220530 | -| policy_gradient_loss | 0.00713 | -| std | 0.00638 | -| value_loss | 2.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22055 | -| time_elapsed | 119188 | -| total_timesteps | 2823040 | -| train/ | | -| approx_kl | 0.07274455 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0609 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 220540 | -| policy_gradient_loss | 0.022 | -| std | 0.00639 | -| value_loss | 1.55e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22056 | -| time_elapsed | 119198 | -| total_timesteps | 2823168 | -| train/ | | -| approx_kl | 0.006145578 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.027 | -| n_updates | 220550 | -| policy_gradient_loss | -0.0142 | -| std | 0.00639 | -| value_loss | 0.000196 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22057 | -| time_elapsed | 119204 | -| total_timesteps | 2823296 | -| train/ | | -| approx_kl | 1.4999416e-05 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.000236 | -| n_updates | 220560 | -| policy_gradient_loss | 0.0183 | -| std | 0.0064 | -| value_loss | 4.48e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22058 | -| time_elapsed | 119207 | -| total_timesteps | 2823424 | -| train/ | | -| approx_kl | 0.040942367 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 220570 | -| policy_gradient_loss | 0.0368 | -| std | 0.00641 | -| value_loss | 3.55e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22059 | -| time_elapsed | 119211 | -| total_timesteps | 2823552 | -| train/ | | -| approx_kl | 0.8096515 | -| clip_fraction | 0.758 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -21.5 | -| learning_rate | 0.0003 | -| loss | 0.0763 | -| n_updates | 220580 | -| policy_gradient_loss | 0.0396 | -| std | 0.00641 | -| value_loss | 3.8e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22060 | -| time_elapsed | 119216 | -| total_timesteps | 2823680 | -| train/ | | -| approx_kl | 0.031455956 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.371 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 220590 | -| policy_gradient_loss | 0.00631 | -| std | 0.00641 | -| value_loss | 4.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22061 | -| time_elapsed | 119220 | -| total_timesteps | 2823808 | -| train/ | | -| approx_kl | 0.016105892 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | 0.00334 | -| n_updates | 220600 | -| policy_gradient_loss | 0.000919 | -| std | 0.00641 | -| value_loss | 0.000247 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22062 | -| time_elapsed | 119225 | -| total_timesteps | 2823936 | -| train/ | | -| approx_kl | 0.014237767 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00192 | -| learning_rate | 0.0003 | -| loss | -0.00401 | -| n_updates | 220610 | -| policy_gradient_loss | -0.00246 | -| std | 0.00641 | -| value_loss | 9.51e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22063 | -| time_elapsed | 119232 | -| total_timesteps | 2824064 | -| train/ | | -| approx_kl | 0.03296276 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -50.8 | -| learning_rate | 0.0003 | -| loss | 0.00581 | -| n_updates | 220620 | -| policy_gradient_loss | 0.017 | -| std | 0.00642 | -| value_loss | 1.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22064 | -| time_elapsed | 119244 | -| total_timesteps | 2824192 | -| train/ | | -| approx_kl | 0.31671855 | -| clip_fraction | 0.701 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0806 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 220630 | -| policy_gradient_loss | 0.0463 | -| std | 0.00642 | -| value_loss | 0.00209 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22065 | -| time_elapsed | 119248 | -| total_timesteps | 2824320 | -| train/ | | -| approx_kl | 0.25859654 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.71 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 220640 | -| policy_gradient_loss | 0.181 | -| std | 0.00642 | -| value_loss | 1.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22066 | -| time_elapsed | 119254 | -| total_timesteps | 2824448 | -| train/ | | -| approx_kl | 0.039039448 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 220650 | -| policy_gradient_loss | 0.0291 | -| std | 0.00642 | -| value_loss | 1.85e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22067 | -| time_elapsed | 119260 | -| total_timesteps | 2824576 | -| train/ | | -| approx_kl | 0.6461927 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.384 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 220660 | -| policy_gradient_loss | 0.046 | -| std | 0.00642 | -| value_loss | 2.1e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22068 | -| time_elapsed | 119265 | -| total_timesteps | 2824704 | -| train/ | | -| approx_kl | 0.0119707715 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 8.16e-05 | -| n_updates | 220670 | -| policy_gradient_loss | 0.0059 | -| std | 0.00642 | -| value_loss | 1.12e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22069 | -| time_elapsed | 119272 | -| total_timesteps | 2824832 | -| train/ | | -| approx_kl | 0.0028807488 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | -0.00918 | -| n_updates | 220680 | -| policy_gradient_loss | 0.0105 | -| std | 0.00642 | -| value_loss | 8.49e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22070 | -| time_elapsed | 119277 | -| total_timesteps | 2824960 | -| train/ | | -| approx_kl | 0.10134988 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 220690 | -| policy_gradient_loss | 0.0117 | -| std | 0.00642 | -| value_loss | 5.91e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22071 | -| time_elapsed | 119282 | -| total_timesteps | 2825088 | -| train/ | | -| approx_kl | 0.119389266 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 220700 | -| policy_gradient_loss | 0.0083 | -| std | 0.00642 | -| value_loss | 4.15e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22072 | -| time_elapsed | 119291 | -| total_timesteps | 2825216 | -| train/ | | -| approx_kl | 0.042488094 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 220710 | -| policy_gradient_loss | -0.0178 | -| std | 0.00642 | -| value_loss | 0.000113 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22073 | -| time_elapsed | 119295 | -| total_timesteps | 2825344 | -| train/ | | -| approx_kl | 0.056451954 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.97 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 220720 | -| policy_gradient_loss | 0.00862 | -| std | 0.00642 | -| value_loss | 3.46e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22074 | -| time_elapsed | 119300 | -| total_timesteps | 2825472 | -| train/ | | -| approx_kl | 0.009767301 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | -0.00646 | -| n_updates | 220730 | -| policy_gradient_loss | 0.00608 | -| std | 0.00642 | -| value_loss | 1.75e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22075 | -| time_elapsed | 119305 | -| total_timesteps | 2825600 | -| train/ | | -| approx_kl | 0.06724255 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0452 | -| n_updates | 220740 | -| policy_gradient_loss | 0.0183 | -| std | 0.00642 | -| value_loss | 1.24e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22076 | -| time_elapsed | 119311 | -| total_timesteps | 2825728 | -| train/ | | -| approx_kl | 0.012785056 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0508 | -| learning_rate | 0.0003 | -| loss | 0.00233 | -| n_updates | 220750 | -| policy_gradient_loss | 0.0068 | -| std | 0.00643 | -| value_loss | 9.23e-10 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22077 | -| time_elapsed | 119317 | -| total_timesteps | 2825856 | -| train/ | | -| approx_kl | 0.0029655113 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 220760 | -| policy_gradient_loss | 0.00996 | -| std | 0.00643 | -| value_loss | 3.87e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 22078 | -| time_elapsed | 119323 | -| total_timesteps | 2825984 | -| train/ | | -| approx_kl | 0.077307895 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0794 | -| learning_rate | 0.0003 | -| loss | 0.0402 | -| n_updates | 220770 | -| policy_gradient_loss | 0.011 | -| std | 0.00643 | -| value_loss | 3.69e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 22079 | -| time_elapsed | 119327 | -| total_timesteps | 2826112 | -| train/ | | -| approx_kl | 0.26110572 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 220780 | -| policy_gradient_loss | 0.0439 | -| std | 0.00643 | -| value_loss | 2.46e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 22080 | -| time_elapsed | 119338 | -| total_timesteps | 2826240 | -| train/ | | -| approx_kl | 0.030680213 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.753 | -| learning_rate | 0.0003 | -| loss | -0.00874 | -| n_updates | 220790 | -| policy_gradient_loss | 0.0163 | -| std | 0.00643 | -| value_loss | 0.00677 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 22081 | -| time_elapsed | 119342 | -| total_timesteps | 2826368 | -| train/ | | -| approx_kl | 0.54501426 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | 0.227 | -| n_updates | 220800 | -| policy_gradient_loss | 0.0771 | -| std | 0.00643 | -| value_loss | 5.15e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 22082 | -| time_elapsed | 119346 | -| total_timesteps | 2826496 | -| train/ | | -| approx_kl | 0.05435855 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | 0.0336 | -| n_updates | 220810 | -| policy_gradient_loss | 0.0152 | -| std | 0.00643 | -| value_loss | 3.56e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 22083 | -| time_elapsed | 119350 | -| total_timesteps | 2826624 | -| train/ | | -| approx_kl | 0.039576516 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0932 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 220820 | -| policy_gradient_loss | -0.00966 | -| std | 0.00643 | -| value_loss | 3.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 22084 | -| time_elapsed | 119353 | -| total_timesteps | 2826752 | -| train/ | | -| approx_kl | 0.009834859 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.00345 | -| n_updates | 220830 | -| policy_gradient_loss | 0.0107 | -| std | 0.00642 | -| value_loss | 2.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 22085 | -| time_elapsed | 119358 | -| total_timesteps | 2826880 | -| train/ | | -| approx_kl | 0.073686495 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 220840 | -| policy_gradient_loss | 0.00369 | -| std | 0.00642 | -| value_loss | 3.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22086 | -| time_elapsed | 119363 | -| total_timesteps | 2827008 | -| train/ | | -| approx_kl | 0.047064446 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.00591 | -| n_updates | 220850 | -| policy_gradient_loss | 0.00497 | -| std | 0.00642 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22087 | -| time_elapsed | 119373 | -| total_timesteps | 2827136 | -| train/ | | -| approx_kl | 0.045040835 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.0251 | -| n_updates | 220860 | -| policy_gradient_loss | -0.0114 | -| std | 0.00642 | -| value_loss | 6.46e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22088 | -| time_elapsed | 119377 | -| total_timesteps | 2827264 | -| train/ | | -| approx_kl | 0.0008677654 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0855 | -| learning_rate | 0.0003 | -| loss | -0.000125 | -| n_updates | 220870 | -| policy_gradient_loss | 0.03 | -| std | 0.00642 | -| value_loss | 0.0012 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22089 | -| time_elapsed | 119381 | -| total_timesteps | 2827392 | -| train/ | | -| approx_kl | 0.8514774 | -| clip_fraction | 0.76 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0989 | -| learning_rate | 0.0003 | -| loss | 0.338 | -| n_updates | 220880 | -| policy_gradient_loss | 0.211 | -| std | 0.00642 | -| value_loss | 1.61e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22090 | -| time_elapsed | 119385 | -| total_timesteps | 2827520 | -| train/ | | -| approx_kl | 0.013403278 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00191 | -| learning_rate | 0.0003 | -| loss | -0.00722 | -| n_updates | 220890 | -| policy_gradient_loss | 0.0254 | -| std | 0.00642 | -| value_loss | 5.6e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22091 | -| time_elapsed | 119390 | -| total_timesteps | 2827648 | -| train/ | | -| approx_kl | 0.09113759 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0586 | -| n_updates | 220900 | -| policy_gradient_loss | 0.0284 | -| std | 0.00641 | -| value_loss | 1.07e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22092 | -| time_elapsed | 119396 | -| total_timesteps | 2827776 | -| train/ | | -| approx_kl | 0.1544731 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | 0.0805 | -| n_updates | 220910 | -| policy_gradient_loss | 0.0249 | -| std | 0.00641 | -| value_loss | 1.94e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 22093 | -| time_elapsed | 119401 | -| total_timesteps | 2827904 | -| train/ | | -| approx_kl | 0.022873692 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 220920 | -| policy_gradient_loss | 0.0199 | -| std | 0.0064 | -| value_loss | 3.47e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22094 | -| time_elapsed | 119406 | -| total_timesteps | 2828032 | -| train/ | | -| approx_kl | 0.13500986 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0178 | -| learning_rate | 0.0003 | -| loss | 0.0472 | -| n_updates | 220930 | -| policy_gradient_loss | 0.0257 | -| std | 0.0064 | -| value_loss | 2.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22095 | -| time_elapsed | 119417 | -| total_timesteps | 2828160 | -| train/ | | -| approx_kl | 0.04349309 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.927 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 220940 | -| policy_gradient_loss | -0.0151 | -| std | 0.0064 | -| value_loss | 0.00105 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22096 | -| time_elapsed | 119423 | -| total_timesteps | 2828288 | -| train/ | | -| approx_kl | 0.2418113 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 220950 | -| policy_gradient_loss | 0.0834 | -| std | 0.0064 | -| value_loss | 6.26e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22097 | -| time_elapsed | 119426 | -| total_timesteps | 2828416 | -| train/ | | -| approx_kl | 0.20950477 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 220960 | -| policy_gradient_loss | 0.058 | -| std | 0.0064 | -| value_loss | 1.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22098 | -| time_elapsed | 119431 | -| total_timesteps | 2828544 | -| train/ | | -| approx_kl | 0.044239067 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.00274 | -| n_updates | 220970 | -| policy_gradient_loss | 0.0609 | -| std | 0.00639 | -| value_loss | 1.06e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22099 | -| time_elapsed | 119435 | -| total_timesteps | 2828672 | -| train/ | | -| approx_kl | 0.00033976277 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | 0.00092 | -| n_updates | 220980 | -| policy_gradient_loss | 0.0977 | -| std | 0.00639 | -| value_loss | 7.26e-07 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22100 | -| time_elapsed | 119439 | -| total_timesteps | 2828800 | -| train/ | | -| approx_kl | 0.135269 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 220990 | -| policy_gradient_loss | 0.178 | -| std | 0.0064 | -| value_loss | 5.44e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22101 | -| time_elapsed | 119443 | -| total_timesteps | 2828928 | -| train/ | | -| approx_kl | 0.020227911 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 221000 | -| policy_gradient_loss | 0.0275 | -| std | 0.0064 | -| value_loss | 4.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22102 | -| time_elapsed | 119447 | -| total_timesteps | 2829056 | -| train/ | | -| approx_kl | 0.018632894 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 221010 | -| policy_gradient_loss | -0.011 | -| std | 0.0064 | -| value_loss | 1.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22103 | -| time_elapsed | 119454 | -| total_timesteps | 2829184 | -| train/ | | -| approx_kl | 0.06415057 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 221020 | -| policy_gradient_loss | -0.00765 | -| std | 0.0064 | -| value_loss | 0.000686 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22104 | -| time_elapsed | 119459 | -| total_timesteps | 2829312 | -| train/ | | -| approx_kl | 0.029708175 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | 0.00569 | -| n_updates | 221030 | -| policy_gradient_loss | 0.0359 | -| std | 0.0064 | -| value_loss | 7.05e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22105 | -| time_elapsed | 119464 | -| total_timesteps | 2829440 | -| train/ | | -| approx_kl | 0.007881883 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | -0.000569 | -| n_updates | 221040 | -| policy_gradient_loss | 0.0379 | -| std | 0.0064 | -| value_loss | 4.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22106 | -| time_elapsed | 119469 | -| total_timesteps | 2829568 | -| train/ | | -| approx_kl | 0.13892697 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 221050 | -| policy_gradient_loss | 0.0108 | -| std | 0.0064 | -| value_loss | 2.79e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22107 | -| time_elapsed | 119474 | -| total_timesteps | 2829696 | -| train/ | | -| approx_kl | 0.17607534 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0501 | -| learning_rate | 0.0003 | -| loss | 0.0872 | -| n_updates | 221060 | -| policy_gradient_loss | 0.0153 | -| std | 0.0064 | -| value_loss | 1.63e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22108 | -| time_elapsed | 119479 | -| total_timesteps | 2829824 | -| train/ | | -| approx_kl | 0.036153633 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | 0.0277 | -| n_updates | 221070 | -| policy_gradient_loss | 0.0216 | -| std | 0.0064 | -| value_loss | 2.93e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22109 | -| time_elapsed | 119484 | -| total_timesteps | 2829952 | -| train/ | | -| approx_kl | 0.6494425 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -4.98 | -| learning_rate | 0.0003 | -| loss | 0.068 | -| n_updates | 221080 | -| policy_gradient_loss | 0.0515 | -| std | 0.00641 | -| value_loss | 2.42e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22110 | -| time_elapsed | 119489 | -| total_timesteps | 2830080 | -| train/ | | -| approx_kl | 0.09433632 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | 0.0505 | -| n_updates | 221090 | -| policy_gradient_loss | 0.0325 | -| std | 0.00641 | -| value_loss | 4.76e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22111 | -| time_elapsed | 119498 | -| total_timesteps | 2830208 | -| train/ | | -| approx_kl | 0.022546858 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.799 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 221100 | -| policy_gradient_loss | 0.00538 | -| std | 0.00641 | -| value_loss | 0.00538 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22112 | -| time_elapsed | 119502 | -| total_timesteps | 2830336 | -| train/ | | -| approx_kl | 0.4034765 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 221110 | -| policy_gradient_loss | 0.152 | -| std | 0.00642 | -| value_loss | 3.97e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22113 | -| time_elapsed | 119505 | -| total_timesteps | 2830464 | -| train/ | | -| approx_kl | 0.074375644 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 221120 | -| policy_gradient_loss | 0.0165 | -| std | 0.00642 | -| value_loss | 8.67e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22114 | -| time_elapsed | 119509 | -| total_timesteps | 2830592 | -| train/ | | -| approx_kl | 9.166123e-05 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.000903 | -| n_updates | 221130 | -| policy_gradient_loss | 0.0289 | -| std | 0.00641 | -| value_loss | 5.27e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22115 | -| time_elapsed | 119514 | -| total_timesteps | 2830720 | -| train/ | | -| approx_kl | 0.00024225516 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.000358 | -| n_updates | 221140 | -| policy_gradient_loss | 0.0284 | -| std | 0.00641 | -| value_loss | 9.02e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22116 | -| time_elapsed | 119519 | -| total_timesteps | 2830848 | -| train/ | | -| approx_kl | 0.2112979 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.303 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 221150 | -| policy_gradient_loss | 0.0245 | -| std | 0.0064 | -| value_loss | 2.78e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22117 | -| time_elapsed | 119524 | -| total_timesteps | 2830976 | -| train/ | | -| approx_kl | 0.021024467 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 221160 | -| policy_gradient_loss | -0.00449 | -| std | 0.0064 | -| value_loss | 4.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 22118 | -| time_elapsed | 119529 | -| total_timesteps | 2831104 | -| train/ | | -| approx_kl | 0.018241862 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0796 | -| learning_rate | 0.0003 | -| loss | 0.00332 | -| n_updates | 221170 | -| policy_gradient_loss | 0.0227 | -| std | 0.00639 | -| value_loss | 2.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 22119 | -| time_elapsed | 119542 | -| total_timesteps | 2831232 | -| train/ | | -| approx_kl | 0.23899087 | -| clip_fraction | 0.681 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.907 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 221180 | -| policy_gradient_loss | 0.118 | -| std | 0.00639 | -| value_loss | 0.00155 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 22120 | -| time_elapsed | 119547 | -| total_timesteps | 2831360 | -| train/ | | -| approx_kl | 0.0616208 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.00835 | -| n_updates | 221190 | -| policy_gradient_loss | 0.0232 | -| std | 0.00639 | -| value_loss | 2.31e-05 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 22121 | -| time_elapsed | 119553 | -| total_timesteps | 2831488 | -| train/ | | -| approx_kl | 0.543602 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0126 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 221200 | -| policy_gradient_loss | 0.0441 | -| std | 0.00639 | -| value_loss | 6.07e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 22122 | -| time_elapsed | 119559 | -| total_timesteps | 2831616 | -| train/ | | -| approx_kl | 0.04495193 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 221210 | -| policy_gradient_loss | 0.0123 | -| std | 0.00639 | -| value_loss | 3.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 22123 | -| time_elapsed | 119565 | -| total_timesteps | 2831744 | -| train/ | | -| approx_kl | 0.057638127 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.0319 | -| n_updates | 221220 | -| policy_gradient_loss | 0.0147 | -| std | 0.00639 | -| value_loss | 2e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.982 | -| time/ | | -| fps | 23 | -| iterations | 22124 | -| time_elapsed | 119571 | -| total_timesteps | 2831872 | -| train/ | | -| approx_kl | 0.04889073 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 221230 | -| policy_gradient_loss | 0.0104 | -| std | 0.00639 | -| value_loss | 1.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22125 | -| time_elapsed | 119577 | -| total_timesteps | 2832000 | -| train/ | | -| approx_kl | 0.057305176 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 221240 | -| policy_gradient_loss | 0.0123 | -| std | 0.00639 | -| value_loss | 9.92e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22126 | -| time_elapsed | 119581 | -| total_timesteps | 2832128 | -| train/ | | -| approx_kl | 0.009269615 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00494 | -| learning_rate | 0.0003 | -| loss | 0.00273 | -| n_updates | 221250 | -| policy_gradient_loss | 0.013 | -| std | 0.00638 | -| value_loss | 4.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22127 | -| time_elapsed | 119592 | -| total_timesteps | 2832256 | -| train/ | | -| approx_kl | 0.01964513 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.902 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 221260 | -| policy_gradient_loss | -0.00562 | -| std | 0.00638 | -| value_loss | 0.00173 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22128 | -| time_elapsed | 119599 | -| total_timesteps | 2832384 | -| train/ | | -| approx_kl | 0.03472161 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.00641 | -| n_updates | 221270 | -| policy_gradient_loss | 0.00626 | -| std | 0.00638 | -| value_loss | 7.72e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22129 | -| time_elapsed | 119605 | -| total_timesteps | 2832512 | -| train/ | | -| approx_kl | 0.05106213 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 221280 | -| policy_gradient_loss | 0.00393 | -| std | 0.00638 | -| value_loss | 1.15e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22130 | -| time_elapsed | 119609 | -| total_timesteps | 2832640 | -| train/ | | -| approx_kl | 0.010246459 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.00583 | -| n_updates | 221290 | -| policy_gradient_loss | 0.00625 | -| std | 0.00638 | -| value_loss | 6.83e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22131 | -| time_elapsed | 119614 | -| total_timesteps | 2832768 | -| train/ | | -| approx_kl | 0.0029561208 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 221300 | -| policy_gradient_loss | 0.00832 | -| std | 0.00639 | -| value_loss | 1.05e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 22132 | -| time_elapsed | 119620 | -| total_timesteps | 2832896 | -| train/ | | -| approx_kl | 0.10570519 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 221310 | -| policy_gradient_loss | 0.013 | -| std | 0.00641 | -| value_loss | 3.73e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22133 | -| time_elapsed | 119626 | -| total_timesteps | 2833024 | -| train/ | | -| approx_kl | 0.010598015 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0916 | -| learning_rate | 0.0003 | -| loss | 0.00708 | -| n_updates | 221320 | -| policy_gradient_loss | 0.00843 | -| std | 0.00641 | -| value_loss | 1.78e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22134 | -| time_elapsed | 119636 | -| total_timesteps | 2833152 | -| train/ | | -| approx_kl | 0.026586894 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.372 | -| learning_rate | 0.0003 | -| loss | -0.0242 | -| n_updates | 221330 | -| policy_gradient_loss | -0.00332 | -| std | 0.0064 | -| value_loss | 0.00189 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22135 | -| time_elapsed | 119642 | -| total_timesteps | 2833280 | -| train/ | | -| approx_kl | 0.732006 | -| clip_fraction | 0.769 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.12 | -| learning_rate | 0.0003 | -| loss | 0.226 | -| n_updates | 221340 | -| policy_gradient_loss | 0.356 | -| std | 0.0064 | -| value_loss | 7.39e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22136 | -| time_elapsed | 119647 | -| total_timesteps | 2833408 | -| train/ | | -| approx_kl | 0.013153584 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -4.86 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 221350 | -| policy_gradient_loss | 0.0173 | -| std | 0.0064 | -| value_loss | 1.46e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22137 | -| time_elapsed | 119652 | -| total_timesteps | 2833536 | -| train/ | | -| approx_kl | 0.25604284 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 221360 | -| policy_gradient_loss | 0.102 | -| std | 0.0064 | -| value_loss | 1.34e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22138 | -| time_elapsed | 119657 | -| total_timesteps | 2833664 | -| train/ | | -| approx_kl | 0.042805005 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 221370 | -| policy_gradient_loss | 0.0212 | -| std | 0.0064 | -| value_loss | 1.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22139 | -| time_elapsed | 119662 | -| total_timesteps | 2833792 | -| train/ | | -| approx_kl | 0.53517205 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 221380 | -| policy_gradient_loss | 0.0608 | -| std | 0.0064 | -| value_loss | 5.92e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 22140 | -| time_elapsed | 119667 | -| total_timesteps | 2833920 | -| train/ | | -| approx_kl | 0.0111590335 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.00256 | -| n_updates | 221390 | -| policy_gradient_loss | 0.00559 | -| std | 0.0064 | -| value_loss | 1.18e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22141 | -| time_elapsed | 119671 | -| total_timesteps | 2834048 | -| train/ | | -| approx_kl | 0.0030120863 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.282 | -| learning_rate | 0.0003 | -| loss | -0.00635 | -| n_updates | 221400 | -| policy_gradient_loss | 0.00861 | -| std | 0.00639 | -| value_loss | 2.1e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22142 | -| time_elapsed | 119681 | -| total_timesteps | 2834176 | -| train/ | | -| approx_kl | 0.00155462 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 221410 | -| policy_gradient_loss | 0.00975 | -| std | 0.00639 | -| value_loss | 0.00229 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22143 | -| time_elapsed | 119685 | -| total_timesteps | 2834304 | -| train/ | | -| approx_kl | 0.1650888 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | 0.0723 | -| n_updates | 221420 | -| policy_gradient_loss | 0.0497 | -| std | 0.00641 | -| value_loss | 0.0001 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22144 | -| time_elapsed | 119690 | -| total_timesteps | 2834432 | -| train/ | | -| approx_kl | 0.00095175626 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 221430 | -| policy_gradient_loss | 0.0255 | -| std | 0.00642 | -| value_loss | 0.000623 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22145 | -| time_elapsed | 119695 | -| total_timesteps | 2834560 | -| train/ | | -| approx_kl | 0.11397782 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -156 | -| learning_rate | 0.0003 | -| loss | -0.00011 | -| n_updates | 221440 | -| policy_gradient_loss | 0.00194 | -| std | 0.00642 | -| value_loss | 0.00122 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22146 | -| time_elapsed | 119700 | -| total_timesteps | 2834688 | -| train/ | | -| approx_kl | 0.025421096 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.466 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 221450 | -| policy_gradient_loss | 0.0317 | -| std | 0.00642 | -| value_loss | 6.02e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22147 | -| time_elapsed | 119704 | -| total_timesteps | 2834816 | -| train/ | | -| approx_kl | 0.5250919 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.587 | -| learning_rate | 0.0003 | -| loss | 0.256 | -| n_updates | 221460 | -| policy_gradient_loss | 0.163 | -| std | 0.00642 | -| value_loss | 3.83e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22148 | -| time_elapsed | 119709 | -| total_timesteps | 2834944 | -| train/ | | -| approx_kl | 0.07715331 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 221470 | -| policy_gradient_loss | 0.0175 | -| std | 0.00642 | -| value_loss | 1.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22149 | -| time_elapsed | 119715 | -| total_timesteps | 2835072 | -| train/ | | -| approx_kl | 0.14287765 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 221480 | -| policy_gradient_loss | 0.0165 | -| std | 0.00642 | -| value_loss | 1.47e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22150 | -| time_elapsed | 119724 | -| total_timesteps | 2835200 | -| train/ | | -| approx_kl | 0.025670044 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | 0.00218 | -| n_updates | 221490 | -| policy_gradient_loss | -0.00373 | -| std | 0.00642 | -| value_loss | 0.00461 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22151 | -| time_elapsed | 119730 | -| total_timesteps | 2835328 | -| train/ | | -| approx_kl | 0.013447832 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | 0.00295 | -| n_updates | 221500 | -| policy_gradient_loss | 0.0253 | -| std | 0.00642 | -| value_loss | 0.00026 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22152 | -| time_elapsed | 119735 | -| total_timesteps | 2835456 | -| train/ | | -| approx_kl | 0.32804355 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 221510 | -| policy_gradient_loss | 0.183 | -| std | 0.00642 | -| value_loss | 5.12e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22153 | -| time_elapsed | 119740 | -| total_timesteps | 2835584 | -| train/ | | -| approx_kl | 0.21925318 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00395 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 221520 | -| policy_gradient_loss | 0.162 | -| std | 0.00642 | -| value_loss | 1.44e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22154 | -| time_elapsed | 119747 | -| total_timesteps | 2835712 | -| train/ | | -| approx_kl | 0.040975552 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 221530 | -| policy_gradient_loss | 0.0303 | -| std | 0.00642 | -| value_loss | 1.17e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22155 | -| time_elapsed | 119753 | -| total_timesteps | 2835840 | -| train/ | | -| approx_kl | 0.0006329729 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.00127 | -| n_updates | 221540 | -| policy_gradient_loss | 0.0245 | -| std | 0.00642 | -| value_loss | 1.29e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22156 | -| time_elapsed | 119758 | -| total_timesteps | 2835968 | -| train/ | | -| approx_kl | 0.51250744 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 221550 | -| policy_gradient_loss | 0.0598 | -| std | 0.00641 | -| value_loss | 3.02e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22157 | -| time_elapsed | 119764 | -| total_timesteps | 2836096 | -| train/ | | -| approx_kl | 0.05315511 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.087 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 221560 | -| policy_gradient_loss | 0.0109 | -| std | 0.00641 | -| value_loss | 2.2e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22158 | -| time_elapsed | 119775 | -| total_timesteps | 2836224 | -| train/ | | -| approx_kl | 0.04572148 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.781 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 221570 | -| policy_gradient_loss | -0.0144 | -| std | 0.00641 | -| value_loss | 0.00657 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22159 | -| time_elapsed | 119781 | -| total_timesteps | 2836352 | -| train/ | | -| approx_kl | 0.00011962 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.00254 | -| n_updates | 221580 | -| policy_gradient_loss | 0.0022 | -| std | 0.00641 | -| value_loss | 3.45e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22160 | -| time_elapsed | 119785 | -| total_timesteps | 2836480 | -| train/ | | -| approx_kl | 0.007396287 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | -0.00691 | -| n_updates | 221590 | -| policy_gradient_loss | 0.00615 | -| std | 0.00641 | -| value_loss | 2.26e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22161 | -| time_elapsed | 119790 | -| total_timesteps | 2836608 | -| train/ | | -| approx_kl | 0.08067915 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.991 | -| learning_rate | 0.0003 | -| loss | 0.0366 | -| n_updates | 221600 | -| policy_gradient_loss | 0.0156 | -| std | 0.00642 | -| value_loss | 9.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22162 | -| time_elapsed | 119794 | -| total_timesteps | 2836736 | -| train/ | | -| approx_kl | 0.046954155 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 221610 | -| policy_gradient_loss | 0.0147 | -| std | 0.00643 | -| value_loss | 4.6e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22163 | -| time_elapsed | 119799 | -| total_timesteps | 2836864 | -| train/ | | -| approx_kl | 0.0073896255 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0658 | -| learning_rate | 0.0003 | -| loss | -0.00658 | -| n_updates | 221620 | -| policy_gradient_loss | 0.00495 | -| std | 0.00643 | -| value_loss | 2.55e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 22164 | -| time_elapsed | 119803 | -| total_timesteps | 2836992 | -| train/ | | -| approx_kl | 0.04242703 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0638 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 221630 | -| policy_gradient_loss | 0.11 | -| std | 0.00643 | -| value_loss | 1.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22165 | -| time_elapsed | 119806 | -| total_timesteps | 2837120 | -| train/ | | -| approx_kl | 0.10228063 | -| clip_fraction | 0.687 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.0635 | -| n_updates | 221640 | -| policy_gradient_loss | 0.115 | -| std | 0.00643 | -| value_loss | 1.29e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22166 | -| time_elapsed | 119820 | -| total_timesteps | 2837248 | -| train/ | | -| approx_kl | 0.17109844 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -8.73 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 221650 | -| policy_gradient_loss | 0.0472 | -| std | 0.00643 | -| value_loss | 0.00511 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22167 | -| time_elapsed | 119825 | -| total_timesteps | 2837376 | -| train/ | | -| approx_kl | 0.18365571 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 221660 | -| policy_gradient_loss | 0.116 | -| std | 0.00643 | -| value_loss | 4.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22168 | -| time_elapsed | 119830 | -| total_timesteps | 2837504 | -| train/ | | -| approx_kl | 0.042268537 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 221670 | -| policy_gradient_loss | 0.0378 | -| std | 0.00643 | -| value_loss | 6.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22169 | -| time_elapsed | 119835 | -| total_timesteps | 2837632 | -| train/ | | -| approx_kl | 0.16534725 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 221680 | -| policy_gradient_loss | 0.0155 | -| std | 0.00643 | -| value_loss | 3.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22170 | -| time_elapsed | 119839 | -| total_timesteps | 2837760 | -| train/ | | -| approx_kl | 0.018726928 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | -0.000149 | -| n_updates | 221690 | -| policy_gradient_loss | 0.0343 | -| std | 0.00643 | -| value_loss | 2.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22171 | -| time_elapsed | 119845 | -| total_timesteps | 2837888 | -| train/ | | -| approx_kl | 0.09804023 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0552 | -| n_updates | 221700 | -| policy_gradient_loss | 0.0258 | -| std | 0.00643 | -| value_loss | 1.56e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22172 | -| time_elapsed | 119850 | -| total_timesteps | 2838016 | -| train/ | | -| approx_kl | 0.6095394 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0895 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 221710 | -| policy_gradient_loss | 0.0477 | -| std | 0.00643 | -| value_loss | 3.27e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22173 | -| time_elapsed | 119862 | -| total_timesteps | 2838144 | -| train/ | | -| approx_kl | 0.010473485 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0259 | -| n_updates | 221720 | -| policy_gradient_loss | -0.00621 | -| std | 0.00643 | -| value_loss | 0.00375 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22174 | -| time_elapsed | 119867 | -| total_timesteps | 2838272 | -| train/ | | -| approx_kl | 0.16716036 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.513 | -| learning_rate | 0.0003 | -| loss | 0.0897 | -| n_updates | 221730 | -| policy_gradient_loss | 0.0437 | -| std | 0.00643 | -| value_loss | 1.6e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22175 | -| time_elapsed | 119871 | -| total_timesteps | 2838400 | -| train/ | | -| approx_kl | 0.0012848424 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00418 | -| learning_rate | 0.0003 | -| loss | 0.000675 | -| n_updates | 221740 | -| policy_gradient_loss | 0.0132 | -| std | 0.00643 | -| value_loss | 1.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22176 | -| time_elapsed | 119878 | -| total_timesteps | 2838528 | -| train/ | | -| approx_kl | 0.053421974 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0922 | -| learning_rate | 0.0003 | -| loss | 0.00359 | -| n_updates | 221750 | -| policy_gradient_loss | 0.0348 | -| std | 0.00643 | -| value_loss | 9.91e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22177 | -| time_elapsed | 119884 | -| total_timesteps | 2838656 | -| train/ | | -| approx_kl | 0.843072 | -| clip_fraction | 0.749 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.292 | -| n_updates | 221760 | -| policy_gradient_loss | 0.215 | -| std | 0.00644 | -| value_loss | 8.77e-07 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22178 | -| time_elapsed | 119889 | -| total_timesteps | 2838784 | -| train/ | | -| approx_kl | 0.06518773 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 221770 | -| policy_gradient_loss | 0.00828 | -| std | 0.00644 | -| value_loss | 5.39e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22179 | -| time_elapsed | 119895 | -| total_timesteps | 2838912 | -| train/ | | -| approx_kl | 0.5536895 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0659 | -| learning_rate | 0.0003 | -| loss | 0.249 | -| n_updates | 221780 | -| policy_gradient_loss | 0.0782 | -| std | 0.00644 | -| value_loss | 2.98e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22180 | -| time_elapsed | 119900 | -| total_timesteps | 2839040 | -| train/ | | -| approx_kl | 0.0071341777 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0733 | -| learning_rate | 0.0003 | -| loss | -0.00641 | -| n_updates | 221790 | -| policy_gradient_loss | 0.00689 | -| std | 0.00643 | -| value_loss | 2.62e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22181 | -| time_elapsed | 119911 | -| total_timesteps | 2839168 | -| train/ | | -| approx_kl | 0.0013244222 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.943 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 221800 | -| policy_gradient_loss | 0.00287 | -| std | 0.00643 | -| value_loss | 0.000621 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22182 | -| time_elapsed | 119916 | -| total_timesteps | 2839296 | -| train/ | | -| approx_kl | 0.009187607 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 221810 | -| policy_gradient_loss | 0.00336 | -| std | 0.00643 | -| value_loss | 1.3e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22183 | -| time_elapsed | 119921 | -| total_timesteps | 2839424 | -| train/ | | -| approx_kl | 0.0010774354 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00988 | -| learning_rate | 0.0003 | -| loss | 0.00469 | -| n_updates | 221820 | -| policy_gradient_loss | 0.00909 | -| std | 0.00643 | -| value_loss | 1.32e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22184 | -| time_elapsed | 119926 | -| total_timesteps | 2839552 | -| train/ | | -| approx_kl | 6.9160014e-06 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.000793 | -| n_updates | 221830 | -| policy_gradient_loss | -0.00364 | -| std | 0.00643 | -| value_loss | 1.18e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22185 | -| time_elapsed | 119932 | -| total_timesteps | 2839680 | -| train/ | | -| approx_kl | 0.059672207 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 221840 | -| policy_gradient_loss | 0.0124 | -| std | 0.00643 | -| value_loss | 6.58e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22186 | -| time_elapsed | 119938 | -| total_timesteps | 2839808 | -| train/ | | -| approx_kl | 0.008460475 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0775 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 221850 | -| policy_gradient_loss | 0.00717 | -| std | 0.00643 | -| value_loss | 4.69e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22187 | -| time_elapsed | 119943 | -| total_timesteps | 2839936 | -| train/ | | -| approx_kl | 0.0025332654 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | -0.00311 | -| n_updates | 221860 | -| policy_gradient_loss | 0.006 | -| std | 0.00643 | -| value_loss | 3.32e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22188 | -| time_elapsed | 119949 | -| total_timesteps | 2840064 | -| train/ | | -| approx_kl | 0.04622225 | -| clip_fraction | 0.654 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0659 | -| learning_rate | 0.0003 | -| loss | 0.0437 | -| n_updates | 221870 | -| policy_gradient_loss | 0.136 | -| std | 0.00643 | -| value_loss | 2.11e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22189 | -| time_elapsed | 119959 | -| total_timesteps | 2840192 | -| train/ | | -| approx_kl | 0.017376205 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 221880 | -| policy_gradient_loss | 0.0109 | -| std | 0.00643 | -| value_loss | 0.00209 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22190 | -| time_elapsed | 119965 | -| total_timesteps | 2840320 | -| train/ | | -| approx_kl | 0.139562 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 221890 | -| policy_gradient_loss | 0.0654 | -| std | 0.00643 | -| value_loss | 8.84e-06 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22191 | -| time_elapsed | 119970 | -| total_timesteps | 2840448 | -| train/ | | -| approx_kl | 1.5401281e-05 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00995 | -| learning_rate | 0.0003 | -| loss | -3.93e-05 | -| n_updates | 221900 | -| policy_gradient_loss | 0.0156 | -| std | 0.00644 | -| value_loss | 3.2e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22192 | -| time_elapsed | 119976 | -| total_timesteps | 2840576 | -| train/ | | -| approx_kl | 0.00063849427 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | 0.00133 | -| n_updates | 221910 | -| policy_gradient_loss | 0.0152 | -| std | 0.00644 | -| value_loss | 2.97e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22193 | -| time_elapsed | 119982 | -| total_timesteps | 2840704 | -| train/ | | -| approx_kl | 0.26641512 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 221920 | -| policy_gradient_loss | 0.0419 | -| std | 0.00644 | -| value_loss | 1.35e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22194 | -| time_elapsed | 119988 | -| total_timesteps | 2840832 | -| train/ | | -| approx_kl | 0.16291276 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | 0.0676 | -| n_updates | 221930 | -| policy_gradient_loss | 0.0207 | -| std | 0.00645 | -| value_loss | 8.94e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22195 | -| time_elapsed | 119992 | -| total_timesteps | 2840960 | -| train/ | | -| approx_kl | 0.019211084 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.091 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 221940 | -| policy_gradient_loss | 0.0105 | -| std | 0.00645 | -| value_loss | 6.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22196 | -| time_elapsed | 119996 | -| total_timesteps | 2841088 | -| train/ | | -| approx_kl | 0.115020365 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0743 | -| n_updates | 221950 | -| policy_gradient_loss | 0.0356 | -| std | 0.00644 | -| value_loss | 5.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22197 | -| time_elapsed | 120009 | -| total_timesteps | 2841216 | -| train/ | | -| approx_kl | 0.025053028 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 221960 | -| policy_gradient_loss | -0.0189 | -| std | 0.00644 | -| value_loss | 0.000225 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22198 | -| time_elapsed | 120014 | -| total_timesteps | 2841344 | -| train/ | | -| approx_kl | 0.015648356 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -2.5e-06 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 221970 | -| policy_gradient_loss | -0.00283 | -| std | 0.00644 | -| value_loss | 2.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22199 | -| time_elapsed | 120019 | -| total_timesteps | 2841472 | -| train/ | | -| approx_kl | 0.028423052 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00664 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 221980 | -| policy_gradient_loss | 0.036 | -| std | 0.00644 | -| value_loss | 4.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22200 | -| time_elapsed | 120025 | -| total_timesteps | 2841600 | -| train/ | | -| approx_kl | 0.32088628 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0701 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 221990 | -| policy_gradient_loss | 0.157 | -| std | 0.00644 | -| value_loss | 4.28e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22201 | -| time_elapsed | 120030 | -| total_timesteps | 2841728 | -| train/ | | -| approx_kl | 0.18940106 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 222000 | -| policy_gradient_loss | 0.132 | -| std | 0.00644 | -| value_loss | 3.63e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22202 | -| time_elapsed | 120035 | -| total_timesteps | 2841856 | -| train/ | | -| approx_kl | 0.17597337 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 222010 | -| policy_gradient_loss | 0.16 | -| std | 0.00644 | -| value_loss | 3.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22203 | -| time_elapsed | 120040 | -| total_timesteps | 2841984 | -| train/ | | -| approx_kl | 0.028818931 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -0.00471 | -| n_updates | 222020 | -| policy_gradient_loss | 0.0236 | -| std | 0.00644 | -| value_loss | 2.73e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22204 | -| time_elapsed | 120046 | -| total_timesteps | 2842112 | -| train/ | | -| approx_kl | 0.00040612463 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.00057 | -| n_updates | 222030 | -| policy_gradient_loss | 0.028 | -| std | 0.00644 | -| value_loss | 1.29e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22205 | -| time_elapsed | 120055 | -| total_timesteps | 2842240 | -| train/ | | -| approx_kl | 0.4609848 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.955 | -| learning_rate | 0.0003 | -| loss | 0.179 | -| n_updates | 222040 | -| policy_gradient_loss | 0.0644 | -| std | 0.00644 | -| value_loss | 0.000634 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22206 | -| time_elapsed | 120060 | -| total_timesteps | 2842368 | -| train/ | | -| approx_kl | 0.054303497 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 222050 | -| policy_gradient_loss | 0.00568 | -| std | 0.00644 | -| value_loss | 1.52e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22207 | -| time_elapsed | 120065 | -| total_timesteps | 2842496 | -| train/ | | -| approx_kl | 0.056936733 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0068 | -| learning_rate | 0.0003 | -| loss | 0.0339 | -| n_updates | 222060 | -| policy_gradient_loss | 0.0165 | -| std | 0.00644 | -| value_loss | 2.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22208 | -| time_elapsed | 120070 | -| total_timesteps | 2842624 | -| train/ | | -| approx_kl | 0.008970059 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.0012 | -| n_updates | 222070 | -| policy_gradient_loss | 0.0067 | -| std | 0.00643 | -| value_loss | 9.99e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22209 | -| time_elapsed | 120076 | -| total_timesteps | 2842752 | -| train/ | | -| approx_kl | 0.0624382 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0753 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 222080 | -| policy_gradient_loss | 0.00917 | -| std | 0.00643 | -| value_loss | 9.12e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22210 | -| time_elapsed | 120080 | -| total_timesteps | 2842880 | -| train/ | | -| approx_kl | 0.013917242 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 222090 | -| policy_gradient_loss | 0.00652 | -| std | 0.00643 | -| value_loss | 7.36e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22211 | -| time_elapsed | 120086 | -| total_timesteps | 2843008 | -| train/ | | -| approx_kl | 0.0028588786 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 222100 | -| policy_gradient_loss | 0.00751 | -| std | 0.00643 | -| value_loss | 3.83e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22212 | -| time_elapsed | 120098 | -| total_timesteps | 2843136 | -| train/ | | -| approx_kl | 0.0092180995 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.87 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 222110 | -| policy_gradient_loss | 0.0481 | -| std | 0.00643 | -| value_loss | 0.00299 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22213 | -| time_elapsed | 120102 | -| total_timesteps | 2843264 | -| train/ | | -| approx_kl | 0.13487443 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.473 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 222120 | -| policy_gradient_loss | 0.0604 | -| std | 0.00643 | -| value_loss | 3.33e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22214 | -| time_elapsed | 120106 | -| total_timesteps | 2843392 | -| train/ | | -| approx_kl | 0.10850766 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00138 | -| learning_rate | 0.0003 | -| loss | 0.0827 | -| n_updates | 222130 | -| policy_gradient_loss | 0.0991 | -| std | 0.00643 | -| value_loss | 1.73e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22215 | -| time_elapsed | 120111 | -| total_timesteps | 2843520 | -| train/ | | -| approx_kl | 0.02963909 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 222140 | -| policy_gradient_loss | 0.0305 | -| std | 0.00643 | -| value_loss | 1.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22216 | -| time_elapsed | 120117 | -| total_timesteps | 2843648 | -| train/ | | -| approx_kl | 0.18248102 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 222150 | -| policy_gradient_loss | 0.0159 | -| std | 0.00644 | -| value_loss | 8.94e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22217 | -| time_elapsed | 120124 | -| total_timesteps | 2843776 | -| train/ | | -| approx_kl | 0.018954985 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | -0.0228 | -| n_updates | 222160 | -| policy_gradient_loss | -0.0133 | -| std | 0.00644 | -| value_loss | 6.36e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22218 | -| time_elapsed | 120131 | -| total_timesteps | 2843904 | -| train/ | | -| approx_kl | 0.027391877 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 222170 | -| policy_gradient_loss | 0.0411 | -| std | 0.00643 | -| value_loss | 4.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22219 | -| time_elapsed | 120136 | -| total_timesteps | 2844032 | -| train/ | | -| approx_kl | 0.28020382 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0452 | -| learning_rate | 0.0003 | -| loss | 0.195 | -| n_updates | 222180 | -| policy_gradient_loss | 0.137 | -| std | 0.00643 | -| value_loss | 3.66e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22220 | -| time_elapsed | 120149 | -| total_timesteps | 2844160 | -| train/ | | -| approx_kl | 0.51056933 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | 0.0897 | -| n_updates | 222190 | -| policy_gradient_loss | 0.0808 | -| std | 0.00643 | -| value_loss | 0.000713 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22221 | -| time_elapsed | 120154 | -| total_timesteps | 2844288 | -| train/ | | -| approx_kl | 0.34017262 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0053 | -| learning_rate | 0.0003 | -| loss | 0.251 | -| n_updates | 222200 | -| policy_gradient_loss | 0.199 | -| std | 0.00643 | -| value_loss | 2.4e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22222 | -| time_elapsed | 120159 | -| total_timesteps | 2844416 | -| train/ | | -| approx_kl | 0.046491463 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 222210 | -| policy_gradient_loss | 0.0207 | -| std | 0.00644 | -| value_loss | 1.03e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22223 | -| time_elapsed | 120164 | -| total_timesteps | 2844544 | -| train/ | | -| approx_kl | 0.734506 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.238 | -| n_updates | 222220 | -| policy_gradient_loss | 0.0649 | -| std | 0.00644 | -| value_loss | 5.75e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22224 | -| time_elapsed | 120170 | -| total_timesteps | 2844672 | -| train/ | | -| approx_kl | 0.043120004 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0153 | -| n_updates | 222230 | -| policy_gradient_loss | 0.00891 | -| std | 0.00644 | -| value_loss | 4.11e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22225 | -| time_elapsed | 120175 | -| total_timesteps | 2844800 | -| train/ | | -| approx_kl | 0.0077923024 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 222240 | -| policy_gradient_loss | 0.00778 | -| std | 0.00644 | -| value_loss | 2.3e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 22226 | -| time_elapsed | 120183 | -| total_timesteps | 2844928 | -| train/ | | -| approx_kl | 0.00240093 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0702 | -| learning_rate | 0.0003 | -| loss | -0.000651 | -| n_updates | 222250 | -| policy_gradient_loss | 0.0104 | -| std | 0.00644 | -| value_loss | 1.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22227 | -| time_elapsed | 120188 | -| total_timesteps | 2845056 | -| train/ | | -| approx_kl | 0.04866776 | -| clip_fraction | 0.653 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | 0.0504 | -| n_updates | 222260 | -| policy_gradient_loss | 0.143 | -| std | 0.00643 | -| value_loss | 3.75e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22228 | -| time_elapsed | 120197 | -| total_timesteps | 2845184 | -| train/ | | -| approx_kl | 0.18697995 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 222270 | -| policy_gradient_loss | 0.0292 | -| std | 0.00643 | -| value_loss | 0.000923 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22229 | -| time_elapsed | 120202 | -| total_timesteps | 2845312 | -| train/ | | -| approx_kl | 0.27885595 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -192 | -| learning_rate | 0.0003 | -| loss | 0.0534 | -| n_updates | 222280 | -| policy_gradient_loss | 0.0346 | -| std | 0.00644 | -| value_loss | 4.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22230 | -| time_elapsed | 120207 | -| total_timesteps | 2845440 | -| train/ | | -| approx_kl | 0.046042804 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 222290 | -| policy_gradient_loss | 0.0231 | -| std | 0.00644 | -| value_loss | 6.86e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22231 | -| time_elapsed | 120212 | -| total_timesteps | 2845568 | -| train/ | | -| approx_kl | 0.64765364 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.68 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 222300 | -| policy_gradient_loss | 0.0438 | -| std | 0.00644 | -| value_loss | 2.29e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22232 | -| time_elapsed | 120217 | -| total_timesteps | 2845696 | -| train/ | | -| approx_kl | 0.012820674 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.178 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 222310 | -| policy_gradient_loss | 0.0034 | -| std | 0.00644 | -| value_loss | 1.46e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22233 | -| time_elapsed | 120223 | -| total_timesteps | 2845824 | -| train/ | | -| approx_kl | 0.0025603427 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.00369 | -| n_updates | 222320 | -| policy_gradient_loss | 0.0104 | -| std | 0.00644 | -| value_loss | 1.08e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22234 | -| time_elapsed | 120228 | -| total_timesteps | 2845952 | -| train/ | | -| approx_kl | 0.1024522 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 222330 | -| policy_gradient_loss | 0.00685 | -| std | 0.00644 | -| value_loss | 7.09e-10 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22235 | -| time_elapsed | 120233 | -| total_timesteps | 2846080 | -| train/ | | -| approx_kl | 0.012898258 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0589 | -| learning_rate | 0.0003 | -| loss | -0.0064 | -| n_updates | 222340 | -| policy_gradient_loss | 0.00225 | -| std | 0.00645 | -| value_loss | 4.91e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22236 | -| time_elapsed | 120241 | -| total_timesteps | 2846208 | -| train/ | | -| approx_kl | 0.15198682 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 222350 | -| policy_gradient_loss | -0.00531 | -| std | 0.00645 | -| value_loss | 0.00331 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22237 | -| time_elapsed | 120249 | -| total_timesteps | 2846336 | -| train/ | | -| approx_kl | 0.15634528 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.346 | -| learning_rate | 0.0003 | -| loss | 0.0872 | -| n_updates | 222360 | -| policy_gradient_loss | 0.0243 | -| std | 0.00645 | -| value_loss | 0.0002 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22238 | -| time_elapsed | 120254 | -| total_timesteps | 2846464 | -| train/ | | -| approx_kl | 0.026321093 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | 0.0042 | -| n_updates | 222370 | -| policy_gradient_loss | 0.0298 | -| std | 0.00645 | -| value_loss | 2.77e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22239 | -| time_elapsed | 120260 | -| total_timesteps | 2846592 | -| train/ | | -| approx_kl | 0.14004122 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0772 | -| n_updates | 222380 | -| policy_gradient_loss | 0.037 | -| std | 0.00645 | -| value_loss | 1.48e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22240 | -| time_elapsed | 120265 | -| total_timesteps | 2846720 | -| train/ | | -| approx_kl | 0.14173475 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0739 | -| learning_rate | 0.0003 | -| loss | 0.0769 | -| n_updates | 222390 | -| policy_gradient_loss | 0.0238 | -| std | 0.00644 | -| value_loss | 9.22e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22241 | -| time_elapsed | 120270 | -| total_timesteps | 2846848 | -| train/ | | -| approx_kl | 0.0125306705 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 222400 | -| policy_gradient_loss | -0.00109 | -| std | 0.00644 | -| value_loss | 5.66e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22242 | -| time_elapsed | 120276 | -| total_timesteps | 2846976 | -| train/ | | -| approx_kl | 0.03162839 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0784 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 222410 | -| policy_gradient_loss | 0.0347 | -| std | 0.00644 | -| value_loss | 4.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22243 | -| time_elapsed | 120281 | -| total_timesteps | 2847104 | -| train/ | | -| approx_kl | 0.107597366 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0478 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 222420 | -| policy_gradient_loss | 0.0188 | -| std | 0.00644 | -| value_loss | 3.8e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22244 | -| time_elapsed | 120292 | -| total_timesteps | 2847232 | -| train/ | | -| approx_kl | 0.07119676 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 222430 | -| policy_gradient_loss | 0.00995 | -| std | 0.00643 | -| value_loss | 0.00164 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22245 | -| time_elapsed | 120296 | -| total_timesteps | 2847360 | -| train/ | | -| approx_kl | 0.6593469 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00768 | -| learning_rate | 0.0003 | -| loss | 0.209 | -| n_updates | 222440 | -| policy_gradient_loss | 0.0739 | -| std | 0.00643 | -| value_loss | 6.31e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22246 | -| time_elapsed | 120301 | -| total_timesteps | 2847488 | -| train/ | | -| approx_kl | 0.049400367 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 222450 | -| policy_gradient_loss | 0.00204 | -| std | 0.00643 | -| value_loss | 3.16e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22247 | -| time_elapsed | 120306 | -| total_timesteps | 2847616 | -| train/ | | -| approx_kl | 0.06551259 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.0548 | -| n_updates | 222460 | -| policy_gradient_loss | 0.0637 | -| std | 0.00646 | -| value_loss | 0.000681 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22248 | -| time_elapsed | 120311 | -| total_timesteps | 2847744 | -| train/ | | -| approx_kl | 0.031839013 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 222470 | -| policy_gradient_loss | 0.0494 | -| std | 0.00647 | -| value_loss | 0.000511 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22249 | -| time_elapsed | 120317 | -| total_timesteps | 2847872 | -| train/ | | -| approx_kl | 0.9893336 | -| clip_fraction | 0.751 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.286 | -| n_updates | 222480 | -| policy_gradient_loss | 0.237 | -| std | 0.00647 | -| value_loss | 5.56e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22250 | -| time_elapsed | 120321 | -| total_timesteps | 2848000 | -| train/ | | -| approx_kl | 0.030538332 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 222490 | -| policy_gradient_loss | -0.0121 | -| std | 0.00648 | -| value_loss | 6.67e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22251 | -| time_elapsed | 120327 | -| total_timesteps | 2848128 | -| train/ | | -| approx_kl | 0.020307176 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.00922 | -| n_updates | 222500 | -| policy_gradient_loss | 0.00357 | -| std | 0.00648 | -| value_loss | 0.000126 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22252 | -| time_elapsed | 120342 | -| total_timesteps | 2848256 | -| train/ | | -| approx_kl | 0.0034214482 | -| clip_fraction | 0.0859 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.579 | -| learning_rate | 0.0003 | -| loss | -0.0283 | -| n_updates | 222510 | -| policy_gradient_loss | -0.011 | -| std | 0.00648 | -| value_loss | 0.00154 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22253 | -| time_elapsed | 120347 | -| total_timesteps | 2848384 | -| train/ | | -| approx_kl | 0.08538922 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | 0.0334 | -| n_updates | 222520 | -| policy_gradient_loss | 0.06 | -| std | 0.00648 | -| value_loss | 2.52e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22254 | -| time_elapsed | 120353 | -| total_timesteps | 2848512 | -| train/ | | -| approx_kl | 0.19714655 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0905 | -| n_updates | 222530 | -| policy_gradient_loss | 0.0441 | -| std | 0.00648 | -| value_loss | 1.43e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22255 | -| time_elapsed | 120358 | -| total_timesteps | 2848640 | -| train/ | | -| approx_kl | 0.0032248944 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.00811 | -| n_updates | 222540 | -| policy_gradient_loss | 0.00499 | -| std | 0.00648 | -| value_loss | 1.26e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22256 | -| time_elapsed | 120364 | -| total_timesteps | 2848768 | -| train/ | | -| approx_kl | 0.09648125 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.00427 | -| n_updates | 222550 | -| policy_gradient_loss | 0.0612 | -| std | 0.00648 | -| value_loss | 1.06e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22257 | -| time_elapsed | 120369 | -| total_timesteps | 2848896 | -| train/ | | -| approx_kl | 0.041987862 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 222560 | -| policy_gradient_loss | 0.0314 | -| std | 0.00648 | -| value_loss | 7.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22258 | -| time_elapsed | 120374 | -| total_timesteps | 2849024 | -| train/ | | -| approx_kl | 0.0008760905 | -| clip_fraction | 0.571 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | -0.00324 | -| n_updates | 222570 | -| policy_gradient_loss | 0.0804 | -| std | 0.00648 | -| value_loss | 2.91e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22259 | -| time_elapsed | 120386 | -| total_timesteps | 2849152 | -| train/ | | -| approx_kl | 0.13216187 | -| clip_fraction | 0.674 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.714 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 222580 | -| policy_gradient_loss | 0.143 | -| std | 0.00648 | -| value_loss | 0.00748 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22260 | -| time_elapsed | 120391 | -| total_timesteps | 2849280 | -| train/ | | -| approx_kl | 0.10729303 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.387 | -| learning_rate | 0.0003 | -| loss | 0.0427 | -| n_updates | 222590 | -| policy_gradient_loss | 0.0369 | -| std | 0.00648 | -| value_loss | 6.42e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22261 | -| time_elapsed | 120396 | -| total_timesteps | 2849408 | -| train/ | | -| approx_kl | 0.33094552 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 222600 | -| policy_gradient_loss | 0.13 | -| std | 0.00648 | -| value_loss | 6.43e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22262 | -| time_elapsed | 120400 | -| total_timesteps | 2849536 | -| train/ | | -| approx_kl | 0.2439319 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 222610 | -| policy_gradient_loss | 0.144 | -| std | 0.00648 | -| value_loss | 6.34e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22263 | -| time_elapsed | 120405 | -| total_timesteps | 2849664 | -| train/ | | -| approx_kl | 0.16107872 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 222620 | -| policy_gradient_loss | 0.119 | -| std | 0.00648 | -| value_loss | 5.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22264 | -| time_elapsed | 120410 | -| total_timesteps | 2849792 | -| train/ | | -| approx_kl | 0.12342649 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.0882 | -| n_updates | 222630 | -| policy_gradient_loss | 0.115 | -| std | 0.00648 | -| value_loss | 3.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22265 | -| time_elapsed | 120415 | -| total_timesteps | 2849920 | -| train/ | | -| approx_kl | 0.14621201 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 222640 | -| policy_gradient_loss | 0.139 | -| std | 0.00648 | -| value_loss | 1.89e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22266 | -| time_elapsed | 120421 | -| total_timesteps | 2850048 | -| train/ | | -| approx_kl | 0.028993493 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | -0.0257 | -| n_updates | 222650 | -| policy_gradient_loss | 0.0233 | -| std | 0.00648 | -| value_loss | 1.91e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22267 | -| time_elapsed | 120433 | -| total_timesteps | 2850176 | -| train/ | | -| approx_kl | 0.0389121 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.607 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 222660 | -| policy_gradient_loss | -0.000752 | -| std | 0.00648 | -| value_loss | 0.00306 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22268 | -| time_elapsed | 120438 | -| total_timesteps | 2850304 | -| train/ | | -| approx_kl | 0.00232139 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -98.4 | -| learning_rate | 0.0003 | -| loss | -0.00487 | -| n_updates | 222670 | -| policy_gradient_loss | 0.032 | -| std | 0.00648 | -| value_loss | 4.14e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22269 | -| time_elapsed | 120444 | -| total_timesteps | 2850432 | -| train/ | | -| approx_kl | 1.2373792 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.318 | -| learning_rate | 0.0003 | -| loss | 0.226 | -| n_updates | 222680 | -| policy_gradient_loss | 0.178 | -| std | 0.00649 | -| value_loss | 9.06e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22270 | -| time_elapsed | 120451 | -| total_timesteps | 2850560 | -| train/ | | -| approx_kl | 0.036966957 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.326 | -| learning_rate | 0.0003 | -| loss | 0.0188 | -| n_updates | 222690 | -| policy_gradient_loss | 0.0157 | -| std | 0.00649 | -| value_loss | 9.04e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22271 | -| time_elapsed | 120455 | -| total_timesteps | 2850688 | -| train/ | | -| approx_kl | 0.13920951 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 222700 | -| policy_gradient_loss | 0.0612 | -| std | 0.00649 | -| value_loss | 1.55e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22272 | -| time_elapsed | 120460 | -| total_timesteps | 2850816 | -| train/ | | -| approx_kl | 0.031788904 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0947 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 222710 | -| policy_gradient_loss | 0.0546 | -| std | 0.00649 | -| value_loss | 2.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22273 | -| time_elapsed | 120465 | -| total_timesteps | 2850944 | -| train/ | | -| approx_kl | 0.016474284 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.308 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 222720 | -| policy_gradient_loss | 0.012 | -| std | 0.00649 | -| value_loss | 4.16e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22274 | -| time_elapsed | 120470 | -| total_timesteps | 2851072 | -| train/ | | -| approx_kl | 0.18261214 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 222730 | -| policy_gradient_loss | 0.0102 | -| std | 0.00649 | -| value_loss | 2.91e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22275 | -| time_elapsed | 120484 | -| total_timesteps | 2851200 | -| train/ | | -| approx_kl | 0.02409672 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.85 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 222740 | -| policy_gradient_loss | 0.00713 | -| std | 0.00649 | -| value_loss | 0.00328 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22276 | -| time_elapsed | 120490 | -| total_timesteps | 2851328 | -| train/ | | -| approx_kl | 0.030656971 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.368 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 222750 | -| policy_gradient_loss | 0.0294 | -| std | 0.00648 | -| value_loss | 0.000477 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22277 | -| time_elapsed | 120496 | -| total_timesteps | 2851456 | -| train/ | | -| approx_kl | 0.000265921 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0114 | -| learning_rate | 0.0003 | -| loss | 0.000779 | -| n_updates | 222760 | -| policy_gradient_loss | 0.0281 | -| std | 0.00648 | -| value_loss | 0.000621 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22278 | -| time_elapsed | 120502 | -| total_timesteps | 2851584 | -| train/ | | -| approx_kl | 0.17558032 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.546 | -| learning_rate | 0.0003 | -| loss | 0.073 | -| n_updates | 222770 | -| policy_gradient_loss | 0.016 | -| std | 0.00647 | -| value_loss | 0.00295 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22279 | -| time_elapsed | 120509 | -| total_timesteps | 2851712 | -| train/ | | -| approx_kl | 0.014358508 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | -0.00705 | -| n_updates | 222780 | -| policy_gradient_loss | 0.0221 | -| std | 0.00647 | -| value_loss | 0.000278 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22280 | -| time_elapsed | 120518 | -| total_timesteps | 2851840 | -| train/ | | -| approx_kl | 0.10185449 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00586 | -| learning_rate | 0.0003 | -| loss | 0.0513 | -| n_updates | 222790 | -| policy_gradient_loss | 0.0271 | -| std | 0.00648 | -| value_loss | 0.000151 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22281 | -| time_elapsed | 120526 | -| total_timesteps | 2851968 | -| train/ | | -| approx_kl | 0.62576187 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | 0.0895 | -| n_updates | 222800 | -| policy_gradient_loss | 0.0377 | -| std | 0.00648 | -| value_loss | 0.000112 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22282 | -| time_elapsed | 120531 | -| total_timesteps | 2852096 | -| train/ | | -| approx_kl | 0.04140181 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 222810 | -| policy_gradient_loss | 0.00184 | -| std | 0.00648 | -| value_loss | 9.33e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22283 | -| time_elapsed | 120546 | -| total_timesteps | 2852224 | -| train/ | | -| approx_kl | 0.007199788 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.865 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 222820 | -| policy_gradient_loss | 0.00486 | -| std | 0.00648 | -| value_loss | 0.00142 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22284 | -| time_elapsed | 120554 | -| total_timesteps | 2852352 | -| train/ | | -| approx_kl | 0.04110381 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.076 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 222830 | -| policy_gradient_loss | 0.0971 | -| std | 0.00648 | -| value_loss | 4.82e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22285 | -| time_elapsed | 120562 | -| total_timesteps | 2852480 | -| train/ | | -| approx_kl | 0.009603336 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 222840 | -| policy_gradient_loss | 0.0259 | -| std | 0.00648 | -| value_loss | 4.08e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22286 | -| time_elapsed | 120570 | -| total_timesteps | 2852608 | -| train/ | | -| approx_kl | 0.25491142 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 222850 | -| policy_gradient_loss | 0.0637 | -| std | 0.00649 | -| value_loss | 3.6e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22287 | -| time_elapsed | 120576 | -| total_timesteps | 2852736 | -| train/ | | -| approx_kl | 0.006464529 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 222860 | -| policy_gradient_loss | 0.00998 | -| std | 0.0065 | -| value_loss | 1.11e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22288 | -| time_elapsed | 120583 | -| total_timesteps | 2852864 | -| train/ | | -| approx_kl | 0.056547917 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.00759 | -| n_updates | 222870 | -| policy_gradient_loss | 0.000979 | -| std | 0.0065 | -| value_loss | 6.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22289 | -| time_elapsed | 120590 | -| total_timesteps | 2852992 | -| train/ | | -| approx_kl | 0.013374883 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.00413 | -| n_updates | 222880 | -| policy_gradient_loss | 0.00717 | -| std | 0.0065 | -| value_loss | 4.61e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22290 | -| time_elapsed | 120596 | -| total_timesteps | 2853120 | -| train/ | | -| approx_kl | 0.0008272561 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.00324 | -| n_updates | 222890 | -| policy_gradient_loss | 0.0102 | -| std | 0.0065 | -| value_loss | 3.52e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22291 | -| time_elapsed | 120621 | -| total_timesteps | 2853248 | -| train/ | | -| approx_kl | 0.009385258 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | 0.00654 | -| n_updates | 222900 | -| policy_gradient_loss | 0.00507 | -| std | 0.0065 | -| value_loss | 0.00383 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22292 | -| time_elapsed | 120628 | -| total_timesteps | 2853376 | -| train/ | | -| approx_kl | 0.018615166 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.000735 | -| n_updates | 222910 | -| policy_gradient_loss | 0.00621 | -| std | 0.00649 | -| value_loss | 0.00149 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22293 | -| time_elapsed | 120633 | -| total_timesteps | 2853504 | -| train/ | | -| approx_kl | 0.003028933 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00615 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 222920 | -| policy_gradient_loss | 0.0099 | -| std | 0.00649 | -| value_loss | 0.000231 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22294 | -| time_elapsed | 120642 | -| total_timesteps | 2853632 | -| train/ | | -| approx_kl | 2.0241365e-05 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.000637 | -| n_updates | 222930 | -| policy_gradient_loss | 0.0393 | -| std | 0.00649 | -| value_loss | 0.000136 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22295 | -| time_elapsed | 120649 | -| total_timesteps | 2853760 | -| train/ | | -| approx_kl | 0.8897589 | -| clip_fraction | 0.753 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | 0.353 | -| n_updates | 222940 | -| policy_gradient_loss | 0.154 | -| std | 0.00649 | -| value_loss | 0.000112 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22296 | -| time_elapsed | 120659 | -| total_timesteps | 2853888 | -| train/ | | -| approx_kl | 0.011513859 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 222950 | -| policy_gradient_loss | 0.024 | -| std | 0.00649 | -| value_loss | 9.18e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22297 | -| time_elapsed | 120667 | -| total_timesteps | 2854016 | -| train/ | | -| approx_kl | 0.1260591 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.0626 | -| n_updates | 222960 | -| policy_gradient_loss | 0.0352 | -| std | 0.00649 | -| value_loss | 6.94e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22298 | -| time_elapsed | 120685 | -| total_timesteps | 2854144 | -| train/ | | -| approx_kl | 0.19050695 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.248 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 222970 | -| policy_gradient_loss | -0.0093 | -| std | 0.00649 | -| value_loss | 0.00303 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22299 | -| time_elapsed | 120693 | -| total_timesteps | 2854272 | -| train/ | | -| approx_kl | 0.022712028 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.428 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 222980 | -| policy_gradient_loss | 0.0186 | -| std | 0.00649 | -| value_loss | 3.11e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22300 | -| time_elapsed | 120700 | -| total_timesteps | 2854400 | -| train/ | | -| approx_kl | 0.11379286 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00821 | -| learning_rate | 0.0003 | -| loss | 0.071 | -| n_updates | 222990 | -| policy_gradient_loss | 0.0365 | -| std | 0.00649 | -| value_loss | 1.42e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22301 | -| time_elapsed | 120705 | -| total_timesteps | 2854528 | -| train/ | | -| approx_kl | 6.1875675e-05 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | -0.000914 | -| n_updates | 223000 | -| policy_gradient_loss | 0.0338 | -| std | 0.00649 | -| value_loss | 1.15e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22302 | -| time_elapsed | 120711 | -| total_timesteps | 2854656 | -| train/ | | -| approx_kl | 0.00054489635 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.000887 | -| n_updates | 223010 | -| policy_gradient_loss | 0.0331 | -| std | 0.00649 | -| value_loss | 6.55e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22303 | -| time_elapsed | 120716 | -| total_timesteps | 2854784 | -| train/ | | -| approx_kl | 0.58739936 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0774 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 223020 | -| policy_gradient_loss | 0.0611 | -| std | 0.00649 | -| value_loss | 5.13e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 22304 | -| time_elapsed | 120722 | -| total_timesteps | 2854912 | -| train/ | | -| approx_kl | 0.0066799694 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 223030 | -| policy_gradient_loss | 0.0044 | -| std | 0.00649 | -| value_loss | 4.32e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22305 | -| time_elapsed | 120729 | -| total_timesteps | 2855040 | -| train/ | | -| approx_kl | 0.03659346 | -| clip_fraction | 0.625 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | 0.0518 | -| n_updates | 223040 | -| policy_gradient_loss | 0.0973 | -| std | 0.00649 | -| value_loss | 2.88e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22306 | -| time_elapsed | 120747 | -| total_timesteps | 2855168 | -| train/ | | -| approx_kl | 0.31399694 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.516 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 223050 | -| policy_gradient_loss | 0.025 | -| std | 0.00649 | -| value_loss | 0.0016 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22307 | -| time_elapsed | 120753 | -| total_timesteps | 2855296 | -| train/ | | -| approx_kl | 0.24188979 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -5.64 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 223060 | -| policy_gradient_loss | 0.0478 | -| std | 0.0065 | -| value_loss | 5.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22308 | -| time_elapsed | 120760 | -| total_timesteps | 2855424 | -| train/ | | -| approx_kl | 0.042211525 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -45.2 | -| learning_rate | 0.0003 | -| loss | -0.00999 | -| n_updates | 223070 | -| policy_gradient_loss | 0.0118 | -| std | 0.0065 | -| value_loss | 3.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22309 | -| time_elapsed | 120767 | -| total_timesteps | 2855552 | -| train/ | | -| approx_kl | 0.16197915 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0588 | -| learning_rate | 0.0003 | -| loss | 0.0797 | -| n_updates | 223080 | -| policy_gradient_loss | 0.0216 | -| std | 0.00651 | -| value_loss | 6.5e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22310 | -| time_elapsed | 120773 | -| total_timesteps | 2855680 | -| train/ | | -| approx_kl | 0.018568177 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.841 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 223090 | -| policy_gradient_loss | -0.00927 | -| std | 0.00652 | -| value_loss | 6.57e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22311 | -| time_elapsed | 120779 | -| total_timesteps | 2855808 | -| train/ | | -| approx_kl | 0.02338542 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.00783 | -| n_updates | 223100 | -| policy_gradient_loss | 0.0245 | -| std | 0.00652 | -| value_loss | 3.85e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22312 | -| time_elapsed | 120786 | -| total_timesteps | 2855936 | -| train/ | | -| approx_kl | 0.13194457 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.61 | -| explained_variance | -0.0805 | -| learning_rate | 0.0003 | -| loss | 0.0984 | -| n_updates | 223110 | -| policy_gradient_loss | 0.0476 | -| std | 0.0065 | -| value_loss | 1.22e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22313 | -| time_elapsed | 120797 | -| total_timesteps | 2856064 | -| train/ | | -| approx_kl | 0.12789838 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.551 | -| learning_rate | 0.0003 | -| loss | 0.071 | -| n_updates | 223120 | -| policy_gradient_loss | 0.024 | -| std | 0.00649 | -| value_loss | 2.17e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22314 | -| time_elapsed | 120818 | -| total_timesteps | 2856192 | -| train/ | | -| approx_kl | 0.013237705 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.691 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 223130 | -| policy_gradient_loss | -0.0132 | -| std | 0.00648 | -| value_loss | 0.00138 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22315 | -| time_elapsed | 120825 | -| total_timesteps | 2856320 | -| train/ | | -| approx_kl | 0.037152052 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.52 | -| learning_rate | 0.0003 | -| loss | -0.00493 | -| n_updates | 223140 | -| policy_gradient_loss | -0.00923 | -| std | 0.00648 | -| value_loss | 6.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22316 | -| time_elapsed | 120830 | -| total_timesteps | 2856448 | -| train/ | | -| approx_kl | 0.01930256 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.00871 | -| n_updates | 223150 | -| policy_gradient_loss | 0.00298 | -| std | 0.00648 | -| value_loss | 5.61e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22317 | -| time_elapsed | 120840 | -| total_timesteps | 2856576 | -| train/ | | -| approx_kl | 0.025479104 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 223160 | -| policy_gradient_loss | 0.0325 | -| std | 0.00648 | -| value_loss | 2.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22318 | -| time_elapsed | 120844 | -| total_timesteps | 2856704 | -| train/ | | -| approx_kl | 0.12163649 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | 0.0613 | -| n_updates | 223170 | -| policy_gradient_loss | 0.0297 | -| std | 0.00648 | -| value_loss | 1.91e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22319 | -| time_elapsed | 120850 | -| total_timesteps | 2856832 | -| train/ | | -| approx_kl | 0.18939641 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | 0.0944 | -| n_updates | 223180 | -| policy_gradient_loss | 0.0334 | -| std | 0.00648 | -| value_loss | 1.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 22320 | -| time_elapsed | 120856 | -| total_timesteps | 2856960 | -| train/ | | -| approx_kl | 0.025974112 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.000211 | -| n_updates | 223190 | -| policy_gradient_loss | 0.0267 | -| std | 0.00648 | -| value_loss | 1.22e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22321 | -| time_elapsed | 120861 | -| total_timesteps | 2857088 | -| train/ | | -| approx_kl | 0.15184912 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.0722 | -| n_updates | 223200 | -| policy_gradient_loss | 0.0363 | -| std | 0.00648 | -| value_loss | 9.39e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22322 | -| time_elapsed | 120874 | -| total_timesteps | 2857216 | -| train/ | | -| approx_kl | 0.032275856 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 223210 | -| policy_gradient_loss | -0.018 | -| std | 0.00648 | -| value_loss | 0.00346 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22323 | -| time_elapsed | 120879 | -| total_timesteps | 2857344 | -| train/ | | -| approx_kl | 0.1581664 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.89 | -| learning_rate | 0.0003 | -| loss | 0.0373 | -| n_updates | 223220 | -| policy_gradient_loss | 0.0171 | -| std | 0.00648 | -| value_loss | 6.26e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22324 | -| time_elapsed | 120887 | -| total_timesteps | 2857472 | -| train/ | | -| approx_kl | 0.10142352 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00204 | -| learning_rate | 0.0003 | -| loss | 0.0516 | -| n_updates | 223230 | -| policy_gradient_loss | 0.0396 | -| std | 0.00648 | -| value_loss | 9.38e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22325 | -| time_elapsed | 120893 | -| total_timesteps | 2857600 | -| train/ | | -| approx_kl | 0.43087777 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.222 | -| n_updates | 223240 | -| policy_gradient_loss | 0.158 | -| std | 0.00648 | -| value_loss | 4.05e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22326 | -| time_elapsed | 120902 | -| total_timesteps | 2857728 | -| train/ | | -| approx_kl | 0.22543533 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | 0.26 | -| n_updates | 223250 | -| policy_gradient_loss | 0.159 | -| std | 0.00648 | -| value_loss | 3.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22327 | -| time_elapsed | 120908 | -| total_timesteps | 2857856 | -| train/ | | -| approx_kl | 0.040827304 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 223260 | -| policy_gradient_loss | 0.023 | -| std | 0.00648 | -| value_loss | 2.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 22328 | -| time_elapsed | 120914 | -| total_timesteps | 2857984 | -| train/ | | -| approx_kl | 0.61330235 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 223270 | -| policy_gradient_loss | 0.0541 | -| std | 0.00648 | -| value_loss | 2.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 22329 | -| time_elapsed | 120921 | -| total_timesteps | 2858112 | -| train/ | | -| approx_kl | 0.046294227 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | -0.00434 | -| n_updates | 223280 | -| policy_gradient_loss | -0.00012 | -| std | 0.00648 | -| value_loss | 1.88e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 22330 | -| time_elapsed | 120948 | -| total_timesteps | 2858240 | -| train/ | | -| approx_kl | 0.011573269 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 223290 | -| policy_gradient_loss | -0.00511 | -| std | 0.00648 | -| value_loss | 0.00213 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 22331 | -| time_elapsed | 120961 | -| total_timesteps | 2858368 | -| train/ | | -| approx_kl | 0.041892268 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -2.53 | -| learning_rate | 0.0003 | -| loss | -0.00829 | -| n_updates | 223300 | -| policy_gradient_loss | -0.003 | -| std | 0.00649 | -| value_loss | 1.14e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 22332 | -| time_elapsed | 120969 | -| total_timesteps | 2858496 | -| train/ | | -| approx_kl | 0.032307565 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 223310 | -| policy_gradient_loss | 0.0148 | -| std | 0.00649 | -| value_loss | 4.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 22333 | -| time_elapsed | 120975 | -| total_timesteps | 2858624 | -| train/ | | -| approx_kl | 0.0014186734 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.098 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 223320 | -| policy_gradient_loss | 0.0112 | -| std | 0.00649 | -| value_loss | 1.27e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 22334 | -| time_elapsed | 120980 | -| total_timesteps | 2858752 | -| train/ | | -| approx_kl | 0.049917776 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00167 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 223330 | -| policy_gradient_loss | 0.129 | -| std | 0.00649 | -| value_loss | 2.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 22335 | -| time_elapsed | 120985 | -| total_timesteps | 2858880 | -| train/ | | -| approx_kl | 0.011261486 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 223340 | -| policy_gradient_loss | 0.0294 | -| std | 0.00649 | -| value_loss | 2.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22336 | -| time_elapsed | 120989 | -| total_timesteps | 2859008 | -| train/ | | -| approx_kl | 0.24990726 | -| clip_fraction | 0.524 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 223350 | -| policy_gradient_loss | 0.0719 | -| std | 0.00649 | -| value_loss | 1.85e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22337 | -| time_elapsed | 121007 | -| total_timesteps | 2859136 | -| train/ | | -| approx_kl | 0.17714563 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | 0.00471 | -| n_updates | 223360 | -| policy_gradient_loss | -0.00716 | -| std | 0.00649 | -| value_loss | 0.00037 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22338 | -| time_elapsed | 121013 | -| total_timesteps | 2859264 | -| train/ | | -| approx_kl | 0.17739052 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.851 | -| learning_rate | 0.0003 | -| loss | 0.041 | -| n_updates | 223370 | -| policy_gradient_loss | 0.0088 | -| std | 0.00648 | -| value_loss | 3.18e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22339 | -| time_elapsed | 121019 | -| total_timesteps | 2859392 | -| train/ | | -| approx_kl | 0.0015817331 | -| clip_fraction | 0.0398 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 223380 | -| policy_gradient_loss | 0.000444 | -| std | 0.00648 | -| value_loss | 1.73e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22340 | -| time_elapsed | 121024 | -| total_timesteps | 2859520 | -| train/ | | -| approx_kl | 0.08288122 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 223390 | -| policy_gradient_loss | 0.0105 | -| std | 0.00648 | -| value_loss | 3.85e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22341 | -| time_elapsed | 121030 | -| total_timesteps | 2859648 | -| train/ | | -| approx_kl | 0.11891919 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -15.8 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 223400 | -| policy_gradient_loss | 0.00947 | -| std | 0.00647 | -| value_loss | 5.45e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22342 | -| time_elapsed | 121037 | -| total_timesteps | 2859776 | -| train/ | | -| approx_kl | 0.041995037 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00806 | -| learning_rate | 0.0003 | -| loss | 1.23e-05 | -| n_updates | 223410 | -| policy_gradient_loss | 0.0195 | -| std | 0.00647 | -| value_loss | 4.56e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 22343 | -| time_elapsed | 121043 | -| total_timesteps | 2859904 | -| train/ | | -| approx_kl | 0.003032689 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 223420 | -| policy_gradient_loss | 0.0323 | -| std | 0.00647 | -| value_loss | 3.94e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22344 | -| time_elapsed | 121048 | -| total_timesteps | 2860032 | -| train/ | | -| approx_kl | 0.08038741 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.035 | -| n_updates | 223430 | -| policy_gradient_loss | 0.027 | -| std | 0.00647 | -| value_loss | 2.21e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22345 | -| time_elapsed | 121059 | -| total_timesteps | 2860160 | -| train/ | | -| approx_kl | 0.014781566 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.112 | -| learning_rate | 0.0003 | -| loss | -0.0248 | -| n_updates | 223440 | -| policy_gradient_loss | -0.0207 | -| std | 0.00646 | -| value_loss | 0.00238 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22346 | -| time_elapsed | 121065 | -| total_timesteps | 2860288 | -| train/ | | -| approx_kl | 0.12265767 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.00638 | -| learning_rate | 0.0003 | -| loss | 0.0591 | -| n_updates | 223450 | -| policy_gradient_loss | 0.0214 | -| std | 0.00646 | -| value_loss | 0.000257 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22347 | -| time_elapsed | 121070 | -| total_timesteps | 2860416 | -| train/ | | -| approx_kl | 0.06368504 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0982 | -| learning_rate | 0.0003 | -| loss | 0.0448 | -| n_updates | 223460 | -| policy_gradient_loss | 0.0468 | -| std | 0.00646 | -| value_loss | 7.42e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22348 | -| time_elapsed | 121076 | -| total_timesteps | 2860544 | -| train/ | | -| approx_kl | 0.42957875 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.00676 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 223470 | -| policy_gradient_loss | 0.141 | -| std | 0.00646 | -| value_loss | 1.61e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22349 | -| time_elapsed | 121079 | -| total_timesteps | 2860672 | -| train/ | | -| approx_kl | 0.07996269 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | 0.0449 | -| n_updates | 223480 | -| policy_gradient_loss | 0.0269 | -| std | 0.00646 | -| value_loss | 1.14e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22350 | -| time_elapsed | 121085 | -| total_timesteps | 2860800 | -| train/ | | -| approx_kl | 2.0419247e-06 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0767 | -| learning_rate | 0.0003 | -| loss | -0.000134 | -| n_updates | 223490 | -| policy_gradient_loss | 0.0248 | -| std | 0.00646 | -| value_loss | 9.9e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 22351 | -| time_elapsed | 121092 | -| total_timesteps | 2860928 | -| train/ | | -| approx_kl | 8.826563e-05 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 8.62e-05 | -| n_updates | 223500 | -| policy_gradient_loss | 0.0285 | -| std | 0.00646 | -| value_loss | 5.25e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22352 | -| time_elapsed | 121097 | -| total_timesteps | 2861056 | -| train/ | | -| approx_kl | 7.9602e-05 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0808 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 223510 | -| policy_gradient_loss | 0.0326 | -| std | 0.00646 | -| value_loss | 3.64e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22353 | -| time_elapsed | 121109 | -| total_timesteps | 2861184 | -| train/ | | -| approx_kl | 0.025863793 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 223520 | -| policy_gradient_loss | -0.00144 | -| std | 0.00646 | -| value_loss | 1.41e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22354 | -| time_elapsed | 121115 | -| total_timesteps | 2861312 | -| train/ | | -| approx_kl | 0.006886265 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 223530 | -| policy_gradient_loss | 0.0293 | -| std | 0.00646 | -| value_loss | 2.91e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22355 | -| time_elapsed | 121123 | -| total_timesteps | 2861440 | -| train/ | | -| approx_kl | 0.23827711 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 223540 | -| policy_gradient_loss | 0.0462 | -| std | 0.00646 | -| value_loss | 1.27e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22356 | -| time_elapsed | 121129 | -| total_timesteps | 2861568 | -| train/ | | -| approx_kl | 0.04584579 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0774 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 223550 | -| policy_gradient_loss | 0.0765 | -| std | 0.00645 | -| value_loss | 7.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22357 | -| time_elapsed | 121136 | -| total_timesteps | 2861696 | -| train/ | | -| approx_kl | 0.013382724 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.085 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 223560 | -| policy_gradient_loss | 0.139 | -| std | 0.00645 | -| value_loss | 7.09e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22358 | -| time_elapsed | 121142 | -| total_timesteps | 2861824 | -| train/ | | -| approx_kl | 0.019831643 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.000813 | -| n_updates | 223570 | -| policy_gradient_loss | 0.0244 | -| std | 0.00645 | -| value_loss | 4.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 22359 | -| time_elapsed | 121147 | -| total_timesteps | 2861952 | -| train/ | | -| approx_kl | 0.036811013 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 223580 | -| policy_gradient_loss | 0.0756 | -| std | 0.00645 | -| value_loss | 3.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22360 | -| time_elapsed | 121155 | -| total_timesteps | 2862080 | -| train/ | | -| approx_kl | 0.22142269 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 223590 | -| policy_gradient_loss | 0.0521 | -| std | 0.00645 | -| value_loss | 2.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22361 | -| time_elapsed | 121168 | -| total_timesteps | 2862208 | -| train/ | | -| approx_kl | 0.005731088 | -| clip_fraction | 0.56 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -0.00816 | -| n_updates | 223600 | -| policy_gradient_loss | 0.0742 | -| std | 0.00645 | -| value_loss | 0.000357 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22362 | -| time_elapsed | 121177 | -| total_timesteps | 2862336 | -| train/ | | -| approx_kl | 0.23826125 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0965 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 223610 | -| policy_gradient_loss | 0.218 | -| std | 0.00645 | -| value_loss | 1.96e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22363 | -| time_elapsed | 121183 | -| total_timesteps | 2862464 | -| train/ | | -| approx_kl | 0.06406868 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | 0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 223620 | -| policy_gradient_loss | 0.0441 | -| std | 0.00645 | -| value_loss | 1.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22364 | -| time_elapsed | 121190 | -| total_timesteps | 2862592 | -| train/ | | -| approx_kl | 0.12590982 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0734 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 223630 | -| policy_gradient_loss | 0.0254 | -| std | 0.00646 | -| value_loss | 1.33e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22365 | -| time_elapsed | 121196 | -| total_timesteps | 2862720 | -| train/ | | -| approx_kl | 0.014167442 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.62 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.00421 | -| n_updates | 223640 | -| policy_gradient_loss | 0.0329 | -| std | 0.00644 | -| value_loss | 4.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22366 | -| time_elapsed | 121202 | -| total_timesteps | 2862848 | -| train/ | | -| approx_kl | 0.030891115 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.725 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 223650 | -| policy_gradient_loss | 0.0273 | -| std | 0.00644 | -| value_loss | 1.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 22367 | -| time_elapsed | 121207 | -| total_timesteps | 2862976 | -| train/ | | -| approx_kl | 0.53244805 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.829 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 223660 | -| policy_gradient_loss | 0.0485 | -| std | 0.00644 | -| value_loss | 6.6e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22368 | -| time_elapsed | 121215 | -| total_timesteps | 2863104 | -| train/ | | -| approx_kl | 0.007857064 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | -0.00657 | -| n_updates | 223670 | -| policy_gradient_loss | 0.00583 | -| std | 0.00644 | -| value_loss | 2.31e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22369 | -| time_elapsed | 121227 | -| total_timesteps | 2863232 | -| train/ | | -| approx_kl | 0.019042185 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.812 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 223680 | -| policy_gradient_loss | -0.0181 | -| std | 0.00643 | -| value_loss | 0.000779 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22370 | -| time_elapsed | 121232 | -| total_timesteps | 2863360 | -| train/ | | -| approx_kl | 0.02043799 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.421 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 223690 | -| policy_gradient_loss | 0.0275 | -| std | 0.00643 | -| value_loss | 2.43e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22371 | -| time_elapsed | 121237 | -| total_timesteps | 2863488 | -| train/ | | -| approx_kl | 1.5519577 | -| clip_fraction | 0.79 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.577 | -| n_updates | 223700 | -| policy_gradient_loss | 0.215 | -| std | 0.00643 | -| value_loss | 3.42e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22372 | -| time_elapsed | 121241 | -| total_timesteps | 2863616 | -| train/ | | -| approx_kl | 0.019186027 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 223710 | -| policy_gradient_loss | 0.0151 | -| std | 0.00642 | -| value_loss | 1.42e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22373 | -| time_elapsed | 121247 | -| total_timesteps | 2863744 | -| train/ | | -| approx_kl | 0.0911107 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 223720 | -| policy_gradient_loss | 0.0227 | -| std | 0.00641 | -| value_loss | 6.38e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22374 | -| time_elapsed | 121254 | -| total_timesteps | 2863872 | -| train/ | | -| approx_kl | 0.0040878477 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 223730 | -| policy_gradient_loss | 0.0553 | -| std | 0.00638 | -| value_loss | 1.74e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22375 | -| time_elapsed | 121261 | -| total_timesteps | 2864000 | -| train/ | | -| approx_kl | 0.08496147 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -12 | -| learning_rate | 0.0003 | -| loss | -0.00589 | -| n_updates | 223740 | -| policy_gradient_loss | 0.0164 | -| std | 0.00637 | -| value_loss | 6.07e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22376 | -| time_elapsed | 121267 | -| total_timesteps | 2864128 | -| train/ | | -| approx_kl | 0.36775964 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0918 | -| n_updates | 223750 | -| policy_gradient_loss | 0.0202 | -| std | 0.00637 | -| value_loss | 3.41e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22377 | -| time_elapsed | 121278 | -| total_timesteps | 2864256 | -| train/ | | -| approx_kl | 0.24583943 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 223760 | -| policy_gradient_loss | -0.0122 | -| std | 0.00637 | -| value_loss | 5.99e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22378 | -| time_elapsed | 121284 | -| total_timesteps | 2864384 | -| train/ | | -| approx_kl | 0.009880637 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 223770 | -| policy_gradient_loss | 0.018 | -| std | 0.00637 | -| value_loss | 4.78e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22379 | -| time_elapsed | 121290 | -| total_timesteps | 2864512 | -| train/ | | -| approx_kl | 0.011891833 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 223780 | -| policy_gradient_loss | 0.0356 | -| std | 0.00637 | -| value_loss | 1.94e-09 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22380 | -| time_elapsed | 121296 | -| total_timesteps | 2864640 | -| train/ | | -| approx_kl | 0.68958 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | 0.199 | -| n_updates | 223790 | -| policy_gradient_loss | 0.0682 | -| std | 0.00637 | -| value_loss | 1.22e-09 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22381 | -| time_elapsed | 121301 | -| total_timesteps | 2864768 | -| train/ | | -| approx_kl | 0.012198903 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00218 | -| n_updates | 223800 | -| policy_gradient_loss | 0.00702 | -| std | 0.00637 | -| value_loss | 4.04e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.979 | -| time/ | | -| fps | 23 | -| iterations | 22382 | -| time_elapsed | 121307 | -| total_timesteps | 2864896 | -| train/ | | -| approx_kl | 0.06939576 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0515 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 223810 | -| policy_gradient_loss | 0.0118 | -| std | 0.00637 | -| value_loss | 3.59e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22383 | -| time_elapsed | 121314 | -| total_timesteps | 2865024 | -| train/ | | -| approx_kl | 0.062233284 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 223820 | -| policy_gradient_loss | 0.0153 | -| std | 0.00637 | -| value_loss | 2.73e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22384 | -| time_elapsed | 121327 | -| total_timesteps | 2865152 | -| train/ | | -| approx_kl | 0.02288942 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | 0.00233 | -| n_updates | 223830 | -| policy_gradient_loss | 0.018 | -| std | 0.00636 | -| value_loss | 0.000185 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22385 | -| time_elapsed | 121333 | -| total_timesteps | 2865280 | -| train/ | | -| approx_kl | 0.021669231 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.953 | -| learning_rate | 0.0003 | -| loss | 0.00412 | -| n_updates | 223840 | -| policy_gradient_loss | 0.0345 | -| std | 0.00636 | -| value_loss | 1.53e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22386 | -| time_elapsed | 121339 | -| total_timesteps | 2865408 | -| train/ | | -| approx_kl | 0.2514644 | -| clip_fraction | 0.563 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 223850 | -| policy_gradient_loss | 0.0853 | -| std | 0.00637 | -| value_loss | 4.21e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22387 | -| time_elapsed | 121342 | -| total_timesteps | 2865536 | -| train/ | | -| approx_kl | 0.052835543 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 223860 | -| policy_gradient_loss | 0.0532 | -| std | 0.00637 | -| value_loss | 2.88e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22388 | -| time_elapsed | 121348 | -| total_timesteps | 2865664 | -| train/ | | -| approx_kl | 1.00042 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.348 | -| n_updates | 223870 | -| policy_gradient_loss | 0.146 | -| std | 0.00637 | -| value_loss | 2.18e-07 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22389 | -| time_elapsed | 121353 | -| total_timesteps | 2865792 | -| train/ | | -| approx_kl | 0.04665512 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 223880 | -| policy_gradient_loss | 0.00574 | -| std | 0.00637 | -| value_loss | 1.24e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22390 | -| time_elapsed | 121358 | -| total_timesteps | 2865920 | -| train/ | | -| approx_kl | 0.58155215 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 223890 | -| policy_gradient_loss | 0.0631 | -| std | 0.00637 | -| value_loss | 7.18e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22391 | -| time_elapsed | 121363 | -| total_timesteps | 2866048 | -| train/ | | -| approx_kl | 0.08195163 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | 0.0353 | -| n_updates | 223900 | -| policy_gradient_loss | 0.0156 | -| std | 0.00637 | -| value_loss | 5.83e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22392 | -| time_elapsed | 121374 | -| total_timesteps | 2866176 | -| train/ | | -| approx_kl | 0.015597655 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 223910 | -| policy_gradient_loss | -0.0121 | -| std | 0.00637 | -| value_loss | 0.00108 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22393 | -| time_elapsed | 121378 | -| total_timesteps | 2866304 | -| train/ | | -| approx_kl | 0.0066886963 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | 0.00919 | -| n_updates | 223920 | -| policy_gradient_loss | 0.00709 | -| std | 0.00637 | -| value_loss | 6.37e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22394 | -| time_elapsed | 121382 | -| total_timesteps | 2866432 | -| train/ | | -| approx_kl | 0.012919357 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -9.71 | -| learning_rate | 0.0003 | -| loss | -0.000239 | -| n_updates | 223930 | -| policy_gradient_loss | 0.0146 | -| std | 0.00637 | -| value_loss | 8.74e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22395 | -| time_elapsed | 121387 | -| total_timesteps | 2866560 | -| train/ | | -| approx_kl | 0.14610915 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.456 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 223940 | -| policy_gradient_loss | 0.0405 | -| std | 0.00637 | -| value_loss | 4.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22396 | -| time_elapsed | 121392 | -| total_timesteps | 2866688 | -| train/ | | -| approx_kl | 0.12659627 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.741 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 223950 | -| policy_gradient_loss | -0.0198 | -| std | 0.00637 | -| value_loss | 1.81e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22397 | -| time_elapsed | 121397 | -| total_timesteps | 2866816 | -| train/ | | -| approx_kl | 0.01891607 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0993 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 223960 | -| policy_gradient_loss | 0.014 | -| std | 0.00637 | -| value_loss | 1.47e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.984 | -| time/ | | -| fps | 23 | -| iterations | 22398 | -| time_elapsed | 121402 | -| total_timesteps | 2866944 | -| train/ | | -| approx_kl | 0.0003528013 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.00326 | -| n_updates | 223970 | -| policy_gradient_loss | 0.0043 | -| std | 0.00637 | -| value_loss | 9.93e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22399 | -| time_elapsed | 121407 | -| total_timesteps | 2867072 | -| train/ | | -| approx_kl | 2.3007859e-05 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.00145 | -| n_updates | 223980 | -| policy_gradient_loss | -0.00346 | -| std | 0.00637 | -| value_loss | 6.65e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22400 | -| time_elapsed | 121415 | -| total_timesteps | 2867200 | -| train/ | | -| approx_kl | 0.015308192 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | 0.0033 | -| n_updates | 223990 | -| policy_gradient_loss | 0.00947 | -| std | 0.00637 | -| value_loss | 1.47e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22401 | -| time_elapsed | 121420 | -| total_timesteps | 2867328 | -| train/ | | -| approx_kl | 0.44325083 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.815 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 224000 | -| policy_gradient_loss | 0.043 | -| std | 0.00637 | -| value_loss | 1.62e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22402 | -| time_elapsed | 121427 | -| total_timesteps | 2867456 | -| train/ | | -| approx_kl | 0.07602913 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -4.87 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 224010 | -| policy_gradient_loss | 0.00529 | -| std | 0.00636 | -| value_loss | 1.75e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22403 | -| time_elapsed | 121433 | -| total_timesteps | 2867584 | -| train/ | | -| approx_kl | 0.055435196 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.24 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 224020 | -| policy_gradient_loss | 0.0105 | -| std | 0.00636 | -| value_loss | 3.82e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22404 | -| time_elapsed | 121439 | -| total_timesteps | 2867712 | -| train/ | | -| approx_kl | 0.009339293 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 224030 | -| policy_gradient_loss | 0.00743 | -| std | 0.00637 | -| value_loss | 2.29e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22405 | -| time_elapsed | 121444 | -| total_timesteps | 2867840 | -| train/ | | -| approx_kl | 0.08346656 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.0486 | -| n_updates | 224040 | -| policy_gradient_loss | 0.0195 | -| std | 0.00637 | -| value_loss | 1.4e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 22406 | -| time_elapsed | 121449 | -| total_timesteps | 2867968 | -| train/ | | -| approx_kl | 0.046946656 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | 0.00472 | -| n_updates | 224050 | -| policy_gradient_loss | 0.00517 | -| std | 0.00637 | -| value_loss | 1.11e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22407 | -| time_elapsed | 121455 | -| total_timesteps | 2868096 | -| train/ | | -| approx_kl | 0.07588067 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 224060 | -| policy_gradient_loss | -0.00676 | -| std | 0.00637 | -| value_loss | 1.01e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22408 | -| time_elapsed | 121465 | -| total_timesteps | 2868224 | -| train/ | | -| approx_kl | 0.027913082 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 224070 | -| policy_gradient_loss | -0.00195 | -| std | 0.00637 | -| value_loss | 0.00025 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22409 | -| time_elapsed | 121470 | -| total_timesteps | 2868352 | -| train/ | | -| approx_kl | 0.00024226727 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 224080 | -| policy_gradient_loss | 0.104 | -| std | 0.00637 | -| value_loss | 3.72e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22410 | -| time_elapsed | 121475 | -| total_timesteps | 2868480 | -| train/ | | -| approx_kl | 0.17693214 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 224090 | -| policy_gradient_loss | 0.153 | -| std | 0.00637 | -| value_loss | 1.04e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22411 | -| time_elapsed | 121480 | -| total_timesteps | 2868608 | -| train/ | | -| approx_kl | 0.09088904 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.229 | -| learning_rate | 0.0003 | -| loss | 0.0294 | -| n_updates | 224100 | -| policy_gradient_loss | 0.0299 | -| std | 0.00637 | -| value_loss | 4.42e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22412 | -| time_elapsed | 121485 | -| total_timesteps | 2868736 | -| train/ | | -| approx_kl | 0.33363146 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 224110 | -| policy_gradient_loss | 0.136 | -| std | 0.00637 | -| value_loss | 3.2e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22413 | -| time_elapsed | 121490 | -| total_timesteps | 2868864 | -| train/ | | -| approx_kl | 0.06433267 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 224120 | -| policy_gradient_loss | 0.0312 | -| std | 0.00637 | -| value_loss | 2.15e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 22414 | -| time_elapsed | 121495 | -| total_timesteps | 2868992 | -| train/ | | -| approx_kl | 0.90211546 | -| clip_fraction | 0.524 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 224130 | -| policy_gradient_loss | 0.0567 | -| std | 0.00637 | -| value_loss | 1.69e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 22415 | -| time_elapsed | 121501 | -| total_timesteps | 2869120 | -| train/ | | -| approx_kl | 0.04929942 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 224140 | -| policy_gradient_loss | -0.00281 | -| std | 0.00637 | -| value_loss | 9.16e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 22416 | -| time_elapsed | 121512 | -| total_timesteps | 2869248 | -| train/ | | -| approx_kl | 0.015986426 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.21 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 224150 | -| policy_gradient_loss | -0.0101 | -| std | 0.00637 | -| value_loss | 0.00183 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 22417 | -| time_elapsed | 121517 | -| total_timesteps | 2869376 | -| train/ | | -| approx_kl | 3.9755367e-05 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | -0.00135 | -| n_updates | 224160 | -| policy_gradient_loss | 0.0332 | -| std | 0.00637 | -| value_loss | 2.53e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 22418 | -| time_elapsed | 121523 | -| total_timesteps | 2869504 | -| train/ | | -| approx_kl | 0.5718815 | -| clip_fraction | 0.539 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.00869 | -| learning_rate | 0.0003 | -| loss | 0.0832 | -| n_updates | 224170 | -| policy_gradient_loss | 0.0328 | -| std | 0.00637 | -| value_loss | 2.36e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 22419 | -| time_elapsed | 121528 | -| total_timesteps | 2869632 | -| train/ | | -| approx_kl | 0.015577376 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.00401 | -| n_updates | 224180 | -| policy_gradient_loss | 0.00986 | -| std | 0.00637 | -| value_loss | 1.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 22420 | -| time_elapsed | 121533 | -| total_timesteps | 2869760 | -| train/ | | -| approx_kl | 0.07617054 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0818 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 224190 | -| policy_gradient_loss | 0.0109 | -| std | 0.00637 | -| value_loss | 9.73e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 22421 | -| time_elapsed | 121538 | -| total_timesteps | 2869888 | -| train/ | | -| approx_kl | 0.12643768 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.0877 | -| n_updates | 224200 | -| policy_gradient_loss | 0.0305 | -| std | 0.00636 | -| value_loss | 4.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22422 | -| time_elapsed | 121542 | -| total_timesteps | 2870016 | -| train/ | | -| approx_kl | 0.020790936 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0845 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 224210 | -| policy_gradient_loss | 0.0318 | -| std | 0.00635 | -| value_loss | 6.27e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22423 | -| time_elapsed | 121553 | -| total_timesteps | 2870144 | -| train/ | | -| approx_kl | 0.0038291458 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.00988 | -| n_updates | 224220 | -| policy_gradient_loss | -0.00451 | -| std | 0.00635 | -| value_loss | 0.000523 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22424 | -| time_elapsed | 121558 | -| total_timesteps | 2870272 | -| train/ | | -| approx_kl | 0.00174144 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.00911 | -| learning_rate | 0.0003 | -| loss | -0.00149 | -| n_updates | 224230 | -| policy_gradient_loss | 0.0227 | -| std | 0.00635 | -| value_loss | 7.38e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22425 | -| time_elapsed | 121563 | -| total_timesteps | 2870400 | -| train/ | | -| approx_kl | 3.3442857 | -| clip_fraction | 0.863 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.135 | -| learning_rate | 0.0003 | -| loss | 0.237 | -| n_updates | 224240 | -| policy_gradient_loss | 0.212 | -| std | 0.00635 | -| value_loss | 3.69e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22426 | -| time_elapsed | 121567 | -| total_timesteps | 2870528 | -| train/ | | -| approx_kl | 0.01613758 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 224250 | -| policy_gradient_loss | 0.0453 | -| std | 0.00636 | -| value_loss | 6.07e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22427 | -| time_elapsed | 121572 | -| total_timesteps | 2870656 | -| train/ | | -| approx_kl | 0.41018224 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.00468 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 224260 | -| policy_gradient_loss | 0.119 | -| std | 0.00636 | -| value_loss | 1.9e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22428 | -| time_elapsed | 121576 | -| total_timesteps | 2870784 | -| train/ | | -| approx_kl | 0.09957723 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 224270 | -| policy_gradient_loss | 0.0433 | -| std | 0.00637 | -| value_loss | 1.07e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22429 | -| time_elapsed | 121580 | -| total_timesteps | 2870912 | -| train/ | | -| approx_kl | 0.5927375 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0621 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 224280 | -| policy_gradient_loss | 0.0607 | -| std | 0.00637 | -| value_loss | 9.08e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22430 | -| time_elapsed | 121584 | -| total_timesteps | 2871040 | -| train/ | | -| approx_kl | 0.046060376 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.0073 | -| n_updates | 224290 | -| policy_gradient_loss | 0.00628 | -| std | 0.00637 | -| value_loss | 6.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22431 | -| time_elapsed | 121594 | -| total_timesteps | 2871168 | -| train/ | | -| approx_kl | 0.024590222 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -2.7 | -| learning_rate | 0.0003 | -| loss | -0.0222 | -| n_updates | 224300 | -| policy_gradient_loss | -0.00943 | -| std | 0.00637 | -| value_loss | 0.00338 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22432 | -| time_elapsed | 121599 | -| total_timesteps | 2871296 | -| train/ | | -| approx_kl | 0.7833711 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.077 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 224310 | -| policy_gradient_loss | 0.061 | -| std | 0.00637 | -| value_loss | 6.34e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22433 | -| time_elapsed | 121604 | -| total_timesteps | 2871424 | -| train/ | | -| approx_kl | 0.054577284 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.0348 | -| n_updates | 224320 | -| policy_gradient_loss | 0.0181 | -| std | 0.00637 | -| value_loss | 1.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22434 | -| time_elapsed | 121610 | -| total_timesteps | 2871552 | -| train/ | | -| approx_kl | 0.08013541 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.047 | -| n_updates | 224330 | -| policy_gradient_loss | 0.0204 | -| std | 0.00637 | -| value_loss | 6.56e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22435 | -| time_elapsed | 121614 | -| total_timesteps | 2871680 | -| train/ | | -| approx_kl | 0.030167323 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 224340 | -| policy_gradient_loss | 0.0194 | -| std | 0.00637 | -| value_loss | 3.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22436 | -| time_elapsed | 121618 | -| total_timesteps | 2871808 | -| train/ | | -| approx_kl | 0.27632177 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 224350 | -| policy_gradient_loss | 0.0517 | -| std | 0.00636 | -| value_loss | 2.9e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22437 | -| time_elapsed | 121623 | -| total_timesteps | 2871936 | -| train/ | | -| approx_kl | 0.00010768324 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 224360 | -| policy_gradient_loss | 0.0435 | -| std | 0.00635 | -| value_loss | 1.53e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22438 | -| time_elapsed | 121629 | -| total_timesteps | 2872064 | -| train/ | | -| approx_kl | 0.078954116 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | 0.0406 | -| n_updates | 224370 | -| policy_gradient_loss | 0.0245 | -| std | 0.00638 | -| value_loss | 2.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22439 | -| time_elapsed | 121638 | -| total_timesteps | 2872192 | -| train/ | | -| approx_kl | 0.067000724 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.855 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 224380 | -| policy_gradient_loss | -0.00966 | -| std | 0.00639 | -| value_loss | 0.00288 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22440 | -| time_elapsed | 121644 | -| total_timesteps | 2872320 | -| train/ | | -| approx_kl | 0.014089424 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 224390 | -| policy_gradient_loss | 0.0268 | -| std | 0.00639 | -| value_loss | 2.27e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22441 | -| time_elapsed | 121649 | -| total_timesteps | 2872448 | -| train/ | | -| approx_kl | 0.4594354 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00958 | -| learning_rate | 0.0003 | -| loss | 0.247 | -| n_updates | 224400 | -| policy_gradient_loss | 0.221 | -| std | 0.00639 | -| value_loss | 4.04e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22442 | -| time_elapsed | 121654 | -| total_timesteps | 2872576 | -| train/ | | -| approx_kl | 0.060452487 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0169 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 224410 | -| policy_gradient_loss | 0.0325 | -| std | 0.0064 | -| value_loss | 2.88e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22443 | -| time_elapsed | 121661 | -| total_timesteps | 2872704 | -| train/ | | -| approx_kl | 0.0008882289 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.00254 | -| n_updates | 224420 | -| policy_gradient_loss | 0.0298 | -| std | 0.0064 | -| value_loss | 2.03e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22444 | -| time_elapsed | 121666 | -| total_timesteps | 2872832 | -| train/ | | -| approx_kl | 0.6771706 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 224430 | -| policy_gradient_loss | 0.0678 | -| std | 0.0064 | -| value_loss | 1.4e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22445 | -| time_elapsed | 121672 | -| total_timesteps | 2872960 | -| train/ | | -| approx_kl | 0.058132555 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 224440 | -| policy_gradient_loss | 0.0142 | -| std | 0.0064 | -| value_loss | 8.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22446 | -| time_elapsed | 121677 | -| total_timesteps | 2873088 | -| train/ | | -| approx_kl | 0.015094468 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0653 | -| learning_rate | 0.0003 | -| loss | -0.00494 | -| n_updates | 224450 | -| policy_gradient_loss | 0.00739 | -| std | 0.00639 | -| value_loss | 6.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22447 | -| time_elapsed | 121687 | -| total_timesteps | 2873216 | -| train/ | | -| approx_kl | 0.016356334 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.952 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 224460 | -| policy_gradient_loss | 0.00337 | -| std | 0.0064 | -| value_loss | 0.00355 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22448 | -| time_elapsed | 121692 | -| total_timesteps | 2873344 | -| train/ | | -| approx_kl | 1.1682642 | -| clip_fraction | 0.791 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.385 | -| n_updates | 224470 | -| policy_gradient_loss | 0.222 | -| std | 0.0064 | -| value_loss | 3.59e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22449 | -| time_elapsed | 121697 | -| total_timesteps | 2873472 | -| train/ | | -| approx_kl | 0.010400008 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 224480 | -| policy_gradient_loss | 0.0354 | -| std | 0.0064 | -| value_loss | 3.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22450 | -| time_elapsed | 121702 | -| total_timesteps | 2873600 | -| train/ | | -| approx_kl | 0.110745266 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.0558 | -| n_updates | 224490 | -| policy_gradient_loss | 0.0283 | -| std | 0.00641 | -| value_loss | 1.93e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22451 | -| time_elapsed | 121707 | -| total_timesteps | 2873728 | -| train/ | | -| approx_kl | 0.17051572 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | 0.077 | -| n_updates | 224500 | -| policy_gradient_loss | 0.0235 | -| std | 0.00641 | -| value_loss | 1.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22452 | -| time_elapsed | 121714 | -| total_timesteps | 2873856 | -| train/ | | -| approx_kl | 0.009687094 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0802 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 224510 | -| policy_gradient_loss | 0.00143 | -| std | 0.00641 | -| value_loss | 8.24e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22453 | -| time_elapsed | 121719 | -| total_timesteps | 2873984 | -| train/ | | -| approx_kl | 0.013913697 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0835 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 224520 | -| policy_gradient_loss | -0.00824 | -| std | 0.00642 | -| value_loss | 2.05e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22454 | -| time_elapsed | 121723 | -| total_timesteps | 2874112 | -| train/ | | -| approx_kl | 0.21526435 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 224530 | -| policy_gradient_loss | 0.00644 | -| std | 0.00642 | -| value_loss | 2.05e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22455 | -| time_elapsed | 121737 | -| total_timesteps | 2874240 | -| train/ | | -| approx_kl | 0.3421907 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -6.38 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 224540 | -| policy_gradient_loss | -0.00478 | -| std | 0.00641 | -| value_loss | 0.00385 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22456 | -| time_elapsed | 121742 | -| total_timesteps | 2874368 | -| train/ | | -| approx_kl | 0.014226021 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 224550 | -| policy_gradient_loss | 0.0619 | -| std | 0.00641 | -| value_loss | 4.81e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22457 | -| time_elapsed | 121747 | -| total_timesteps | 2874496 | -| train/ | | -| approx_kl | 0.19289216 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0048 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 224560 | -| policy_gradient_loss | 0.0626 | -| std | 0.00641 | -| value_loss | 3.23e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22458 | -| time_elapsed | 121752 | -| total_timesteps | 2874624 | -| train/ | | -| approx_kl | 0.0058179013 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | -0.00319 | -| n_updates | 224570 | -| policy_gradient_loss | 0.0149 | -| std | 0.00641 | -| value_loss | 2.32e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22459 | -| time_elapsed | 121757 | -| total_timesteps | 2874752 | -| train/ | | -| approx_kl | 0.019073023 | -| clip_fraction | 0.6 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.00228 | -| n_updates | 224580 | -| policy_gradient_loss | 0.0945 | -| std | 0.00641 | -| value_loss | 1.72e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22460 | -| time_elapsed | 121761 | -| total_timesteps | 2874880 | -| train/ | | -| approx_kl | 0.2793241 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.0891 | -| n_updates | 224590 | -| policy_gradient_loss | 0.027 | -| std | 0.00641 | -| value_loss | 1.02e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22461 | -| time_elapsed | 121766 | -| total_timesteps | 2875008 | -| train/ | | -| approx_kl | 0.00015690364 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0564 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 224600 | -| policy_gradient_loss | -0.000338 | -| std | 0.00641 | -| value_loss | 1.64e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22462 | -| time_elapsed | 121778 | -| total_timesteps | 2875136 | -| train/ | | -| approx_kl | 0.0080276 | -| clip_fraction | 0.56 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.869 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 224610 | -| policy_gradient_loss | 0.0189 | -| std | 0.00641 | -| value_loss | 0.00233 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22463 | -| time_elapsed | 121783 | -| total_timesteps | 2875264 | -| train/ | | -| approx_kl | 0.013839545 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.475 | -| learning_rate | 0.0003 | -| loss | 0.00918 | -| n_updates | 224620 | -| policy_gradient_loss | 0.018 | -| std | 0.00641 | -| value_loss | 2.23e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22464 | -| time_elapsed | 121787 | -| total_timesteps | 2875392 | -| train/ | | -| approx_kl | 0.52883095 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | 0.251 | -| n_updates | 224630 | -| policy_gradient_loss | 0.192 | -| std | 0.00641 | -| value_loss | 2.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22465 | -| time_elapsed | 121792 | -| total_timesteps | 2875520 | -| train/ | | -| approx_kl | 0.07668423 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 224640 | -| policy_gradient_loss | 0.026 | -| std | 0.00641 | -| value_loss | 1.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22466 | -| time_elapsed | 121798 | -| total_timesteps | 2875648 | -| train/ | | -| approx_kl | 0.81136495 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.209 | -| n_updates | 224650 | -| policy_gradient_loss | 0.0651 | -| std | 0.00641 | -| value_loss | 1.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22467 | -| time_elapsed | 121803 | -| total_timesteps | 2875776 | -| train/ | | -| approx_kl | 0.012329055 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | 0.00317 | -| n_updates | 224660 | -| policy_gradient_loss | 0.0104 | -| std | 0.00641 | -| value_loss | 7.29e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22468 | -| time_elapsed | 121807 | -| total_timesteps | 2875904 | -| train/ | | -| approx_kl | 0.0028562462 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0739 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 224670 | -| policy_gradient_loss | 0.0106 | -| std | 0.00641 | -| value_loss | 4.44e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22469 | -| time_elapsed | 121811 | -| total_timesteps | 2876032 | -| train/ | | -| approx_kl | 1.1981465e-06 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | -9.62e-05 | -| n_updates | 224680 | -| policy_gradient_loss | 0.04 | -| std | 0.00641 | -| value_loss | 3.6e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22470 | -| time_elapsed | 121823 | -| total_timesteps | 2876160 | -| train/ | | -| approx_kl | 0.21782008 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.899 | -| learning_rate | 0.0003 | -| loss | 0.0636 | -| n_updates | 224690 | -| policy_gradient_loss | 0.0376 | -| std | 0.00641 | -| value_loss | 0.000674 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22471 | -| time_elapsed | 121828 | -| total_timesteps | 2876288 | -| train/ | | -| approx_kl | 0.05466295 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.776 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 224700 | -| policy_gradient_loss | 0.0342 | -| std | 0.00641 | -| value_loss | 1.99e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22472 | -| time_elapsed | 121834 | -| total_timesteps | 2876416 | -| train/ | | -| approx_kl | 0.7659836 | -| clip_fraction | 0.742 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.264 | -| n_updates | 224710 | -| policy_gradient_loss | 0.148 | -| std | 0.00641 | -| value_loss | 4.45e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22473 | -| time_elapsed | 121840 | -| total_timesteps | 2876544 | -| train/ | | -| approx_kl | 0.023456383 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 224720 | -| policy_gradient_loss | 0.017 | -| std | 0.00641 | -| value_loss | 3.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22474 | -| time_elapsed | 121844 | -| total_timesteps | 2876672 | -| train/ | | -| approx_kl | 0.08760685 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.0159 | -| n_updates | 224730 | -| policy_gradient_loss | 0.0223 | -| std | 0.00641 | -| value_loss | 5.73e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22475 | -| time_elapsed | 121849 | -| total_timesteps | 2876800 | -| train/ | | -| approx_kl | 0.18412027 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00316 | -| learning_rate | 0.0003 | -| loss | 0.0972 | -| n_updates | 224740 | -| policy_gradient_loss | 0.0288 | -| std | 0.00641 | -| value_loss | 1.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 22476 | -| time_elapsed | 121854 | -| total_timesteps | 2876928 | -| train/ | | -| approx_kl | 0.026694112 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 224750 | -| policy_gradient_loss | 0.0364 | -| std | 0.00641 | -| value_loss | 1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22477 | -| time_elapsed | 121859 | -| total_timesteps | 2877056 | -| train/ | | -| approx_kl | 0.39432755 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 224760 | -| policy_gradient_loss | 0.142 | -| std | 0.00641 | -| value_loss | 6.92e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22478 | -| time_elapsed | 121867 | -| total_timesteps | 2877184 | -| train/ | | -| approx_kl | 0.052357413 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.635 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 224770 | -| policy_gradient_loss | -0.013 | -| std | 0.00642 | -| value_loss | 0.00225 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22479 | -| time_elapsed | 121872 | -| total_timesteps | 2877312 | -| train/ | | -| approx_kl | 0.10344401 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -5.09 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 224780 | -| policy_gradient_loss | 0.00851 | -| std | 0.00642 | -| value_loss | 1.51e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22480 | -| time_elapsed | 121877 | -| total_timesteps | 2877440 | -| train/ | | -| approx_kl | 0.06177669 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0754 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 224790 | -| policy_gradient_loss | 0.0167 | -| std | 0.00642 | -| value_loss | 3.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22481 | -| time_elapsed | 121881 | -| total_timesteps | 2877568 | -| train/ | | -| approx_kl | 0.046704594 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 224800 | -| policy_gradient_loss | 0.0158 | -| std | 0.00642 | -| value_loss | 2.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22482 | -| time_elapsed | 121886 | -| total_timesteps | 2877696 | -| train/ | | -| approx_kl | 0.06622426 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 224810 | -| policy_gradient_loss | 0.00611 | -| std | 0.00642 | -| value_loss | 1.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22483 | -| time_elapsed | 121889 | -| total_timesteps | 2877824 | -| train/ | | -| approx_kl | 0.012616402 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | -0.00273 | -| n_updates | 224820 | -| policy_gradient_loss | 0.0107 | -| std | 0.00642 | -| value_loss | 1.34e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 22484 | -| time_elapsed | 121893 | -| total_timesteps | 2877952 | -| train/ | | -| approx_kl | 0.0028762044 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | -0.000773 | -| n_updates | 224830 | -| policy_gradient_loss | 0.00671 | -| std | 0.00642 | -| value_loss | 1.18e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22485 | -| time_elapsed | 121897 | -| total_timesteps | 2878080 | -| train/ | | -| approx_kl | 0.05565739 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.0809 | -| n_updates | 224840 | -| policy_gradient_loss | 0.173 | -| std | 0.00642 | -| value_loss | 1.45e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22486 | -| time_elapsed | 121905 | -| total_timesteps | 2878208 | -| train/ | | -| approx_kl | 0.053950243 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.938 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 224850 | -| policy_gradient_loss | 0.0122 | -| std | 0.00642 | -| value_loss | 0.000755 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22487 | -| time_elapsed | 121910 | -| total_timesteps | 2878336 | -| train/ | | -| approx_kl | 0.1921212 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.829 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 224860 | -| policy_gradient_loss | 0.0681 | -| std | 0.00642 | -| value_loss | 7.38e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22488 | -| time_elapsed | 121915 | -| total_timesteps | 2878464 | -| train/ | | -| approx_kl | 0.04513205 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 224870 | -| policy_gradient_loss | 0.0547 | -| std | 0.00642 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22489 | -| time_elapsed | 121920 | -| total_timesteps | 2878592 | -| train/ | | -| approx_kl | 0.19163132 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.000732 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 224880 | -| policy_gradient_loss | 0.0643 | -| std | 0.00642 | -| value_loss | 4.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22490 | -| time_elapsed | 121925 | -| total_timesteps | 2878720 | -| train/ | | -| approx_kl | 0.046219163 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 224890 | -| policy_gradient_loss | 0.0432 | -| std | 0.00642 | -| value_loss | 3.63e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22491 | -| time_elapsed | 121930 | -| total_timesteps | 2878848 | -| train/ | | -| approx_kl | 1.1710646 | -| clip_fraction | 0.757 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.358 | -| n_updates | 224900 | -| policy_gradient_loss | 0.191 | -| std | 0.00642 | -| value_loss | 2.51e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22492 | -| time_elapsed | 121936 | -| total_timesteps | 2878976 | -| train/ | | -| approx_kl | 0.036519695 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | -0.00335 | -| n_updates | 224910 | -| policy_gradient_loss | -0.00789 | -| std | 0.00642 | -| value_loss | 1.67e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 22493 | -| time_elapsed | 121941 | -| total_timesteps | 2879104 | -| train/ | | -| approx_kl | 0.027237695 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | -0.00182 | -| n_updates | 224920 | -| policy_gradient_loss | -0.00372 | -| std | 0.00642 | -| value_loss | 1.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 22494 | -| time_elapsed | 121952 | -| total_timesteps | 2879232 | -| train/ | | -| approx_kl | 0.04684883 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.836 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 224930 | -| policy_gradient_loss | 0.0278 | -| std | 0.00642 | -| value_loss | 0.00303 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 22495 | -| time_elapsed | 121959 | -| total_timesteps | 2879360 | -| train/ | | -| approx_kl | 0.13742563 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0665 | -| n_updates | 224940 | -| policy_gradient_loss | 0.0295 | -| std | 0.00642 | -| value_loss | 1.7e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 22496 | -| time_elapsed | 121964 | -| total_timesteps | 2879488 | -| train/ | | -| approx_kl | 0.00047264807 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 224950 | -| policy_gradient_loss | 0.0309 | -| std | 0.00642 | -| value_loss | 1.48e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 22497 | -| time_elapsed | 121967 | -| total_timesteps | 2879616 | -| train/ | | -| approx_kl | 0.22307354 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | 0.0685 | -| n_updates | 224960 | -| policy_gradient_loss | 0.0214 | -| std | 0.00643 | -| value_loss | 1.43e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 22498 | -| time_elapsed | 121973 | -| total_timesteps | 2879744 | -| train/ | | -| approx_kl | 0.021181447 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 224970 | -| policy_gradient_loss | -0.00642 | -| std | 0.00643 | -| value_loss | 9.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 22499 | -| time_elapsed | 121978 | -| total_timesteps | 2879872 | -| train/ | | -| approx_kl | 0.016725738 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.00593 | -| n_updates | 224980 | -| policy_gradient_loss | -0.0035 | -| std | 0.00643 | -| value_loss | 6.52e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22500 | -| time_elapsed | 121984 | -| total_timesteps | 2880000 | -| train/ | | -| approx_kl | 0.01700296 | -| clip_fraction | 0.143 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 224990 | -| policy_gradient_loss | -0.0065 | -| std | 0.00643 | -| value_loss | 4.92e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22501 | -| time_elapsed | 121988 | -| total_timesteps | 2880128 | -| train/ | | -| approx_kl | 0.027296014 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00436 | -| learning_rate | 0.0003 | -| loss | 0.0057 | -| n_updates | 225000 | -| policy_gradient_loss | 0.0302 | -| std | 0.00643 | -| value_loss | 2.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22502 | -| time_elapsed | 121998 | -| total_timesteps | 2880256 | -| train/ | | -| approx_kl | 0.109671876 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.57 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 225010 | -| policy_gradient_loss | 0.000418 | -| std | 0.00643 | -| value_loss | 0.00261 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22503 | -| time_elapsed | 122003 | -| total_timesteps | 2880384 | -| train/ | | -| approx_kl | 0.014878 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -1.02 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 225020 | -| policy_gradient_loss | -0.00186 | -| std | 0.00643 | -| value_loss | 1.19e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22504 | -| time_elapsed | 122007 | -| total_timesteps | 2880512 | -| train/ | | -| approx_kl | 0.011596942 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00138 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 225030 | -| policy_gradient_loss | -0.00329 | -| std | 0.00643 | -| value_loss | 6.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22505 | -| time_elapsed | 122012 | -| total_timesteps | 2880640 | -| train/ | | -| approx_kl | 0.028317677 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 225040 | -| policy_gradient_loss | 0.0492 | -| std | 0.00643 | -| value_loss | 9.32e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22506 | -| time_elapsed | 122017 | -| total_timesteps | 2880768 | -| train/ | | -| approx_kl | 0.1275168 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00229 | -| learning_rate | 0.0003 | -| loss | -0.000277 | -| n_updates | 225050 | -| policy_gradient_loss | 0.00706 | -| std | 0.00643 | -| value_loss | 5.22e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 22507 | -| time_elapsed | 122022 | -| total_timesteps | 2880896 | -| train/ | | -| approx_kl | 0.14876369 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0636 | -| n_updates | 225060 | -| policy_gradient_loss | 0.0262 | -| std | 0.00643 | -| value_loss | 3.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22508 | -| time_elapsed | 122028 | -| total_timesteps | 2881024 | -| train/ | | -| approx_kl | 0.030429916 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.00608 | -| n_updates | 225070 | -| policy_gradient_loss | 0.0236 | -| std | 0.00643 | -| value_loss | 1.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22509 | -| time_elapsed | 122040 | -| total_timesteps | 2881152 | -| train/ | | -| approx_kl | 0.122043654 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.798 | -| learning_rate | 0.0003 | -| loss | 0.0987 | -| n_updates | 225080 | -| policy_gradient_loss | 0.0733 | -| std | 0.00643 | -| value_loss | 0.00434 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22510 | -| time_elapsed | 122045 | -| total_timesteps | 2881280 | -| train/ | | -| approx_kl | 0.04509085 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0843 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 225090 | -| policy_gradient_loss | 0.0219 | -| std | 0.00644 | -| value_loss | 1.02e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22511 | -| time_elapsed | 122049 | -| total_timesteps | 2881408 | -| train/ | | -| approx_kl | 0.00040932186 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.000717 | -| n_updates | 225100 | -| policy_gradient_loss | 0.0287 | -| std | 0.00644 | -| value_loss | 2.56e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22512 | -| time_elapsed | 122054 | -| total_timesteps | 2881536 | -| train/ | | -| approx_kl | 0.0014169859 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 225110 | -| policy_gradient_loss | 0.0311 | -| std | 0.00644 | -| value_loss | 6.32e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22513 | -| time_elapsed | 122058 | -| total_timesteps | 2881664 | -| train/ | | -| approx_kl | 0.0008587828 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 225120 | -| policy_gradient_loss | 0.0363 | -| std | 0.00644 | -| value_loss | 2.37e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22514 | -| time_elapsed | 122063 | -| total_timesteps | 2881792 | -| train/ | | -| approx_kl | 0.67177474 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | 0.27 | -| n_updates | 225130 | -| policy_gradient_loss | 0.081 | -| std | 0.00644 | -| value_loss | 1.88e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 22515 | -| time_elapsed | 122068 | -| total_timesteps | 2881920 | -| train/ | | -| approx_kl | 0.07578747 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 225140 | -| policy_gradient_loss | 0.0207 | -| std | 0.00644 | -| value_loss | 1.25e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22516 | -| time_elapsed | 122073 | -| total_timesteps | 2882048 | -| train/ | | -| approx_kl | 0.051534105 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 225150 | -| policy_gradient_loss | 0.00697 | -| std | 0.00644 | -| value_loss | 8.78e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22517 | -| time_elapsed | 122081 | -| total_timesteps | 2882176 | -| train/ | | -| approx_kl | 0.005460304 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 225160 | -| policy_gradient_loss | 0.0144 | -| std | 0.00644 | -| value_loss | 0.00164 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22518 | -| time_elapsed | 122086 | -| total_timesteps | 2882304 | -| train/ | | -| approx_kl | 1.1692698 | -| clip_fraction | 0.743 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0902 | -| learning_rate | 0.0003 | -| loss | 0.374 | -| n_updates | 225170 | -| policy_gradient_loss | 0.225 | -| std | 0.00644 | -| value_loss | 1.03e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22519 | -| time_elapsed | 122090 | -| total_timesteps | 2882432 | -| train/ | | -| approx_kl | 0.007371089 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | -0.00499 | -| n_updates | 225180 | -| policy_gradient_loss | 0.0358 | -| std | 0.00644 | -| value_loss | 2.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22520 | -| time_elapsed | 122096 | -| total_timesteps | 2882560 | -| train/ | | -| approx_kl | 0.116836935 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.00367 | -| learning_rate | 0.0003 | -| loss | 0.049 | -| n_updates | 225190 | -| policy_gradient_loss | 0.0308 | -| std | 0.00644 | -| value_loss | 1.46e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22521 | -| time_elapsed | 122101 | -| total_timesteps | 2882688 | -| train/ | | -| approx_kl | 0.78043586 | -| clip_fraction | 0.551 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 225200 | -| policy_gradient_loss | 0.0589 | -| std | 0.00644 | -| value_loss | 1.15e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22522 | -| time_elapsed | 122106 | -| total_timesteps | 2882816 | -| train/ | | -| approx_kl | 0.018916966 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.0035 | -| n_updates | 225210 | -| policy_gradient_loss | 0.00959 | -| std | 0.00644 | -| value_loss | 7.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22523 | -| time_elapsed | 122111 | -| total_timesteps | 2882944 | -| train/ | | -| approx_kl | 0.081563406 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.0477 | -| n_updates | 225220 | -| policy_gradient_loss | 0.0203 | -| std | 0.00644 | -| value_loss | 4.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22524 | -| time_elapsed | 122115 | -| total_timesteps | 2883072 | -| train/ | | -| approx_kl | 0.04895167 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.0242 | -| n_updates | 225230 | -| policy_gradient_loss | 0.0128 | -| std | 0.00644 | -| value_loss | 2.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22525 | -| time_elapsed | 122124 | -| total_timesteps | 2883200 | -| train/ | | -| approx_kl | 0.009380405 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.795 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 225240 | -| policy_gradient_loss | 0.000608 | -| std | 0.00644 | -| value_loss | 0.00466 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22526 | -| time_elapsed | 122131 | -| total_timesteps | 2883328 | -| train/ | | -| approx_kl | 0.76517963 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0453 | -| learning_rate | 0.0003 | -| loss | 0.306 | -| n_updates | 225250 | -| policy_gradient_loss | 0.137 | -| std | 0.00644 | -| value_loss | 1.82e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22527 | -| time_elapsed | 122137 | -| total_timesteps | 2883456 | -| train/ | | -| approx_kl | 0.027363503 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0119 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 225260 | -| policy_gradient_loss | -0.0119 | -| std | 0.00644 | -| value_loss | 2.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22528 | -| time_elapsed | 122142 | -| total_timesteps | 2883584 | -| train/ | | -| approx_kl | 0.020327678 | -| clip_fraction | 0.135 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 225270 | -| policy_gradient_loss | -0.00783 | -| std | 0.00644 | -| value_loss | 1.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22529 | -| time_elapsed | 122148 | -| total_timesteps | 2883712 | -| train/ | | -| approx_kl | 0.025388468 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 225280 | -| policy_gradient_loss | 0.0275 | -| std | 0.00644 | -| value_loss | 1.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22530 | -| time_elapsed | 122154 | -| total_timesteps | 2883840 | -| train/ | | -| approx_kl | 0.30043435 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0314 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 225290 | -| policy_gradient_loss | 0.142 | -| std | 0.00644 | -| value_loss | 7.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22531 | -| time_elapsed | 122158 | -| total_timesteps | 2883968 | -| train/ | | -| approx_kl | 0.050311632 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 225300 | -| policy_gradient_loss | 0.0267 | -| std | 0.00644 | -| value_loss | 5.93e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22532 | -| time_elapsed | 122162 | -| total_timesteps | 2884096 | -| train/ | | -| approx_kl | 0.0006717667 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0292 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 225310 | -| policy_gradient_loss | 0.0332 | -| std | 0.00644 | -| value_loss | 3.98e-07 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22533 | -| time_elapsed | 122175 | -| total_timesteps | 2884224 | -| train/ | | -| approx_kl | 0.313469 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 225320 | -| policy_gradient_loss | 0.039 | -| std | 0.00644 | -| value_loss | 0.00425 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22534 | -| time_elapsed | 122179 | -| total_timesteps | 2884352 | -| train/ | | -| approx_kl | 0.010010777 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.00168 | -| n_updates | 225330 | -| policy_gradient_loss | 0.00702 | -| std | 0.00644 | -| value_loss | 4.82e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22535 | -| time_elapsed | 122184 | -| total_timesteps | 2884480 | -| train/ | | -| approx_kl | 0.072169766 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00809 | -| learning_rate | 0.0003 | -| loss | 0.0516 | -| n_updates | 225340 | -| policy_gradient_loss | 0.0219 | -| std | 0.00642 | -| value_loss | 6.81e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22536 | -| time_elapsed | 122188 | -| total_timesteps | 2884608 | -| train/ | | -| approx_kl | 0.01052729 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 225350 | -| policy_gradient_loss | 0.00481 | -| std | 0.00641 | -| value_loss | 6.48e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22537 | -| time_elapsed | 122193 | -| total_timesteps | 2884736 | -| train/ | | -| approx_kl | 0.088497624 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 225360 | -| policy_gradient_loss | 0.00465 | -| std | 0.0064 | -| value_loss | 9.76e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22538 | -| time_elapsed | 122199 | -| total_timesteps | 2884864 | -| train/ | | -| approx_kl | 0.042807937 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 225370 | -| policy_gradient_loss | 0.00745 | -| std | 0.0064 | -| value_loss | 7.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 22539 | -| time_elapsed | 122205 | -| total_timesteps | 2884992 | -| train/ | | -| approx_kl | 0.008672003 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | -0.00496 | -| n_updates | 225380 | -| policy_gradient_loss | 0.0053 | -| std | 0.0064 | -| value_loss | 4.89e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22540 | -| time_elapsed | 122212 | -| total_timesteps | 2885120 | -| train/ | | -| approx_kl | 0.002726337 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -0.00172 | -| n_updates | 225390 | -| policy_gradient_loss | 0.00893 | -| std | 0.0064 | -| value_loss | 2.87e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22541 | -| time_elapsed | 122227 | -| total_timesteps | 2885248 | -| train/ | | -| approx_kl | 0.07557596 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 225400 | -| policy_gradient_loss | 0.00315 | -| std | 0.0064 | -| value_loss | 0.00159 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22542 | -| time_elapsed | 122232 | -| total_timesteps | 2885376 | -| train/ | | -| approx_kl | 0.10949913 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00882 | -| learning_rate | 0.0003 | -| loss | 0.0334 | -| n_updates | 225410 | -| policy_gradient_loss | 0.00626 | -| std | 0.0064 | -| value_loss | 3.46e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22543 | -| time_elapsed | 122238 | -| total_timesteps | 2885504 | -| train/ | | -| approx_kl | 0.043842934 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 225420 | -| policy_gradient_loss | 0.00271 | -| std | 0.0064 | -| value_loss | 5.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22544 | -| time_elapsed | 122242 | -| total_timesteps | 2885632 | -| train/ | | -| approx_kl | 0.008984449 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 225430 | -| policy_gradient_loss | 0.00357 | -| std | 0.00639 | -| value_loss | 8.79e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22545 | -| time_elapsed | 122249 | -| total_timesteps | 2885760 | -| train/ | | -| approx_kl | 0.087641664 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.412 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 225440 | -| policy_gradient_loss | 0.00819 | -| std | 0.00638 | -| value_loss | 1.61e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22546 | -| time_elapsed | 122253 | -| total_timesteps | 2885888 | -| train/ | | -| approx_kl | 0.0450524 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -1.98 | -| learning_rate | 0.0003 | -| loss | -0.00245 | -| n_updates | 225450 | -| policy_gradient_loss | 0.0137 | -| std | 0.00637 | -| value_loss | 1.35e-07 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22547 | -| time_elapsed | 122258 | -| total_timesteps | 2886016 | -| train/ | | -| approx_kl | 0.130214 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0745 | -| learning_rate | 0.0003 | -| loss | 0.0757 | -| n_updates | 225460 | -| policy_gradient_loss | 0.055 | -| std | 0.00637 | -| value_loss | 6.53e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22548 | -| time_elapsed | 122275 | -| total_timesteps | 2886144 | -| train/ | | -| approx_kl | 0.083696574 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -2.42 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 225470 | -| policy_gradient_loss | -0.00832 | -| std | 0.00637 | -| value_loss | 0.003 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22549 | -| time_elapsed | 122280 | -| total_timesteps | 2886272 | -| train/ | | -| approx_kl | 0.12452909 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.143 | -| learning_rate | 0.0003 | -| loss | 0.0717 | -| n_updates | 225480 | -| policy_gradient_loss | 0.0283 | -| std | 0.00636 | -| value_loss | 4.01e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22550 | -| time_elapsed | 122285 | -| total_timesteps | 2886400 | -| train/ | | -| approx_kl | 0.009240082 | -| clip_fraction | 0.0781 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | -0.00873 | -| n_updates | 225490 | -| policy_gradient_loss | -0.00361 | -| std | 0.00636 | -| value_loss | 1.98e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22551 | -| time_elapsed | 122291 | -| total_timesteps | 2886528 | -| train/ | | -| approx_kl | 0.0850104 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0749 | -| n_updates | 225500 | -| policy_gradient_loss | 0.0249 | -| std | 0.00636 | -| value_loss | 1.67e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22552 | -| time_elapsed | 122297 | -| total_timesteps | 2886656 | -| train/ | | -| approx_kl | 0.008637028 | -| clip_fraction | 0.0844 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | 0.000572 | -| n_updates | 225510 | -| policy_gradient_loss | 0.00115 | -| std | 0.00637 | -| value_loss | 1.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22553 | -| time_elapsed | 122303 | -| total_timesteps | 2886784 | -| train/ | | -| approx_kl | 0.012481747 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.000377 | -| n_updates | 225520 | -| policy_gradient_loss | 0.000248 | -| std | 0.00639 | -| value_loss | 1.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 22554 | -| time_elapsed | 122308 | -| total_timesteps | 2886912 | -| train/ | | -| approx_kl | 0.013513925 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.00335 | -| learning_rate | 0.0003 | -| loss | 0.00256 | -| n_updates | 225530 | -| policy_gradient_loss | 0.00135 | -| std | 0.0064 | -| value_loss | 1.92e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22555 | -| time_elapsed | 122312 | -| total_timesteps | 2887040 | -| train/ | | -| approx_kl | 0.01452592 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0827 | -| learning_rate | 0.0003 | -| loss | -0.002 | -| n_updates | 225540 | -| policy_gradient_loss | -0.000832 | -| std | 0.00641 | -| value_loss | 1.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22556 | -| time_elapsed | 122325 | -| total_timesteps | 2887168 | -| train/ | | -| approx_kl | 0.029733812 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.435 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 225550 | -| policy_gradient_loss | -0.00122 | -| std | 0.00641 | -| value_loss | 0.00126 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22557 | -| time_elapsed | 122331 | -| total_timesteps | 2887296 | -| train/ | | -| approx_kl | 0.1314745 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.021 | -| learning_rate | 0.0003 | -| loss | 0.0857 | -| n_updates | 225560 | -| policy_gradient_loss | 0.0412 | -| std | 0.00641 | -| value_loss | 1.79e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22558 | -| time_elapsed | 122336 | -| total_timesteps | 2887424 | -| train/ | | -| approx_kl | 0.00014314102 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 225570 | -| policy_gradient_loss | 0.021 | -| std | 0.00641 | -| value_loss | 4.76e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22559 | -| time_elapsed | 122341 | -| total_timesteps | 2887552 | -| train/ | | -| approx_kl | 0.5183863 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0499 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 225580 | -| policy_gradient_loss | 0.0428 | -| std | 0.00641 | -| value_loss | 3.96e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22560 | -| time_elapsed | 122346 | -| total_timesteps | 2887680 | -| train/ | | -| approx_kl | 0.013082763 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 225590 | -| policy_gradient_loss | 0.0052 | -| std | 0.00642 | -| value_loss | 2.91e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22561 | -| time_elapsed | 122352 | -| total_timesteps | 2887808 | -| train/ | | -| approx_kl | 0.07149668 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 225600 | -| policy_gradient_loss | 0.0138 | -| std | 0.00642 | -| value_loss | 1.81e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22562 | -| time_elapsed | 122357 | -| total_timesteps | 2887936 | -| train/ | | -| approx_kl | 0.042706817 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 225610 | -| policy_gradient_loss | 0.0061 | -| std | 0.00642 | -| value_loss | 1.31e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22563 | -| time_elapsed | 122362 | -| total_timesteps | 2888064 | -| train/ | | -| approx_kl | 0.0037338398 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -1.87e-05 | -| n_updates | 225620 | -| policy_gradient_loss | 0.0112 | -| std | 0.0064 | -| value_loss | 2.02e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22564 | -| time_elapsed | 122371 | -| total_timesteps | 2888192 | -| train/ | | -| approx_kl | 0.01969283 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | 0.733 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 225630 | -| policy_gradient_loss | -0.00867 | -| std | 0.00639 | -| value_loss | 0.0075 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22565 | -| time_elapsed | 122376 | -| total_timesteps | 2888320 | -| train/ | | -| approx_kl | 0.08231078 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.63 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | 0.059 | -| n_updates | 225640 | -| policy_gradient_loss | 0.0249 | -| std | 0.00638 | -| value_loss | 3.51e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22566 | -| time_elapsed | 122382 | -| total_timesteps | 2888448 | -| train/ | | -| approx_kl | 0.008933957 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0037 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 225650 | -| policy_gradient_loss | 0.00126 | -| std | 0.00638 | -| value_loss | 6.88e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22567 | -| time_elapsed | 122385 | -| total_timesteps | 2888576 | -| train/ | | -| approx_kl | 0.03532806 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | 0.0458 | -| n_updates | 225660 | -| policy_gradient_loss | 0.102 | -| std | 0.00638 | -| value_loss | 5.61e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22568 | -| time_elapsed | 122388 | -| total_timesteps | 2888704 | -| train/ | | -| approx_kl | 0.096241914 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0573 | -| n_updates | 225670 | -| policy_gradient_loss | 0.113 | -| std | 0.00638 | -| value_loss | 1.05e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22569 | -| time_elapsed | 122393 | -| total_timesteps | 2888832 | -| train/ | | -| approx_kl | 0.13027905 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.0978 | -| n_updates | 225680 | -| policy_gradient_loss | 0.16 | -| std | 0.00638 | -| value_loss | 8.3e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22570 | -| time_elapsed | 122397 | -| total_timesteps | 2888960 | -| train/ | | -| approx_kl | 0.02410782 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 225690 | -| policy_gradient_loss | 0.0294 | -| std | 0.00637 | -| value_loss | 1.1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22571 | -| time_elapsed | 122402 | -| total_timesteps | 2889088 | -| train/ | | -| approx_kl | 0.69185454 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | 0.36 | -| n_updates | 225700 | -| policy_gradient_loss | 0.0905 | -| std | 0.00636 | -| value_loss | 1.83e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22572 | -| time_elapsed | 122412 | -| total_timesteps | 2889216 | -| train/ | | -| approx_kl | 0.004683198 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.771 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 225710 | -| policy_gradient_loss | -0.0048 | -| std | 0.00636 | -| value_loss | 0.00592 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22573 | -| time_elapsed | 122416 | -| total_timesteps | 2889344 | -| train/ | | -| approx_kl | 0.026450308 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0826 | -| learning_rate | 0.0003 | -| loss | 0.00261 | -| n_updates | 225720 | -| policy_gradient_loss | 0.0071 | -| std | 0.00636 | -| value_loss | 2.4e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22574 | -| time_elapsed | 122420 | -| total_timesteps | 2889472 | -| train/ | | -| approx_kl | 0.06933775 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | 0.0577 | -| n_updates | 225730 | -| policy_gradient_loss | 0.0254 | -| std | 0.00637 | -| value_loss | 0.000106 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22575 | -| time_elapsed | 122426 | -| total_timesteps | 2889600 | -| train/ | | -| approx_kl | 0.08602301 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -3.11 | -| learning_rate | 0.0003 | -| loss | 0.0583 | -| n_updates | 225740 | -| policy_gradient_loss | 0.0244 | -| std | 0.00636 | -| value_loss | 0.00133 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22576 | -| time_elapsed | 122431 | -| total_timesteps | 2889728 | -| train/ | | -| approx_kl | 0.031201521 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0935 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 225750 | -| policy_gradient_loss | 0.00792 | -| std | 0.00636 | -| value_loss | 0.000835 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22577 | -| time_elapsed | 122436 | -| total_timesteps | 2889856 | -| train/ | | -| approx_kl | 0.07414925 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -2.35 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 225760 | -| policy_gradient_loss | 0.0171 | -| std | 0.00636 | -| value_loss | 4.99e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22578 | -| time_elapsed | 122441 | -| total_timesteps | 2889984 | -| train/ | | -| approx_kl | 0.043135993 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.0011 | -| n_updates | 225770 | -| policy_gradient_loss | 0.00142 | -| std | 0.00636 | -| value_loss | 2.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 22579 | -| time_elapsed | 122446 | -| total_timesteps | 2890112 | -| train/ | | -| approx_kl | 0.050250176 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0445 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 225780 | -| policy_gradient_loss | 0.0127 | -| std | 0.00635 | -| value_loss | 1.69e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 22580 | -| time_elapsed | 122459 | -| total_timesteps | 2890240 | -| train/ | | -| approx_kl | 0.023944113 | -| clip_fraction | 0.158 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.957 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 225790 | -| policy_gradient_loss | -0.00145 | -| std | 0.00635 | -| value_loss | 0.000461 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 22581 | -| time_elapsed | 122464 | -| total_timesteps | 2890368 | -| train/ | | -| approx_kl | 0.046944097 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.0197 | -| n_updates | 225800 | -| policy_gradient_loss | 0.00882 | -| std | 0.00635 | -| value_loss | 6.66e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 22582 | -| time_elapsed | 122470 | -| total_timesteps | 2890496 | -| train/ | | -| approx_kl | 0.00957983 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.00347 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 225810 | -| policy_gradient_loss | 0.00592 | -| std | 0.00635 | -| value_loss | 1.83e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 22583 | -| time_elapsed | 122474 | -| total_timesteps | 2890624 | -| train/ | | -| approx_kl | 0.0012978059 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.00708 | -| n_updates | 225820 | -| policy_gradient_loss | 0.00589 | -| std | 0.00634 | -| value_loss | 1.63e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 22584 | -| time_elapsed | 122479 | -| total_timesteps | 2890752 | -| train/ | | -| approx_kl | 0.053731013 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 225830 | -| policy_gradient_loss | 0.0173 | -| std | 0.00634 | -| value_loss | 8.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 22585 | -| time_elapsed | 122483 | -| total_timesteps | 2890880 | -| train/ | | -| approx_kl | 0.010918642 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.072 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 225840 | -| policy_gradient_loss | 0.00927 | -| std | 0.00634 | -| value_loss | 6.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22586 | -| time_elapsed | 122489 | -| total_timesteps | 2891008 | -| train/ | | -| approx_kl | 0.094959944 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0518 | -| n_updates | 225850 | -| policy_gradient_loss | 0.0205 | -| std | 0.00634 | -| value_loss | 5.38e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22587 | -| time_elapsed | 122501 | -| total_timesteps | 2891136 | -| train/ | | -| approx_kl | 0.00063987914 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 225860 | -| policy_gradient_loss | -0.00244 | -| std | 0.00634 | -| value_loss | 0.00408 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22588 | -| time_elapsed | 122505 | -| total_timesteps | 2891264 | -| train/ | | -| approx_kl | 0.017176785 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.446 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 225870 | -| policy_gradient_loss | 0.0031 | -| std | 0.00634 | -| value_loss | 2.96e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22589 | -| time_elapsed | 122508 | -| total_timesteps | 2891392 | -| train/ | | -| approx_kl | 0.072747916 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0085 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 225880 | -| policy_gradient_loss | 0.0156 | -| std | 0.00634 | -| value_loss | 1.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22590 | -| time_elapsed | 122512 | -| total_timesteps | 2891520 | -| train/ | | -| approx_kl | 0.046218567 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.00654 | -| n_updates | 225890 | -| policy_gradient_loss | 0.00431 | -| std | 0.00634 | -| value_loss | 1.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22591 | -| time_elapsed | 122517 | -| total_timesteps | 2891648 | -| train/ | | -| approx_kl | 0.06307932 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 225900 | -| policy_gradient_loss | 0.0132 | -| std | 0.00634 | -| value_loss | 8.36e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22592 | -| time_elapsed | 122522 | -| total_timesteps | 2891776 | -| train/ | | -| approx_kl | 0.012659986 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.00485 | -| n_updates | 225910 | -| policy_gradient_loss | 0.0128 | -| std | 0.00634 | -| value_loss | 6.94e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 22593 | -| time_elapsed | 122527 | -| total_timesteps | 2891904 | -| train/ | | -| approx_kl | 0.07811582 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.0471 | -| n_updates | 225920 | -| policy_gradient_loss | 0.0198 | -| std | 0.00633 | -| value_loss | 3.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22594 | -| time_elapsed | 122531 | -| total_timesteps | 2892032 | -| train/ | | -| approx_kl | 0.011464499 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0711 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 225930 | -| policy_gradient_loss | 0.00568 | -| std | 0.00632 | -| value_loss | 3.39e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22595 | -| time_elapsed | 122540 | -| total_timesteps | 2892160 | -| train/ | | -| approx_kl | 0.10427123 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.00779 | -| n_updates | 225940 | -| policy_gradient_loss | -0.0125 | -| std | 0.00631 | -| value_loss | 4.99e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22596 | -| time_elapsed | 122545 | -| total_timesteps | 2892288 | -| train/ | | -| approx_kl | 0.033756506 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0328 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 225950 | -| policy_gradient_loss | 0.00846 | -| std | 0.0063 | -| value_loss | 3.97e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22597 | -| time_elapsed | 122551 | -| total_timesteps | 2892416 | -| train/ | | -| approx_kl | 0.0629163 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 225960 | -| policy_gradient_loss | 0.0116 | -| std | 0.00629 | -| value_loss | 2.92e-07 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22598 | -| time_elapsed | 122556 | -| total_timesteps | 2892544 | -| train/ | | -| approx_kl | 0.009792 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00766 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 225970 | -| policy_gradient_loss | 0.00317 | -| std | 0.00629 | -| value_loss | 1.49e-07 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22599 | -| time_elapsed | 122561 | -| total_timesteps | 2892672 | -| train/ | | -| approx_kl | 0.00092152925 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.00459 | -| n_updates | 225980 | -| policy_gradient_loss | 0.00618 | -| std | 0.00629 | -| value_loss | 9.47e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22600 | -| time_elapsed | 122567 | -| total_timesteps | 2892800 | -| train/ | | -| approx_kl | 0.0060005947 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00165 | -| n_updates | 225990 | -| policy_gradient_loss | 0.00608 | -| std | 0.00628 | -| value_loss | 6.43e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 22601 | -| time_elapsed | 122571 | -| total_timesteps | 2892928 | -| train/ | | -| approx_kl | 0.0019706595 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | -0.000564 | -| n_updates | 226000 | -| policy_gradient_loss | 0.0103 | -| std | 0.00627 | -| value_loss | 3.51e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22602 | -| time_elapsed | 122580 | -| total_timesteps | 2893056 | -| train/ | | -| approx_kl | 0.026998404 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 226010 | -| policy_gradient_loss | 0.0184 | -| std | 0.00625 | -| value_loss | 3.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22603 | -| time_elapsed | 122586 | -| total_timesteps | 2893184 | -| train/ | | -| approx_kl | 0.0072523113 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.985 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 226020 | -| policy_gradient_loss | 0.00317 | -| std | 0.00624 | -| value_loss | 0.000142 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22604 | -| time_elapsed | 122590 | -| total_timesteps | 2893312 | -| train/ | | -| approx_kl | 0.00013935706 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00794 | -| learning_rate | 0.0003 | -| loss | -0.00108 | -| n_updates | 226030 | -| policy_gradient_loss | 0.0304 | -| std | 0.00623 | -| value_loss | 3.18e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22605 | -| time_elapsed | 122595 | -| total_timesteps | 2893440 | -| train/ | | -| approx_kl | 0.18720502 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0827 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 226040 | -| policy_gradient_loss | 0.0331 | -| std | 0.00622 | -| value_loss | 0.00215 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22606 | -| time_elapsed | 122600 | -| total_timesteps | 2893568 | -| train/ | | -| approx_kl | 0.030965623 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | 0.00847 | -| n_updates | 226050 | -| policy_gradient_loss | 0.0347 | -| std | 0.00621 | -| value_loss | 0.000357 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22607 | -| time_elapsed | 122605 | -| total_timesteps | 2893696 | -| train/ | | -| approx_kl | 0.09492671 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 226060 | -| policy_gradient_loss | 0.0202 | -| std | 0.00621 | -| value_loss | 0.000135 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22608 | -| time_elapsed | 122609 | -| total_timesteps | 2893824 | -| train/ | | -| approx_kl | 0.1508964 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0797 | -| n_updates | 226070 | -| policy_gradient_loss | 0.0268 | -| std | 0.00621 | -| value_loss | 8.08e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 22609 | -| time_elapsed | 122613 | -| total_timesteps | 2893952 | -| train/ | | -| approx_kl | 0.13367747 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.0967 | -| n_updates | 226080 | -| policy_gradient_loss | 0.0132 | -| std | 0.00619 | -| value_loss | 0.000153 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22610 | -| time_elapsed | 122619 | -| total_timesteps | 2894080 | -| train/ | | -| approx_kl | 0.62560314 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | 0.19 | -| n_updates | 226090 | -| policy_gradient_loss | 0.0714 | -| std | 0.00616 | -| value_loss | 4.5e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22611 | -| time_elapsed | 122629 | -| total_timesteps | 2894208 | -| train/ | | -| approx_kl | 0.0062115625 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | -0.00957 | -| n_updates | 226100 | -| policy_gradient_loss | -0.00562 | -| std | 0.00615 | -| value_loss | 0.00461 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22612 | -| time_elapsed | 122634 | -| total_timesteps | 2894336 | -| train/ | | -| approx_kl | 0.008502737 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00945 | -| n_updates | 226110 | -| policy_gradient_loss | 0.0109 | -| std | 0.00615 | -| value_loss | 6.56e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22613 | -| time_elapsed | 122640 | -| total_timesteps | 2894464 | -| train/ | | -| approx_kl | 0.0014261375 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.00712 | -| n_updates | 226120 | -| policy_gradient_loss | 0.00474 | -| std | 0.00615 | -| value_loss | 3.6e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22614 | -| time_elapsed | 122646 | -| total_timesteps | 2894592 | -| train/ | | -| approx_kl | 0.061323468 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 226130 | -| policy_gradient_loss | 0.00286 | -| std | 0.00614 | -| value_loss | 3.06e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22615 | -| time_elapsed | 122649 | -| total_timesteps | 2894720 | -| train/ | | -| approx_kl | 9.741308e-05 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 226140 | -| policy_gradient_loss | 0.0386 | -| std | 0.00618 | -| value_loss | 0.00319 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22616 | -| time_elapsed | 122654 | -| total_timesteps | 2894848 | -| train/ | | -| approx_kl | 0.5786742 | -| clip_fraction | 0.778 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -3.62 | -| learning_rate | 0.0003 | -| loss | 0.0995 | -| n_updates | 226150 | -| policy_gradient_loss | 0.0753 | -| std | 0.0062 | -| value_loss | 0.00509 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 22617 | -| time_elapsed | 122659 | -| total_timesteps | 2894976 | -| train/ | | -| approx_kl | 0.02613189 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.781 | -| learning_rate | 0.0003 | -| loss | 0.00187 | -| n_updates | 226160 | -| policy_gradient_loss | -0.00296 | -| std | 0.0062 | -| value_loss | 0.000425 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22618 | -| time_elapsed | 122664 | -| total_timesteps | 2895104 | -| train/ | | -| approx_kl | 0.03234771 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 226170 | -| policy_gradient_loss | 0.0434 | -| std | 0.00621 | -| value_loss | 0.000207 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22619 | -| time_elapsed | 122676 | -| total_timesteps | 2895232 | -| train/ | | -| approx_kl | 0.009431021 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.452 | -| learning_rate | 0.0003 | -| loss | -0.00522 | -| n_updates | 226180 | -| policy_gradient_loss | 0.0431 | -| std | 0.00621 | -| value_loss | 0.00193 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22620 | -| time_elapsed | 122681 | -| total_timesteps | 2895360 | -| train/ | | -| approx_kl | 0.009163974 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 226190 | -| policy_gradient_loss | 0.0908 | -| std | 0.00621 | -| value_loss | 8.29e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22621 | -| time_elapsed | 122684 | -| total_timesteps | 2895488 | -| train/ | | -| approx_kl | 0.018343817 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.00383 | -| n_updates | 226200 | -| policy_gradient_loss | 0.0293 | -| std | 0.00621 | -| value_loss | 6.17e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22622 | -| time_elapsed | 122689 | -| total_timesteps | 2895616 | -| train/ | | -| approx_kl | 0.0077588595 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 226210 | -| policy_gradient_loss | 0.00856 | -| std | 0.00621 | -| value_loss | 6.05e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22623 | -| time_elapsed | 122692 | -| total_timesteps | 2895744 | -| train/ | | -| approx_kl | 0.07040077 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 226220 | -| policy_gradient_loss | 0.0321 | -| std | 0.00621 | -| value_loss | 0.000165 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 22624 | -| time_elapsed | 122695 | -| total_timesteps | 2895872 | -| train/ | | -| approx_kl | 0.33797586 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.23 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 226230 | -| policy_gradient_loss | 0.0976 | -| std | 0.0062 | -| value_loss | 1.25e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22625 | -| time_elapsed | 122700 | -| total_timesteps | 2896000 | -| train/ | | -| approx_kl | 0.04721495 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 226240 | -| policy_gradient_loss | 0.02 | -| std | 0.0062 | -| value_loss | 1.81e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22626 | -| time_elapsed | 122704 | -| total_timesteps | 2896128 | -| train/ | | -| approx_kl | 0.18361148 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00824 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 226250 | -| policy_gradient_loss | 0.0123 | -| std | 0.00621 | -| value_loss | 1.01e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22627 | -| time_elapsed | 122714 | -| total_timesteps | 2896256 | -| train/ | | -| approx_kl | 0.047806267 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -5.58 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 226260 | -| policy_gradient_loss | -0.0101 | -| std | 0.00621 | -| value_loss | 0.00363 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22628 | -| time_elapsed | 122719 | -| total_timesteps | 2896384 | -| train/ | | -| approx_kl | 0.09841767 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | 0.0694 | -| n_updates | 226270 | -| policy_gradient_loss | 0.0306 | -| std | 0.00621 | -| value_loss | 4.54e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22629 | -| time_elapsed | 122725 | -| total_timesteps | 2896512 | -| train/ | | -| approx_kl | 0.5218013 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -25.2 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 226280 | -| policy_gradient_loss | 0.0445 | -| std | 0.00621 | -| value_loss | 4.86e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22630 | -| time_elapsed | 122730 | -| total_timesteps | 2896640 | -| train/ | | -| approx_kl | 0.052085448 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.43 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 226290 | -| policy_gradient_loss | 0.0442 | -| std | 0.00621 | -| value_loss | 3.96e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22631 | -| time_elapsed | 122736 | -| total_timesteps | 2896768 | -| train/ | | -| approx_kl | 0.25003394 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 226300 | -| policy_gradient_loss | 0.0484 | -| std | 0.00621 | -| value_loss | 1.26e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 22632 | -| time_elapsed | 122742 | -| total_timesteps | 2896896 | -| train/ | | -| approx_kl | 0.07091288 | -| clip_fraction | 0.603 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 226310 | -| policy_gradient_loss | 0.0921 | -| std | 0.00621 | -| value_loss | 9.48e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22633 | -| time_elapsed | 122747 | -| total_timesteps | 2897024 | -| train/ | | -| approx_kl | 0.26838195 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 226320 | -| policy_gradient_loss | 0.0495 | -| std | 0.00621 | -| value_loss | 7.69e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22634 | -| time_elapsed | 122757 | -| total_timesteps | 2897152 | -| train/ | | -| approx_kl | 0.00047590397 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.008 | -| n_updates | 226330 | -| policy_gradient_loss | -0.00462 | -| std | 0.00621 | -| value_loss | 0.000225 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22635 | -| time_elapsed | 122763 | -| total_timesteps | 2897280 | -| train/ | | -| approx_kl | 0.084586635 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0171 | -| learning_rate | 0.0003 | -| loss | 0.00874 | -| n_updates | 226340 | -| policy_gradient_loss | 0.07 | -| std | 0.00621 | -| value_loss | 0.000911 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22636 | -| time_elapsed | 122768 | -| total_timesteps | 2897408 | -| train/ | | -| approx_kl | 0.00011579646 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.204 | -| learning_rate | 0.0003 | -| loss | 0.00014 | -| n_updates | 226350 | -| policy_gradient_loss | 0.0842 | -| std | 0.00621 | -| value_loss | 1.58e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22637 | -| time_elapsed | 122772 | -| total_timesteps | 2897536 | -| train/ | | -| approx_kl | 0.03929264 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 226360 | -| policy_gradient_loss | 0.0256 | -| std | 0.00621 | -| value_loss | 2.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22638 | -| time_elapsed | 122777 | -| total_timesteps | 2897664 | -| train/ | | -| approx_kl | 0.039880842 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.00626 | -| n_updates | 226370 | -| policy_gradient_loss | 0.0241 | -| std | 0.00621 | -| value_loss | 1.78e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22639 | -| time_elapsed | 122783 | -| total_timesteps | 2897792 | -| train/ | | -| approx_kl | 0.13063228 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.0727 | -| n_updates | 226380 | -| policy_gradient_loss | 0.0344 | -| std | 0.00621 | -| value_loss | 1.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.967 | -| time/ | | -| fps | 23 | -| iterations | 22640 | -| time_elapsed | 122789 | -| total_timesteps | 2897920 | -| train/ | | -| approx_kl | 0.006851392 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 226390 | -| policy_gradient_loss | 0.0233 | -| std | 0.00621 | -| value_loss | 8.74e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22641 | -| time_elapsed | 122794 | -| total_timesteps | 2898048 | -| train/ | | -| approx_kl | 0.53144515 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 226400 | -| policy_gradient_loss | 0.0694 | -| std | 0.00621 | -| value_loss | 5.92e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22642 | -| time_elapsed | 122804 | -| total_timesteps | 2898176 | -| train/ | | -| approx_kl | 0.010074611 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.791 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 226410 | -| policy_gradient_loss | -0.00803 | -| std | 0.0062 | -| value_loss | 0.00504 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22643 | -| time_elapsed | 122808 | -| total_timesteps | 2898304 | -| train/ | | -| approx_kl | 0.21728998 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 226420 | -| policy_gradient_loss | 0.036 | -| std | 0.0062 | -| value_loss | 1.55e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22644 | -| time_elapsed | 122813 | -| total_timesteps | 2898432 | -| train/ | | -| approx_kl | 0.00084908307 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00941 | -| learning_rate | 0.0003 | -| loss | 0.0012 | -| n_updates | 226430 | -| policy_gradient_loss | 0.0335 | -| std | 0.0062 | -| value_loss | 2.04e-06 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22645 | -| time_elapsed | 122818 | -| total_timesteps | 2898560 | -| train/ | | -| approx_kl | 0.266728 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 226440 | -| policy_gradient_loss | 0.0251 | -| std | 0.0062 | -| value_loss | 1.2e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22646 | -| time_elapsed | 122822 | -| total_timesteps | 2898688 | -| train/ | | -| approx_kl | 0.023843743 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 226450 | -| policy_gradient_loss | 0.00487 | -| std | 0.0062 | -| value_loss | 7.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22647 | -| time_elapsed | 122827 | -| total_timesteps | 2898816 | -| train/ | | -| approx_kl | 0.029993739 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.069 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 226460 | -| policy_gradient_loss | 0.0394 | -| std | 0.0062 | -| value_loss | 4.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22648 | -| time_elapsed | 122832 | -| total_timesteps | 2898944 | -| train/ | | -| approx_kl | 0.36033744 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 226470 | -| policy_gradient_loss | 0.154 | -| std | 0.0062 | -| value_loss | 4.9e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22649 | -| time_elapsed | 122837 | -| total_timesteps | 2899072 | -| train/ | | -| approx_kl | 0.07151719 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 226480 | -| policy_gradient_loss | 0.0377 | -| std | 0.0062 | -| value_loss | 3.72e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22650 | -| time_elapsed | 122846 | -| total_timesteps | 2899200 | -| train/ | | -| approx_kl | 0.47087973 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.39 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 226490 | -| policy_gradient_loss | 0.00807 | -| std | 0.0062 | -| value_loss | 0.0026 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22651 | -| time_elapsed | 122851 | -| total_timesteps | 2899328 | -| train/ | | -| approx_kl | 0.10912879 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -24.5 | -| learning_rate | 0.0003 | -| loss | -0.00705 | -| n_updates | 226500 | -| policy_gradient_loss | -0.00873 | -| std | 0.0062 | -| value_loss | 4.5e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22652 | -| time_elapsed | 122855 | -| total_timesteps | 2899456 | -| train/ | | -| approx_kl | 0.03935572 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.355 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 226510 | -| policy_gradient_loss | 0.00867 | -| std | 0.0062 | -| value_loss | 1.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22653 | -| time_elapsed | 122859 | -| total_timesteps | 2899584 | -| train/ | | -| approx_kl | 0.0067380453 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 226520 | -| policy_gradient_loss | 0.00831 | -| std | 0.0062 | -| value_loss | 8.54e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22654 | -| time_elapsed | 122863 | -| total_timesteps | 2899712 | -| train/ | | -| approx_kl | 0.0013237968 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.00344 | -| n_updates | 226530 | -| policy_gradient_loss | 0.00435 | -| std | 0.0062 | -| value_loss | 7.11e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22655 | -| time_elapsed | 122867 | -| total_timesteps | 2899840 | -| train/ | | -| approx_kl | 0.0067190854 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 226540 | -| policy_gradient_loss | 0.00818 | -| std | 0.0062 | -| value_loss | 5.77e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 22656 | -| time_elapsed | 122872 | -| total_timesteps | 2899968 | -| train/ | | -| approx_kl | 9.902427e-05 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.000178 | -| n_updates | 226550 | -| policy_gradient_loss | 0.0223 | -| std | 0.0062 | -| value_loss | 3.05e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22657 | -| time_elapsed | 122877 | -| total_timesteps | 2900096 | -| train/ | | -| approx_kl | 0.67351615 | -| clip_fraction | 0.749 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.06 | -| learning_rate | 0.0003 | -| loss | 0.366 | -| n_updates | 226560 | -| policy_gradient_loss | 0.137 | -| std | 0.0062 | -| value_loss | 2.81e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22658 | -| time_elapsed | 122890 | -| total_timesteps | 2900224 | -| train/ | | -| approx_kl | 0.22388273 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 226570 | -| policy_gradient_loss | 0.012 | -| std | 0.0062 | -| value_loss | 2.46e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22659 | -| time_elapsed | 122896 | -| total_timesteps | 2900352 | -| train/ | | -| approx_kl | 0.020915497 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -8.12 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 226580 | -| policy_gradient_loss | -0.00519 | -| std | 0.0062 | -| value_loss | 1.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22660 | -| time_elapsed | 122902 | -| total_timesteps | 2900480 | -| train/ | | -| approx_kl | 0.015956318 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.29 | -| learning_rate | 0.0003 | -| loss | 0.00427 | -| n_updates | 226590 | -| policy_gradient_loss | 0.00199 | -| std | 0.00621 | -| value_loss | 1.29e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22661 | -| time_elapsed | 122907 | -| total_timesteps | 2900608 | -| train/ | | -| approx_kl | 0.034898397 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | 0.00553 | -| n_updates | 226600 | -| policy_gradient_loss | 0.0331 | -| std | 0.00621 | -| value_loss | 4.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22662 | -| time_elapsed | 122912 | -| total_timesteps | 2900736 | -| train/ | | -| approx_kl | 0.114445314 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00753 | -| learning_rate | 0.0003 | -| loss | 0.0635 | -| n_updates | 226610 | -| policy_gradient_loss | 0.0302 | -| std | 0.00621 | -| value_loss | 2.37e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22663 | -| time_elapsed | 122917 | -| total_timesteps | 2900864 | -| train/ | | -| approx_kl | 0.0003393814 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 226620 | -| policy_gradient_loss | 0.0364 | -| std | 0.00621 | -| value_loss | 1.8e-09 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.963 | -| time/ | | -| fps | 23 | -| iterations | 22664 | -| time_elapsed | 122922 | -| total_timesteps | 2900992 | -| train/ | | -| approx_kl | 0.8646504 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.348 | -| n_updates | 226630 | -| policy_gradient_loss | 0.0852 | -| std | 0.0062 | -| value_loss | 1.58e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22665 | -| time_elapsed | 122928 | -| total_timesteps | 2901120 | -| train/ | | -| approx_kl | 0.011153776 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.027 | -| learning_rate | 0.0003 | -| loss | 0.00503 | -| n_updates | 226640 | -| policy_gradient_loss | 0.00793 | -| std | 0.0062 | -| value_loss | 7.17e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22666 | -| time_elapsed | 122940 | -| total_timesteps | 2901248 | -| train/ | | -| approx_kl | 0.025292646 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.996 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 226650 | -| policy_gradient_loss | 0.018 | -| std | 0.0062 | -| value_loss | 2.88e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22667 | -| time_elapsed | 122943 | -| total_timesteps | 2901376 | -| train/ | | -| approx_kl | 0.020956464 | -| clip_fraction | 0.175 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | -0.0162 | -| n_updates | 226660 | -| policy_gradient_loss | -0.00956 | -| std | 0.0062 | -| value_loss | 6.55e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22668 | -| time_elapsed | 122947 | -| total_timesteps | 2901504 | -| train/ | | -| approx_kl | 0.023234304 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | 0.00405 | -| n_updates | 226670 | -| policy_gradient_loss | 0.0269 | -| std | 0.0062 | -| value_loss | 2.6e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22669 | -| time_elapsed | 122953 | -| total_timesteps | 2901632 | -| train/ | | -| approx_kl | 0.43055493 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.000415 | -| learning_rate | 0.0003 | -| loss | 0.297 | -| n_updates | 226680 | -| policy_gradient_loss | 0.184 | -| std | 0.0062 | -| value_loss | 1.83e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22670 | -| time_elapsed | 122958 | -| total_timesteps | 2901760 | -| train/ | | -| approx_kl | 0.2344611 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0103 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 226690 | -| policy_gradient_loss | 0.161 | -| std | 0.0062 | -| value_loss | 1.56e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22671 | -| time_elapsed | 122965 | -| total_timesteps | 2901888 | -| train/ | | -| approx_kl | 0.15151241 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.0881 | -| n_updates | 226700 | -| policy_gradient_loss | 0.121 | -| std | 0.0062 | -| value_loss | 1.29e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22672 | -| time_elapsed | 122971 | -| total_timesteps | 2902016 | -| train/ | | -| approx_kl | 0.13817647 | -| clip_fraction | 0.679 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0162 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 226710 | -| policy_gradient_loss | 0.111 | -| std | 0.0062 | -| value_loss | 1.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22673 | -| time_elapsed | 122984 | -| total_timesteps | 2902144 | -| train/ | | -| approx_kl | 0.0032060645 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.764 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 226720 | -| policy_gradient_loss | 0.0171 | -| std | 0.0062 | -| value_loss | 0.00138 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22674 | -| time_elapsed | 122990 | -| total_timesteps | 2902272 | -| train/ | | -| approx_kl | 0.1802514 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0191 | -| learning_rate | 0.0003 | -| loss | 0.0807 | -| n_updates | 226730 | -| policy_gradient_loss | 0.0472 | -| std | 0.0062 | -| value_loss | 0.000538 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22675 | -| time_elapsed | 122993 | -| total_timesteps | 2902400 | -| train/ | | -| approx_kl | 0.013746886 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00901 | -| learning_rate | 0.0003 | -| loss | 0.00616 | -| n_updates | 226740 | -| policy_gradient_loss | 0.0135 | -| std | 0.0062 | -| value_loss | 1.93e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22676 | -| time_elapsed | 122997 | -| total_timesteps | 2902528 | -| train/ | | -| approx_kl | 0.08534814 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.0348 | -| n_updates | 226750 | -| policy_gradient_loss | 0.0123 | -| std | 0.0062 | -| value_loss | 7.48e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22677 | -| time_elapsed | 123004 | -| total_timesteps | 2902656 | -| train/ | | -| approx_kl | 0.015047198 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 226760 | -| policy_gradient_loss | 0.00726 | -| std | 0.0062 | -| value_loss | 7.4e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22678 | -| time_elapsed | 123010 | -| total_timesteps | 2902784 | -| train/ | | -| approx_kl | 0.08275997 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 226770 | -| policy_gradient_loss | 0.0219 | -| std | 0.0062 | -| value_loss | 5.67e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 22679 | -| time_elapsed | 123014 | -| total_timesteps | 2902912 | -| train/ | | -| approx_kl | 0.052430257 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0297 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 226780 | -| policy_gradient_loss | 0.0174 | -| std | 0.0062 | -| value_loss | 3.87e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22680 | -| time_elapsed | 123020 | -| total_timesteps | 2903040 | -| train/ | | -| approx_kl | 0.06406193 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.0366 | -| n_updates | 226790 | -| policy_gradient_loss | 0.0171 | -| std | 0.0062 | -| value_loss | 2.31e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22681 | -| time_elapsed | 123031 | -| total_timesteps | 2903168 | -| train/ | | -| approx_kl | 0.026745196 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 226800 | -| policy_gradient_loss | -0.00885 | -| std | 0.0062 | -| value_loss | 0.000258 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22682 | -| time_elapsed | 123035 | -| total_timesteps | 2903296 | -| train/ | | -| approx_kl | 0.0121703185 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00625 | -| learning_rate | 0.0003 | -| loss | 0.000339 | -| n_updates | 226810 | -| policy_gradient_loss | 0.0329 | -| std | 0.00621 | -| value_loss | 1.56e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22683 | -| time_elapsed | 123039 | -| total_timesteps | 2903424 | -| train/ | | -| approx_kl | 0.93820596 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 226820 | -| policy_gradient_loss | 0.0645 | -| std | 0.00621 | -| value_loss | 7.6e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22684 | -| time_elapsed | 123043 | -| total_timesteps | 2903552 | -| train/ | | -| approx_kl | 0.05056967 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.006 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 226830 | -| policy_gradient_loss | 0.0113 | -| std | 0.00621 | -| value_loss | 3.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22685 | -| time_elapsed | 123048 | -| total_timesteps | 2903680 | -| train/ | | -| approx_kl | 0.060148343 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 226840 | -| policy_gradient_loss | -0.00141 | -| std | 0.00621 | -| value_loss | 2.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22686 | -| time_elapsed | 123052 | -| total_timesteps | 2903808 | -| train/ | | -| approx_kl | 0.12913245 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | 0.0893 | -| n_updates | 226850 | -| policy_gradient_loss | 0.0755 | -| std | 0.00622 | -| value_loss | 4.8e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22687 | -| time_elapsed | 123057 | -| total_timesteps | 2903936 | -| train/ | | -| approx_kl | 0.03964121 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -64.9 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 226860 | -| policy_gradient_loss | 0.0133 | -| std | 0.00623 | -| value_loss | 8.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22688 | -| time_elapsed | 123062 | -| total_timesteps | 2904064 | -| train/ | | -| approx_kl | 0.013694568 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -9.91 | -| learning_rate | 0.0003 | -| loss | -0.000504 | -| n_updates | 226870 | -| policy_gradient_loss | 0.0536 | -| std | 0.00623 | -| value_loss | 2.45e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22689 | -| time_elapsed | 123068 | -| total_timesteps | 2904192 | -| train/ | | -| approx_kl | 0.17058055 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 226880 | -| policy_gradient_loss | 0.156 | -| std | 0.00623 | -| value_loss | 0.000282 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22690 | -| time_elapsed | 123072 | -| total_timesteps | 2904320 | -| train/ | | -| approx_kl | 0.06162812 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.392 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 226890 | -| policy_gradient_loss | 0.0305 | -| std | 0.00624 | -| value_loss | 2.34e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22691 | -| time_elapsed | 123076 | -| total_timesteps | 2904448 | -| train/ | | -| approx_kl | 0.0010926393 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 226900 | -| policy_gradient_loss | 0.0295 | -| std | 0.00624 | -| value_loss | 5.57e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22692 | -| time_elapsed | 123081 | -| total_timesteps | 2904576 | -| train/ | | -| approx_kl | 0.6322923 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00373 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 226910 | -| policy_gradient_loss | 0.0607 | -| std | 0.00624 | -| value_loss | 2.37e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22693 | -| time_elapsed | 123086 | -| total_timesteps | 2904704 | -| train/ | | -| approx_kl | 0.010517733 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 226920 | -| policy_gradient_loss | 0.0049 | -| std | 0.00624 | -| value_loss | 2.22e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22694 | -| time_elapsed | 123092 | -| total_timesteps | 2904832 | -| train/ | | -| approx_kl | 0.07773416 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 226930 | -| policy_gradient_loss | 0.0122 | -| std | 0.00624 | -| value_loss | 1.66e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22695 | -| time_elapsed | 123097 | -| total_timesteps | 2904960 | -| train/ | | -| approx_kl | 0.046862394 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 226940 | -| policy_gradient_loss | 0.0152 | -| std | 0.00624 | -| value_loss | 1.14e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22696 | -| time_elapsed | 123103 | -| total_timesteps | 2905088 | -| train/ | | -| approx_kl | 0.009069376 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | -0.00802 | -| n_updates | 226950 | -| policy_gradient_loss | 0.00627 | -| std | 0.00624 | -| value_loss | 8.4e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22697 | -| time_elapsed | 123112 | -| total_timesteps | 2905216 | -| train/ | | -| approx_kl | 0.0432102 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.154 | -| learning_rate | 0.0003 | -| loss | -0.0257 | -| n_updates | 226960 | -| policy_gradient_loss | -0.0159 | -| std | 0.00624 | -| value_loss | 0.00158 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22698 | -| time_elapsed | 123118 | -| total_timesteps | 2905344 | -| train/ | | -| approx_kl | 0.00027536973 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.344 | -| learning_rate | 0.0003 | -| loss | 0.00303 | -| n_updates | 226970 | -| policy_gradient_loss | 0.00696 | -| std | 0.00624 | -| value_loss | 2.53e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22699 | -| time_elapsed | 123124 | -| total_timesteps | 2905472 | -| train/ | | -| approx_kl | 0.0687344 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00795 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 226980 | -| policy_gradient_loss | 0.0173 | -| std | 0.00624 | -| value_loss | 8.06e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22700 | -| time_elapsed | 123128 | -| total_timesteps | 2905600 | -| train/ | | -| approx_kl | 0.014028616 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00563 | -| learning_rate | 0.0003 | -| loss | -0.00913 | -| n_updates | 226990 | -| policy_gradient_loss | 0.0139 | -| std | 0.00624 | -| value_loss | 5.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22701 | -| time_elapsed | 123133 | -| total_timesteps | 2905728 | -| train/ | | -| approx_kl | 0.08494887 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 227000 | -| policy_gradient_loss | 0.00222 | -| std | 0.00624 | -| value_loss | 4.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22702 | -| time_elapsed | 123141 | -| total_timesteps | 2905856 | -| train/ | | -| approx_kl | 0.014479422 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 227010 | -| policy_gradient_loss | 0.00476 | -| std | 0.00624 | -| value_loss | 3.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22703 | -| time_elapsed | 123146 | -| total_timesteps | 2905984 | -| train/ | | -| approx_kl | 0.0037039965 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 227020 | -| policy_gradient_loss | 0.0095 | -| std | 0.00624 | -| value_loss | 2.36e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22704 | -| time_elapsed | 123153 | -| total_timesteps | 2906112 | -| train/ | | -| approx_kl | 3.5970937e-05 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.000503 | -| n_updates | 227030 | -| policy_gradient_loss | 0.0684 | -| std | 0.00624 | -| value_loss | 1.96e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22705 | -| time_elapsed | 123164 | -| total_timesteps | 2906240 | -| train/ | | -| approx_kl | 0.6034864 | -| clip_fraction | 0.752 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.858 | -| learning_rate | 0.0003 | -| loss | 0.194 | -| n_updates | 227040 | -| policy_gradient_loss | 0.099 | -| std | 0.00624 | -| value_loss | 0.00255 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22706 | -| time_elapsed | 123169 | -| total_timesteps | 2906368 | -| train/ | | -| approx_kl | 0.239291 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -11.3 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 227050 | -| policy_gradient_loss | 0.00227 | -| std | 0.00624 | -| value_loss | 1.16e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22707 | -| time_elapsed | 123174 | -| total_timesteps | 2906496 | -| train/ | | -| approx_kl | 0.15220557 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.86 | -| learning_rate | 0.0003 | -| loss | 0.0724 | -| n_updates | 227060 | -| policy_gradient_loss | 0.0489 | -| std | 0.00624 | -| value_loss | 9.4e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22708 | -| time_elapsed | 123179 | -| total_timesteps | 2906624 | -| train/ | | -| approx_kl | 0.00021320675 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 227070 | -| policy_gradient_loss | 0.0274 | -| std | 0.00624 | -| value_loss | 7.54e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22709 | -| time_elapsed | 123184 | -| total_timesteps | 2906752 | -| train/ | | -| approx_kl | 0.065873794 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | 0.0341 | -| n_updates | 227080 | -| policy_gradient_loss | 0.0315 | -| std | 0.00624 | -| value_loss | 4.87e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22710 | -| time_elapsed | 123188 | -| total_timesteps | 2906880 | -| train/ | | -| approx_kl | 0.3363508 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 227090 | -| policy_gradient_loss | 0.123 | -| std | 0.00624 | -| value_loss | 4.11e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22711 | -| time_elapsed | 123192 | -| total_timesteps | 2907008 | -| train/ | | -| approx_kl | 0.058758873 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | 0.0296 | -| n_updates | 227100 | -| policy_gradient_loss | 0.0273 | -| std | 0.00624 | -| value_loss | 3.45e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22712 | -| time_elapsed | 123205 | -| total_timesteps | 2907136 | -| train/ | | -| approx_kl | 0.051274788 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.75 | -| learning_rate | 0.0003 | -| loss | -0.0275 | -| n_updates | 227110 | -| policy_gradient_loss | -0.00175 | -| std | 0.00624 | -| value_loss | 0.00076 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22713 | -| time_elapsed | 123211 | -| total_timesteps | 2907264 | -| train/ | | -| approx_kl | 0.0034041232 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.682 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 227120 | -| policy_gradient_loss | 0.0102 | -| std | 0.00624 | -| value_loss | 6.21e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22714 | -| time_elapsed | 123218 | -| total_timesteps | 2907392 | -| train/ | | -| approx_kl | 0.08630959 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00513 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 227130 | -| policy_gradient_loss | 0.0036 | -| std | 0.00623 | -| value_loss | 4.16e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22715 | -| time_elapsed | 123223 | -| total_timesteps | 2907520 | -| train/ | | -| approx_kl | 0.05055306 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | 0.00344 | -| n_updates | 227140 | -| policy_gradient_loss | 0.00437 | -| std | 0.00623 | -| value_loss | 1.85e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22716 | -| time_elapsed | 123227 | -| total_timesteps | 2907648 | -| train/ | | -| approx_kl | 0.060132533 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.00215 | -| n_updates | 227150 | -| policy_gradient_loss | -5.35e-05 | -| std | 0.00623 | -| value_loss | 1.92e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22717 | -| time_elapsed | 123232 | -| total_timesteps | 2907776 | -| train/ | | -| approx_kl | 0.012865027 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 227160 | -| policy_gradient_loss | 0.00602 | -| std | 0.00623 | -| value_loss | 1.77e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22718 | -| time_elapsed | 123237 | -| total_timesteps | 2907904 | -| train/ | | -| approx_kl | 0.0880084 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 227170 | -| policy_gradient_loss | 0.00795 | -| std | 0.00623 | -| value_loss | 1.45e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22719 | -| time_elapsed | 123242 | -| total_timesteps | 2908032 | -| train/ | | -| approx_kl | 0.05279776 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 227180 | -| policy_gradient_loss | 0.0119 | -| std | 0.00624 | -| value_loss | 9.86e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22720 | -| time_elapsed | 123252 | -| total_timesteps | 2908160 | -| train/ | | -| approx_kl | 0.010336406 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 227190 | -| policy_gradient_loss | 0.00622 | -| std | 0.00624 | -| value_loss | 0.000128 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22721 | -| time_elapsed | 123257 | -| total_timesteps | 2908288 | -| train/ | | -| approx_kl | 0.0047311364 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.63 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 227200 | -| policy_gradient_loss | 0.00888 | -| std | 0.00623 | -| value_loss | 5.92e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22722 | -| time_elapsed | 123261 | -| total_timesteps | 2908416 | -| train/ | | -| approx_kl | 0.033682898 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 227210 | -| policy_gradient_loss | 0.0142 | -| std | 0.00622 | -| value_loss | 4.53e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22723 | -| time_elapsed | 123267 | -| total_timesteps | 2908544 | -| train/ | | -| approx_kl | 0.08003806 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.317 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 227220 | -| policy_gradient_loss | 0.0084 | -| std | 0.00622 | -| value_loss | 3.26e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22724 | -| time_elapsed | 123271 | -| total_timesteps | 2908672 | -| train/ | | -| approx_kl | 0.008357728 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00408 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 227230 | -| policy_gradient_loss | 0.00267 | -| std | 0.00622 | -| value_loss | 9.89e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22725 | -| time_elapsed | 123276 | -| total_timesteps | 2908800 | -| train/ | | -| approx_kl | 0.08978841 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.0235 | -| n_updates | 227240 | -| policy_gradient_loss | 0.00604 | -| std | 0.00622 | -| value_loss | 4.99e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22726 | -| time_elapsed | 123280 | -| total_timesteps | 2908928 | -| train/ | | -| approx_kl | 0.056754384 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.00593 | -| n_updates | 227250 | -| policy_gradient_loss | 0.00479 | -| std | 0.00622 | -| value_loss | 4.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22727 | -| time_elapsed | 123285 | -| total_timesteps | 2909056 | -| train/ | | -| approx_kl | 0.057631224 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 227260 | -| policy_gradient_loss | 0.00755 | -| std | 0.00623 | -| value_loss | 3.62e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22728 | -| time_elapsed | 123295 | -| total_timesteps | 2909184 | -| train/ | | -| approx_kl | 0.0072450307 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | -0.0231 | -| n_updates | 227270 | -| policy_gradient_loss | -0.0123 | -| std | 0.00623 | -| value_loss | 0.00287 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22729 | -| time_elapsed | 123300 | -| total_timesteps | 2909312 | -| train/ | | -| approx_kl | 0.003572958 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -61 | -| learning_rate | 0.0003 | -| loss | -0.00732 | -| n_updates | 227280 | -| policy_gradient_loss | 0.0213 | -| std | 0.00623 | -| value_loss | 1.63e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22730 | -| time_elapsed | 123305 | -| total_timesteps | 2909440 | -| train/ | | -| approx_kl | 0.84378374 | -| clip_fraction | 0.773 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | 0.301 | -| n_updates | 227290 | -| policy_gradient_loss | 0.239 | -| std | 0.00623 | -| value_loss | 4.71e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22731 | -| time_elapsed | 123310 | -| total_timesteps | 2909568 | -| train/ | | -| approx_kl | 0.022250783 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 227300 | -| policy_gradient_loss | -0.00264 | -| std | 0.00623 | -| value_loss | 2.98e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22732 | -| time_elapsed | 123315 | -| total_timesteps | 2909696 | -| train/ | | -| approx_kl | 0.028050514 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -0.000535 | -| n_updates | 227310 | -| policy_gradient_loss | 0.0327 | -| std | 0.00623 | -| value_loss | 2.21e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22733 | -| time_elapsed | 123319 | -| total_timesteps | 2909824 | -| train/ | | -| approx_kl | 0.11262415 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.0657 | -| n_updates | 227320 | -| policy_gradient_loss | 0.0322 | -| std | 0.00623 | -| value_loss | 1.52e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 22734 | -| time_elapsed | 123325 | -| total_timesteps | 2909952 | -| train/ | | -| approx_kl | 0.1597297 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 227330 | -| policy_gradient_loss | 0.025 | -| std | 0.00623 | -| value_loss | 1.13e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22735 | -| time_elapsed | 123329 | -| total_timesteps | 2910080 | -| train/ | | -| approx_kl | 0.029781256 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.0077 | -| n_updates | 227340 | -| policy_gradient_loss | 0.0294 | -| std | 0.00623 | -| value_loss | 1.03e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22736 | -| time_elapsed | 123337 | -| total_timesteps | 2910208 | -| train/ | | -| approx_kl | 0.37735277 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 227350 | -| policy_gradient_loss | 0.0853 | -| std | 0.00623 | -| value_loss | 0.000449 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22737 | -| time_elapsed | 123344 | -| total_timesteps | 2910336 | -| train/ | | -| approx_kl | 0.12659545 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00922 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 227360 | -| policy_gradient_loss | 0.0382 | -| std | 0.00623 | -| value_loss | 6.31e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22738 | -| time_elapsed | 123349 | -| total_timesteps | 2910464 | -| train/ | | -| approx_kl | 0.16006935 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00744 | -| learning_rate | 0.0003 | -| loss | 0.0508 | -| n_updates | 227370 | -| policy_gradient_loss | 0.0242 | -| std | 0.00623 | -| value_loss | 1.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22739 | -| time_elapsed | 123355 | -| total_timesteps | 2910592 | -| train/ | | -| approx_kl | 0.03518717 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0466 | -| learning_rate | 0.0003 | -| loss | 0.00587 | -| n_updates | 227380 | -| policy_gradient_loss | 0.0297 | -| std | 0.00623 | -| value_loss | 1.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22740 | -| time_elapsed | 123360 | -| total_timesteps | 2910720 | -| train/ | | -| approx_kl | 0.17268966 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 227390 | -| policy_gradient_loss | 0.0496 | -| std | 0.00623 | -| value_loss | 6.33e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22741 | -| time_elapsed | 123365 | -| total_timesteps | 2910848 | -| train/ | | -| approx_kl | 0.14440028 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.0679 | -| n_updates | 227400 | -| policy_gradient_loss | 0.0266 | -| std | 0.00624 | -| value_loss | 4.96e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.94 | -| time/ | | -| fps | 23 | -| iterations | 22742 | -| time_elapsed | 123371 | -| total_timesteps | 2910976 | -| train/ | | -| approx_kl | 0.035790738 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 227410 | -| policy_gradient_loss | 0.0406 | -| std | 0.00623 | -| value_loss | 3.72e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22743 | -| time_elapsed | 123375 | -| total_timesteps | 2911104 | -| train/ | | -| approx_kl | 0.35547435 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 227420 | -| policy_gradient_loss | 0.144 | -| std | 0.00624 | -| value_loss | 1.34e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22744 | -| time_elapsed | 123386 | -| total_timesteps | 2911232 | -| train/ | | -| approx_kl | 0.22795889 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 227430 | -| policy_gradient_loss | 0.0867 | -| std | 0.00624 | -| value_loss | 9.58e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22745 | -| time_elapsed | 123391 | -| total_timesteps | 2911360 | -| train/ | | -| approx_kl | 0.24322592 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.000619 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 227440 | -| policy_gradient_loss | 0.141 | -| std | 0.00624 | -| value_loss | 2.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22746 | -| time_elapsed | 123395 | -| total_timesteps | 2911488 | -| train/ | | -| approx_kl | 0.060630318 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 227450 | -| policy_gradient_loss | 0.0297 | -| std | 0.00624 | -| value_loss | 5.72e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22747 | -| time_elapsed | 123400 | -| total_timesteps | 2911616 | -| train/ | | -| approx_kl | 0.6075544 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 227460 | -| policy_gradient_loss | 0.0545 | -| std | 0.00624 | -| value_loss | 4.27e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22748 | -| time_elapsed | 123405 | -| total_timesteps | 2911744 | -| train/ | | -| approx_kl | 0.016629418 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.00992 | -| n_updates | 227470 | -| policy_gradient_loss | 0.0119 | -| std | 0.00623 | -| value_loss | 6.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22749 | -| time_elapsed | 123410 | -| total_timesteps | 2911872 | -| train/ | | -| approx_kl | 0.003551663 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | -0.00068 | -| n_updates | 227480 | -| policy_gradient_loss | 0.00797 | -| std | 0.00623 | -| value_loss | 7.73e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22750 | -| time_elapsed | 123416 | -| total_timesteps | 2912000 | -| train/ | | -| approx_kl | 0.08881026 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.0581 | -| n_updates | 227490 | -| policy_gradient_loss | 0.0248 | -| std | 0.00622 | -| value_loss | 4.62e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22751 | -| time_elapsed | 123421 | -| total_timesteps | 2912128 | -| train/ | | -| approx_kl | 0.009017038 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0045 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 227500 | -| policy_gradient_loss | 0.00703 | -| std | 0.00622 | -| value_loss | 6.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22752 | -| time_elapsed | 123435 | -| total_timesteps | 2912256 | -| train/ | | -| approx_kl | 0.083989225 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | -0.00136 | -| n_updates | 227510 | -| policy_gradient_loss | -0.0102 | -| std | 0.00622 | -| value_loss | 0.000163 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22753 | -| time_elapsed | 123440 | -| total_timesteps | 2912384 | -| train/ | | -| approx_kl | 0.00924194 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | -0.00073 | -| n_updates | 227520 | -| policy_gradient_loss | 0.0365 | -| std | 0.00622 | -| value_loss | 2.01e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22754 | -| time_elapsed | 123446 | -| total_timesteps | 2912512 | -| train/ | | -| approx_kl | 0.36562023 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | 0.269 | -| n_updates | 227530 | -| policy_gradient_loss | 0.169 | -| std | 0.00622 | -| value_loss | 1.23e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22755 | -| time_elapsed | 123452 | -| total_timesteps | 2912640 | -| train/ | | -| approx_kl | 0.05956117 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00546 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 227540 | -| policy_gradient_loss | 0.0315 | -| std | 0.00622 | -| value_loss | 5.92e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22756 | -| time_elapsed | 123457 | -| total_timesteps | 2912768 | -| train/ | | -| approx_kl | 0.73834777 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.214 | -| n_updates | 227550 | -| policy_gradient_loss | 0.0707 | -| std | 0.00622 | -| value_loss | 4.82e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22757 | -| time_elapsed | 123461 | -| total_timesteps | 2912896 | -| train/ | | -| approx_kl | 0.011704583 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.0245 | -| n_updates | 227560 | -| policy_gradient_loss | 5.49e-05 | -| std | 0.00622 | -| value_loss | 3.84e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22758 | -| time_elapsed | 123466 | -| total_timesteps | 2913024 | -| train/ | | -| approx_kl | 0.0031603575 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 227570 | -| policy_gradient_loss | 0.0113 | -| std | 0.00622 | -| value_loss | 1.74e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22759 | -| time_elapsed | 123477 | -| total_timesteps | 2913152 | -| train/ | | -| approx_kl | 0.004427508 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 227580 | -| policy_gradient_loss | -0.000726 | -| std | 0.00622 | -| value_loss | 0.000331 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22760 | -| time_elapsed | 123482 | -| total_timesteps | 2913280 | -| train/ | | -| approx_kl | 0.05338919 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.701 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 227590 | -| policy_gradient_loss | 0.000447 | -| std | 0.00622 | -| value_loss | 4.73e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22761 | -| time_elapsed | 123488 | -| total_timesteps | 2913408 | -| train/ | | -| approx_kl | 0.008914072 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00626 | -| learning_rate | 0.0003 | -| loss | 0.000241 | -| n_updates | 227600 | -| policy_gradient_loss | 0.00805 | -| std | 0.00621 | -| value_loss | 6.3e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22762 | -| time_elapsed | 123493 | -| total_timesteps | 2913536 | -| train/ | | -| approx_kl | 0.0891688 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.0597 | -| n_updates | 227610 | -| policy_gradient_loss | 0.0247 | -| std | 0.00622 | -| value_loss | 2.77e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22763 | -| time_elapsed | 123497 | -| total_timesteps | 2913664 | -| train/ | | -| approx_kl | 0.011009388 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | 0.00419 | -| n_updates | 227620 | -| policy_gradient_loss | 0.00711 | -| std | 0.00622 | -| value_loss | 2.56e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22764 | -| time_elapsed | 123501 | -| total_timesteps | 2913792 | -| train/ | | -| approx_kl | 0.0632723 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -3.27 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 227630 | -| policy_gradient_loss | 0.00621 | -| std | 0.00622 | -| value_loss | 5.03e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 22765 | -| time_elapsed | 123506 | -| total_timesteps | 2913920 | -| train/ | | -| approx_kl | 0.06456579 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00297 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 227640 | -| policy_gradient_loss | 0.0163 | -| std | 0.00623 | -| value_loss | 6.03e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22766 | -| time_elapsed | 123510 | -| total_timesteps | 2914048 | -| train/ | | -| approx_kl | 0.035570066 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.008 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 227650 | -| policy_gradient_loss | 0.00698 | -| std | 0.00623 | -| value_loss | 2.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22767 | -| time_elapsed | 123520 | -| total_timesteps | 2914176 | -| train/ | | -| approx_kl | 0.03011877 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -6.55 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 227660 | -| policy_gradient_loss | -0.0156 | -| std | 0.00623 | -| value_loss | 0.00371 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22768 | -| time_elapsed | 123525 | -| total_timesteps | 2914304 | -| train/ | | -| approx_kl | 0.022790868 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.297 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 227670 | -| policy_gradient_loss | 0.0448 | -| std | 0.00623 | -| value_loss | 6.76e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22769 | -| time_elapsed | 123531 | -| total_timesteps | 2914432 | -| train/ | | -| approx_kl | 0.16930054 | -| clip_fraction | 0.507 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00345 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 227680 | -| policy_gradient_loss | 0.0728 | -| std | 0.00623 | -| value_loss | 5.11e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22770 | -| time_elapsed | 123536 | -| total_timesteps | 2914560 | -| train/ | | -| approx_kl | 0.044755712 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.00846 | -| n_updates | 227690 | -| policy_gradient_loss | 0.0252 | -| std | 0.00623 | -| value_loss | 4.45e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22771 | -| time_elapsed | 123539 | -| total_timesteps | 2914688 | -| train/ | | -| approx_kl | 0.8689839 | -| clip_fraction | 0.751 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.288 | -| n_updates | 227700 | -| policy_gradient_loss | 0.179 | -| std | 0.00623 | -| value_loss | 3.66e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22772 | -| time_elapsed | 123543 | -| total_timesteps | 2914816 | -| train/ | | -| approx_kl | 0.033986036 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | -0.00231 | -| n_updates | 227710 | -| policy_gradient_loss | -0.00581 | -| std | 0.00623 | -| value_loss | 2.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 22773 | -| time_elapsed | 123547 | -| total_timesteps | 2914944 | -| train/ | | -| approx_kl | 0.021973254 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.00843 | -| n_updates | 227720 | -| policy_gradient_loss | 0.00295 | -| std | 0.00623 | -| value_loss | 1.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22774 | -| time_elapsed | 123552 | -| total_timesteps | 2915072 | -| train/ | | -| approx_kl | 0.02449039 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 227730 | -| policy_gradient_loss | 0.042 | -| std | 0.00623 | -| value_loss | 2.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22775 | -| time_elapsed | 123561 | -| total_timesteps | 2915200 | -| train/ | | -| approx_kl | 0.009682108 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 227740 | -| policy_gradient_loss | -0.00848 | -| std | 0.00623 | -| value_loss | 0.00162 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22776 | -| time_elapsed | 123567 | -| total_timesteps | 2915328 | -| train/ | | -| approx_kl | 0.4817762 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -2.98 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 227750 | -| policy_gradient_loss | 0.0352 | -| std | 0.00623 | -| value_loss | 3.61e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22777 | -| time_elapsed | 123571 | -| total_timesteps | 2915456 | -| train/ | | -| approx_kl | 0.006837168 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.82 | -| learning_rate | 0.0003 | -| loss | -0.00277 | -| n_updates | 227760 | -| policy_gradient_loss | 0.00727 | -| std | 0.00623 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22778 | -| time_elapsed | 123576 | -| total_timesteps | 2915584 | -| train/ | | -| approx_kl | 0.0016041873 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00257 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 227770 | -| policy_gradient_loss | 0.0103 | -| std | 0.00623 | -| value_loss | 2.28e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22779 | -| time_elapsed | 123582 | -| total_timesteps | 2915712 | -| train/ | | -| approx_kl | 0.10241451 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 227780 | -| policy_gradient_loss | 0.00301 | -| std | 0.00623 | -| value_loss | 1.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22780 | -| time_elapsed | 123587 | -| total_timesteps | 2915840 | -| train/ | | -| approx_kl | 0.011320468 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.00384 | -| n_updates | 227790 | -| policy_gradient_loss | 0.0125 | -| std | 0.00623 | -| value_loss | 2.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 22781 | -| time_elapsed | 123592 | -| total_timesteps | 2915968 | -| train/ | | -| approx_kl | 0.094739035 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 227800 | -| policy_gradient_loss | 0.0106 | -| std | 0.00623 | -| value_loss | 1.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22782 | -| time_elapsed | 123598 | -| total_timesteps | 2916096 | -| train/ | | -| approx_kl | 0.010059748 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | -0.00964 | -| n_updates | 227810 | -| policy_gradient_loss | 0.00258 | -| std | 0.00623 | -| value_loss | 2.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22783 | -| time_elapsed | 123609 | -| total_timesteps | 2916224 | -| train/ | | -| approx_kl | 0.012760568 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.761 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 227820 | -| policy_gradient_loss | -0.000873 | -| std | 0.00623 | -| value_loss | 0.00596 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22784 | -| time_elapsed | 123614 | -| total_timesteps | 2916352 | -| train/ | | -| approx_kl | 0.0776155 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.0935 | -| n_updates | 227830 | -| policy_gradient_loss | 0.126 | -| std | 0.00623 | -| value_loss | 3.13e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22785 | -| time_elapsed | 123619 | -| total_timesteps | 2916480 | -| train/ | | -| approx_kl | 0.017256219 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0035 | -| learning_rate | 0.0003 | -| loss | 0.00508 | -| n_updates | 227840 | -| policy_gradient_loss | 0.0235 | -| std | 0.00623 | -| value_loss | 2.71e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22786 | -| time_elapsed | 123624 | -| total_timesteps | 2916608 | -| train/ | | -| approx_kl | 0.19069682 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0678 | -| learning_rate | 0.0003 | -| loss | 0.0519 | -| n_updates | 227850 | -| policy_gradient_loss | 0.0145 | -| std | 0.00623 | -| value_loss | 1.76e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22787 | -| time_elapsed | 123629 | -| total_timesteps | 2916736 | -| train/ | | -| approx_kl | 0.0183043 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.00798 | -| n_updates | 227860 | -| policy_gradient_loss | 0.00326 | -| std | 0.00623 | -| value_loss | 1.08e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22788 | -| time_elapsed | 123633 | -| total_timesteps | 2916864 | -| train/ | | -| approx_kl | 0.015294126 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0777 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 227870 | -| policy_gradient_loss | -0.00779 | -| std | 0.00623 | -| value_loss | 8.31e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22789 | -| time_elapsed | 123639 | -| total_timesteps | 2916992 | -| train/ | | -| approx_kl | 0.012840984 | -| clip_fraction | 0.113 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | 0.00372 | -| n_updates | 227880 | -| policy_gradient_loss | 0.00238 | -| std | 0.00622 | -| value_loss | 6.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22790 | -| time_elapsed | 123645 | -| total_timesteps | 2917120 | -| train/ | | -| approx_kl | 0.012217626 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0837 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 227890 | -| policy_gradient_loss | -0.00175 | -| std | 0.00622 | -| value_loss | 1.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22791 | -| time_elapsed | 123658 | -| total_timesteps | 2917248 | -| train/ | | -| approx_kl | 0.029995086 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 227900 | -| policy_gradient_loss | 0.0137 | -| std | 0.00621 | -| value_loss | 0.00618 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22792 | -| time_elapsed | 123663 | -| total_timesteps | 2917376 | -| train/ | | -| approx_kl | 0.3762269 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.213 | -| n_updates | 227910 | -| policy_gradient_loss | 0.16 | -| std | 0.00621 | -| value_loss | 1.8e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22793 | -| time_elapsed | 123668 | -| total_timesteps | 2917504 | -| train/ | | -| approx_kl | 0.06259421 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0227 | -| n_updates | 227920 | -| policy_gradient_loss | 0.0261 | -| std | 0.00621 | -| value_loss | 8.17e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22794 | -| time_elapsed | 123673 | -| total_timesteps | 2917632 | -| train/ | | -| approx_kl | 0.16508928 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00397 | -| learning_rate | 0.0003 | -| loss | 0.063 | -| n_updates | 227930 | -| policy_gradient_loss | 0.022 | -| std | 0.00621 | -| value_loss | 4.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22795 | -| time_elapsed | 123679 | -| total_timesteps | 2917760 | -| train/ | | -| approx_kl | 0.016355488 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.00908 | -| n_updates | 227940 | -| policy_gradient_loss | 0.00436 | -| std | 0.00621 | -| value_loss | 2.19e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 22796 | -| time_elapsed | 123684 | -| total_timesteps | 2917888 | -| train/ | | -| approx_kl | 0.016338527 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0898 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 227950 | -| policy_gradient_loss | -0.000768 | -| std | 0.00621 | -| value_loss | 1.54e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22797 | -| time_elapsed | 123689 | -| total_timesteps | 2918016 | -| train/ | | -| approx_kl | 0.02282422 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 227960 | -| policy_gradient_loss | 0.0212 | -| std | 0.00621 | -| value_loss | 1.25e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22798 | -| time_elapsed | 123698 | -| total_timesteps | 2918144 | -| train/ | | -| approx_kl | 0.13746119 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.824 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 227970 | -| policy_gradient_loss | 0.0083 | -| std | 0.00621 | -| value_loss | 0.00342 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22799 | -| time_elapsed | 123703 | -| total_timesteps | 2918272 | -| train/ | | -| approx_kl | 0.0017102733 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 227980 | -| policy_gradient_loss | 0.0308 | -| std | 0.00621 | -| value_loss | 0.000292 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22800 | -| time_elapsed | 123707 | -| total_timesteps | 2918400 | -| train/ | | -| approx_kl | 0.56340444 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00686 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 227990 | -| policy_gradient_loss | 0.0542 | -| std | 0.00621 | -| value_loss | 1.76e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22801 | -| time_elapsed | 123710 | -| total_timesteps | 2918528 | -| train/ | | -| approx_kl | 0.053412702 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00778 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 228000 | -| policy_gradient_loss | 0.0136 | -| std | 0.00621 | -| value_loss | 7.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22802 | -| time_elapsed | 123715 | -| total_timesteps | 2918656 | -| train/ | | -| approx_kl | 0.047198307 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 228010 | -| policy_gradient_loss | -0.00295 | -| std | 0.00621 | -| value_loss | 5.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22803 | -| time_elapsed | 123721 | -| total_timesteps | 2918784 | -| train/ | | -| approx_kl | 0.009569138 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 228020 | -| policy_gradient_loss | 0.00798 | -| std | 0.0062 | -| value_loss | 3.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.943 | -| time/ | | -| fps | 23 | -| iterations | 22804 | -| time_elapsed | 123726 | -| total_timesteps | 2918912 | -| train/ | | -| approx_kl | 0.069218785 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 228030 | -| policy_gradient_loss | 0.00781 | -| std | 0.0062 | -| value_loss | 2.95e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22805 | -| time_elapsed | 123731 | -| total_timesteps | 2919040 | -| train/ | | -| approx_kl | 0.05124817 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 228040 | -| policy_gradient_loss | 0.0121 | -| std | 0.0062 | -| value_loss | 1.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22806 | -| time_elapsed | 123741 | -| total_timesteps | 2919168 | -| train/ | | -| approx_kl | 0.03501439 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.621 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 228050 | -| policy_gradient_loss | -0.00339 | -| std | 0.0062 | -| value_loss | 0.0145 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22807 | -| time_elapsed | 123747 | -| total_timesteps | 2919296 | -| train/ | | -| approx_kl | 0.061001074 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | 0.038 | -| n_updates | 228060 | -| policy_gradient_loss | 0.0161 | -| std | 0.0062 | -| value_loss | 5.67e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22808 | -| time_elapsed | 123752 | -| total_timesteps | 2919424 | -| train/ | | -| approx_kl | 0.05921557 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 228070 | -| policy_gradient_loss | 0.0119 | -| std | 0.0062 | -| value_loss | 5.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22809 | -| time_elapsed | 123757 | -| total_timesteps | 2919552 | -| train/ | | -| approx_kl | 0.069543555 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0512 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 228080 | -| policy_gradient_loss | 0.0109 | -| std | 0.0062 | -| value_loss | 5.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22810 | -| time_elapsed | 123762 | -| total_timesteps | 2919680 | -| train/ | | -| approx_kl | 0.05122155 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.0338 | -| n_updates | 228090 | -| policy_gradient_loss | 0.0165 | -| std | 0.0062 | -| value_loss | 3.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22811 | -| time_elapsed | 123766 | -| total_timesteps | 2919808 | -| train/ | | -| approx_kl | 0.055951994 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0841 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 228100 | -| policy_gradient_loss | 0.00757 | -| std | 0.0062 | -| value_loss | 2.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 22812 | -| time_elapsed | 123771 | -| total_timesteps | 2919936 | -| train/ | | -| approx_kl | 0.011468265 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | -0.00111 | -| n_updates | 228110 | -| policy_gradient_loss | 0.00931 | -| std | 0.0062 | -| value_loss | 1.83e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22813 | -| time_elapsed | 123777 | -| total_timesteps | 2920064 | -| train/ | | -| approx_kl | 0.06496422 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.0249 | -| n_updates | 228120 | -| policy_gradient_loss | 0.00856 | -| std | 0.0062 | -| value_loss | 1.43e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22814 | -| time_elapsed | 123787 | -| total_timesteps | 2920192 | -| train/ | | -| approx_kl | 0.008160067 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.801 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 228130 | -| policy_gradient_loss | -0.0053 | -| std | 0.0062 | -| value_loss | 0.00393 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22815 | -| time_elapsed | 123792 | -| total_timesteps | 2920320 | -| train/ | | -| approx_kl | 0.0774477 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.00375 | -| n_updates | 228140 | -| policy_gradient_loss | -0.00337 | -| std | 0.0062 | -| value_loss | 4.61e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22816 | -| time_elapsed | 123796 | -| total_timesteps | 2920448 | -| train/ | | -| approx_kl | 0.01171013 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 228150 | -| policy_gradient_loss | 0.00649 | -| std | 0.0062 | -| value_loss | 1.09e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22817 | -| time_elapsed | 123800 | -| total_timesteps | 2920576 | -| train/ | | -| approx_kl | 0.061740838 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 228160 | -| policy_gradient_loss | 0.00845 | -| std | 0.0062 | -| value_loss | 5.75e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22818 | -| time_elapsed | 123804 | -| total_timesteps | 2920704 | -| train/ | | -| approx_kl | 0.011004724 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.00235 | -| n_updates | 228170 | -| policy_gradient_loss | 0.00605 | -| std | 0.0062 | -| value_loss | 3.67e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22819 | -| time_elapsed | 123811 | -| total_timesteps | 2920832 | -| train/ | | -| approx_kl | 0.08828676 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 228180 | -| policy_gradient_loss | 0.0142 | -| std | 0.0062 | -| value_loss | 3.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22820 | -| time_elapsed | 123816 | -| total_timesteps | 2920960 | -| train/ | | -| approx_kl | 0.062029995 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 228190 | -| policy_gradient_loss | 0.0117 | -| std | 0.0062 | -| value_loss | 2.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22821 | -| time_elapsed | 123821 | -| total_timesteps | 2921088 | -| train/ | | -| approx_kl | 0.051733032 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 228200 | -| policy_gradient_loss | 0.0164 | -| std | 0.00619 | -| value_loss | 1.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22822 | -| time_elapsed | 123832 | -| total_timesteps | 2921216 | -| train/ | | -| approx_kl | 0.01662094 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.673 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 228210 | -| policy_gradient_loss | -0.0142 | -| std | 0.00619 | -| value_loss | 0.000998 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22823 | -| time_elapsed | 123836 | -| total_timesteps | 2921344 | -| train/ | | -| approx_kl | 0.09288042 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | 0.0159 | -| n_updates | 228220 | -| policy_gradient_loss | 0.00837 | -| std | 0.00619 | -| value_loss | 7.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22824 | -| time_elapsed | 123841 | -| total_timesteps | 2921472 | -| train/ | | -| approx_kl | 0.009181757 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0053 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 228230 | -| policy_gradient_loss | 0.0135 | -| std | 0.00619 | -| value_loss | 6.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22825 | -| time_elapsed | 123846 | -| total_timesteps | 2921600 | -| train/ | | -| approx_kl | 0.004445378 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | -0.000895 | -| n_updates | 228240 | -| policy_gradient_loss | 0.00905 | -| std | 0.00619 | -| value_loss | 3.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22826 | -| time_elapsed | 123850 | -| total_timesteps | 2921728 | -| train/ | | -| approx_kl | 0.078141615 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 228250 | -| policy_gradient_loss | 0.00593 | -| std | 0.00619 | -| value_loss | 3.03e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22827 | -| time_elapsed | 123856 | -| total_timesteps | 2921856 | -| train/ | | -| approx_kl | 0.05160502 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.0282 | -| n_updates | 228260 | -| policy_gradient_loss | 0.0147 | -| std | 0.00619 | -| value_loss | 1.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 22828 | -| time_elapsed | 123861 | -| total_timesteps | 2921984 | -| train/ | | -| approx_kl | 0.008124936 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0616 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 228270 | -| policy_gradient_loss | 0.00911 | -| std | 0.0062 | -| value_loss | 1.07e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22829 | -| time_elapsed | 123866 | -| total_timesteps | 2922112 | -| train/ | | -| approx_kl | 0.0012458288 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.00959 | -| n_updates | 228280 | -| policy_gradient_loss | 0.00165 | -| std | 0.0062 | -| value_loss | 1.03e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22830 | -| time_elapsed | 123877 | -| total_timesteps | 2922240 | -| train/ | | -| approx_kl | 0.05240561 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | 0.00723 | -| n_updates | 228290 | -| policy_gradient_loss | 0.00466 | -| std | 0.0062 | -| value_loss | 0.00117 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22831 | -| time_elapsed | 123883 | -| total_timesteps | 2922368 | -| train/ | | -| approx_kl | 0.005255333 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0916 | -| learning_rate | 0.0003 | -| loss | -0.00635 | -| n_updates | 228300 | -| policy_gradient_loss | 0.00677 | -| std | 0.0062 | -| value_loss | 1.01e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22832 | -| time_elapsed | 123888 | -| total_timesteps | 2922496 | -| train/ | | -| approx_kl | 0.037768167 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00863 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 228310 | -| policy_gradient_loss | 0.107 | -| std | 0.0062 | -| value_loss | 1.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22833 | -| time_elapsed | 123892 | -| total_timesteps | 2922624 | -| train/ | | -| approx_kl | 0.011710782 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.00524 | -| n_updates | 228320 | -| policy_gradient_loss | 0.029 | -| std | 0.0062 | -| value_loss | 7.45e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22834 | -| time_elapsed | 123898 | -| total_timesteps | 2922752 | -| train/ | | -| approx_kl | 0.6417997 | -| clip_fraction | 0.578 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 228330 | -| policy_gradient_loss | 0.0548 | -| std | 0.0062 | -| value_loss | 4.14e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 22835 | -| time_elapsed | 123903 | -| total_timesteps | 2922880 | -| train/ | | -| approx_kl | 0.049849045 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | -0.0009 | -| n_updates | 228340 | -| policy_gradient_loss | -0.000146 | -| std | 0.0062 | -| value_loss | 3.99e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22836 | -| time_elapsed | 123908 | -| total_timesteps | 2923008 | -| train/ | | -| approx_kl | 0.04886242 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 228350 | -| policy_gradient_loss | 0.00702 | -| std | 0.0062 | -| value_loss | 2.93e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22837 | -| time_elapsed | 123918 | -| total_timesteps | 2923136 | -| train/ | | -| approx_kl | 0.009599589 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.0256 | -| n_updates | 228360 | -| policy_gradient_loss | -0.0132 | -| std | 0.0062 | -| value_loss | 3.63e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22838 | -| time_elapsed | 123922 | -| total_timesteps | 2923264 | -| train/ | | -| approx_kl | 0.20113875 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.627 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 228370 | -| policy_gradient_loss | 0.0242 | -| std | 0.0062 | -| value_loss | 7.89e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22839 | -| time_elapsed | 123928 | -| total_timesteps | 2923392 | -| train/ | | -| approx_kl | 0.0015251879 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0696 | -| learning_rate | 0.0003 | -| loss | 0.000488 | -| n_updates | 228380 | -| policy_gradient_loss | 0.0251 | -| std | 0.0062 | -| value_loss | 7.11e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22840 | -| time_elapsed | 123932 | -| total_timesteps | 2923520 | -| train/ | | -| approx_kl | 0.0005835369 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | -0.00143 | -| n_updates | 228390 | -| policy_gradient_loss | 0.0328 | -| std | 0.0062 | -| value_loss | 2.81e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22841 | -| time_elapsed | 123938 | -| total_timesteps | 2923648 | -| train/ | | -| approx_kl | 0.48636904 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.21 | -| n_updates | 228400 | -| policy_gradient_loss | 0.0676 | -| std | 0.0062 | -| value_loss | 2.09e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22842 | -| time_elapsed | 123942 | -| total_timesteps | 2923776 | -| train/ | | -| approx_kl | 0.05207189 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 228410 | -| policy_gradient_loss | 0.0106 | -| std | 0.0062 | -| value_loss | 1.86e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22843 | -| time_elapsed | 123948 | -| total_timesteps | 2923904 | -| train/ | | -| approx_kl | 0.012235428 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 228420 | -| policy_gradient_loss | 0.0117 | -| std | 0.0062 | -| value_loss | 1.38e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22844 | -| time_elapsed | 123952 | -| total_timesteps | 2924032 | -| train/ | | -| approx_kl | 0.0008637798 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.00992 | -| n_updates | 228430 | -| policy_gradient_loss | -0.00293 | -| std | 0.0062 | -| value_loss | 1.08e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22845 | -| time_elapsed | 123962 | -| total_timesteps | 2924160 | -| train/ | | -| approx_kl | 0.13687772 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | 0.0395 | -| n_updates | 228440 | -| policy_gradient_loss | 0.00348 | -| std | 0.0062 | -| value_loss | 0.000566 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22846 | -| time_elapsed | 123967 | -| total_timesteps | 2924288 | -| train/ | | -| approx_kl | 0.012255872 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.663 | -| learning_rate | 0.0003 | -| loss | 0.00159 | -| n_updates | 228450 | -| policy_gradient_loss | 0.00102 | -| std | 0.0062 | -| value_loss | 1e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22847 | -| time_elapsed | 123972 | -| total_timesteps | 2924416 | -| train/ | | -| approx_kl | 0.0115257595 | -| clip_fraction | 0.108 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | 0.00255 | -| n_updates | 228460 | -| policy_gradient_loss | 0.00156 | -| std | 0.00619 | -| value_loss | 1.25e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22848 | -| time_elapsed | 123977 | -| total_timesteps | 2924544 | -| train/ | | -| approx_kl | 0.031940907 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0905 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 228470 | -| policy_gradient_loss | 0.0308 | -| std | 0.00619 | -| value_loss | 1.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22849 | -| time_elapsed | 123981 | -| total_timesteps | 2924672 | -| train/ | | -| approx_kl | 0.11115658 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.0667 | -| n_updates | 228480 | -| policy_gradient_loss | 0.0307 | -| std | 0.00619 | -| value_loss | 6.54e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22850 | -| time_elapsed | 123986 | -| total_timesteps | 2924800 | -| train/ | | -| approx_kl | 0.00026355637 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0949 | -| learning_rate | 0.0003 | -| loss | -0.000147 | -| n_updates | 228490 | -| policy_gradient_loss | 0.0323 | -| std | 0.00619 | -| value_loss | 3.14e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22851 | -| time_elapsed | 123991 | -| total_timesteps | 2924928 | -| train/ | | -| approx_kl | 0.0016131271 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.084 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 228500 | -| policy_gradient_loss | 0.0394 | -| std | 0.00619 | -| value_loss | 4.2e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22852 | -| time_elapsed | 123995 | -| total_timesteps | 2925056 | -| train/ | | -| approx_kl | 0.23351343 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 228510 | -| policy_gradient_loss | 0.0123 | -| std | 0.00619 | -| value_loss | 1.38e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22853 | -| time_elapsed | 124002 | -| total_timesteps | 2925184 | -| train/ | | -| approx_kl | 0.01807339 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.695 | -| learning_rate | 0.0003 | -| loss | -0.0288 | -| n_updates | 228520 | -| policy_gradient_loss | -0.0076 | -| std | 0.00619 | -| value_loss | 0.000847 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22854 | -| time_elapsed | 124008 | -| total_timesteps | 2925312 | -| train/ | | -| approx_kl | 0.08401909 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -9.81 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 228530 | -| policy_gradient_loss | 0.00469 | -| std | 0.00619 | -| value_loss | 9.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22855 | -| time_elapsed | 124011 | -| total_timesteps | 2925440 | -| train/ | | -| approx_kl | 0.054569725 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.238 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 228540 | -| policy_gradient_loss | 0.0462 | -| std | 0.00619 | -| value_loss | 8.54e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22856 | -| time_elapsed | 124015 | -| total_timesteps | 2925568 | -| train/ | | -| approx_kl | 0.13201591 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 228550 | -| policy_gradient_loss | 0.0311 | -| std | 0.00619 | -| value_loss | 1.44e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22857 | -| time_elapsed | 124020 | -| total_timesteps | 2925696 | -| train/ | | -| approx_kl | 0.0012082243 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.000827 | -| learning_rate | 0.0003 | -| loss | -0.00534 | -| n_updates | 228560 | -| policy_gradient_loss | 0.0273 | -| std | 0.00619 | -| value_loss | 6.53e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22858 | -| time_elapsed | 124026 | -| total_timesteps | 2925824 | -| train/ | | -| approx_kl | 0.61672795 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.21 | -| n_updates | 228570 | -| policy_gradient_loss | 0.06 | -| std | 0.00619 | -| value_loss | 5.02e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 22859 | -| time_elapsed | 124031 | -| total_timesteps | 2925952 | -| train/ | | -| approx_kl | 0.014278402 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 228580 | -| policy_gradient_loss | 0.0095 | -| std | 0.00619 | -| value_loss | 3.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22860 | -| time_elapsed | 124036 | -| total_timesteps | 2926080 | -| train/ | | -| approx_kl | 0.002980404 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | -0.00177 | -| n_updates | 228590 | -| policy_gradient_loss | 0.00972 | -| std | 0.00619 | -| value_loss | 1.97e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22861 | -| time_elapsed | 124045 | -| total_timesteps | 2926208 | -| train/ | | -| approx_kl | 0.0030413535 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.768 | -| learning_rate | 0.0003 | -| loss | -0.00609 | -| n_updates | 228600 | -| policy_gradient_loss | -0.00868 | -| std | 0.00619 | -| value_loss | 0.00571 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22862 | -| time_elapsed | 124052 | -| total_timesteps | 2926336 | -| train/ | | -| approx_kl | 0.06650628 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 228610 | -| policy_gradient_loss | 0.015 | -| std | 0.00619 | -| value_loss | 1.99e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22863 | -| time_elapsed | 124058 | -| total_timesteps | 2926464 | -| train/ | | -| approx_kl | 0.0814773 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00796 | -| learning_rate | 0.0003 | -| loss | 0.0454 | -| n_updates | 228620 | -| policy_gradient_loss | 0.022 | -| std | 0.00619 | -| value_loss | 2.9e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22864 | -| time_elapsed | 124064 | -| total_timesteps | 2926592 | -| train/ | | -| approx_kl | 0.010281214 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.00854 | -| n_updates | 228630 | -| policy_gradient_loss | 0.00737 | -| std | 0.00619 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22865 | -| time_elapsed | 124069 | -| total_timesteps | 2926720 | -| train/ | | -| approx_kl | 0.0009894101 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0084 | -| n_updates | 228640 | -| policy_gradient_loss | 0.00122 | -| std | 0.00619 | -| value_loss | 1.4e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22866 | -| time_elapsed | 124075 | -| total_timesteps | 2926848 | -| train/ | | -| approx_kl | 0.0061671287 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | -0.00742 | -| n_updates | 228650 | -| policy_gradient_loss | 0.00472 | -| std | 0.00619 | -| value_loss | 8.75e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22867 | -| time_elapsed | 124079 | -| total_timesteps | 2926976 | -| train/ | | -| approx_kl | 0.00013124291 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.000305 | -| n_updates | 228660 | -| policy_gradient_loss | 0.0343 | -| std | 0.00619 | -| value_loss | 5.26e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22868 | -| time_elapsed | 124085 | -| total_timesteps | 2927104 | -| train/ | | -| approx_kl | 0.21753258 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0666 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 228670 | -| policy_gradient_loss | 0.0728 | -| std | 0.00618 | -| value_loss | 3.97e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22869 | -| time_elapsed | 124097 | -| total_timesteps | 2927232 | -| train/ | | -| approx_kl | 0.018198678 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0259 | -| n_updates | 228680 | -| policy_gradient_loss | 0.00283 | -| std | 0.00618 | -| value_loss | 1.55e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22870 | -| time_elapsed | 124101 | -| total_timesteps | 2927360 | -| train/ | | -| approx_kl | 0.004678473 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | -0.00059 | -| n_updates | 228690 | -| policy_gradient_loss | 0.0378 | -| std | 0.00618 | -| value_loss | 2.1e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22871 | -| time_elapsed | 124106 | -| total_timesteps | 2927488 | -| train/ | | -| approx_kl | 1.0600588 | -| clip_fraction | 0.763 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.4 | -| n_updates | 228700 | -| policy_gradient_loss | 0.277 | -| std | 0.00618 | -| value_loss | 2.6e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22872 | -| time_elapsed | 124111 | -| total_timesteps | 2927616 | -| train/ | | -| approx_kl | 0.012953842 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 228710 | -| policy_gradient_loss | 0.0267 | -| std | 0.00618 | -| value_loss | 5.38e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22873 | -| time_elapsed | 124116 | -| total_timesteps | 2927744 | -| train/ | | -| approx_kl | 0.272118 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.251 | -| n_updates | 228720 | -| policy_gradient_loss | 0.128 | -| std | 0.00618 | -| value_loss | 4.81e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 22874 | -| time_elapsed | 124120 | -| total_timesteps | 2927872 | -| train/ | | -| approx_kl | 0.17328559 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 228730 | -| policy_gradient_loss | 0.0992 | -| std | 0.00618 | -| value_loss | 3.79e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22875 | -| time_elapsed | 124124 | -| total_timesteps | 2928000 | -| train/ | | -| approx_kl | 0.1892006 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 228740 | -| policy_gradient_loss | 0.166 | -| std | 0.00618 | -| value_loss | 2.53e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22876 | -| time_elapsed | 124129 | -| total_timesteps | 2928128 | -| train/ | | -| approx_kl | 0.16206619 | -| clip_fraction | 0.704 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00401 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 228750 | -| policy_gradient_loss | 0.13 | -| std | 0.00618 | -| value_loss | 1.69e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22877 | -| time_elapsed | 124138 | -| total_timesteps | 2928256 | -| train/ | | -| approx_kl | 0.49642974 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -5.93 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 228760 | -| policy_gradient_loss | 0.00175 | -| std | 0.00618 | -| value_loss | 0.00347 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22878 | -| time_elapsed | 124143 | -| total_timesteps | 2928384 | -| train/ | | -| approx_kl | 0.070958175 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 228770 | -| policy_gradient_loss | 0.00986 | -| std | 0.00619 | -| value_loss | 5.75e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22879 | -| time_elapsed | 124149 | -| total_timesteps | 2928512 | -| train/ | | -| approx_kl | 0.012532639 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00312 | -| learning_rate | 0.0003 | -| loss | -0.00498 | -| n_updates | 228780 | -| policy_gradient_loss | 0.00529 | -| std | 0.00619 | -| value_loss | 4.26e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22880 | -| time_elapsed | 124152 | -| total_timesteps | 2928640 | -| train/ | | -| approx_kl | 7.084943e-05 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0774 | -| learning_rate | 0.0003 | -| loss | -0.000119 | -| n_updates | 228790 | -| policy_gradient_loss | 0.00844 | -| std | 0.00619 | -| value_loss | 4.39e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22881 | -| time_elapsed | 124157 | -| total_timesteps | 2928768 | -| train/ | | -| approx_kl | 0.05622974 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 0.0081 | -| n_updates | 228800 | -| policy_gradient_loss | 0.00793 | -| std | 0.0062 | -| value_loss | 2.7e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 22882 | -| time_elapsed | 124163 | -| total_timesteps | 2928896 | -| train/ | | -| approx_kl | 0.041322466 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.19 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 228810 | -| policy_gradient_loss | 0.0119 | -| std | 0.0062 | -| value_loss | 5.48e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22883 | -| time_elapsed | 124167 | -| total_timesteps | 2929024 | -| train/ | | -| approx_kl | 0.07138657 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 228820 | -| policy_gradient_loss | 0.00854 | -| std | 0.0062 | -| value_loss | 4.2e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22884 | -| time_elapsed | 124177 | -| total_timesteps | 2929152 | -| train/ | | -| approx_kl | 0.021648008 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.793 | -| learning_rate | 0.0003 | -| loss | -0.00941 | -| n_updates | 228830 | -| policy_gradient_loss | -0.00645 | -| std | 0.00621 | -| value_loss | 0.00448 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22885 | -| time_elapsed | 124182 | -| total_timesteps | 2929280 | -| train/ | | -| approx_kl | 0.07885276 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00303 | -| learning_rate | 0.0003 | -| loss | 0.0425 | -| n_updates | 228840 | -| policy_gradient_loss | 0.0166 | -| std | 0.00621 | -| value_loss | 0.000166 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22886 | -| time_elapsed | 124186 | -| total_timesteps | 2929408 | -| train/ | | -| approx_kl | 0.012564416 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00919 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 228850 | -| policy_gradient_loss | 0.00542 | -| std | 0.0062 | -| value_loss | 9.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22887 | -| time_elapsed | 124191 | -| total_timesteps | 2929536 | -| train/ | | -| approx_kl | 0.003471111 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.000785 | -| learning_rate | 0.0003 | -| loss | -0.00575 | -| n_updates | 228860 | -| policy_gradient_loss | 0.0122 | -| std | 0.0062 | -| value_loss | 2.79e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22888 | -| time_elapsed | 124195 | -| total_timesteps | 2929664 | -| train/ | | -| approx_kl | 0.11237626 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 228870 | -| policy_gradient_loss | 0.0118 | -| std | 0.00621 | -| value_loss | 2.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22889 | -| time_elapsed | 124200 | -| total_timesteps | 2929792 | -| train/ | | -| approx_kl | 0.038195264 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.0261 | -| n_updates | 228880 | -| policy_gradient_loss | 0.0467 | -| std | 0.0062 | -| value_loss | 1.12e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 22890 | -| time_elapsed | 124204 | -| total_timesteps | 2929920 | -| train/ | | -| approx_kl | 0.15479618 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0955 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 228890 | -| policy_gradient_loss | 0.054 | -| std | 0.0062 | -| value_loss | 6.92e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22891 | -| time_elapsed | 124207 | -| total_timesteps | 2930048 | -| train/ | | -| approx_kl | 0.2178871 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 228900 | -| policy_gradient_loss | 0.0333 | -| std | 0.0062 | -| value_loss | 6.35e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22892 | -| time_elapsed | 124214 | -| total_timesteps | 2930176 | -| train/ | | -| approx_kl | 0.034430005 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.456 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 228910 | -| policy_gradient_loss | -0.0108 | -| std | 0.00621 | -| value_loss | 0.00118 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22893 | -| time_elapsed | 124219 | -| total_timesteps | 2930304 | -| train/ | | -| approx_kl | 0.03125588 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -3.46 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 228920 | -| policy_gradient_loss | 0.0277 | -| std | 0.0062 | -| value_loss | 1.18e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22894 | -| time_elapsed | 124224 | -| total_timesteps | 2930432 | -| train/ | | -| approx_kl | 0.5253835 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0933 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 228930 | -| policy_gradient_loss | 0.131 | -| std | 0.0062 | -| value_loss | 4.24e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22895 | -| time_elapsed | 124230 | -| total_timesteps | 2930560 | -| train/ | | -| approx_kl | 0.08964142 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 228940 | -| policy_gradient_loss | 0.0266 | -| std | 0.0062 | -| value_loss | 1.85e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22896 | -| time_elapsed | 124235 | -| total_timesteps | 2930688 | -| train/ | | -| approx_kl | 9.434158e-05 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | 0.00077 | -| n_updates | 228950 | -| policy_gradient_loss | 0.0449 | -| std | 0.0062 | -| value_loss | 3e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22897 | -| time_elapsed | 124241 | -| total_timesteps | 2930816 | -| train/ | | -| approx_kl | 0.20969729 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.0427 | -| n_updates | 228960 | -| policy_gradient_loss | 0.0131 | -| std | 0.0062 | -| value_loss | 2.24e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 22898 | -| time_elapsed | 124246 | -| total_timesteps | 2930944 | -| train/ | | -| approx_kl | 0.02494157 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 228970 | -| policy_gradient_loss | 0.00873 | -| std | 0.0062 | -| value_loss | 1.25e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22899 | -| time_elapsed | 124250 | -| total_timesteps | 2931072 | -| train/ | | -| approx_kl | 0.028945824 | -| clip_fraction | 0.46 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | 0.00852 | -| n_updates | 228980 | -| policy_gradient_loss | 0.0267 | -| std | 0.00619 | -| value_loss | 8.35e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22900 | -| time_elapsed | 124259 | -| total_timesteps | 2931200 | -| train/ | | -| approx_kl | 0.4165216 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.984 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 228990 | -| policy_gradient_loss | 0.102 | -| std | 0.00619 | -| value_loss | 0.000137 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22901 | -| time_elapsed | 124263 | -| total_timesteps | 2931328 | -| train/ | | -| approx_kl | 0.19041075 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.4 | -| learning_rate | 0.0003 | -| loss | 0.0898 | -| n_updates | 229000 | -| policy_gradient_loss | 0.0421 | -| std | 0.00619 | -| value_loss | 3.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22902 | -| time_elapsed | 124269 | -| total_timesteps | 2931456 | -| train/ | | -| approx_kl | 0.15866774 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00176 | -| learning_rate | 0.0003 | -| loss | 0.0664 | -| n_updates | 229010 | -| policy_gradient_loss | 0.0253 | -| std | 0.00619 | -| value_loss | 3.12e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22903 | -| time_elapsed | 124277 | -| total_timesteps | 2931584 | -| train/ | | -| approx_kl | 0.03916997 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.00665 | -| n_updates | 229020 | -| policy_gradient_loss | 0.0327 | -| std | 0.0062 | -| value_loss | 2.15e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22904 | -| time_elapsed | 124283 | -| total_timesteps | 2931712 | -| train/ | | -| approx_kl | 0.29971653 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 229030 | -| policy_gradient_loss | 0.138 | -| std | 0.0062 | -| value_loss | 1.98e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22905 | -| time_elapsed | 124289 | -| total_timesteps | 2931840 | -| train/ | | -| approx_kl | 0.07969652 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.00849 | -| n_updates | 229040 | -| policy_gradient_loss | 0.0379 | -| std | 0.0062 | -| value_loss | 1.78e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 22906 | -| time_elapsed | 124295 | -| total_timesteps | 2931968 | -| train/ | | -| approx_kl | 0.0011351742 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | 0.00279 | -| n_updates | 229050 | -| policy_gradient_loss | 0.0338 | -| std | 0.0062 | -| value_loss | 1.32e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22907 | -| time_elapsed | 124300 | -| total_timesteps | 2932096 | -| train/ | | -| approx_kl | 0.21868047 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0644 | -| n_updates | 229060 | -| policy_gradient_loss | 0.0192 | -| std | 0.00619 | -| value_loss | 6e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22908 | -| time_elapsed | 124310 | -| total_timesteps | 2932224 | -| train/ | | -| approx_kl | 0.112060055 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.648 | -| learning_rate | 0.0003 | -| loss | 0.0282 | -| n_updates | 229070 | -| policy_gradient_loss | -0.00224 | -| std | 0.00619 | -| value_loss | 0.00741 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22909 | -| time_elapsed | 124314 | -| total_timesteps | 2932352 | -| train/ | | -| approx_kl | 8.178316e-05 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.231 | -| learning_rate | 0.0003 | -| loss | -0.000612 | -| n_updates | 229080 | -| policy_gradient_loss | 0.0809 | -| std | 0.00619 | -| value_loss | 0.000242 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22910 | -| time_elapsed | 124317 | -| total_timesteps | 2932480 | -| train/ | | -| approx_kl | 0.038359046 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | 0.0431 | -| n_updates | 229090 | -| policy_gradient_loss | 0.0553 | -| std | 0.0062 | -| value_loss | 2.06e-05 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22911 | -| time_elapsed | 124323 | -| total_timesteps | 2932608 | -| train/ | | -| approx_kl | 0.428952 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0632 | -| learning_rate | 0.0003 | -| loss | 0.266 | -| n_updates | 229100 | -| policy_gradient_loss | 0.192 | -| std | 0.0062 | -| value_loss | 2.09e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22912 | -| time_elapsed | 124328 | -| total_timesteps | 2932736 | -| train/ | | -| approx_kl | 0.059158035 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 229110 | -| policy_gradient_loss | 0.0321 | -| std | 0.0062 | -| value_loss | 2.04e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22913 | -| time_elapsed | 124334 | -| total_timesteps | 2932864 | -| train/ | | -| approx_kl | 0.00010224618 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | -0.000208 | -| n_updates | 229120 | -| policy_gradient_loss | 0.0342 | -| std | 0.0062 | -| value_loss | 9.6e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 22914 | -| time_elapsed | 124339 | -| total_timesteps | 2932992 | -| train/ | | -| approx_kl | 0.5638455 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 229130 | -| policy_gradient_loss | 0.0688 | -| std | 0.00619 | -| value_loss | 7.68e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 22915 | -| time_elapsed | 124343 | -| total_timesteps | 2933120 | -| train/ | | -| approx_kl | 0.0069905855 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 229140 | -| policy_gradient_loss | 0.00861 | -| std | 0.00619 | -| value_loss | 6.16e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 22916 | -| time_elapsed | 124355 | -| total_timesteps | 2933248 | -| train/ | | -| approx_kl | 0.046371967 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -1.9 | -| learning_rate | 0.0003 | -| loss | -0.029 | -| n_updates | 229150 | -| policy_gradient_loss | -0.00705 | -| std | 0.00619 | -| value_loss | 0.00255 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 22917 | -| time_elapsed | 124360 | -| total_timesteps | 2933376 | -| train/ | | -| approx_kl | 0.00080102123 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | -0.00999 | -| n_updates | 229160 | -| policy_gradient_loss | 0.0302 | -| std | 0.00619 | -| value_loss | 1.21e-05 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 22918 | -| time_elapsed | 124366 | -| total_timesteps | 2933504 | -| train/ | | -| approx_kl | 0.2732958 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0987 | -| n_updates | 229170 | -| policy_gradient_loss | 0.0284 | -| std | 0.00619 | -| value_loss | 2.41e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 22919 | -| time_elapsed | 124371 | -| total_timesteps | 2933632 | -| train/ | | -| approx_kl | 0.03351401 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00865 | -| learning_rate | 0.0003 | -| loss | 0.00188 | -| n_updates | 229180 | -| policy_gradient_loss | -0.00185 | -| std | 0.00619 | -| value_loss | 1.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 22920 | -| time_elapsed | 124376 | -| total_timesteps | 2933760 | -| train/ | | -| approx_kl | 0.027915023 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0077 | -| n_updates | 229190 | -| policy_gradient_loss | 0.00179 | -| std | 0.00619 | -| value_loss | 9.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 22921 | -| time_elapsed | 124381 | -| total_timesteps | 2933888 | -| train/ | | -| approx_kl | 0.026779436 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 229200 | -| policy_gradient_loss | 0.0358 | -| std | 0.00619 | -| value_loss | 5.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22922 | -| time_elapsed | 124385 | -| total_timesteps | 2934016 | -| train/ | | -| approx_kl | 0.07967293 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 229210 | -| policy_gradient_loss | 0.0254 | -| std | 0.00619 | -| value_loss | 3.84e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22923 | -| time_elapsed | 124396 | -| total_timesteps | 2934144 | -| train/ | | -| approx_kl | 0.31617248 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.876 | -| learning_rate | 0.0003 | -| loss | 0.0643 | -| n_updates | 229220 | -| policy_gradient_loss | 0.0262 | -| std | 0.00619 | -| value_loss | 0.00177 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22924 | -| time_elapsed | 124402 | -| total_timesteps | 2934272 | -| train/ | | -| approx_kl | 3.355369e-05 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0201 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 229230 | -| policy_gradient_loss | 0.0122 | -| std | 0.00619 | -| value_loss | 3.64e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22925 | -| time_elapsed | 124407 | -| total_timesteps | 2934400 | -| train/ | | -| approx_kl | 0.02529181 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -147 | -| learning_rate | 0.0003 | -| loss | -0.00441 | -| n_updates | 229240 | -| policy_gradient_loss | 0.0188 | -| std | 0.00619 | -| value_loss | 5.81e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22926 | -| time_elapsed | 124412 | -| total_timesteps | 2934528 | -| train/ | | -| approx_kl | 0.21010038 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.624 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 229250 | -| policy_gradient_loss | 0.06 | -| std | 0.00619 | -| value_loss | 9.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22927 | -| time_elapsed | 124417 | -| total_timesteps | 2934656 | -| train/ | | -| approx_kl | 0.003807283 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00823 | -| learning_rate | 0.0003 | -| loss | -0.0141 | -| n_updates | 229260 | -| policy_gradient_loss | -0.00143 | -| std | 0.00618 | -| value_loss | 8.55e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22928 | -| time_elapsed | 124422 | -| total_timesteps | 2934784 | -| train/ | | -| approx_kl | 0.10964758 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00519 | -| learning_rate | 0.0003 | -| loss | 0.0721 | -| n_updates | 229270 | -| policy_gradient_loss | 0.116 | -| std | 0.00618 | -| value_loss | 6.63e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 22929 | -| time_elapsed | 124426 | -| total_timesteps | 2934912 | -| train/ | | -| approx_kl | 0.06063338 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.0829 | -| n_updates | 229280 | -| policy_gradient_loss | 0.031 | -| std | 0.00618 | -| value_loss | 5.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22930 | -| time_elapsed | 124430 | -| total_timesteps | 2935040 | -| train/ | | -| approx_kl | 0.041407086 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0681 | -| n_updates | 229290 | -| policy_gradient_loss | 0.0143 | -| std | 0.00619 | -| value_loss | 3.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22931 | -| time_elapsed | 124439 | -| total_timesteps | 2935168 | -| train/ | | -| approx_kl | 0.18191151 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 229300 | -| policy_gradient_loss | -0.0128 | -| std | 0.00619 | -| value_loss | 0.00165 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22932 | -| time_elapsed | 124444 | -| total_timesteps | 2935296 | -| train/ | | -| approx_kl | 0.08439305 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.00658 | -| n_updates | 229310 | -| policy_gradient_loss | 0.0167 | -| std | 0.00619 | -| value_loss | 8.91e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22933 | -| time_elapsed | 124448 | -| total_timesteps | 2935424 | -| train/ | | -| approx_kl | 0.3853042 | -| clip_fraction | 0.749 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -5.78 | -| learning_rate | 0.0003 | -| loss | 0.0773 | -| n_updates | 229320 | -| policy_gradient_loss | 0.0786 | -| std | 0.00619 | -| value_loss | 2.13e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22934 | -| time_elapsed | 124451 | -| total_timesteps | 2935552 | -| train/ | | -| approx_kl | 0.06352512 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -4.11 | -| learning_rate | 0.0003 | -| loss | 0.00764 | -| n_updates | 229330 | -| policy_gradient_loss | 0.00754 | -| std | 0.0062 | -| value_loss | 1.61e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22935 | -| time_elapsed | 124455 | -| total_timesteps | 2935680 | -| train/ | | -| approx_kl | 0.00047476962 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.29 | -| learning_rate | 0.0003 | -| loss | 0.00259 | -| n_updates | 229340 | -| policy_gradient_loss | 0.0309 | -| std | 0.0062 | -| value_loss | 3.67e-10 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22936 | -| time_elapsed | 124461 | -| total_timesteps | 2935808 | -| train/ | | -| approx_kl | 0.1737097 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.155 | -| learning_rate | 0.0003 | -| loss | 0.0804 | -| n_updates | 229350 | -| policy_gradient_loss | 0.0229 | -| std | 0.0062 | -| value_loss | 1.24e-10 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 22937 | -| time_elapsed | 124466 | -| total_timesteps | 2935936 | -| train/ | | -| approx_kl | 0.022578208 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0896 | -| learning_rate | 0.0003 | -| loss | -0.00203 | -| n_updates | 229360 | -| policy_gradient_loss | 0.029 | -| std | 0.0062 | -| value_loss | 1.01e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22938 | -| time_elapsed | 124471 | -| total_timesteps | 2936064 | -| train/ | | -| approx_kl | 0.13502957 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 229370 | -| policy_gradient_loss | 0.0183 | -| std | 0.0062 | -| value_loss | 8.44e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22939 | -| time_elapsed | 124481 | -| total_timesteps | 2936192 | -| train/ | | -| approx_kl | 0.10652558 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.707 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 229380 | -| policy_gradient_loss | 0.0089 | -| std | 0.0062 | -| value_loss | 0.00778 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22940 | -| time_elapsed | 124487 | -| total_timesteps | 2936320 | -| train/ | | -| approx_kl | 0.0029228297 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.363 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 229390 | -| policy_gradient_loss | 0.0282 | -| std | 0.0062 | -| value_loss | 6.27e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22941 | -| time_elapsed | 124492 | -| total_timesteps | 2936448 | -| train/ | | -| approx_kl | 0.001736634 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00282 | -| learning_rate | 0.0003 | -| loss | 0.00102 | -| n_updates | 229400 | -| policy_gradient_loss | 0.0353 | -| std | 0.00621 | -| value_loss | 6.3e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22942 | -| time_elapsed | 124497 | -| total_timesteps | 2936576 | -| train/ | | -| approx_kl | 0.68689394 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.287 | -| n_updates | 229410 | -| policy_gradient_loss | 0.0849 | -| std | 0.00621 | -| value_loss | 3.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22943 | -| time_elapsed | 124501 | -| total_timesteps | 2936704 | -| train/ | | -| approx_kl | 0.066954255 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.00794 | -| n_updates | 229420 | -| policy_gradient_loss | 0.00303 | -| std | 0.0062 | -| value_loss | 3.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22944 | -| time_elapsed | 124507 | -| total_timesteps | 2936832 | -| train/ | | -| approx_kl | 0.010239795 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 229430 | -| policy_gradient_loss | 0.00638 | -| std | 0.0062 | -| value_loss | 2.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22945 | -| time_elapsed | 124512 | -| total_timesteps | 2936960 | -| train/ | | -| approx_kl | 0.078852504 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 229440 | -| policy_gradient_loss | 0.0145 | -| std | 0.0062 | -| value_loss | 1.48e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22946 | -| time_elapsed | 124517 | -| total_timesteps | 2937088 | -| train/ | | -| approx_kl | 0.014941346 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 229450 | -| policy_gradient_loss | 0.00542 | -| std | 0.00621 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22947 | -| time_elapsed | 124527 | -| total_timesteps | 2937216 | -| train/ | | -| approx_kl | 0.041626245 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.39 | -| learning_rate | 0.0003 | -| loss | -0.0282 | -| n_updates | 229460 | -| policy_gradient_loss | -0.012 | -| std | 0.00621 | -| value_loss | 0.00166 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22948 | -| time_elapsed | 124534 | -| total_timesteps | 2937344 | -| train/ | | -| approx_kl | 0.0005795616 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0988 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 229470 | -| policy_gradient_loss | 0.0304 | -| std | 0.0062 | -| value_loss | 4.28e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22949 | -| time_elapsed | 124541 | -| total_timesteps | 2937472 | -| train/ | | -| approx_kl | 0.00087776873 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0878 | -| learning_rate | 0.0003 | -| loss | -0.00479 | -| n_updates | 229480 | -| policy_gradient_loss | 0.0273 | -| std | 0.0062 | -| value_loss | 1.92e-07 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22950 | -| time_elapsed | 124547 | -| total_timesteps | 2937600 | -| train/ | | -| approx_kl | 0.495035 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 229490 | -| policy_gradient_loss | 0.0525 | -| std | 0.0062 | -| value_loss | 1.46e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22951 | -| time_elapsed | 124552 | -| total_timesteps | 2937728 | -| train/ | | -| approx_kl | 0.043572016 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 229500 | -| policy_gradient_loss | -4.83e-05 | -| std | 0.0062 | -| value_loss | 1.24e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22952 | -| time_elapsed | 124559 | -| total_timesteps | 2937856 | -| train/ | | -| approx_kl | 0.05744529 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 229510 | -| policy_gradient_loss | 0.0111 | -| std | 0.00621 | -| value_loss | 9.36e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 22953 | -| time_elapsed | 124566 | -| total_timesteps | 2937984 | -| train/ | | -| approx_kl | 0.009527213 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 229520 | -| policy_gradient_loss | 0.00764 | -| std | 0.00621 | -| value_loss | 7.34e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22954 | -| time_elapsed | 124571 | -| total_timesteps | 2938112 | -| train/ | | -| approx_kl | 0.00093205273 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.00224 | -| n_updates | 229530 | -| policy_gradient_loss | 0.00801 | -| std | 0.0062 | -| value_loss | 2.7e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22955 | -| time_elapsed | 124583 | -| total_timesteps | 2938240 | -| train/ | | -| approx_kl | 0.26238552 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.626 | -| learning_rate | 0.0003 | -| loss | 0.0727 | -| n_updates | 229540 | -| policy_gradient_loss | 0.00479 | -| std | 0.0062 | -| value_loss | 0.0012 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22956 | -| time_elapsed | 124588 | -| total_timesteps | 2938368 | -| train/ | | -| approx_kl | 0.11574722 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0877 | -| n_updates | 229550 | -| policy_gradient_loss | 0.0296 | -| std | 0.0062 | -| value_loss | 2.77e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22957 | -| time_elapsed | 124593 | -| total_timesteps | 2938496 | -| train/ | | -| approx_kl | 0.044616647 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00691 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 229560 | -| policy_gradient_loss | 0.034 | -| std | 0.0062 | -| value_loss | 5.79e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22958 | -| time_elapsed | 124598 | -| total_timesteps | 2938624 | -| train/ | | -| approx_kl | 0.12731239 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00205 | -| learning_rate | 0.0003 | -| loss | 0.0825 | -| n_updates | 229570 | -| policy_gradient_loss | 0.04 | -| std | 0.0062 | -| value_loss | 2.18e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22959 | -| time_elapsed | 124604 | -| total_timesteps | 2938752 | -| train/ | | -| approx_kl | 8.5690524e-05 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0762 | -| learning_rate | 0.0003 | -| loss | -0.00044 | -| n_updates | 229580 | -| policy_gradient_loss | 0.0423 | -| std | 0.00619 | -| value_loss | 1.38e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 22960 | -| time_elapsed | 124610 | -| total_timesteps | 2938880 | -| train/ | | -| approx_kl | 0.17058513 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.0813 | -| n_updates | 229590 | -| policy_gradient_loss | 0.0218 | -| std | 0.00619 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22961 | -| time_elapsed | 124615 | -| total_timesteps | 2939008 | -| train/ | | -| approx_kl | 0.020813132 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 229600 | -| policy_gradient_loss | -0.00994 | -| std | 0.00618 | -| value_loss | 8.26e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22962 | -| time_elapsed | 124626 | -| total_timesteps | 2939136 | -| train/ | | -| approx_kl | 0.27796173 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.11 | -| learning_rate | 0.0003 | -| loss | 0.00858 | -| n_updates | 229610 | -| policy_gradient_loss | -0.00134 | -| std | 0.00618 | -| value_loss | 0.00128 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22963 | -| time_elapsed | 124632 | -| total_timesteps | 2939264 | -| train/ | | -| approx_kl | 0.006133784 | -| clip_fraction | 0.0516 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0963 | -| learning_rate | 0.0003 | -| loss | -0.00325 | -| n_updates | 229620 | -| policy_gradient_loss | -0.000854 | -| std | 0.00618 | -| value_loss | 0.00117 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22964 | -| time_elapsed | 124638 | -| total_timesteps | 2939392 | -| train/ | | -| approx_kl | 0.011298817 | -| clip_fraction | 0.0914 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | 0.000694 | -| n_updates | 229630 | -| policy_gradient_loss | 0.000632 | -| std | 0.00619 | -| value_loss | 2.61e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22965 | -| time_elapsed | 124643 | -| total_timesteps | 2939520 | -| train/ | | -| approx_kl | 0.029357336 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | 0.0023 | -| n_updates | 229640 | -| policy_gradient_loss | 0.0253 | -| std | 0.0062 | -| value_loss | 1.47e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22966 | -| time_elapsed | 124649 | -| total_timesteps | 2939648 | -| train/ | | -| approx_kl | 0.119042665 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.349 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 229650 | -| policy_gradient_loss | 0.0158 | -| std | 0.0062 | -| value_loss | 1.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22967 | -| time_elapsed | 124653 | -| total_timesteps | 2939776 | -| train/ | | -| approx_kl | 0.008650075 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | 0.00522 | -| n_updates | 229660 | -| policy_gradient_loss | 0.031 | -| std | 0.00619 | -| value_loss | 2.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 22968 | -| time_elapsed | 124657 | -| total_timesteps | 2939904 | -| train/ | | -| approx_kl | 0.60074973 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.248 | -| learning_rate | 0.0003 | -| loss | 0.218 | -| n_updates | 229670 | -| policy_gradient_loss | 0.0773 | -| std | 0.00619 | -| value_loss | 4.72e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22969 | -| time_elapsed | 124661 | -| total_timesteps | 2940032 | -| train/ | | -| approx_kl | 0.054830924 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 229680 | -| policy_gradient_loss | 0.0149 | -| std | 0.00619 | -| value_loss | 1.62e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22970 | -| time_elapsed | 124670 | -| total_timesteps | 2940160 | -| train/ | | -| approx_kl | 0.0032113227 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.788 | -| learning_rate | 0.0003 | -| loss | -0.00717 | -| n_updates | 229690 | -| policy_gradient_loss | 0.0281 | -| std | 0.00619 | -| value_loss | 0.00115 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22971 | -| time_elapsed | 124675 | -| total_timesteps | 2940288 | -| train/ | | -| approx_kl | 0.7477453 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.645 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 229700 | -| policy_gradient_loss | 0.043 | -| std | 0.00617 | -| value_loss | 3.79e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22972 | -| time_elapsed | 124678 | -| total_timesteps | 2940416 | -| train/ | | -| approx_kl | 0.017383376 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00926 | -| learning_rate | 0.0003 | -| loss | 0.00599 | -| n_updates | 229710 | -| policy_gradient_loss | 0.0113 | -| std | 0.00617 | -| value_loss | 4.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22973 | -| time_elapsed | 124683 | -| total_timesteps | 2940544 | -| train/ | | -| approx_kl | 0.08336775 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 229720 | -| policy_gradient_loss | 0.00897 | -| std | 0.00616 | -| value_loss | 3.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22974 | -| time_elapsed | 124688 | -| total_timesteps | 2940672 | -| train/ | | -| approx_kl | 0.054648384 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0199 | -| learning_rate | 0.0003 | -| loss | 0.00705 | -| n_updates | 229730 | -| policy_gradient_loss | 0.00471 | -| std | 0.00616 | -| value_loss | 2.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22975 | -| time_elapsed | 124693 | -| total_timesteps | 2940800 | -| train/ | | -| approx_kl | 0.007782141 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 229740 | -| policy_gradient_loss | 0.00658 | -| std | 0.00616 | -| value_loss | 1.74e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 22976 | -| time_elapsed | 124697 | -| total_timesteps | 2940928 | -| train/ | | -| approx_kl | 0.0011773524 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.0053 | -| n_updates | 229750 | -| policy_gradient_loss | 0.00562 | -| std | 0.00616 | -| value_loss | 1.32e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22977 | -| time_elapsed | 124702 | -| total_timesteps | 2941056 | -| train/ | | -| approx_kl | 0.0072447658 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | -0.00734 | -| n_updates | 229760 | -| policy_gradient_loss | 0.00914 | -| std | 0.00616 | -| value_loss | 9.96e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22978 | -| time_elapsed | 124709 | -| total_timesteps | 2941184 | -| train/ | | -| approx_kl | 0.04737635 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.663 | -| learning_rate | 0.0003 | -| loss | -0.0246 | -| n_updates | 229770 | -| policy_gradient_loss | 0.00676 | -| std | 0.00616 | -| value_loss | 0.000741 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22979 | -| time_elapsed | 124713 | -| total_timesteps | 2941312 | -| train/ | | -| approx_kl | 0.039433148 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 229780 | -| policy_gradient_loss | 0.0791 | -| std | 0.00616 | -| value_loss | 1.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22980 | -| time_elapsed | 124716 | -| total_timesteps | 2941440 | -| train/ | | -| approx_kl | 0.22914882 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00273 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 229790 | -| policy_gradient_loss | 0.0359 | -| std | 0.00616 | -| value_loss | 3.77e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22981 | -| time_elapsed | 124720 | -| total_timesteps | 2941568 | -| train/ | | -| approx_kl | 0.07951928 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0554 | -| n_updates | 229800 | -| policy_gradient_loss | 0.0971 | -| std | 0.00616 | -| value_loss | 3.52e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22982 | -| time_elapsed | 124725 | -| total_timesteps | 2941696 | -| train/ | | -| approx_kl | 1.1175871e-08 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | 1.62e-06 | -| n_updates | 229810 | -| policy_gradient_loss | 0.113 | -| std | 0.00616 | -| value_loss | 2.86e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22983 | -| time_elapsed | 124729 | -| total_timesteps | 2941824 | -| train/ | | -| approx_kl | 0.030313607 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.0262 | -| n_updates | 229820 | -| policy_gradient_loss | 0.0451 | -| std | 0.00616 | -| value_loss | 1.85e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 22984 | -| time_elapsed | 124734 | -| total_timesteps | 2941952 | -| train/ | | -| approx_kl | 0.13307258 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0594 | -| n_updates | 229830 | -| policy_gradient_loss | 0.0316 | -| std | 0.00616 | -| value_loss | 1.73e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22985 | -| time_elapsed | 124739 | -| total_timesteps | 2942080 | -| train/ | | -| approx_kl | 0.00056662643 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | -0.000577 | -| n_updates | 229840 | -| policy_gradient_loss | 0.0369 | -| std | 0.00616 | -| value_loss | 9.29e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22986 | -| time_elapsed | 124750 | -| total_timesteps | 2942208 | -| train/ | | -| approx_kl | 0.03399494 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.713 | -| learning_rate | 0.0003 | -| loss | -0.0219 | -| n_updates | 229850 | -| policy_gradient_loss | -0.00366 | -| std | 0.00616 | -| value_loss | 0.00479 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22987 | -| time_elapsed | 124754 | -| total_timesteps | 2942336 | -| train/ | | -| approx_kl | 0.011414189 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0908 | -| learning_rate | 0.0003 | -| loss | -0.00964 | -| n_updates | 229860 | -| policy_gradient_loss | 0.0113 | -| std | 0.00616 | -| value_loss | 9.36e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22988 | -| time_elapsed | 124759 | -| total_timesteps | 2942464 | -| train/ | | -| approx_kl | 0.0014031562 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00784 | -| learning_rate | 0.0003 | -| loss | 0.00495 | -| n_updates | 229870 | -| policy_gradient_loss | 0.0102 | -| std | 0.00616 | -| value_loss | 1.12e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22989 | -| time_elapsed | 124764 | -| total_timesteps | 2942592 | -| train/ | | -| approx_kl | 0.008704286 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.017 | -| learning_rate | 0.0003 | -| loss | -0.00553 | -| n_updates | 229880 | -| policy_gradient_loss | 0.0101 | -| std | 0.00616 | -| value_loss | 5.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22990 | -| time_elapsed | 124769 | -| total_timesteps | 2942720 | -| train/ | | -| approx_kl | 0.0026968373 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 229890 | -| policy_gradient_loss | 0.0125 | -| std | 0.00615 | -| value_loss | 3.38e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22991 | -| time_elapsed | 124775 | -| total_timesteps | 2942848 | -| train/ | | -| approx_kl | 0.05595371 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.0542 | -| n_updates | 229900 | -| policy_gradient_loss | 0.167 | -| std | 0.00615 | -| value_loss | 2.84e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 22992 | -| time_elapsed | 124781 | -| total_timesteps | 2942976 | -| train/ | | -| approx_kl | 0.10556021 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 229910 | -| policy_gradient_loss | 0.142 | -| std | 0.00615 | -| value_loss | 2.14e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 22993 | -| time_elapsed | 124787 | -| total_timesteps | 2943104 | -| train/ | | -| approx_kl | 0.13149458 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.079 | -| n_updates | 229920 | -| policy_gradient_loss | 0.128 | -| std | 0.00615 | -| value_loss | 1.25e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 22994 | -| time_elapsed | 124802 | -| total_timesteps | 2943232 | -| train/ | | -| approx_kl | 0.24977446 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 229930 | -| policy_gradient_loss | 0.0819 | -| std | 0.00615 | -| value_loss | 5.09e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 22995 | -| time_elapsed | 124808 | -| total_timesteps | 2943360 | -| train/ | | -| approx_kl | 0.12419082 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 229940 | -| policy_gradient_loss | 0.0309 | -| std | 0.00615 | -| value_loss | 7.13e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 22996 | -| time_elapsed | 124812 | -| total_timesteps | 2943488 | -| train/ | | -| approx_kl | 0.00055295974 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 229950 | -| policy_gradient_loss | 0.0346 | -| std | 0.00615 | -| value_loss | 5.22e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 22997 | -| time_elapsed | 124818 | -| total_timesteps | 2943616 | -| train/ | | -| approx_kl | 0.6062957 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.202 | -| n_updates | 229960 | -| policy_gradient_loss | 0.071 | -| std | 0.00615 | -| value_loss | 4.31e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 22998 | -| time_elapsed | 124823 | -| total_timesteps | 2943744 | -| train/ | | -| approx_kl | 0.010803249 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0208 | -| learning_rate | 0.0003 | -| loss | 0.000956 | -| n_updates | 229970 | -| policy_gradient_loss | 0.0105 | -| std | 0.00615 | -| value_loss | 2.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 22999 | -| time_elapsed | 124828 | -| total_timesteps | 2943872 | -| train/ | | -| approx_kl | 0.114528626 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0711 | -| n_updates | 229980 | -| policy_gradient_loss | 0.0271 | -| std | 0.00615 | -| value_loss | 2.33e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23000 | -| time_elapsed | 124833 | -| total_timesteps | 2944000 | -| train/ | | -| approx_kl | 0.048110895 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | -7.24e-05 | -| n_updates | 229990 | -| policy_gradient_loss | 0.00305 | -| std | 0.00615 | -| value_loss | 1.89e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23001 | -| time_elapsed | 124837 | -| total_timesteps | 2944128 | -| train/ | | -| approx_kl | 0.008002904 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00278 | -| learning_rate | 0.0003 | -| loss | -0.00855 | -| n_updates | 230000 | -| policy_gradient_loss | 0.00586 | -| std | 0.00615 | -| value_loss | 1.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23002 | -| time_elapsed | 124848 | -| total_timesteps | 2944256 | -| train/ | | -| approx_kl | 0.08304563 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.71 | -| learning_rate | 0.0003 | -| loss | 0.0448 | -| n_updates | 230010 | -| policy_gradient_loss | 0.0142 | -| std | 0.00615 | -| value_loss | 0.00222 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23003 | -| time_elapsed | 124854 | -| total_timesteps | 2944384 | -| train/ | | -| approx_kl | 0.04115536 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 230020 | -| policy_gradient_loss | 0.0155 | -| std | 0.00613 | -| value_loss | 0.000823 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23004 | -| time_elapsed | 124858 | -| total_timesteps | 2944512 | -| train/ | | -| approx_kl | 0.006742675 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00213 | -| learning_rate | 0.0003 | -| loss | -0.00901 | -| n_updates | 230030 | -| policy_gradient_loss | 0.012 | -| std | 0.00613 | -| value_loss | 7.82e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23005 | -| time_elapsed | 124864 | -| total_timesteps | 2944640 | -| train/ | | -| approx_kl | 0.0036913208 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00242 | -| n_updates | 230040 | -| policy_gradient_loss | 0.0132 | -| std | 0.00613 | -| value_loss | 4.03e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23006 | -| time_elapsed | 124869 | -| total_timesteps | 2944768 | -| train/ | | -| approx_kl | 0.11363574 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 230050 | -| policy_gradient_loss | 0.012 | -| std | 0.00613 | -| value_loss | 3.13e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 23007 | -| time_elapsed | 124875 | -| total_timesteps | 2944896 | -| train/ | | -| approx_kl | 0.04882269 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.0185 | -| n_updates | 230060 | -| policy_gradient_loss | 0.0109 | -| std | 0.00613 | -| value_loss | 2.3e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23008 | -| time_elapsed | 124880 | -| total_timesteps | 2945024 | -| train/ | | -| approx_kl | 0.010566039 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | -0.00651 | -| n_updates | 230070 | -| policy_gradient_loss | 0.00948 | -| std | 0.00613 | -| value_loss | 1.86e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23009 | -| time_elapsed | 124891 | -| total_timesteps | 2945152 | -| train/ | | -| approx_kl | 0.0023948057 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.68 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 230080 | -| policy_gradient_loss | 0.0148 | -| std | 0.00613 | -| value_loss | 0.00784 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23010 | -| time_elapsed | 124897 | -| total_timesteps | 2945280 | -| train/ | | -| approx_kl | 0.09773714 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00225 | -| learning_rate | 0.0003 | -| loss | 0.0815 | -| n_updates | 230090 | -| policy_gradient_loss | 0.0272 | -| std | 0.00612 | -| value_loss | 0.000153 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23011 | -| time_elapsed | 124900 | -| total_timesteps | 2945408 | -| train/ | | -| approx_kl | 0.00071075046 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00268 | -| learning_rate | 0.0003 | -| loss | -0.0063 | -| n_updates | 230100 | -| policy_gradient_loss | 0.00993 | -| std | 0.00612 | -| value_loss | 2.95e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23012 | -| time_elapsed | 124904 | -| total_timesteps | 2945536 | -| train/ | | -| approx_kl | 0.30348936 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 230110 | -| policy_gradient_loss | 0.0792 | -| std | 0.00611 | -| value_loss | 6.96e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23013 | -| time_elapsed | 124910 | -| total_timesteps | 2945664 | -| train/ | | -| approx_kl | 0.078726426 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.439 | -| learning_rate | 0.0003 | -| loss | 0.0607 | -| n_updates | 230120 | -| policy_gradient_loss | 0.0274 | -| std | 0.00611 | -| value_loss | 4.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23014 | -| time_elapsed | 124915 | -| total_timesteps | 2945792 | -| train/ | | -| approx_kl | 0.004785672 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0104 | -| learning_rate | 0.0003 | -| loss | 0.000171 | -| n_updates | 230130 | -| policy_gradient_loss | 0.0102 | -| std | 0.00611 | -| value_loss | 0.000165 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 23015 | -| time_elapsed | 124921 | -| total_timesteps | 2945920 | -| train/ | | -| approx_kl | 0.081843115 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00529 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 230140 | -| policy_gradient_loss | 0.0151 | -| std | 0.0061 | -| value_loss | 1.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23016 | -| time_elapsed | 124927 | -| total_timesteps | 2946048 | -| train/ | | -| approx_kl | 0.017789597 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.00519 | -| n_updates | 230150 | -| policy_gradient_loss | 0.0114 | -| std | 0.0061 | -| value_loss | 7.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23017 | -| time_elapsed | 124935 | -| total_timesteps | 2946176 | -| train/ | | -| approx_kl | 0.050420687 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | 0.0743 | -| n_updates | 230160 | -| policy_gradient_loss | 0.0459 | -| std | 0.0061 | -| value_loss | 0.0018 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23018 | -| time_elapsed | 124941 | -| total_timesteps | 2946304 | -| train/ | | -| approx_kl | 0.1472167 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 230170 | -| policy_gradient_loss | 0.0369 | -| std | 0.00609 | -| value_loss | 4.4e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23019 | -| time_elapsed | 124947 | -| total_timesteps | 2946432 | -| train/ | | -| approx_kl | 9.069685e-05 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00381 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 230180 | -| policy_gradient_loss | 0.0382 | -| std | 0.00609 | -| value_loss | 2.21e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23020 | -| time_elapsed | 124953 | -| total_timesteps | 2946560 | -| train/ | | -| approx_kl | 0.0005232813 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | 0.000569 | -| n_updates | 230190 | -| policy_gradient_loss | 0.0343 | -| std | 0.00609 | -| value_loss | 8.74e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23021 | -| time_elapsed | 124958 | -| total_timesteps | 2946688 | -| train/ | | -| approx_kl | 0.0018042931 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 230200 | -| policy_gradient_loss | 0.0411 | -| std | 0.00609 | -| value_loss | 7.36e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23022 | -| time_elapsed | 124964 | -| total_timesteps | 2946816 | -| train/ | | -| approx_kl | 0.60689837 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 230210 | -| policy_gradient_loss | 0.0677 | -| std | 0.00609 | -| value_loss | 6.21e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23023 | -| time_elapsed | 124970 | -| total_timesteps | 2946944 | -| train/ | | -| approx_kl | 0.00811964 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | -0.0017 | -| n_updates | 230220 | -| policy_gradient_loss | 0.0103 | -| std | 0.00609 | -| value_loss | 4.41e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23024 | -| time_elapsed | 124974 | -| total_timesteps | 2947072 | -| train/ | | -| approx_kl | 0.0018249517 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.00892 | -| n_updates | 230230 | -| policy_gradient_loss | 0.00149 | -| std | 0.00608 | -| value_loss | 3.29e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23025 | -| time_elapsed | 124983 | -| total_timesteps | 2947200 | -| train/ | | -| approx_kl | 0.011766067 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.765 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 230240 | -| policy_gradient_loss | -0.00886 | -| std | 0.00608 | -| value_loss | 0.000597 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23026 | -| time_elapsed | 124989 | -| total_timesteps | 2947328 | -| train/ | | -| approx_kl | 0.2269702 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 230250 | -| policy_gradient_loss | 0.0618 | -| std | 0.00608 | -| value_loss | 8.14e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23027 | -| time_elapsed | 124993 | -| total_timesteps | 2947456 | -| train/ | | -| approx_kl | 0.14221679 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.0907 | -| n_updates | 230260 | -| policy_gradient_loss | 0.0289 | -| std | 0.00609 | -| value_loss | 2.33e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23028 | -| time_elapsed | 124999 | -| total_timesteps | 2947584 | -| train/ | | -| approx_kl | 0.0038957722 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 230270 | -| policy_gradient_loss | 0.0288 | -| std | 0.00609 | -| value_loss | 1.73e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23029 | -| time_elapsed | 125005 | -| total_timesteps | 2947712 | -| train/ | | -| approx_kl | 0.06316603 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | 0.0336 | -| n_updates | 230280 | -| policy_gradient_loss | 0.0681 | -| std | 0.0061 | -| value_loss | 1e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23030 | -| time_elapsed | 125010 | -| total_timesteps | 2947840 | -| train/ | | -| approx_kl | 0.0032367962 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 230290 | -| policy_gradient_loss | 0.106 | -| std | 0.0061 | -| value_loss | 9.31e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 23031 | -| time_elapsed | 125015 | -| total_timesteps | 2947968 | -| train/ | | -| approx_kl | 1.6955844 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.37 | -| n_updates | 230300 | -| policy_gradient_loss | 0.231 | -| std | 0.00611 | -| value_loss | 4.88e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23032 | -| time_elapsed | 125020 | -| total_timesteps | 2948096 | -| train/ | | -| approx_kl | 0.044943474 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0624 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 230310 | -| policy_gradient_loss | 0.0133 | -| std | 0.00608 | -| value_loss | 3.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23033 | -| time_elapsed | 125030 | -| total_timesteps | 2948224 | -| train/ | | -| approx_kl | 0.010581739 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 230320 | -| policy_gradient_loss | 0.0759 | -| std | 0.00607 | -| value_loss | 0.000128 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23034 | -| time_elapsed | 125035 | -| total_timesteps | 2948352 | -| train/ | | -| approx_kl | 0.16385625 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 230330 | -| policy_gradient_loss | 0.0709 | -| std | 0.00606 | -| value_loss | 2.89e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23035 | -| time_elapsed | 125039 | -| total_timesteps | 2948480 | -| train/ | | -| approx_kl | 0.17303888 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -3.01 | -| learning_rate | 0.0003 | -| loss | 0.0533 | -| n_updates | 230340 | -| policy_gradient_loss | 0.0221 | -| std | 0.00606 | -| value_loss | 7.93e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23036 | -| time_elapsed | 125044 | -| total_timesteps | 2948608 | -| train/ | | -| approx_kl | 0.0016656299 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00427 | -| n_updates | 230350 | -| policy_gradient_loss | 0.032 | -| std | 0.00605 | -| value_loss | 7.77e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23037 | -| time_elapsed | 125049 | -| total_timesteps | 2948736 | -| train/ | | -| approx_kl | 0.0011409433 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.00191 | -| n_updates | 230360 | -| policy_gradient_loss | 0.0407 | -| std | 0.00605 | -| value_loss | 6.91e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23038 | -| time_elapsed | 125055 | -| total_timesteps | 2948864 | -| train/ | | -| approx_kl | 0.22477585 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | 0.0695 | -| n_updates | 230370 | -| policy_gradient_loss | 0.0198 | -| std | 0.00605 | -| value_loss | 5.23e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23039 | -| time_elapsed | 125059 | -| total_timesteps | 2948992 | -| train/ | | -| approx_kl | 0.030216457 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 230380 | -| policy_gradient_loss | 0.049 | -| std | 0.00606 | -| value_loss | 5.73e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 23040 | -| time_elapsed | 125064 | -| total_timesteps | 2949120 | -| train/ | | -| approx_kl | 0.3804195 | -| clip_fraction | 0.748 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.202 | -| n_updates | 230390 | -| policy_gradient_loss | 0.169 | -| std | 0.00606 | -| value_loss | 1.17e-10 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 23041 | -| time_elapsed | 125079 | -| total_timesteps | 2949248 | -| train/ | | -| approx_kl | 0.02320055 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.86 | -| learning_rate | 0.0003 | -| loss | -0.0287 | -| n_updates | 230400 | -| policy_gradient_loss | -0.00258 | -| std | 0.00607 | -| value_loss | 0.00207 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 23042 | -| time_elapsed | 125084 | -| total_timesteps | 2949376 | -| train/ | | -| approx_kl | 1.5431712 | -| clip_fraction | 0.779 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | 0.587 | -| n_updates | 230410 | -| policy_gradient_loss | 0.255 | -| std | 0.00607 | -| value_loss | 3.81e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 23043 | -| time_elapsed | 125088 | -| total_timesteps | 2949504 | -| train/ | | -| approx_kl | 0.005078193 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00606 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 230420 | -| policy_gradient_loss | 0.0276 | -| std | 0.00607 | -| value_loss | 9.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 23044 | -| time_elapsed | 125092 | -| total_timesteps | 2949632 | -| train/ | | -| approx_kl | 0.20042446 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.000633 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 230430 | -| policy_gradient_loss | 0.0283 | -| std | 0.00607 | -| value_loss | 4.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 23045 | -| time_elapsed | 125098 | -| total_timesteps | 2949760 | -| train/ | | -| approx_kl | 0.032802302 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0164 | -| learning_rate | 0.0003 | -| loss | 0.000358 | -| n_updates | 230440 | -| policy_gradient_loss | 0.0278 | -| std | 0.00607 | -| value_loss | 3.39e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.879 | -| time/ | | -| fps | 23 | -| iterations | 23046 | -| time_elapsed | 125103 | -| total_timesteps | 2949888 | -| train/ | | -| approx_kl | 0.3832309 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 230450 | -| policy_gradient_loss | 0.133 | -| std | 0.00607 | -| value_loss | 2.52e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23047 | -| time_elapsed | 125108 | -| total_timesteps | 2950016 | -| train/ | | -| approx_kl | 0.23322096 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 230460 | -| policy_gradient_loss | 0.11 | -| std | 0.00608 | -| value_loss | 1.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23048 | -| time_elapsed | 125121 | -| total_timesteps | 2950144 | -| train/ | | -| approx_kl | 0.0046104295 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 230470 | -| policy_gradient_loss | 0.0228 | -| std | 0.00608 | -| value_loss | 0.000163 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23049 | -| time_elapsed | 125127 | -| total_timesteps | 2950272 | -| train/ | | -| approx_kl | 0.030162971 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0265 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 230480 | -| policy_gradient_loss | -0.000724 | -| std | 0.00608 | -| value_loss | 1.31e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23050 | -| time_elapsed | 125132 | -| total_timesteps | 2950400 | -| train/ | | -| approx_kl | 0.033197504 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -44.6 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 230490 | -| policy_gradient_loss | 0.018 | -| std | 0.00608 | -| value_loss | 2.2e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23051 | -| time_elapsed | 125136 | -| total_timesteps | 2950528 | -| train/ | | -| approx_kl | 0.15656082 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00303 | -| learning_rate | 0.0003 | -| loss | 0.0515 | -| n_updates | 230500 | -| policy_gradient_loss | 0.0289 | -| std | 0.00608 | -| value_loss | 3.11e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23052 | -| time_elapsed | 125142 | -| total_timesteps | 2950656 | -| train/ | | -| approx_kl | 0.15918137 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0718 | -| n_updates | 230510 | -| policy_gradient_loss | 0.0246 | -| std | 0.00608 | -| value_loss | 2.01e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23053 | -| time_elapsed | 125148 | -| total_timesteps | 2950784 | -| train/ | | -| approx_kl | 0.04578893 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 230520 | -| policy_gradient_loss | 0.0502 | -| std | 0.00608 | -| value_loss | 1.51e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23054 | -| time_elapsed | 125153 | -| total_timesteps | 2950912 | -| train/ | | -| approx_kl | 0.12795596 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.078 | -| n_updates | 230530 | -| policy_gradient_loss | 0.0364 | -| std | 0.00608 | -| value_loss | 9.68e-11 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23055 | -| time_elapsed | 125159 | -| total_timesteps | 2951040 | -| train/ | | -| approx_kl | 0.00046596956 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | -0.00186 | -| n_updates | 230540 | -| policy_gradient_loss | 0.0369 | -| std | 0.00608 | -| value_loss | 7.14e-11 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23056 | -| time_elapsed | 125168 | -| total_timesteps | 2951168 | -| train/ | | -| approx_kl | 0.006166191 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 230550 | -| policy_gradient_loss | 0.0251 | -| std | 0.00608 | -| value_loss | 0.000706 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23057 | -| time_elapsed | 125174 | -| total_timesteps | 2951296 | -| train/ | | -| approx_kl | 0.0030564894 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.585 | -| learning_rate | 0.0003 | -| loss | -0.00428 | -| n_updates | 230560 | -| policy_gradient_loss | 0.0812 | -| std | 0.00605 | -| value_loss | 5.77e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23058 | -| time_elapsed | 125179 | -| total_timesteps | 2951424 | -| train/ | | -| approx_kl | 0.20096576 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.671 | -| learning_rate | 0.0003 | -| loss | 0.0929 | -| n_updates | 230570 | -| policy_gradient_loss | 0.0849 | -| std | 0.00604 | -| value_loss | 7.58e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23059 | -| time_elapsed | 125183 | -| total_timesteps | 2951552 | -| train/ | | -| approx_kl | 0.0071363673 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -120 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 230580 | -| policy_gradient_loss | -0.00537 | -| std | 0.00603 | -| value_loss | 5.39e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23060 | -| time_elapsed | 125186 | -| total_timesteps | 2951680 | -| train/ | | -| approx_kl | 0.00013279496 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.189 | -| learning_rate | 0.0003 | -| loss | 0.000455 | -| n_updates | 230590 | -| policy_gradient_loss | 0.0131 | -| std | 0.00603 | -| value_loss | 1.31e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23061 | -| time_elapsed | 125189 | -| total_timesteps | 2951808 | -| train/ | | -| approx_kl | 0.0013681375 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | -0.00307 | -| n_updates | 230600 | -| policy_gradient_loss | 0.0145 | -| std | 0.00603 | -| value_loss | 4.91e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23062 | -| time_elapsed | 125193 | -| total_timesteps | 2951936 | -| train/ | | -| approx_kl | 0.113044545 | -| clip_fraction | 0.635 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.0587 | -| n_updates | 230610 | -| policy_gradient_loss | 0.0874 | -| std | 0.00603 | -| value_loss | 3.41e-09 | ------------------------------------------ --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23063 | -| time_elapsed | 125196 | -| total_timesteps | 2952064 | -| train/ | | -| approx_kl | 0.000103228725 | -| clip_fraction | 0.564 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | -0.00038 | -| n_updates | 230620 | -| policy_gradient_loss | 0.114 | -| std | 0.00602 | -| value_loss | 3.95e-08 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23064 | -| time_elapsed | 125203 | -| total_timesteps | 2952192 | -| train/ | | -| approx_kl | 0.06426751 | -| clip_fraction | 0.479 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.669 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 230630 | -| policy_gradient_loss | 0.0326 | -| std | 0.00602 | -| value_loss | 0.00711 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23065 | -| time_elapsed | 125206 | -| total_timesteps | 2952320 | -| train/ | | -| approx_kl | 0.48555857 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | 0.229 | -| n_updates | 230640 | -| policy_gradient_loss | 0.18 | -| std | 0.00602 | -| value_loss | 1.72e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23066 | -| time_elapsed | 125210 | -| total_timesteps | 2952448 | -| train/ | | -| approx_kl | 0.34361774 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | 0.192 | -| n_updates | 230650 | -| policy_gradient_loss | 0.211 | -| std | 0.00602 | -| value_loss | 7.45e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23067 | -| time_elapsed | 125213 | -| total_timesteps | 2952576 | -| train/ | | -| approx_kl | 0.04565922 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00137 | -| learning_rate | 0.0003 | -| loss | 0.00819 | -| n_updates | 230660 | -| policy_gradient_loss | 0.0287 | -| std | 0.00602 | -| value_loss | 5.15e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23068 | -| time_elapsed | 125218 | -| total_timesteps | 2952704 | -| train/ | | -| approx_kl | 0.0009916183 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0102 | -| learning_rate | 0.0003 | -| loss | 0.00819 | -| n_updates | 230670 | -| policy_gradient_loss | 0.00382 | -| std | 0.00602 | -| value_loss | 2.89e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23069 | -| time_elapsed | 125222 | -| total_timesteps | 2952832 | -| train/ | | -| approx_kl | 0.25718358 | -| clip_fraction | 0.746 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0588 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 230680 | -| policy_gradient_loss | 0.195 | -| std | 0.00602 | -| value_loss | 1.12e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 23070 | -| time_elapsed | 125226 | -| total_timesteps | 2952960 | -| train/ | | -| approx_kl | 0.041073836 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 230690 | -| policy_gradient_loss | 0.0292 | -| std | 0.00602 | -| value_loss | 8.94e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23071 | -| time_elapsed | 125231 | -| total_timesteps | 2953088 | -| train/ | | -| approx_kl | 0.78389543 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 230700 | -| policy_gradient_loss | 0.0595 | -| std | 0.00602 | -| value_loss | 7.92e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23072 | -| time_elapsed | 125240 | -| total_timesteps | 2953216 | -| train/ | | -| approx_kl | 0.05316029 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.0272 | -| n_updates | 230710 | -| policy_gradient_loss | 0.00156 | -| std | 0.00602 | -| value_loss | 0.00125 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23073 | -| time_elapsed | 125244 | -| total_timesteps | 2953344 | -| train/ | | -| approx_kl | 1.164481 | -| clip_fraction | 0.762 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.006 | -| learning_rate | 0.0003 | -| loss | 0.387 | -| n_updates | 230720 | -| policy_gradient_loss | 0.312 | -| std | 0.00602 | -| value_loss | 1.32e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23074 | -| time_elapsed | 125248 | -| total_timesteps | 2953472 | -| train/ | | -| approx_kl | 0.011412106 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 230730 | -| policy_gradient_loss | 0.0288 | -| std | 0.00601 | -| value_loss | 5.19e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23075 | -| time_elapsed | 125252 | -| total_timesteps | 2953600 | -| train/ | | -| approx_kl | 0.2286117 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0022 | -| learning_rate | 0.0003 | -| loss | 0.0831 | -| n_updates | 230740 | -| policy_gradient_loss | 0.0275 | -| std | 0.00601 | -| value_loss | 2.17e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23076 | -| time_elapsed | 125256 | -| total_timesteps | 2953728 | -| train/ | | -| approx_kl | 0.038439848 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 230750 | -| policy_gradient_loss | 0.0417 | -| std | 0.00601 | -| value_loss | 1.47e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23077 | -| time_elapsed | 125262 | -| total_timesteps | 2953856 | -| train/ | | -| approx_kl | 0.36593905 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0252 | -| learning_rate | 0.0003 | -| loss | 0.22 | -| n_updates | 230760 | -| policy_gradient_loss | 0.183 | -| std | 0.00601 | -| value_loss | 1.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 23078 | -| time_elapsed | 125268 | -| total_timesteps | 2953984 | -| train/ | | -| approx_kl | 0.30616853 | -| clip_fraction | 0.753 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 230770 | -| policy_gradient_loss | 0.175 | -| std | 0.00601 | -| value_loss | 1.08e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 23079 | -| time_elapsed | 125274 | -| total_timesteps | 2954112 | -| train/ | | -| approx_kl | 0.037922956 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 230780 | -| policy_gradient_loss | 0.0277 | -| std | 0.00601 | -| value_loss | 6.65e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 23080 | -| time_elapsed | 125288 | -| total_timesteps | 2954240 | -| train/ | | -| approx_kl | 0.01238182 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.745 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 230790 | -| policy_gradient_loss | -0.0242 | -| std | 0.00601 | -| value_loss | 0.00532 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 23081 | -| time_elapsed | 125292 | -| total_timesteps | 2954368 | -| train/ | | -| approx_kl | 0.16432893 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | 0.0918 | -| n_updates | 230800 | -| policy_gradient_loss | 0.0327 | -| std | 0.00602 | -| value_loss | 5.84e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 23082 | -| time_elapsed | 125296 | -| total_timesteps | 2954496 | -| train/ | | -| approx_kl | 0.036907606 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00516 | -| learning_rate | 0.0003 | -| loss | 0.00417 | -| n_updates | 230810 | -| policy_gradient_loss | 0.0314 | -| std | 0.00602 | -| value_loss | 1.31e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 23083 | -| time_elapsed | 125301 | -| total_timesteps | 2954624 | -| train/ | | -| approx_kl | 0.1316962 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0473 | -| n_updates | 230820 | -| policy_gradient_loss | 0.0266 | -| std | 0.00602 | -| value_loss | 1.09e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 23084 | -| time_elapsed | 125305 | -| total_timesteps | 2954752 | -| train/ | | -| approx_kl | 0.16176626 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.0947 | -| n_updates | 230830 | -| policy_gradient_loss | 0.0318 | -| std | 0.00602 | -| value_loss | 5.6e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.864 | -| time/ | | -| fps | 23 | -| iterations | 23085 | -| time_elapsed | 125310 | -| total_timesteps | 2954880 | -| train/ | | -| approx_kl | 0.034216274 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 230840 | -| policy_gradient_loss | 0.0275 | -| std | 0.00602 | -| value_loss | 5.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23086 | -| time_elapsed | 125315 | -| total_timesteps | 2955008 | -| train/ | | -| approx_kl | 0.35646537 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 230850 | -| policy_gradient_loss | 0.157 | -| std | 0.00602 | -| value_loss | 3.57e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23087 | -| time_elapsed | 125327 | -| total_timesteps | 2955136 | -| train/ | | -| approx_kl | 0.03678395 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.5 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 230860 | -| policy_gradient_loss | -0.000491 | -| std | 0.00602 | -| value_loss | 0.00206 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23088 | -| time_elapsed | 125332 | -| total_timesteps | 2955264 | -| train/ | | -| approx_kl | 0.21384585 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.852 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 230870 | -| policy_gradient_loss | 0.0642 | -| std | 0.00602 | -| value_loss | 7.95e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23089 | -| time_elapsed | 125337 | -| total_timesteps | 2955392 | -| train/ | | -| approx_kl | 0.13980852 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -169 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 230880 | -| policy_gradient_loss | 0.00244 | -| std | 0.00602 | -| value_loss | 2.75e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23090 | -| time_elapsed | 125342 | -| total_timesteps | 2955520 | -| train/ | | -| approx_kl | 0.016274724 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 230890 | -| policy_gradient_loss | 0.00124 | -| std | 0.00602 | -| value_loss | 4.59e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23091 | -| time_elapsed | 125348 | -| total_timesteps | 2955648 | -| train/ | | -| approx_kl | 0.021813963 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | 0.00557 | -| n_updates | 230900 | -| policy_gradient_loss | 0.00739 | -| std | 0.00602 | -| value_loss | 1.14e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23092 | -| time_elapsed | 125353 | -| total_timesteps | 2955776 | -| train/ | | -| approx_kl | 0.06958138 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -5.22 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 230910 | -| policy_gradient_loss | -0.0146 | -| std | 0.00602 | -| value_loss | 3.06e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.874 | -| time/ | | -| fps | 23 | -| iterations | 23093 | -| time_elapsed | 125359 | -| total_timesteps | 2955904 | -| train/ | | -| approx_kl | 0.0730795 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00889 | -| learning_rate | 0.0003 | -| loss | 0.036 | -| n_updates | 230920 | -| policy_gradient_loss | 0.018 | -| std | 0.00602 | -| value_loss | 4.05e-11 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23094 | -| time_elapsed | 125364 | -| total_timesteps | 2956032 | -| train/ | | -| approx_kl | 0.072729245 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 230930 | -| policy_gradient_loss | 0.00954 | -| std | 0.00602 | -| value_loss | 1.12e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23095 | -| time_elapsed | 125373 | -| total_timesteps | 2956160 | -| train/ | | -| approx_kl | 0.011680161 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.00614 | -| n_updates | 230940 | -| policy_gradient_loss | -0.00433 | -| std | 0.00602 | -| value_loss | 0.0037 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23096 | -| time_elapsed | 125379 | -| total_timesteps | 2956288 | -| train/ | | -| approx_kl | 0.03315496 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 230950 | -| policy_gradient_loss | 0.0145 | -| std | 0.00602 | -| value_loss | 1.36e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23097 | -| time_elapsed | 125384 | -| total_timesteps | 2956416 | -| train/ | | -| approx_kl | 0.0046774494 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00896 | -| learning_rate | 0.0003 | -| loss | -0.00376 | -| n_updates | 230960 | -| policy_gradient_loss | 0.00724 | -| std | 0.00602 | -| value_loss | 1.23e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23098 | -| time_elapsed | 125388 | -| total_timesteps | 2956544 | -| train/ | | -| approx_kl | 0.04902195 | -| clip_fraction | 0.656 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0756 | -| n_updates | 230970 | -| policy_gradient_loss | 0.171 | -| std | 0.00602 | -| value_loss | 8.07e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23099 | -| time_elapsed | 125393 | -| total_timesteps | 2956672 | -| train/ | | -| approx_kl | 0.12428936 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.0975 | -| n_updates | 230980 | -| policy_gradient_loss | 0.137 | -| std | 0.00602 | -| value_loss | 5.41e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23100 | -| time_elapsed | 125399 | -| total_timesteps | 2956800 | -| train/ | | -| approx_kl | 0.02455841 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.00735 | -| n_updates | 230990 | -| policy_gradient_loss | 0.0249 | -| std | 0.00602 | -| value_loss | 3.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 23101 | -| time_elapsed | 125403 | -| total_timesteps | 2956928 | -| train/ | | -| approx_kl | 0.26409975 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 231000 | -| policy_gradient_loss | 0.0789 | -| std | 0.006 | -| value_loss | 0.000995 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23102 | -| time_elapsed | 125408 | -| total_timesteps | 2957056 | -| train/ | | -| approx_kl | 0.12529472 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | 0.00893 | -| n_updates | 231010 | -| policy_gradient_loss | -0.00656 | -| std | 0.006 | -| value_loss | 0.00103 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23103 | -| time_elapsed | 125417 | -| total_timesteps | 2957184 | -| train/ | | -| approx_kl | 0.0044923206 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.621 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 231020 | -| policy_gradient_loss | -0.00725 | -| std | 0.006 | -| value_loss | 0.0101 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23104 | -| time_elapsed | 125422 | -| total_timesteps | 2957312 | -| train/ | | -| approx_kl | 0.051027775 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0003 | -| learning_rate | 0.0003 | -| loss | 0.0338 | -| n_updates | 231030 | -| policy_gradient_loss | 0.0184 | -| std | 0.00599 | -| value_loss | 9.38e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23105 | -| time_elapsed | 125426 | -| total_timesteps | 2957440 | -| train/ | | -| approx_kl | 0.012736607 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 231040 | -| policy_gradient_loss | 0.0156 | -| std | 0.00599 | -| value_loss | 6.67e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23106 | -| time_elapsed | 125429 | -| total_timesteps | 2957568 | -| train/ | | -| approx_kl | 0.038890097 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.0324 | -| n_updates | 231050 | -| policy_gradient_loss | 0.0231 | -| std | 0.00599 | -| value_loss | 4.6e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23107 | -| time_elapsed | 125434 | -| total_timesteps | 2957696 | -| train/ | | -| approx_kl | 0.2561435 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 231060 | -| policy_gradient_loss | 0.0423 | -| std | 0.00598 | -| value_loss | 3.85e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23108 | -| time_elapsed | 125439 | -| total_timesteps | 2957824 | -| train/ | | -| approx_kl | 0.18205336 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 231070 | -| policy_gradient_loss | 0.0323 | -| std | 0.00598 | -| value_loss | 3.93e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 23109 | -| time_elapsed | 125444 | -| total_timesteps | 2957952 | -| train/ | | -| approx_kl | 0.029360373 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 231080 | -| policy_gradient_loss | 0.0294 | -| std | 0.00598 | -| value_loss | 7.7e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23110 | -| time_elapsed | 125449 | -| total_timesteps | 2958080 | -| train/ | | -| approx_kl | 0.17423753 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 231090 | -| policy_gradient_loss | 0.0494 | -| std | 0.00598 | -| value_loss | 5.75e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23111 | -| time_elapsed | 125458 | -| total_timesteps | 2958208 | -| train/ | | -| approx_kl | 0.10841802 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.000881 | -| n_updates | 231100 | -| policy_gradient_loss | -0.0139 | -| std | 0.00598 | -| value_loss | 0.000367 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23112 | -| time_elapsed | 125462 | -| total_timesteps | 2958336 | -| train/ | | -| approx_kl | 0.103212 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.28 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 231110 | -| policy_gradient_loss | 0.0264 | -| std | 0.00598 | -| value_loss | 3.66e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23113 | -| time_elapsed | 125466 | -| total_timesteps | 2958464 | -| train/ | | -| approx_kl | 0.13532285 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 231120 | -| policy_gradient_loss | 0.0774 | -| std | 0.00598 | -| value_loss | 4.11e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23114 | -| time_elapsed | 125473 | -| total_timesteps | 2958592 | -| train/ | | -| approx_kl | 0.2792595 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.0981 | -| n_updates | 231130 | -| policy_gradient_loss | 0.0539 | -| std | 0.00598 | -| value_loss | 3.03e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23115 | -| time_elapsed | 125477 | -| total_timesteps | 2958720 | -| train/ | | -| approx_kl | 0.00382919 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 231140 | -| policy_gradient_loss | 0.013 | -| std | 0.00597 | -| value_loss | 2.41e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23116 | -| time_elapsed | 125481 | -| total_timesteps | 2958848 | -| train/ | | -| approx_kl | 0.11253315 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0727 | -| n_updates | 231150 | -| policy_gradient_loss | 0.0975 | -| std | 0.00597 | -| value_loss | 1.48e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 23117 | -| time_elapsed | 125485 | -| total_timesteps | 2958976 | -| train/ | | -| approx_kl | 0.43383807 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.213 | -| n_updates | 231160 | -| policy_gradient_loss | 0.0699 | -| std | 0.00597 | -| value_loss | 1.33e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23118 | -| time_elapsed | 125489 | -| total_timesteps | 2959104 | -| train/ | | -| approx_kl | 0.07317501 | -| clip_fraction | 0.618 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 231170 | -| policy_gradient_loss | 0.0875 | -| std | 0.00597 | -| value_loss | 1.26e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23119 | -| time_elapsed | 125501 | -| total_timesteps | 2959232 | -| train/ | | -| approx_kl | 0.092233956 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 231180 | -| policy_gradient_loss | 0.00166 | -| std | 0.00597 | -| value_loss | 4.77e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23120 | -| time_elapsed | 125505 | -| total_timesteps | 2959360 | -| train/ | | -| approx_kl | 0.60137975 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.29 | -| n_updates | 231190 | -| policy_gradient_loss | 0.18 | -| std | 0.00597 | -| value_loss | 5.03e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23121 | -| time_elapsed | 125509 | -| total_timesteps | 2959488 | -| train/ | | -| approx_kl | 0.091090776 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | 0.05 | -| n_updates | 231200 | -| policy_gradient_loss | 0.0345 | -| std | 0.00597 | -| value_loss | 2.11e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23122 | -| time_elapsed | 125514 | -| total_timesteps | 2959616 | -| train/ | | -| approx_kl | 0.15339169 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 231210 | -| policy_gradient_loss | 0.0179 | -| std | 0.00597 | -| value_loss | 1.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23123 | -| time_elapsed | 125518 | -| total_timesteps | 2959744 | -| train/ | | -| approx_kl | 0.032622963 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.00659 | -| n_updates | 231220 | -| policy_gradient_loss | 0.0351 | -| std | 0.00597 | -| value_loss | 1.12e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23124 | -| time_elapsed | 125524 | -| total_timesteps | 2959872 | -| train/ | | -| approx_kl | 0.33326456 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 231230 | -| policy_gradient_loss | 0.165 | -| std | 0.00597 | -| value_loss | 6.23e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23125 | -| time_elapsed | 125528 | -| total_timesteps | 2960000 | -| train/ | | -| approx_kl | 0.18711998 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 231240 | -| policy_gradient_loss | 0.128 | -| std | 0.00597 | -| value_loss | 4.22e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23126 | -| time_elapsed | 125532 | -| total_timesteps | 2960128 | -| train/ | | -| approx_kl | 0.04422064 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00482 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 231250 | -| policy_gradient_loss | 0.0348 | -| std | 0.00597 | -| value_loss | 2.98e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23127 | -| time_elapsed | 125544 | -| total_timesteps | 2960256 | -| train/ | | -| approx_kl | 0.28292042 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.609 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 231260 | -| policy_gradient_loss | 0.0553 | -| std | 0.00597 | -| value_loss | 0.0127 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23128 | -| time_elapsed | 125550 | -| total_timesteps | 2960384 | -| train/ | | -| approx_kl | 0.012134511 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 231270 | -| policy_gradient_loss | 0.00995 | -| std | 0.00596 | -| value_loss | 0.000308 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23129 | -| time_elapsed | 125555 | -| total_timesteps | 2960512 | -| train/ | | -| approx_kl | 0.003523958 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 231280 | -| policy_gradient_loss | 0.0121 | -| std | 0.00596 | -| value_loss | 6.67e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23130 | -| time_elapsed | 125561 | -| total_timesteps | 2960640 | -| train/ | | -| approx_kl | 3.7671998e-07 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 6.22e-05 | -| n_updates | 231290 | -| policy_gradient_loss | 0.0323 | -| std | 0.00596 | -| value_loss | 3.52e-05 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23131 | -| time_elapsed | 125566 | -| total_timesteps | 2960768 | -| train/ | | -| approx_kl | 1.2378058 | -| clip_fraction | 0.771 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.53 | -| n_updates | 231300 | -| policy_gradient_loss | 0.208 | -| std | 0.00596 | -| value_loss | 2.15e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.881 | -| time/ | | -| fps | 23 | -| iterations | 23132 | -| time_elapsed | 125572 | -| total_timesteps | 2960896 | -| train/ | | -| approx_kl | 0.015719714 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | -0.00795 | -| n_updates | 231310 | -| policy_gradient_loss | 0.0253 | -| std | 0.00596 | -| value_loss | 1.79e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23133 | -| time_elapsed | 125575 | -| total_timesteps | 2961024 | -| train/ | | -| approx_kl | 0.3446791 | -| clip_fraction | 0.743 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.179 | -| n_updates | 231320 | -| policy_gradient_loss | 0.164 | -| std | 0.00596 | -| value_loss | 1.53e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23134 | -| time_elapsed | 125589 | -| total_timesteps | 2961152 | -| train/ | | -| approx_kl | 0.0041842824 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | 0.00253 | -| n_updates | 231330 | -| policy_gradient_loss | 0.0141 | -| std | 0.00596 | -| value_loss | 0.000643 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23135 | -| time_elapsed | 125594 | -| total_timesteps | 2961280 | -| train/ | | -| approx_kl | 0.0022334312 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.000309 | -| n_updates | 231340 | -| policy_gradient_loss | 0.0283 | -| std | 0.00596 | -| value_loss | 6.37e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23136 | -| time_elapsed | 125600 | -| total_timesteps | 2961408 | -| train/ | | -| approx_kl | 0.003183995 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.0033 | -| n_updates | 231350 | -| policy_gradient_loss | 0.0352 | -| std | 0.00596 | -| value_loss | 3.73e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23137 | -| time_elapsed | 125605 | -| total_timesteps | 2961536 | -| train/ | | -| approx_kl | 0.004413054 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | -0.0115 | -| n_updates | 231360 | -| policy_gradient_loss | 0.0371 | -| std | 0.00596 | -| value_loss | 6.8e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23138 | -| time_elapsed | 125610 | -| total_timesteps | 2961664 | -| train/ | | -| approx_kl | 0.60112447 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | 0.088 | -| n_updates | 231370 | -| policy_gradient_loss | 0.0562 | -| std | 0.00596 | -| value_loss | 4.61e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23139 | -| time_elapsed | 125616 | -| total_timesteps | 2961792 | -| train/ | | -| approx_kl | 0.008275484 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.00605 | -| n_updates | 231380 | -| policy_gradient_loss | 0.0103 | -| std | 0.00596 | -| value_loss | 3.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23140 | -| time_elapsed | 125620 | -| total_timesteps | 2961920 | -| train/ | | -| approx_kl | 0.002179773 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | -0.000694 | -| n_updates | 231390 | -| policy_gradient_loss | 0.00994 | -| std | 0.00596 | -| value_loss | 1.59e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23141 | -| time_elapsed | 125626 | -| total_timesteps | 2962048 | -| train/ | | -| approx_kl | 1.6819686e-05 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | 0.000384 | -| n_updates | 231400 | -| policy_gradient_loss | 0.0479 | -| std | 0.00596 | -| value_loss | 2.34e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23142 | -| time_elapsed | 125634 | -| total_timesteps | 2962176 | -| train/ | | -| approx_kl | 0.062330544 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.000607 | -| n_updates | 231410 | -| policy_gradient_loss | 0.0256 | -| std | 0.00596 | -| value_loss | 0.00105 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23143 | -| time_elapsed | 125640 | -| total_timesteps | 2962304 | -| train/ | | -| approx_kl | 0.39371842 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00808 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 231420 | -| policy_gradient_loss | 0.143 | -| std | 0.00596 | -| value_loss | 7.43e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23144 | -| time_elapsed | 125644 | -| total_timesteps | 2962432 | -| train/ | | -| approx_kl | 0.08033683 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00788 | -| learning_rate | 0.0003 | -| loss | 0.0266 | -| n_updates | 231430 | -| policy_gradient_loss | 0.0356 | -| std | 0.00596 | -| value_loss | 4.11e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23145 | -| time_elapsed | 125649 | -| total_timesteps | 2962560 | -| train/ | | -| approx_kl | 0.1966822 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00672 | -| learning_rate | 0.0003 | -| loss | 0.0683 | -| n_updates | 231440 | -| policy_gradient_loss | 0.0246 | -| std | 0.00596 | -| value_loss | 2.42e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23146 | -| time_elapsed | 125654 | -| total_timesteps | 2962688 | -| train/ | | -| approx_kl | 0.030163618 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.00334 | -| n_updates | 231450 | -| policy_gradient_loss | 0.0321 | -| std | 0.00596 | -| value_loss | 1.76e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23147 | -| time_elapsed | 125659 | -| total_timesteps | 2962816 | -| train/ | | -| approx_kl | 0.44709954 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.213 | -| n_updates | 231460 | -| policy_gradient_loss | 0.174 | -| std | 0.00596 | -| value_loss | 1.48e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23148 | -| time_elapsed | 125663 | -| total_timesteps | 2962944 | -| train/ | | -| approx_kl | 0.067262396 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 231470 | -| policy_gradient_loss | 0.0315 | -| std | 0.00596 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23149 | -| time_elapsed | 125669 | -| total_timesteps | 2963072 | -| train/ | | -| approx_kl | 0.0013266248 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.000307 | -| n_updates | 231480 | -| policy_gradient_loss | 0.0337 | -| std | 0.00596 | -| value_loss | 1.29e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23150 | -| time_elapsed | 125680 | -| total_timesteps | 2963200 | -| train/ | | -| approx_kl | 0.00573161 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.0238 | -| n_updates | 231490 | -| policy_gradient_loss | 0.0116 | -| std | 0.00596 | -| value_loss | 0.00193 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23151 | -| time_elapsed | 125685 | -| total_timesteps | 2963328 | -| train/ | | -| approx_kl | 0.5751271 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00419 | -| learning_rate | 0.0003 | -| loss | 0.256 | -| n_updates | 231500 | -| policy_gradient_loss | 0.0882 | -| std | 0.00596 | -| value_loss | 5.18e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23152 | -| time_elapsed | 125690 | -| total_timesteps | 2963456 | -| train/ | | -| approx_kl | 0.0043193107 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 231510 | -| policy_gradient_loss | 0.0124 | -| std | 0.00596 | -| value_loss | 2.16e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23153 | -| time_elapsed | 125695 | -| total_timesteps | 2963584 | -| train/ | | -| approx_kl | 0.0608523 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00998 | -| learning_rate | 0.0003 | -| loss | 0.0536 | -| n_updates | 231520 | -| policy_gradient_loss | 0.129 | -| std | 0.00596 | -| value_loss | 1.15e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23154 | -| time_elapsed | 125699 | -| total_timesteps | 2963712 | -| train/ | | -| approx_kl | 0.20805085 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 231530 | -| policy_gradient_loss | 0.0321 | -| std | 0.00596 | -| value_loss | 6.24e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23155 | -| time_elapsed | 125704 | -| total_timesteps | 2963840 | -| train/ | | -| approx_kl | 0.043431815 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00954 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 231540 | -| policy_gradient_loss | 0.0423 | -| std | 0.00597 | -| value_loss | 8.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.892 | -| time/ | | -| fps | 23 | -| iterations | 23156 | -| time_elapsed | 125708 | -| total_timesteps | 2963968 | -| train/ | | -| approx_kl | 0.43003157 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | 0.193 | -| n_updates | 231550 | -| policy_gradient_loss | 0.165 | -| std | 0.00597 | -| value_loss | 2.82e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23157 | -| time_elapsed | 125713 | -| total_timesteps | 2964096 | -| train/ | | -| approx_kl | 0.20703919 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 231560 | -| policy_gradient_loss | 0.113 | -| std | 0.00597 | -| value_loss | 1.17e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23158 | -| time_elapsed | 125723 | -| total_timesteps | 2964224 | -| train/ | | -| approx_kl | 0.03161028 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0923 | -| learning_rate | 0.0003 | -| loss | -0.00899 | -| n_updates | 231570 | -| policy_gradient_loss | 0.00152 | -| std | 0.00597 | -| value_loss | 0.00141 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23159 | -| time_elapsed | 125728 | -| total_timesteps | 2964352 | -| train/ | | -| approx_kl | 0.0090182675 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.616 | -| learning_rate | 0.0003 | -| loss | 0.00561 | -| n_updates | 231580 | -| policy_gradient_loss | 0.00868 | -| std | 0.00598 | -| value_loss | 1.37e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23160 | -| time_elapsed | 125733 | -| total_timesteps | 2964480 | -| train/ | | -| approx_kl | 0.07576761 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.576 | -| learning_rate | 0.0003 | -| loss | 0.0542 | -| n_updates | 231590 | -| policy_gradient_loss | 0.0379 | -| std | 0.00598 | -| value_loss | 4.24e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23161 | -| time_elapsed | 125737 | -| total_timesteps | 2964608 | -| train/ | | -| approx_kl | 0.0003045667 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0557 | -| learning_rate | 0.0003 | -| loss | 0.00143 | -| n_updates | 231600 | -| policy_gradient_loss | 0.0436 | -| std | 0.00597 | -| value_loss | 3.04e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23162 | -| time_elapsed | 125741 | -| total_timesteps | 2964736 | -| train/ | | -| approx_kl | 0.70667404 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.227 | -| n_updates | 231610 | -| policy_gradient_loss | 0.0796 | -| std | 0.00597 | -| value_loss | 2.05e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23163 | -| time_elapsed | 125745 | -| total_timesteps | 2964864 | -| train/ | | -| approx_kl | 0.010017123 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.00452 | -| n_updates | 231620 | -| policy_gradient_loss | 0.0108 | -| std | 0.00598 | -| value_loss | 2.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23164 | -| time_elapsed | 125751 | -| total_timesteps | 2964992 | -| train/ | | -| approx_kl | 0.002752353 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -5.63 | -| learning_rate | 0.0003 | -| loss | -0.00968 | -| n_updates | 231630 | -| policy_gradient_loss | 0.0109 | -| std | 0.00598 | -| value_loss | 6.48e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23165 | -| time_elapsed | 125757 | -| total_timesteps | 2965120 | -| train/ | | -| approx_kl | 0.062404573 | -| clip_fraction | 0.665 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.872 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 231640 | -| policy_gradient_loss | 0.119 | -| std | 0.00598 | -| value_loss | 1.11e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23166 | -| time_elapsed | 125770 | -| total_timesteps | 2965248 | -| train/ | | -| approx_kl | 0.062250197 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.831 | -| learning_rate | 0.0003 | -| loss | 0.00877 | -| n_updates | 231650 | -| policy_gradient_loss | 0.0124 | -| std | 0.00598 | -| value_loss | 0.00294 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23167 | -| time_elapsed | 125775 | -| total_timesteps | 2965376 | -| train/ | | -| approx_kl | 0.014134403 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | 0.00813 | -| n_updates | 231660 | -| policy_gradient_loss | 0.0402 | -| std | 0.00597 | -| value_loss | 1.54e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23168 | -| time_elapsed | 125780 | -| total_timesteps | 2965504 | -| train/ | | -| approx_kl | 0.22882381 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 231670 | -| policy_gradient_loss | 0.0254 | -| std | 0.00596 | -| value_loss | 4.3e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23169 | -| time_elapsed | 125785 | -| total_timesteps | 2965632 | -| train/ | | -| approx_kl | 0.02741765 | -| clip_fraction | 0.189 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 231680 | -| policy_gradient_loss | 0.00346 | -| std | 0.00596 | -| value_loss | 1.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23170 | -| time_elapsed | 125790 | -| total_timesteps | 2965760 | -| train/ | | -| approx_kl | 0.039772805 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | 0.00693 | -| n_updates | 231690 | -| policy_gradient_loss | 0.0444 | -| std | 0.00596 | -| value_loss | 1.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 23171 | -| time_elapsed | 125795 | -| total_timesteps | 2965888 | -| train/ | | -| approx_kl | 0.38198498 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 231700 | -| policy_gradient_loss | 0.146 | -| std | 0.00596 | -| value_loss | 6.88e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23172 | -| time_elapsed | 125800 | -| total_timesteps | 2966016 | -| train/ | | -| approx_kl | 0.19809574 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 231710 | -| policy_gradient_loss | 0.145 | -| std | 0.00596 | -| value_loss | 6.88e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23173 | -| time_elapsed | 125815 | -| total_timesteps | 2966144 | -| train/ | | -| approx_kl | 0.055406146 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.00814 | -| n_updates | 231720 | -| policy_gradient_loss | 0.0289 | -| std | 0.00596 | -| value_loss | 0.00134 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23174 | -| time_elapsed | 125820 | -| total_timesteps | 2966272 | -| train/ | | -| approx_kl | 0.017630316 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.158 | -| learning_rate | 0.0003 | -| loss | 0.00773 | -| n_updates | 231730 | -| policy_gradient_loss | 0.0248 | -| std | 0.00596 | -| value_loss | 2.17e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23175 | -| time_elapsed | 125826 | -| total_timesteps | 2966400 | -| train/ | | -| approx_kl | 0.6375901 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00888 | -| learning_rate | 0.0003 | -| loss | 0.3 | -| n_updates | 231740 | -| policy_gradient_loss | 0.169 | -| std | 0.00596 | -| value_loss | 6.65e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23176 | -| time_elapsed | 125831 | -| total_timesteps | 2966528 | -| train/ | | -| approx_kl | 0.10002062 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | 0.0381 | -| n_updates | 231750 | -| policy_gradient_loss | 0.0291 | -| std | 0.00596 | -| value_loss | 4.7e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23177 | -| time_elapsed | 125836 | -| total_timesteps | 2966656 | -| train/ | | -| approx_kl | 7.498497e-05 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 3.24e-05 | -| n_updates | 231760 | -| policy_gradient_loss | 0.0338 | -| std | 0.00596 | -| value_loss | 2.6e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23178 | -| time_elapsed | 125842 | -| total_timesteps | 2966784 | -| train/ | | -| approx_kl | 0.74670583 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0957 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 231770 | -| policy_gradient_loss | 0.0651 | -| std | 0.00596 | -| value_loss | 3.79e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 23179 | -| time_elapsed | 125847 | -| total_timesteps | 2966912 | -| train/ | | -| approx_kl | 0.05126796 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00637 | -| learning_rate | 0.0003 | -| loss | -0.00678 | -| n_updates | 231780 | -| policy_gradient_loss | -0.0019 | -| std | 0.00596 | -| value_loss | 1.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23180 | -| time_elapsed | 125853 | -| total_timesteps | 2967040 | -| train/ | | -| approx_kl | 0.008979467 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | -0.00555 | -| n_updates | 231790 | -| policy_gradient_loss | 0.00927 | -| std | 0.00596 | -| value_loss | 1.46e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23181 | -| time_elapsed | 125863 | -| total_timesteps | 2967168 | -| train/ | | -| approx_kl | 0.0028489097 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.808 | -| learning_rate | 0.0003 | -| loss | 0.00206 | -| n_updates | 231800 | -| policy_gradient_loss | 0.000374 | -| std | 0.00596 | -| value_loss | 0.00369 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23182 | -| time_elapsed | 125867 | -| total_timesteps | 2967296 | -| train/ | | -| approx_kl | 0.018027395 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.162 | -| learning_rate | 0.0003 | -| loss | 0.00307 | -| n_updates | 231810 | -| policy_gradient_loss | 0.0106 | -| std | 0.00596 | -| value_loss | 2.14e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23183 | -| time_elapsed | 125872 | -| total_timesteps | 2967424 | -| train/ | | -| approx_kl | 0.08676238 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0447 | -| n_updates | 231820 | -| policy_gradient_loss | 0.0179 | -| std | 0.00596 | -| value_loss | 4.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23184 | -| time_elapsed | 125877 | -| total_timesteps | 2967552 | -| train/ | | -| approx_kl | 0.066621155 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 231830 | -| policy_gradient_loss | 0.00858 | -| std | 0.00596 | -| value_loss | 3.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23185 | -| time_elapsed | 125883 | -| total_timesteps | 2967680 | -| train/ | | -| approx_kl | 0.062039126 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0219 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 231840 | -| policy_gradient_loss | 0.00454 | -| std | 0.00596 | -| value_loss | 2.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23186 | -| time_elapsed | 125890 | -| total_timesteps | 2967808 | -| train/ | | -| approx_kl | 0.012770351 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.00331 | -| n_updates | 231850 | -| policy_gradient_loss | 0.0152 | -| std | 0.00596 | -| value_loss | 1.61e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23187 | -| time_elapsed | 125895 | -| total_timesteps | 2967936 | -| train/ | | -| approx_kl | 0.024710964 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 231860 | -| policy_gradient_loss | 0.0181 | -| std | 0.00595 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23188 | -| time_elapsed | 125902 | -| total_timesteps | 2968064 | -| train/ | | -| approx_kl | 0.0023733503 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0564 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 231870 | -| policy_gradient_loss | 0.00428 | -| std | 0.00593 | -| value_loss | 5.74e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23189 | -| time_elapsed | 125915 | -| total_timesteps | 2968192 | -| train/ | | -| approx_kl | 0.07323873 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.81 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 231880 | -| policy_gradient_loss | 0.0174 | -| std | 0.00593 | -| value_loss | 0.00245 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23190 | -| time_elapsed | 125920 | -| total_timesteps | 2968320 | -| train/ | | -| approx_kl | 0.015649166 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.515 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 231890 | -| policy_gradient_loss | 0.0433 | -| std | 0.00593 | -| value_loss | 1.27e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23191 | -| time_elapsed | 125925 | -| total_timesteps | 2968448 | -| train/ | | -| approx_kl | 0.9117663 | -| clip_fraction | 0.774 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -4.08 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 231900 | -| policy_gradient_loss | 0.0617 | -| std | 0.00593 | -| value_loss | 4.77e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23192 | -| time_elapsed | 125929 | -| total_timesteps | 2968576 | -| train/ | | -| approx_kl | 0.007898834 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.949 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 231910 | -| policy_gradient_loss | 0.0127 | -| std | 0.00593 | -| value_loss | 1.32e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23193 | -| time_elapsed | 125934 | -| total_timesteps | 2968704 | -| train/ | | -| approx_kl | 0.64291835 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00984 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 231920 | -| policy_gradient_loss | 0.052 | -| std | 0.00593 | -| value_loss | 6.33e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23194 | -| time_elapsed | 125939 | -| total_timesteps | 2968832 | -| train/ | | -| approx_kl | 0.0143269 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.00407 | -| n_updates | 231930 | -| policy_gradient_loss | 0.0108 | -| std | 0.00593 | -| value_loss | 1.55e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.9 | -| time/ | | -| fps | 23 | -| iterations | 23195 | -| time_elapsed | 125943 | -| total_timesteps | 2968960 | -| train/ | | -| approx_kl | 0.09071861 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -95.6 | -| learning_rate | 0.0003 | -| loss | 0.000688 | -| n_updates | 231940 | -| policy_gradient_loss | 0.0101 | -| std | 0.00593 | -| value_loss | 4.15e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23196 | -| time_elapsed | 125947 | -| total_timesteps | 2969088 | -| train/ | | -| approx_kl | 1.5392503 | -| clip_fraction | 0.763 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0905 | -| learning_rate | 0.0003 | -| loss | 0.277 | -| n_updates | 231950 | -| policy_gradient_loss | 0.141 | -| std | 0.00593 | -| value_loss | 7.78e-12 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23197 | -| time_elapsed | 125957 | -| total_timesteps | 2969216 | -| train/ | | -| approx_kl | 0.030737014 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 231960 | -| policy_gradient_loss | -0.0125 | -| std | 0.00593 | -| value_loss | 0.00473 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23198 | -| time_elapsed | 125962 | -| total_timesteps | 2969344 | -| train/ | | -| approx_kl | 0.00035606604 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | -0.000187 | -| n_updates | 231970 | -| policy_gradient_loss | 0.0946 | -| std | 0.00592 | -| value_loss | 2.81e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23199 | -| time_elapsed | 125966 | -| total_timesteps | 2969472 | -| train/ | | -| approx_kl | 0.14320895 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00214 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 231980 | -| policy_gradient_loss | 0.183 | -| std | 0.00592 | -| value_loss | 1.4e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23200 | -| time_elapsed | 125971 | -| total_timesteps | 2969600 | -| train/ | | -| approx_kl | 0.1238474 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.338 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 231990 | -| policy_gradient_loss | 0.0545 | -| std | 0.00592 | -| value_loss | 1.46e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23201 | -| time_elapsed | 125976 | -| total_timesteps | 2969728 | -| train/ | | -| approx_kl | 0.16434017 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | 0.0822 | -| n_updates | 232000 | -| policy_gradient_loss | 0.0357 | -| std | 0.00592 | -| value_loss | 9.54e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23202 | -| time_elapsed | 125981 | -| total_timesteps | 2969856 | -| train/ | | -| approx_kl | 0.0010008495 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | -0.00645 | -| n_updates | 232010 | -| policy_gradient_loss | 0.0341 | -| std | 0.00592 | -| value_loss | 8.47e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23203 | -| time_elapsed | 125986 | -| total_timesteps | 2969984 | -| train/ | | -| approx_kl | 0.0014204173 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 232020 | -| policy_gradient_loss | 0.0395 | -| std | 0.00592 | -| value_loss | 5.45e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23204 | -| time_elapsed | 125995 | -| total_timesteps | 2970112 | -| train/ | | -| approx_kl | 0.21835776 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 232030 | -| policy_gradient_loss | 0.00924 | -| std | 0.00592 | -| value_loss | 2.81e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23205 | -| time_elapsed | 126005 | -| total_timesteps | 2970240 | -| train/ | | -| approx_kl | 0.02520067 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 232040 | -| policy_gradient_loss | 0.00964 | -| std | 0.00592 | -| value_loss | 0.000784 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23206 | -| time_elapsed | 126013 | -| total_timesteps | 2970368 | -| train/ | | -| approx_kl | 0.13205266 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.0937 | -| n_updates | 232050 | -| policy_gradient_loss | 0.0532 | -| std | 0.00592 | -| value_loss | 4.42e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23207 | -| time_elapsed | 126020 | -| total_timesteps | 2970496 | -| train/ | | -| approx_kl | 0.68580747 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 232060 | -| policy_gradient_loss | 0.0515 | -| std | 0.00593 | -| value_loss | 3.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23208 | -| time_elapsed | 126026 | -| total_timesteps | 2970624 | -| train/ | | -| approx_kl | 0.015072316 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0678 | -| learning_rate | 0.0003 | -| loss | 0.00932 | -| n_updates | 232070 | -| policy_gradient_loss | 0.0144 | -| std | 0.00593 | -| value_loss | 3.07e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23209 | -| time_elapsed | 126030 | -| total_timesteps | 2970752 | -| train/ | | -| approx_kl | 0.0036218744 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0437 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 232080 | -| policy_gradient_loss | 0.0116 | -| std | 0.00593 | -| value_loss | 1.97e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23210 | -| time_elapsed | 126035 | -| total_timesteps | 2970880 | -| train/ | | -| approx_kl | 0.058955424 | -| clip_fraction | 0.647 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | 0.0831 | -| n_updates | 232090 | -| policy_gradient_loss | 0.119 | -| std | 0.00593 | -| value_loss | 1.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23211 | -| time_elapsed | 126040 | -| total_timesteps | 2971008 | -| train/ | | -| approx_kl | 0.017683804 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | -0.000589 | -| n_updates | 232100 | -| policy_gradient_loss | 0.036 | -| std | 0.00593 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23212 | -| time_elapsed | 126052 | -| total_timesteps | 2971136 | -| train/ | | -| approx_kl | 0.004690843 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.85 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 232110 | -| policy_gradient_loss | -0.00836 | -| std | 0.00593 | -| value_loss | 0.00277 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23213 | -| time_elapsed | 126057 | -| total_timesteps | 2971264 | -| train/ | | -| approx_kl | 0.009541968 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0357 | -| learning_rate | 0.0003 | -| loss | 0.00407 | -| n_updates | 232120 | -| policy_gradient_loss | 0.00606 | -| std | 0.00593 | -| value_loss | 0.0148 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23214 | -| time_elapsed | 126064 | -| total_timesteps | 2971392 | -| train/ | | -| approx_kl | 0.016314056 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | 0.00614 | -| n_updates | 232130 | -| policy_gradient_loss | 0.0442 | -| std | 0.00592 | -| value_loss | 0.00076 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23215 | -| time_elapsed | 126068 | -| total_timesteps | 2971520 | -| train/ | | -| approx_kl | 0.3291883 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0119 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 232140 | -| policy_gradient_loss | 0.132 | -| std | 0.00592 | -| value_loss | 0.000213 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23216 | -| time_elapsed | 126072 | -| total_timesteps | 2971648 | -| train/ | | -| approx_kl | 0.30215997 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 232150 | -| policy_gradient_loss | 0.193 | -| std | 0.00593 | -| value_loss | 0.000155 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23217 | -| time_elapsed | 126076 | -| total_timesteps | 2971776 | -| train/ | | -| approx_kl | 0.049336538 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 232160 | -| policy_gradient_loss | 0.0348 | -| std | 0.00593 | -| value_loss | 0.000134 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23218 | -| time_elapsed | 126082 | -| total_timesteps | 2971904 | -| train/ | | -| approx_kl | 0.22306146 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0808 | -| n_updates | 232170 | -| policy_gradient_loss | 0.0249 | -| std | 0.00593 | -| value_loss | 0.000109 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23219 | -| time_elapsed | 126088 | -| total_timesteps | 2972032 | -| train/ | | -| approx_kl | 0.02947939 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 232180 | -| policy_gradient_loss | 0.0308 | -| std | 0.00593 | -| value_loss | 9.08e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23220 | -| time_elapsed | 126099 | -| total_timesteps | 2972160 | -| train/ | | -| approx_kl | 0.13064724 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.788 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 232190 | -| policy_gradient_loss | -0.00679 | -| std | 0.00593 | -| value_loss | 0.00436 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23221 | -| time_elapsed | 126103 | -| total_timesteps | 2972288 | -| train/ | | -| approx_kl | 0.0032604206 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -0.00036 | -| n_updates | 232200 | -| policy_gradient_loss | 0.0423 | -| std | 0.00591 | -| value_loss | 1.98e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23222 | -| time_elapsed | 126108 | -| total_timesteps | 2972416 | -| train/ | | -| approx_kl | 0.09184001 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 232210 | -| policy_gradient_loss | 0.109 | -| std | 0.0059 | -| value_loss | 7.37e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23223 | -| time_elapsed | 126112 | -| total_timesteps | 2972544 | -| train/ | | -| approx_kl | 0.0036845743 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00205 | -| learning_rate | 0.0003 | -| loss | 0.00173 | -| n_updates | 232220 | -| policy_gradient_loss | 0.0106 | -| std | 0.00589 | -| value_loss | 3.73e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23224 | -| time_elapsed | 126118 | -| total_timesteps | 2972672 | -| train/ | | -| approx_kl | 0.32989797 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 232230 | -| policy_gradient_loss | 0.045 | -| std | 0.00588 | -| value_loss | 4.09e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23225 | -| time_elapsed | 126124 | -| total_timesteps | 2972800 | -| train/ | | -| approx_kl | 0.27346107 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.000421 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 232240 | -| policy_gradient_loss | 0.063 | -| std | 0.00588 | -| value_loss | 2.13e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23226 | -| time_elapsed | 126129 | -| total_timesteps | 2972928 | -| train/ | | -| approx_kl | 0.005230252 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | -0.00276 | -| n_updates | 232250 | -| policy_gradient_loss | 0.0222 | -| std | 0.00587 | -| value_loss | 1.14e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23227 | -| time_elapsed | 126133 | -| total_timesteps | 2973056 | -| train/ | | -| approx_kl | 5.517993e-05 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | 0.000835 | -| n_updates | 232260 | -| policy_gradient_loss | 0.013 | -| std | 0.00587 | -| value_loss | 7.92e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23228 | -| time_elapsed | 126144 | -| total_timesteps | 2973184 | -| train/ | | -| approx_kl | 0.20014891 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.768 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 232270 | -| policy_gradient_loss | 0.000854 | -| std | 0.00587 | -| value_loss | 0.00081 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23229 | -| time_elapsed | 126149 | -| total_timesteps | 2973312 | -| train/ | | -| approx_kl | 0.064566344 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.343 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 232280 | -| policy_gradient_loss | 0.0358 | -| std | 0.00587 | -| value_loss | 5.74e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23230 | -| time_elapsed | 126154 | -| total_timesteps | 2973440 | -| train/ | | -| approx_kl | 0.39698413 | -| clip_fraction | 0.747 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.335 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 232290 | -| policy_gradient_loss | 0.143 | -| std | 0.00587 | -| value_loss | 5.58e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23231 | -| time_elapsed | 126158 | -| total_timesteps | 2973568 | -| train/ | | -| approx_kl | 0.059947096 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0793 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 232300 | -| policy_gradient_loss | 0.0229 | -| std | 0.00587 | -| value_loss | 4.43e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23232 | -| time_elapsed | 126164 | -| total_timesteps | 2973696 | -| train/ | | -| approx_kl | 0.21314579 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 232310 | -| policy_gradient_loss | 0.0324 | -| std | 0.00587 | -| value_loss | 3.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23233 | -| time_elapsed | 126169 | -| total_timesteps | 2973824 | -| train/ | | -| approx_kl | 0.034038164 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | -0.00995 | -| n_updates | 232320 | -| policy_gradient_loss | 0.0296 | -| std | 0.00587 | -| value_loss | 1.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23234 | -| time_elapsed | 126173 | -| total_timesteps | 2973952 | -| train/ | | -| approx_kl | 0.13424824 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | 0.0629 | -| n_updates | 232330 | -| policy_gradient_loss | 0.0339 | -| std | 0.00587 | -| value_loss | 1.19e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23235 | -| time_elapsed | 126179 | -| total_timesteps | 2974080 | -| train/ | | -| approx_kl | 0.00021152431 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 232340 | -| policy_gradient_loss | 0.0326 | -| std | 0.00587 | -| value_loss | 9.69e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23236 | -| time_elapsed | 126190 | -| total_timesteps | 2974208 | -| train/ | | -| approx_kl | 0.19816817 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -3.94 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 232350 | -| policy_gradient_loss | -0.00881 | -| std | 0.00587 | -| value_loss | 0.0034 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23237 | -| time_elapsed | 126197 | -| total_timesteps | 2974336 | -| train/ | | -| approx_kl | 0.85207844 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.508 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 232360 | -| policy_gradient_loss | 0.0414 | -| std | 0.00587 | -| value_loss | 1.54e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23238 | -| time_elapsed | 126202 | -| total_timesteps | 2974464 | -| train/ | | -| approx_kl | 0.017486673 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | 0.000339 | -| n_updates | 232370 | -| policy_gradient_loss | 0.00927 | -| std | 0.00588 | -| value_loss | 3.58e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23239 | -| time_elapsed | 126208 | -| total_timesteps | 2974592 | -| train/ | | -| approx_kl | 0.008479 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0981 | -| learning_rate | 0.0003 | -| loss | 0.00609 | -| n_updates | 232380 | -| policy_gradient_loss | 0.0186 | -| std | 0.00586 | -| value_loss | 1.55e-07 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23240 | -| time_elapsed | 126214 | -| total_timesteps | 2974720 | -| train/ | | -| approx_kl | 0.0075299004 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0885 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 232390 | -| policy_gradient_loss | 0.015 | -| std | 0.00585 | -| value_loss | 2.46e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23241 | -| time_elapsed | 126219 | -| total_timesteps | 2974848 | -| train/ | | -| approx_kl | 0.004601464 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.00928 | -| n_updates | 232400 | -| policy_gradient_loss | 0.0143 | -| std | 0.00584 | -| value_loss | 1.57e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23242 | -| time_elapsed | 126223 | -| total_timesteps | 2974976 | -| train/ | | -| approx_kl | 0.06600591 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.0677 | -| n_updates | 232410 | -| policy_gradient_loss | 0.234 | -| std | 0.00584 | -| value_loss | 8.06e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23243 | -| time_elapsed | 126228 | -| total_timesteps | 2975104 | -| train/ | | -| approx_kl | 0.0148150865 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 232420 | -| policy_gradient_loss | 0.0368 | -| std | 0.00584 | -| value_loss | 7.85e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23244 | -| time_elapsed | 126239 | -| total_timesteps | 2975232 | -| train/ | | -| approx_kl | 0.020287622 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -3.75 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 232430 | -| policy_gradient_loss | -0.018 | -| std | 0.00584 | -| value_loss | 0.00302 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23245 | -| time_elapsed | 126244 | -| total_timesteps | 2975360 | -| train/ | | -| approx_kl | 0.08335842 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0831 | -| learning_rate | 0.0003 | -| loss | 0.0427 | -| n_updates | 232440 | -| policy_gradient_loss | 0.0191 | -| std | 0.00584 | -| value_loss | 6.94e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23246 | -| time_elapsed | 126249 | -| total_timesteps | 2975488 | -| train/ | | -| approx_kl | 0.013177473 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | 0.00415 | -| n_updates | 232450 | -| policy_gradient_loss | 0.0109 | -| std | 0.00584 | -| value_loss | 5.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23247 | -| time_elapsed | 126255 | -| total_timesteps | 2975616 | -| train/ | | -| approx_kl | 0.083797514 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0734 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 232460 | -| policy_gradient_loss | 0.0157 | -| std | 0.00584 | -| value_loss | 5.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23248 | -| time_elapsed | 126259 | -| total_timesteps | 2975744 | -| train/ | | -| approx_kl | 0.04505795 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 232470 | -| policy_gradient_loss | 0.00884 | -| std | 0.00584 | -| value_loss | 3.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 23249 | -| time_elapsed | 126264 | -| total_timesteps | 2975872 | -| train/ | | -| approx_kl | 0.010058625 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.0018 | -| n_updates | 232480 | -| policy_gradient_loss | 0.0078 | -| std | 0.00586 | -| value_loss | 2.16e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23250 | -| time_elapsed | 126268 | -| total_timesteps | 2976000 | -| train/ | | -| approx_kl | 0.0021400126 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -5.57 | -| learning_rate | 0.0003 | -| loss | -4.07e-06 | -| n_updates | 232490 | -| policy_gradient_loss | 0.00685 | -| std | 0.00587 | -| value_loss | 4.24e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23251 | -| time_elapsed | 126274 | -| total_timesteps | 2976128 | -| train/ | | -| approx_kl | 0.09380803 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00709 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 232500 | -| policy_gradient_loss | -0.00258 | -| std | 0.00587 | -| value_loss | 2.91e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23252 | -| time_elapsed | 126285 | -| total_timesteps | 2976256 | -| train/ | | -| approx_kl | 0.15288119 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.714 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 232510 | -| policy_gradient_loss | -0.0164 | -| std | 0.00587 | -| value_loss | 0.00199 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23253 | -| time_elapsed | 126291 | -| total_timesteps | 2976384 | -| train/ | | -| approx_kl | 0.042472303 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.598 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 232520 | -| policy_gradient_loss | 0.0155 | -| std | 0.00587 | -| value_loss | 4.44e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23254 | -| time_elapsed | 126297 | -| total_timesteps | 2976512 | -| train/ | | -| approx_kl | 1.2318014 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.324 | -| n_updates | 232530 | -| policy_gradient_loss | 0.284 | -| std | 0.00587 | -| value_loss | 6.93e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23255 | -| time_elapsed | 126302 | -| total_timesteps | 2976640 | -| train/ | | -| approx_kl | 0.011929296 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.003 | -| learning_rate | 0.0003 | -| loss | 0.00208 | -| n_updates | 232540 | -| policy_gradient_loss | 0.0453 | -| std | 0.00587 | -| value_loss | 3.92e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23256 | -| time_elapsed | 126307 | -| total_timesteps | 2976768 | -| train/ | | -| approx_kl | 0.3038545 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 232550 | -| policy_gradient_loss | 0.0912 | -| std | 0.00587 | -| value_loss | 2.42e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23257 | -| time_elapsed | 126312 | -| total_timesteps | 2976896 | -| train/ | | -| approx_kl | 0.05560301 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0373 | -| n_updates | 232560 | -| policy_gradient_loss | 0.0305 | -| std | 0.00587 | -| value_loss | 1.38e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23258 | -| time_elapsed | 126317 | -| total_timesteps | 2977024 | -| train/ | | -| approx_kl | 0.18711148 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | 0.0733 | -| n_updates | 232570 | -| policy_gradient_loss | 0.0211 | -| std | 0.00587 | -| value_loss | 2.88e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23259 | -| time_elapsed | 126330 | -| total_timesteps | 2977152 | -| train/ | | -| approx_kl | 0.0020745182 | -| clip_fraction | 0.184 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.836 | -| learning_rate | 0.0003 | -| loss | -0.0198 | -| n_updates | 232580 | -| policy_gradient_loss | -0.013 | -| std | 0.00588 | -| value_loss | 0.000519 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23260 | -| time_elapsed | 126334 | -| total_timesteps | 2977280 | -| train/ | | -| approx_kl | 0.10369287 | -| clip_fraction | 0.586 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00137 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 232590 | -| policy_gradient_loss | 0.0658 | -| std | 0.00588 | -| value_loss | 7.61e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23261 | -| time_elapsed | 126340 | -| total_timesteps | 2977408 | -| train/ | | -| approx_kl | 0.00014695292 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.000842 | -| n_updates | 232600 | -| policy_gradient_loss | 0.134 | -| std | 0.00588 | -| value_loss | 1.16e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23262 | -| time_elapsed | 126345 | -| total_timesteps | 2977536 | -| train/ | | -| approx_kl | 4.8027964 | -| clip_fraction | 0.873 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | 0.265 | -| n_updates | 232610 | -| policy_gradient_loss | 0.239 | -| std | 0.00589 | -| value_loss | 2.9e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23263 | -| time_elapsed | 126349 | -| total_timesteps | 2977664 | -| train/ | | -| approx_kl | 0.039548147 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0737 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 232620 | -| policy_gradient_loss | 0.0347 | -| std | 0.00589 | -| value_loss | 1.21e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23264 | -| time_elapsed | 126354 | -| total_timesteps | 2977792 | -| train/ | | -| approx_kl | 0.2886866 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 232630 | -| policy_gradient_loss | 0.139 | -| std | 0.00589 | -| value_loss | 1.12e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23265 | -| time_elapsed | 126360 | -| total_timesteps | 2977920 | -| train/ | | -| approx_kl | 0.23169503 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 232640 | -| policy_gradient_loss | 0.128 | -| std | 0.00589 | -| value_loss | 9.83e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23266 | -| time_elapsed | 126364 | -| total_timesteps | 2978048 | -| train/ | | -| approx_kl | 0.21024565 | -| clip_fraction | 0.744 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 232650 | -| policy_gradient_loss | 0.172 | -| std | 0.00589 | -| value_loss | 7.41e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23267 | -| time_elapsed | 126374 | -| total_timesteps | 2978176 | -| train/ | | -| approx_kl | 0.15560505 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.952 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 232660 | -| policy_gradient_loss | 0.109 | -| std | 0.00589 | -| value_loss | 0.000297 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23268 | -| time_elapsed | 126378 | -| total_timesteps | 2978304 | -| train/ | | -| approx_kl | 0.030621083 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 232670 | -| policy_gradient_loss | 0.0258 | -| std | 0.00589 | -| value_loss | 1.22e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23269 | -| time_elapsed | 126382 | -| total_timesteps | 2978432 | -| train/ | | -| approx_kl | 0.22844741 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 232680 | -| policy_gradient_loss | 0.0317 | -| std | 0.00589 | -| value_loss | 3.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23270 | -| time_elapsed | 126387 | -| total_timesteps | 2978560 | -| train/ | | -| approx_kl | 0.021993391 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 232690 | -| policy_gradient_loss | 0.0262 | -| std | 0.00589 | -| value_loss | 2.41e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23271 | -| time_elapsed | 126393 | -| total_timesteps | 2978688 | -| train/ | | -| approx_kl | 0.12123336 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.0662 | -| n_updates | 232700 | -| policy_gradient_loss | 0.0328 | -| std | 0.00589 | -| value_loss | 1.38e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23272 | -| time_elapsed | 126399 | -| total_timesteps | 2978816 | -| train/ | | -| approx_kl | 0.00014042901 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 232710 | -| policy_gradient_loss | 0.0375 | -| std | 0.00589 | -| value_loss | 1.1e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23273 | -| time_elapsed | 126405 | -| total_timesteps | 2978944 | -| train/ | | -| approx_kl | 0.22559564 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 232720 | -| policy_gradient_loss | 0.0298 | -| std | 0.00589 | -| value_loss | 7.37e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23274 | -| time_elapsed | 126409 | -| total_timesteps | 2979072 | -| train/ | | -| approx_kl | 0.02268581 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.00551 | -| n_updates | 232730 | -| policy_gradient_loss | 0.0281 | -| std | 0.00589 | -| value_loss | 4.79e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23275 | -| time_elapsed | 126417 | -| total_timesteps | 2979200 | -| train/ | | -| approx_kl | 0.35426882 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | 0.264 | -| n_updates | 232740 | -| policy_gradient_loss | 0.172 | -| std | 0.00589 | -| value_loss | 0.000207 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23276 | -| time_elapsed | 126421 | -| total_timesteps | 2979328 | -| train/ | | -| approx_kl | 0.07602933 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00583 | -| learning_rate | 0.0003 | -| loss | 0.0621 | -| n_updates | 232750 | -| policy_gradient_loss | 0.043 | -| std | 0.00589 | -| value_loss | 3.1e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23277 | -| time_elapsed | 126427 | -| total_timesteps | 2979456 | -| train/ | | -| approx_kl | 0.00051734364 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.000914 | -| learning_rate | 0.0003 | -| loss | 0.00334 | -| n_updates | 232760 | -| policy_gradient_loss | 0.0416 | -| std | 0.00589 | -| value_loss | 2.46e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23278 | -| time_elapsed | 126431 | -| total_timesteps | 2979584 | -| train/ | | -| approx_kl | 0.65831643 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00774 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 232770 | -| policy_gradient_loss | 0.0647 | -| std | 0.00589 | -| value_loss | 7.84e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23279 | -| time_elapsed | 126436 | -| total_timesteps | 2979712 | -| train/ | | -| approx_kl | 0.01603587 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 232780 | -| policy_gradient_loss | 0.00751 | -| std | 0.00589 | -| value_loss | 6.52e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23280 | -| time_elapsed | 126441 | -| total_timesteps | 2979840 | -| train/ | | -| approx_kl | 0.0843318 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.0162 | -| n_updates | 232790 | -| policy_gradient_loss | 0.00288 | -| std | 0.00589 | -| value_loss | 5.11e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 23281 | -| time_elapsed | 126448 | -| total_timesteps | 2979968 | -| train/ | | -| approx_kl | 0.011668965 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | -0.00666 | -| n_updates | 232800 | -| policy_gradient_loss | 0.00658 | -| std | 0.00589 | -| value_loss | 3.86e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23282 | -| time_elapsed | 126454 | -| total_timesteps | 2980096 | -| train/ | | -| approx_kl | 0.00078504905 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.0054 | -| n_updates | 232810 | -| policy_gradient_loss | 0.00222 | -| std | 0.00589 | -| value_loss | 2.93e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23283 | -| time_elapsed | 126462 | -| total_timesteps | 2980224 | -| train/ | | -| approx_kl | 0.0039002537 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.715 | -| learning_rate | 0.0003 | -| loss | -0.0302 | -| n_updates | 232820 | -| policy_gradient_loss | -0.0209 | -| std | 0.0059 | -| value_loss | 0.00781 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23284 | -| time_elapsed | 126467 | -| total_timesteps | 2980352 | -| train/ | | -| approx_kl | 0.06394294 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 232830 | -| policy_gradient_loss | 0.0412 | -| std | 0.0059 | -| value_loss | 6.64e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23285 | -| time_elapsed | 126472 | -| total_timesteps | 2980480 | -| train/ | | -| approx_kl | 0.15661818 | -| clip_fraction | 0.56 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00395 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 232840 | -| policy_gradient_loss | 0.0743 | -| std | 0.0059 | -| value_loss | 2.14e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23286 | -| time_elapsed | 126475 | -| total_timesteps | 2980608 | -| train/ | | -| approx_kl | 0.039195895 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 232850 | -| policy_gradient_loss | 0.0412 | -| std | 0.0059 | -| value_loss | 1.51e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23287 | -| time_elapsed | 126478 | -| total_timesteps | 2980736 | -| train/ | | -| approx_kl | 1.0546091 | -| clip_fraction | 0.773 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.261 | -| n_updates | 232860 | -| policy_gradient_loss | 0.231 | -| std | 0.0059 | -| value_loss | 1.13e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23288 | -| time_elapsed | 126482 | -| total_timesteps | 2980864 | -| train/ | | -| approx_kl | 0.010420505 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.00264 | -| n_updates | 232870 | -| policy_gradient_loss | 0.0352 | -| std | 0.0059 | -| value_loss | 5.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23289 | -| time_elapsed | 126486 | -| total_timesteps | 2980992 | -| train/ | | -| approx_kl | 0.112477675 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0969 | -| learning_rate | 0.0003 | -| loss | 0.0702 | -| n_updates | 232880 | -| policy_gradient_loss | 0.0363 | -| std | 0.0059 | -| value_loss | 3.67e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23290 | -| time_elapsed | 126490 | -| total_timesteps | 2981120 | -| train/ | | -| approx_kl | 0.20202464 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0623 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 232890 | -| policy_gradient_loss | 0.0355 | -| std | 0.0059 | -| value_loss | 2.7e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23291 | -| time_elapsed | 126504 | -| total_timesteps | 2981248 | -| train/ | | -| approx_kl | 0.038143028 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | -0.0202 | -| n_updates | 232900 | -| policy_gradient_loss | 0.00368 | -| std | 0.0059 | -| value_loss | 0.00196 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23292 | -| time_elapsed | 126509 | -| total_timesteps | 2981376 | -| train/ | | -| approx_kl | 0.0089316815 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00302 | -| learning_rate | 0.0003 | -| loss | 0.00646 | -| n_updates | 232910 | -| policy_gradient_loss | 0.0222 | -| std | 0.0059 | -| value_loss | 1.13e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23293 | -| time_elapsed | 126514 | -| total_timesteps | 2981504 | -| train/ | | -| approx_kl | 0.024589892 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.00945 | -| n_updates | 232920 | -| policy_gradient_loss | 0.00263 | -| std | 0.0059 | -| value_loss | 2.65e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23294 | -| time_elapsed | 126518 | -| total_timesteps | 2981632 | -| train/ | | -| approx_kl | 0.018940862 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0978 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 232930 | -| policy_gradient_loss | -0.00694 | -| std | 0.0059 | -| value_loss | 1.95e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23295 | -| time_elapsed | 126521 | -| total_timesteps | 2981760 | -| train/ | | -| approx_kl | 0.03231717 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 232940 | -| policy_gradient_loss | 0.0385 | -| std | 0.0059 | -| value_loss | 2.19e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23296 | -| time_elapsed | 126526 | -| total_timesteps | 2981888 | -| train/ | | -| approx_kl | 0.28558746 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 232950 | -| policy_gradient_loss | 0.108 | -| std | 0.0059 | -| value_loss | 4.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23297 | -| time_elapsed | 126531 | -| total_timesteps | 2982016 | -| train/ | | -| approx_kl | 0.053627443 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0616 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 232960 | -| policy_gradient_loss | 0.023 | -| std | 0.00591 | -| value_loss | 4.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23298 | -| time_elapsed | 126542 | -| total_timesteps | 2982144 | -| train/ | | -| approx_kl | 0.05296398 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.792 | -| learning_rate | 0.0003 | -| loss | -0.00576 | -| n_updates | 232970 | -| policy_gradient_loss | 0.0116 | -| std | 0.00591 | -| value_loss | 0.00527 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23299 | -| time_elapsed | 126547 | -| total_timesteps | 2982272 | -| train/ | | -| approx_kl | 0.00356971 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 232980 | -| policy_gradient_loss | 0.0112 | -| std | 0.00591 | -| value_loss | 1.12e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23300 | -| time_elapsed | 126551 | -| total_timesteps | 2982400 | -| train/ | | -| approx_kl | 0.0033345507 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 232990 | -| policy_gradient_loss | 0.0163 | -| std | 0.00591 | -| value_loss | 1.91e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23301 | -| time_elapsed | 126555 | -| total_timesteps | 2982528 | -| train/ | | -| approx_kl | 0.068445064 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0432 | -| learning_rate | 0.0003 | -| loss | 0.0491 | -| n_updates | 233000 | -| policy_gradient_loss | 0.0218 | -| std | 0.0059 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23302 | -| time_elapsed | 126561 | -| total_timesteps | 2982656 | -| train/ | | -| approx_kl | 0.014543568 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.00281 | -| n_updates | 233010 | -| policy_gradient_loss | 0.00802 | -| std | 0.00589 | -| value_loss | 7.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23303 | -| time_elapsed | 126567 | -| total_timesteps | 2982784 | -| train/ | | -| approx_kl | 0.076241076 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 233020 | -| policy_gradient_loss | 0.00778 | -| std | 0.00589 | -| value_loss | 1.7e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.92 | -| time/ | | -| fps | 23 | -| iterations | 23304 | -| time_elapsed | 126573 | -| total_timesteps | 2982912 | -| train/ | | -| approx_kl | 0.05377462 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 233030 | -| policy_gradient_loss | 0.0166 | -| std | 0.00589 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23305 | -| time_elapsed | 126577 | -| total_timesteps | 2983040 | -| train/ | | -| approx_kl | 0.0074342713 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.00422 | -| n_updates | 233040 | -| policy_gradient_loss | 0.00531 | -| std | 0.00589 | -| value_loss | 6.58e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23306 | -| time_elapsed | 126585 | -| total_timesteps | 2983168 | -| train/ | | -| approx_kl | 0.21791285 | -| clip_fraction | 0.565 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 233050 | -| policy_gradient_loss | 0.0335 | -| std | 0.00589 | -| value_loss | 0.000804 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23307 | -| time_elapsed | 126592 | -| total_timesteps | 2983296 | -| train/ | | -| approx_kl | 0.081546724 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | 0.0854 | -| n_updates | 233060 | -| policy_gradient_loss | 0.0452 | -| std | 0.00589 | -| value_loss | 9.62e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23308 | -| time_elapsed | 126599 | -| total_timesteps | 2983424 | -| train/ | | -| approx_kl | 0.00022396352 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -141 | -| learning_rate | 0.0003 | -| loss | -0.000271 | -| n_updates | 233070 | -| policy_gradient_loss | 0.0435 | -| std | 0.00589 | -| value_loss | 5.23e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23309 | -| time_elapsed | 126604 | -| total_timesteps | 2983552 | -| train/ | | -| approx_kl | 5.0926046 | -| clip_fraction | 0.874 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.309 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 233080 | -| policy_gradient_loss | 0.203 | -| std | 0.0059 | -| value_loss | 2.05e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23310 | -| time_elapsed | 126610 | -| total_timesteps | 2983680 | -| train/ | | -| approx_kl | 0.006876179 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.014 | -| learning_rate | 0.0003 | -| loss | -0.0195 | -| n_updates | 233090 | -| policy_gradient_loss | 0.0406 | -| std | 0.0059 | -| value_loss | 5.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23311 | -| time_elapsed | 126614 | -| total_timesteps | 2983808 | -| train/ | | -| approx_kl | 0.08448139 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 233100 | -| policy_gradient_loss | 0.0304 | -| std | 0.00591 | -| value_loss | 7.92e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23312 | -| time_elapsed | 126619 | -| total_timesteps | 2983936 | -| train/ | | -| approx_kl | 0.18857647 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0941 | -| n_updates | 233110 | -| policy_gradient_loss | 0.0288 | -| std | 0.00591 | -| value_loss | 3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23313 | -| time_elapsed | 126624 | -| total_timesteps | 2984064 | -| train/ | | -| approx_kl | 0.028327873 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | -0.0056 | -| n_updates | 233120 | -| policy_gradient_loss | 0.0271 | -| std | 0.00591 | -| value_loss | 3.13e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23314 | -| time_elapsed | 126632 | -| total_timesteps | 2984192 | -| train/ | | -| approx_kl | 0.26859498 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 233130 | -| policy_gradient_loss | 0.0204 | -| std | 0.00591 | -| value_loss | 0.000212 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23315 | -| time_elapsed | 126637 | -| total_timesteps | 2984320 | -| train/ | | -| approx_kl | 0.11748053 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 233140 | -| policy_gradient_loss | 1.43 | -| std | 0.0059 | -| value_loss | 2.31e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23316 | -| time_elapsed | 126642 | -| total_timesteps | 2984448 | -| train/ | | -| approx_kl | 0.022484306 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00969 | -| learning_rate | 0.0003 | -| loss | -0.00258 | -| n_updates | 233150 | -| policy_gradient_loss | 0.0364 | -| std | 0.0059 | -| value_loss | 9.27e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23317 | -| time_elapsed | 126647 | -| total_timesteps | 2984576 | -| train/ | | -| approx_kl | 0.6115439 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00382 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 233160 | -| policy_gradient_loss | 0.0566 | -| std | 0.0059 | -| value_loss | 5.06e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23318 | -| time_elapsed | 126651 | -| total_timesteps | 2984704 | -| train/ | | -| approx_kl | 0.01115641 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 233170 | -| policy_gradient_loss | 0.00132 | -| std | 0.0059 | -| value_loss | 3.9e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23319 | -| time_elapsed | 126656 | -| total_timesteps | 2984832 | -| train/ | | -| approx_kl | 0.046943735 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | 0.0641 | -| n_updates | 233180 | -| policy_gradient_loss | 0.146 | -| std | 0.0059 | -| value_loss | 2.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23320 | -| time_elapsed | 126660 | -| total_timesteps | 2984960 | -| train/ | | -| approx_kl | 0.102674425 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | 0.0547 | -| n_updates | 233190 | -| policy_gradient_loss | 0.0808 | -| std | 0.0059 | -| value_loss | 4.2e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23321 | -| time_elapsed | 126665 | -| total_timesteps | 2985088 | -| train/ | | -| approx_kl | 0.026736395 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.00531 | -| n_updates | 233200 | -| policy_gradient_loss | 0.0398 | -| std | 0.00591 | -| value_loss | 2.38e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23322 | -| time_elapsed | 126675 | -| total_timesteps | 2985216 | -| train/ | | -| approx_kl | 0.08265865 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0366 | -| learning_rate | 0.0003 | -| loss | 0.00282 | -| n_updates | 233210 | -| policy_gradient_loss | -0.00206 | -| std | 0.0059 | -| value_loss | 0.00199 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23323 | -| time_elapsed | 126681 | -| total_timesteps | 2985344 | -| train/ | | -| approx_kl | 0.019547446 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | 0.00456 | -| n_updates | 233220 | -| policy_gradient_loss | 0.0367 | -| std | 0.0059 | -| value_loss | 7.48e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23324 | -| time_elapsed | 126689 | -| total_timesteps | 2985472 | -| train/ | | -| approx_kl | 0.3248887 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.179 | -| n_updates | 233230 | -| policy_gradient_loss | 0.166 | -| std | 0.0059 | -| value_loss | 1.02e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23325 | -| time_elapsed | 126694 | -| total_timesteps | 2985600 | -| train/ | | -| approx_kl | 0.061150193 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 233240 | -| policy_gradient_loss | 0.0298 | -| std | 0.0059 | -| value_loss | 3.55e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23326 | -| time_elapsed | 126698 | -| total_timesteps | 2985728 | -| train/ | | -| approx_kl | 0.18510067 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0976 | -| learning_rate | 0.0003 | -| loss | 0.093 | -| n_updates | 233250 | -| policy_gradient_loss | 0.0241 | -| std | 0.0059 | -| value_loss | 2.13e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23327 | -| time_elapsed | 126701 | -| total_timesteps | 2985856 | -| train/ | | -| approx_kl | 0.028038546 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0952 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 233260 | -| policy_gradient_loss | 0.0232 | -| std | 0.0059 | -| value_loss | 1.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23328 | -| time_elapsed | 126705 | -| total_timesteps | 2985984 | -| train/ | | -| approx_kl | 0.38223368 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 233270 | -| policy_gradient_loss | 0.167 | -| std | 0.0059 | -| value_loss | 9.52e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23329 | -| time_elapsed | 126711 | -| total_timesteps | 2986112 | -| train/ | | -| approx_kl | 0.05706484 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.00651 | -| n_updates | 233280 | -| policy_gradient_loss | 0.0265 | -| std | 0.0059 | -| value_loss | 9.27e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23330 | -| time_elapsed | 126726 | -| total_timesteps | 2986240 | -| train/ | | -| approx_kl | 0.25371507 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.324 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 233290 | -| policy_gradient_loss | -0.00137 | -| std | 0.0059 | -| value_loss | 0.00149 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23331 | -| time_elapsed | 126731 | -| total_timesteps | 2986368 | -| train/ | | -| approx_kl | 0.051801078 | -| clip_fraction | 0.625 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | -0.0049 | -| n_updates | 233300 | -| policy_gradient_loss | 0.0658 | -| std | 0.0059 | -| value_loss | 3.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23332 | -| time_elapsed | 126735 | -| total_timesteps | 2986496 | -| train/ | | -| approx_kl | 0.024013886 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | -0.00437 | -| n_updates | 233310 | -| policy_gradient_loss | 0.0176 | -| std | 0.0059 | -| value_loss | 5.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23333 | -| time_elapsed | 126739 | -| total_timesteps | 2986624 | -| train/ | | -| approx_kl | 0.046307653 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 233320 | -| policy_gradient_loss | 0.036 | -| std | 0.0059 | -| value_loss | 1.66e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23334 | -| time_elapsed | 126743 | -| total_timesteps | 2986752 | -| train/ | | -| approx_kl | 0.2033527 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.0996 | -| n_updates | 233330 | -| policy_gradient_loss | 0.0498 | -| std | 0.0059 | -| value_loss | 1.21e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23335 | -| time_elapsed | 126747 | -| total_timesteps | 2986880 | -| train/ | | -| approx_kl | 0.0045136176 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | -0.00877 | -| n_updates | 233340 | -| policy_gradient_loss | 0.004 | -| std | 0.0059 | -| value_loss | 9.41e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23336 | -| time_elapsed | 126751 | -| total_timesteps | 2987008 | -| train/ | | -| approx_kl | 6.625615e-05 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | 0.00165 | -| n_updates | 233350 | -| policy_gradient_loss | 0.00224 | -| std | 0.0059 | -| value_loss | 7.45e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23337 | -| time_elapsed | 126761 | -| total_timesteps | 2987136 | -| train/ | | -| approx_kl | 0.016261242 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.643 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 233360 | -| policy_gradient_loss | -0.0153 | -| std | 0.0059 | -| value_loss | 0.001 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23338 | -| time_elapsed | 126767 | -| total_timesteps | 2987264 | -| train/ | | -| approx_kl | 0.24713582 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.136 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 233370 | -| policy_gradient_loss | 0.0921 | -| std | 0.0059 | -| value_loss | 0.000376 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23339 | -| time_elapsed | 126771 | -| total_timesteps | 2987392 | -| train/ | | -| approx_kl | 0.0027102926 | -| clip_fraction | 0.565 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00963 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 233380 | -| policy_gradient_loss | 0.103 | -| std | 0.0059 | -| value_loss | 4.31e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23340 | -| time_elapsed | 126777 | -| total_timesteps | 2987520 | -| train/ | | -| approx_kl | 0.22988877 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | 0.243 | -| n_updates | 233390 | -| policy_gradient_loss | 0.131 | -| std | 0.0059 | -| value_loss | 6.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23341 | -| time_elapsed | 126781 | -| total_timesteps | 2987648 | -| train/ | | -| approx_kl | 0.022960266 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0632 | -| learning_rate | 0.0003 | -| loss | 0.00904 | -| n_updates | 233400 | -| policy_gradient_loss | 0.0103 | -| std | 0.00591 | -| value_loss | 5.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23342 | -| time_elapsed | 126786 | -| total_timesteps | 2987776 | -| train/ | | -| approx_kl | 0.027323665 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.00185 | -| n_updates | 233410 | -| policy_gradient_loss | 0.0353 | -| std | 0.00591 | -| value_loss | 2.22e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23343 | -| time_elapsed | 126792 | -| total_timesteps | 2987904 | -| train/ | | -| approx_kl | 0.3597454 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | 0.191 | -| n_updates | 233420 | -| policy_gradient_loss | 0.149 | -| std | 0.00592 | -| value_loss | 1.86e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23344 | -| time_elapsed | 126798 | -| total_timesteps | 2988032 | -| train/ | | -| approx_kl | 0.06329179 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 233430 | -| policy_gradient_loss | 0.0263 | -| std | 0.00592 | -| value_loss | 1.45e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23345 | -| time_elapsed | 126811 | -| total_timesteps | 2988160 | -| train/ | | -| approx_kl | 0.018940024 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.582 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 233440 | -| policy_gradient_loss | 0.00315 | -| std | 0.0059 | -| value_loss | 0.0153 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23346 | -| time_elapsed | 126815 | -| total_timesteps | 2988288 | -| train/ | | -| approx_kl | 0.5748383 | -| clip_fraction | 0.551 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.919 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 233450 | -| policy_gradient_loss | 0.07 | -| std | 0.0059 | -| value_loss | 0.000286 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23347 | -| time_elapsed | 126819 | -| total_timesteps | 2988416 | -| train/ | | -| approx_kl | 0.00483061 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 233460 | -| policy_gradient_loss | 0.0104 | -| std | 0.00589 | -| value_loss | 0.000131 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23348 | -| time_elapsed | 126825 | -| total_timesteps | 2988544 | -| train/ | | -| approx_kl | 0.0019044988 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 233470 | -| policy_gradient_loss | 0.0133 | -| std | 0.00589 | -| value_loss | 9.12e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23349 | -| time_elapsed | 126830 | -| total_timesteps | 2988672 | -| train/ | | -| approx_kl | 6.546732e-06 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.000186 | -| n_updates | 233480 | -| policy_gradient_loss | 0.0449 | -| std | 0.00589 | -| value_loss | 5.74e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23350 | -| time_elapsed | 126834 | -| total_timesteps | 2988800 | -| train/ | | -| approx_kl | 0.20224185 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 233490 | -| policy_gradient_loss | 0.0574 | -| std | 0.00589 | -| value_loss | 4.77e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23351 | -| time_elapsed | 126838 | -| total_timesteps | 2988928 | -| train/ | | -| approx_kl | 0.07323939 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 233500 | -| policy_gradient_loss | 0.0699 | -| std | 0.00589 | -| value_loss | 3.58e-05 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23352 | -| time_elapsed | 126841 | -| total_timesteps | 2989056 | -| train/ | | -| approx_kl | 1.024669 | -| clip_fraction | 0.751 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.311 | -| n_updates | 233510 | -| policy_gradient_loss | 0.176 | -| std | 0.00589 | -| value_loss | 2.23e-05 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23353 | -| time_elapsed | 126850 | -| total_timesteps | 2989184 | -| train/ | | -| approx_kl | 0.05127666 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -3.81 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 233520 | -| policy_gradient_loss | -0.00194 | -| std | 0.00589 | -| value_loss | 0.00369 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23354 | -| time_elapsed | 126855 | -| total_timesteps | 2989312 | -| train/ | | -| approx_kl | 0.0037706988 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.0029 | -| n_updates | 233530 | -| policy_gradient_loss | 0.0406 | -| std | 0.00589 | -| value_loss | 0.000419 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23355 | -| time_elapsed | 126860 | -| total_timesteps | 2989440 | -| train/ | | -| approx_kl | 0.79255533 | -| clip_fraction | 0.768 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00607 | -| learning_rate | 0.0003 | -| loss | 0.264 | -| n_updates | 233540 | -| policy_gradient_loss | 0.149 | -| std | 0.00589 | -| value_loss | 0.0125 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23356 | -| time_elapsed | 126866 | -| total_timesteps | 2989568 | -| train/ | | -| approx_kl | 0.002655955 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | 0.00497 | -| n_updates | 233550 | -| policy_gradient_loss | 0.00165 | -| std | 0.00589 | -| value_loss | 0.00101 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23357 | -| time_elapsed | 126871 | -| total_timesteps | 2989696 | -| train/ | | -| approx_kl | 0.02415388 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.617 | -| learning_rate | 0.0003 | -| loss | 0.00848 | -| n_updates | 233560 | -| policy_gradient_loss | 0.00196 | -| std | 0.00589 | -| value_loss | 0.000175 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23358 | -| time_elapsed | 126879 | -| total_timesteps | 2989824 | -| train/ | | -| approx_kl | 0.020675767 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.29 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 233570 | -| policy_gradient_loss | -0.00722 | -| std | 0.00589 | -| value_loss | 5.15e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.909 | -| time/ | | -| fps | 23 | -| iterations | 23359 | -| time_elapsed | 126885 | -| total_timesteps | 2989952 | -| train/ | | -| approx_kl | 0.02741523 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 233580 | -| policy_gradient_loss | 0.0352 | -| std | 0.00589 | -| value_loss | 4.04e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23360 | -| time_elapsed | 126892 | -| total_timesteps | 2990080 | -| train/ | | -| approx_kl | 0.1376378 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | 0.0822 | -| n_updates | 233590 | -| policy_gradient_loss | 0.0378 | -| std | 0.00588 | -| value_loss | 2.95e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23361 | -| time_elapsed | 126905 | -| total_timesteps | 2990208 | -| train/ | | -| approx_kl | 0.18022485 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 233600 | -| policy_gradient_loss | -0.00245 | -| std | 0.00588 | -| value_loss | 0.000626 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23362 | -| time_elapsed | 126911 | -| total_timesteps | 2990336 | -| train/ | | -| approx_kl | 0.07036018 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0558 | -| learning_rate | 0.0003 | -| loss | 0.0553 | -| n_updates | 233610 | -| policy_gradient_loss | 0.0341 | -| std | 0.00587 | -| value_loss | 1.61e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23363 | -| time_elapsed | 126916 | -| total_timesteps | 2990464 | -| train/ | | -| approx_kl | 0.7844159 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.305 | -| n_updates | 233620 | -| policy_gradient_loss | 0.206 | -| std | 0.00587 | -| value_loss | 1.61e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23364 | -| time_elapsed | 126921 | -| total_timesteps | 2990592 | -| train/ | | -| approx_kl | 0.24053642 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 233630 | -| policy_gradient_loss | 0.123 | -| std | 0.00587 | -| value_loss | 1.52e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23365 | -| time_elapsed | 126926 | -| total_timesteps | 2990720 | -| train/ | | -| approx_kl | 0.06128299 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | 0.0372 | -| n_updates | 233640 | -| policy_gradient_loss | 0.0364 | -| std | 0.00587 | -| value_loss | 1.11e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23366 | -| time_elapsed | 126931 | -| total_timesteps | 2990848 | -| train/ | | -| approx_kl | 0.0011062585 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.00327 | -| n_updates | 233650 | -| policy_gradient_loss | 0.0394 | -| std | 0.00587 | -| value_loss | 1.09e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23367 | -| time_elapsed | 126936 | -| total_timesteps | 2990976 | -| train/ | | -| approx_kl | 0.24624394 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 233660 | -| policy_gradient_loss | 0.0314 | -| std | 0.00587 | -| value_loss | 5.74e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23368 | -| time_elapsed | 126941 | -| total_timesteps | 2991104 | -| train/ | | -| approx_kl | 0.030499518 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.076 | -| learning_rate | 0.0003 | -| loss | 0.00763 | -| n_updates | 233670 | -| policy_gradient_loss | 0.0415 | -| std | 0.00587 | -| value_loss | 4.22e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23369 | -| time_elapsed | 126952 | -| total_timesteps | 2991232 | -| train/ | | -| approx_kl | 0.25998425 | -| clip_fraction | 0.739 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 233680 | -| policy_gradient_loss | 0.139 | -| std | 0.00587 | -| value_loss | 0.000343 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23370 | -| time_elapsed | 126957 | -| total_timesteps | 2991360 | -| train/ | | -| approx_kl | 0.23619369 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 233690 | -| policy_gradient_loss | 0.141 | -| std | 0.00587 | -| value_loss | 5.43e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23371 | -| time_elapsed | 126961 | -| total_timesteps | 2991488 | -| train/ | | -| approx_kl | 0.14662142 | -| clip_fraction | 0.701 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00755 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 233700 | -| policy_gradient_loss | 0.119 | -| std | 0.00587 | -| value_loss | 4.54e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23372 | -| time_elapsed | 126967 | -| total_timesteps | 2991616 | -| train/ | | -| approx_kl | 0.033017732 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0116 | -| learning_rate | 0.0003 | -| loss | 0.000262 | -| n_updates | 233710 | -| policy_gradient_loss | 0.0254 | -| std | 0.00587 | -| value_loss | 4.14e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23373 | -| time_elapsed | 126971 | -| total_timesteps | 2991744 | -| train/ | | -| approx_kl | 0.7376133 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 233720 | -| policy_gradient_loss | 0.0764 | -| std | 0.00588 | -| value_loss | 3.77e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 23374 | -| time_elapsed | 126976 | -| total_timesteps | 2991872 | -| train/ | | -| approx_kl | 0.016281644 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | -0.00524 | -| n_updates | 233730 | -| policy_gradient_loss | 0.00701 | -| std | 0.00587 | -| value_loss | 3.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23375 | -| time_elapsed | 126981 | -| total_timesteps | 2992000 | -| train/ | | -| approx_kl | 0.07770556 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0553 | -| n_updates | 233740 | -| policy_gradient_loss | 0.0229 | -| std | 0.00587 | -| value_loss | 2.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23376 | -| time_elapsed | 126985 | -| total_timesteps | 2992128 | -| train/ | | -| approx_kl | 0.051809352 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00338 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 233750 | -| policy_gradient_loss | 0.00821 | -| std | 0.00587 | -| value_loss | 1.27e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23377 | -| time_elapsed | 126998 | -| total_timesteps | 2992256 | -| train/ | | -| approx_kl | 0.04095399 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.983 | -| learning_rate | 0.0003 | -| loss | -0.00459 | -| n_updates | 233760 | -| policy_gradient_loss | -0.00528 | -| std | 0.00587 | -| value_loss | 0.000149 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23378 | -| time_elapsed | 127003 | -| total_timesteps | 2992384 | -| train/ | | -| approx_kl | 0.059577797 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00529 | -| learning_rate | 0.0003 | -| loss | 0.0249 | -| n_updates | 233770 | -| policy_gradient_loss | 0.00987 | -| std | 0.00587 | -| value_loss | 2.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23379 | -| time_elapsed | 127007 | -| total_timesteps | 2992512 | -| train/ | | -| approx_kl | 0.04743279 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00636 | -| learning_rate | 0.0003 | -| loss | 0.0261 | -| n_updates | 233780 | -| policy_gradient_loss | 0.0131 | -| std | 0.00587 | -| value_loss | 1.26e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23380 | -| time_elapsed | 127012 | -| total_timesteps | 2992640 | -| train/ | | -| approx_kl | 0.06249262 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 233790 | -| policy_gradient_loss | 0.0129 | -| std | 0.00587 | -| value_loss | 8.91e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23381 | -| time_elapsed | 127017 | -| total_timesteps | 2992768 | -| train/ | | -| approx_kl | 0.010336639 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.00174 | -| n_updates | 233800 | -| policy_gradient_loss | 0.00923 | -| std | 0.00587 | -| value_loss | 7.87e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23382 | -| time_elapsed | 127022 | -| total_timesteps | 2992896 | -| train/ | | -| approx_kl | 0.11094856 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 233810 | -| policy_gradient_loss | 0.0258 | -| std | 0.00587 | -| value_loss | 7.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23383 | -| time_elapsed | 127028 | -| total_timesteps | 2993024 | -| train/ | | -| approx_kl | 0.014359448 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0196 | -| learning_rate | 0.0003 | -| loss | 0.00585 | -| n_updates | 233820 | -| policy_gradient_loss | 0.0116 | -| std | 0.00586 | -| value_loss | 3.09e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23384 | -| time_elapsed | 127039 | -| total_timesteps | 2993152 | -| train/ | | -| approx_kl | 0.0153043475 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 233830 | -| policy_gradient_loss | 0.00468 | -| std | 0.00586 | -| value_loss | 0.000202 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23385 | -| time_elapsed | 127043 | -| total_timesteps | 2993280 | -| train/ | | -| approx_kl | 0.055559326 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | 0.0569 | -| n_updates | 233840 | -| policy_gradient_loss | 0.162 | -| std | 0.00585 | -| value_loss | 6.89e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23386 | -| time_elapsed | 127047 | -| total_timesteps | 2993408 | -| train/ | | -| approx_kl | 0.015396772 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00927 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 233850 | -| policy_gradient_loss | 0.035 | -| std | 0.00585 | -| value_loss | 2.83e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23387 | -| time_elapsed | 127051 | -| total_timesteps | 2993536 | -| train/ | | -| approx_kl | 1.1119992e-06 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00949 | -| learning_rate | 0.0003 | -| loss | 0.000169 | -| n_updates | 233860 | -| policy_gradient_loss | 0.0322 | -| std | 0.00585 | -| value_loss | 1.36e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23388 | -| time_elapsed | 127056 | -| total_timesteps | 2993664 | -| train/ | | -| approx_kl | 0.2545985 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.0872 | -| n_updates | 233870 | -| policy_gradient_loss | 0.022 | -| std | 0.00586 | -| value_loss | 7.17e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23389 | -| time_elapsed | 127061 | -| total_timesteps | 2993792 | -| train/ | | -| approx_kl | 0.018436987 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.00926 | -| n_updates | 233880 | -| policy_gradient_loss | 0.0372 | -| std | 0.00586 | -| value_loss | 4.06e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23390 | -| time_elapsed | 127065 | -| total_timesteps | 2993920 | -| train/ | | -| approx_kl | 0.16027044 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0561 | -| learning_rate | 0.0003 | -| loss | 0.0961 | -| n_updates | 233890 | -| policy_gradient_loss | 0.0447 | -| std | 0.00585 | -| value_loss | 3.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23391 | -| time_elapsed | 127069 | -| total_timesteps | 2994048 | -| train/ | | -| approx_kl | 0.20617723 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0973 | -| n_updates | 233900 | -| policy_gradient_loss | 0.0389 | -| std | 0.00584 | -| value_loss | 1.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23392 | -| time_elapsed | 127076 | -| total_timesteps | 2994176 | -| train/ | | -| approx_kl | 0.048877038 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | -0.00929 | -| n_updates | 233910 | -| policy_gradient_loss | 0.00821 | -| std | 0.00584 | -| value_loss | 6.73e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23393 | -| time_elapsed | 127082 | -| total_timesteps | 2994304 | -| train/ | | -| approx_kl | 0.0030471897 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | -0.00181 | -| n_updates | 233920 | -| policy_gradient_loss | 0.0378 | -| std | 0.00584 | -| value_loss | 1.21e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23394 | -| time_elapsed | 127087 | -| total_timesteps | 2994432 | -| train/ | | -| approx_kl | 0.0045392364 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 233930 | -| policy_gradient_loss | 0.0393 | -| std | 0.00584 | -| value_loss | 1.15e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23395 | -| time_elapsed | 127091 | -| total_timesteps | 2994560 | -| train/ | | -| approx_kl | 0.52738655 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.204 | -| n_updates | 233940 | -| policy_gradient_loss | 0.0731 | -| std | 0.00584 | -| value_loss | 1.05e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23396 | -| time_elapsed | 127095 | -| total_timesteps | 2994688 | -| train/ | | -| approx_kl | 0.0068193125 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.000561 | -| n_updates | 233950 | -| policy_gradient_loss | 0.0125 | -| std | 0.00585 | -| value_loss | 4.43e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23397 | -| time_elapsed | 127099 | -| total_timesteps | 2994816 | -| train/ | | -| approx_kl | 0.0018296517 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0697 | -| learning_rate | 0.0003 | -| loss | -0.00568 | -| n_updates | 233960 | -| policy_gradient_loss | 0.0108 | -| std | 0.00586 | -| value_loss | 4.83e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 23398 | -| time_elapsed | 127104 | -| total_timesteps | 2994944 | -| train/ | | -| approx_kl | 4.1816384e-06 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.00024 | -| n_updates | 233970 | -| policy_gradient_loss | 0.0296 | -| std | 0.00586 | -| value_loss | 2.45e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23399 | -| time_elapsed | 127108 | -| total_timesteps | 2995072 | -| train/ | | -| approx_kl | 0.33195126 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0616 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 233980 | -| policy_gradient_loss | 0.0808 | -| std | 0.00586 | -| value_loss | 2.7e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23400 | -| time_elapsed | 127116 | -| total_timesteps | 2995200 | -| train/ | | -| approx_kl | 0.3042459 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 233990 | -| policy_gradient_loss | 0.052 | -| std | 0.00586 | -| value_loss | 0.000373 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23401 | -| time_elapsed | 127120 | -| total_timesteps | 2995328 | -| train/ | | -| approx_kl | 0.29663166 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0807 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 234000 | -| policy_gradient_loss | 0.0371 | -| std | 0.00586 | -| value_loss | 1.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23402 | -| time_elapsed | 127126 | -| total_timesteps | 2995456 | -| train/ | | -| approx_kl | 0.033539467 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00223 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 234010 | -| policy_gradient_loss | 0.0268 | -| std | 0.00586 | -| value_loss | 6.3e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23403 | -| time_elapsed | 127129 | -| total_timesteps | 2995584 | -| train/ | | -| approx_kl | 0.15546441 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00813 | -| learning_rate | 0.0003 | -| loss | 0.0552 | -| n_updates | 234020 | -| policy_gradient_loss | 0.03 | -| std | 0.00586 | -| value_loss | 4.2e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23404 | -| time_elapsed | 127134 | -| total_timesteps | 2995712 | -| train/ | | -| approx_kl | 0.16740103 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00518 | -| learning_rate | 0.0003 | -| loss | 0.0694 | -| n_updates | 234030 | -| policy_gradient_loss | 0.0249 | -| std | 0.00586 | -| value_loss | 3.16e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23405 | -| time_elapsed | 127138 | -| total_timesteps | 2995840 | -| train/ | | -| approx_kl | 0.01442573 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.000957 | -| n_updates | 234040 | -| policy_gradient_loss | 0.000817 | -| std | 0.00586 | -| value_loss | 2.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 23406 | -| time_elapsed | 127143 | -| total_timesteps | 2995968 | -| train/ | | -| approx_kl | 0.036437992 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 234050 | -| policy_gradient_loss | 0.0324 | -| std | 0.00586 | -| value_loss | 1.98e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23407 | -| time_elapsed | 127149 | -| total_timesteps | 2996096 | -| train/ | | -| approx_kl | 0.3977138 | -| clip_fraction | 0.722 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 234060 | -| policy_gradient_loss | 0.206 | -| std | 0.00586 | -| value_loss | 1.92e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23408 | -| time_elapsed | 127158 | -| total_timesteps | 2996224 | -| train/ | | -| approx_kl | 0.051029406 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | -0.025 | -| n_updates | 234070 | -| policy_gradient_loss | -0.0101 | -| std | 0.00586 | -| value_loss | 0.00194 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23409 | -| time_elapsed | 127162 | -| total_timesteps | 2996352 | -| train/ | | -| approx_kl | 0.0017179223 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.52 | -| learning_rate | 0.0003 | -| loss | -0.00399 | -| n_updates | 234080 | -| policy_gradient_loss | 0.0257 | -| std | 0.00586 | -| value_loss | 6.89e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23410 | -| time_elapsed | 127167 | -| total_timesteps | 2996480 | -| train/ | | -| approx_kl | 0.26301974 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 234090 | -| policy_gradient_loss | 0.0767 | -| std | 0.00587 | -| value_loss | 3.11e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23411 | -| time_elapsed | 127172 | -| total_timesteps | 2996608 | -| train/ | | -| approx_kl | 0.010103197 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | 0.00611 | -| n_updates | 234100 | -| policy_gradient_loss | 0.0079 | -| std | 0.00587 | -| value_loss | 8.72e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23412 | -| time_elapsed | 127177 | -| total_timesteps | 2996736 | -| train/ | | -| approx_kl | 0.09293914 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 234110 | -| policy_gradient_loss | 0.0146 | -| std | 0.00587 | -| value_loss | 5.7e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23413 | -| time_elapsed | 127182 | -| total_timesteps | 2996864 | -| train/ | | -| approx_kl | 0.5329863 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0762 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 234120 | -| policy_gradient_loss | 0.0386 | -| std | 0.0059 | -| value_loss | 6.49e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.887 | -| time/ | | -| fps | 23 | -| iterations | 23414 | -| time_elapsed | 127187 | -| total_timesteps | 2996992 | -| train/ | | -| approx_kl | 0.7359852 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.119 | -| n_updates | 234130 | -| policy_gradient_loss | 0.0479 | -| std | 0.00592 | -| value_loss | 7.22e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23415 | -| time_elapsed | 127192 | -| total_timesteps | 2997120 | -| train/ | | -| approx_kl | 0.0082039805 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00388 | -| learning_rate | 0.0003 | -| loss | -0.000855 | -| n_updates | 234140 | -| policy_gradient_loss | 0.00811 | -| std | 0.00593 | -| value_loss | 3.62e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23416 | -| time_elapsed | 127203 | -| total_timesteps | 2997248 | -| train/ | | -| approx_kl | 0.13089035 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.939 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 234150 | -| policy_gradient_loss | -0.00559 | -| std | 0.00593 | -| value_loss | 0.00073 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23417 | -| time_elapsed | 127208 | -| total_timesteps | 2997376 | -| train/ | | -| approx_kl | 0.37400773 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -2.56 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 234160 | -| policy_gradient_loss | 0.0387 | -| std | 0.00593 | -| value_loss | 9.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23418 | -| time_elapsed | 127213 | -| total_timesteps | 2997504 | -| train/ | | -| approx_kl | 0.09403933 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.0669 | -| n_updates | 234170 | -| policy_gradient_loss | 0.104 | -| std | 0.00594 | -| value_loss | 1.41e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23419 | -| time_elapsed | 127219 | -| total_timesteps | 2997632 | -| train/ | | -| approx_kl | 4.239427e-05 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.000663 | -| learning_rate | 0.0003 | -| loss | 0.000492 | -| n_updates | 234180 | -| policy_gradient_loss | 0.0867 | -| std | 0.00594 | -| value_loss | 9.81e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23420 | -| time_elapsed | 127224 | -| total_timesteps | 2997760 | -| train/ | | -| approx_kl | 0.17409739 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 234190 | -| policy_gradient_loss | 0.161 | -| std | 0.00594 | -| value_loss | 7.36e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23421 | -| time_elapsed | 127230 | -| total_timesteps | 2997888 | -| train/ | | -| approx_kl | 0.01236284 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0158 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 234200 | -| policy_gradient_loss | 0.0253 | -| std | 0.00594 | -| value_loss | 4.74e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23422 | -| time_elapsed | 127235 | -| total_timesteps | 2998016 | -| train/ | | -| approx_kl | 0.6142687 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.322 | -| n_updates | 234210 | -| policy_gradient_loss | 0.175 | -| std | 0.00594 | -| value_loss | 4.26e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23423 | -| time_elapsed | 127247 | -| total_timesteps | 2998144 | -| train/ | | -| approx_kl | 0.022321105 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 234220 | -| policy_gradient_loss | 0.00142 | -| std | 0.00594 | -| value_loss | 0.0018 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23424 | -| time_elapsed | 127254 | -| total_timesteps | 2998272 | -| train/ | | -| approx_kl | 0.15209815 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | 0.058 | -| n_updates | 234230 | -| policy_gradient_loss | 0.0547 | -| std | 0.00594 | -| value_loss | 6.03e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23425 | -| time_elapsed | 127260 | -| total_timesteps | 2998400 | -| train/ | | -| approx_kl | 0.010441506 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00481 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 234240 | -| policy_gradient_loss | 0.000215 | -| std | 0.00593 | -| value_loss | 1.29e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23426 | -| time_elapsed | 127264 | -| total_timesteps | 2998528 | -| train/ | | -| approx_kl | 0.00046240445 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0134 | -| learning_rate | 0.0003 | -| loss | 0.00643 | -| n_updates | 234250 | -| policy_gradient_loss | -0.00424 | -| std | 0.00593 | -| value_loss | 6.01e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23427 | -| time_elapsed | 127268 | -| total_timesteps | 2998656 | -| train/ | | -| approx_kl | 0.08996505 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.048 | -| n_updates | 234260 | -| policy_gradient_loss | 0.0877 | -| std | 0.00593 | -| value_loss | 4.39e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23428 | -| time_elapsed | 127272 | -| total_timesteps | 2998784 | -| train/ | | -| approx_kl | 0.02203009 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.00963 | -| n_updates | 234270 | -| policy_gradient_loss | 0.0101 | -| std | 0.00593 | -| value_loss | 4.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 23429 | -| time_elapsed | 127276 | -| total_timesteps | 2998912 | -| train/ | | -| approx_kl | 0.044720918 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 234280 | -| policy_gradient_loss | 0.0558 | -| std | 0.00593 | -| value_loss | 3.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23430 | -| time_elapsed | 127280 | -| total_timesteps | 2999040 | -| train/ | | -| approx_kl | 0.28091183 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 234290 | -| policy_gradient_loss | 0.0646 | -| std | 0.00593 | -| value_loss | 3.54e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23431 | -| time_elapsed | 127289 | -| total_timesteps | 2999168 | -| train/ | | -| approx_kl | 0.004533626 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.809 | -| learning_rate | 0.0003 | -| loss | -0.00898 | -| n_updates | 234300 | -| policy_gradient_loss | -0.0051 | -| std | 0.00593 | -| value_loss | 0.00416 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23432 | -| time_elapsed | 127293 | -| total_timesteps | 2999296 | -| train/ | | -| approx_kl | 0.0029113744 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | -0.00726 | -| n_updates | 234310 | -| policy_gradient_loss | 0.0104 | -| std | 0.00593 | -| value_loss | 1.43e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23433 | -| time_elapsed | 127298 | -| total_timesteps | 2999424 | -| train/ | | -| approx_kl | 0.08813371 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00696 | -| learning_rate | 0.0003 | -| loss | 0.00097 | -| n_updates | 234320 | -| policy_gradient_loss | 0.0636 | -| std | 0.00593 | -| value_loss | 4.6e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23434 | -| time_elapsed | 127303 | -| total_timesteps | 2999552 | -| train/ | | -| approx_kl | 0.2731102 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00121 | -| learning_rate | 0.0003 | -| loss | 0.079 | -| n_updates | 234330 | -| policy_gradient_loss | 0.0397 | -| std | 0.00593 | -| value_loss | 3.21e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23435 | -| time_elapsed | 127307 | -| total_timesteps | 2999680 | -| train/ | | -| approx_kl | 0.08123816 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 234340 | -| policy_gradient_loss | 0.0854 | -| std | 0.00593 | -| value_loss | 2.54e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23436 | -| time_elapsed | 127311 | -| total_timesteps | 2999808 | -| train/ | | -| approx_kl | 0.00025491742 | -| clip_fraction | 0.586 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 7.65e-05 | -| n_updates | 234350 | -| policy_gradient_loss | 0.116 | -| std | 0.00593 | -| value_loss | 1.66e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 23437 | -| time_elapsed | 127316 | -| total_timesteps | 2999936 | -| train/ | | -| approx_kl | 0.20351315 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 234360 | -| policy_gradient_loss | 0.195 | -| std | 0.00594 | -| value_loss | 1.14e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23438 | -| time_elapsed | 127320 | -| total_timesteps | 3000064 | -| train/ | | -| approx_kl | 0.08230275 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 234370 | -| policy_gradient_loss | 0.02 | -| std | 0.00595 | -| value_loss | 8e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23439 | -| time_elapsed | 127330 | -| total_timesteps | 3000192 | -| train/ | | -| approx_kl | 0.28702807 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | 0.0529 | -| n_updates | 234380 | -| policy_gradient_loss | 0.0167 | -| std | 0.00595 | -| value_loss | 0.00677 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23440 | -| time_elapsed | 127335 | -| total_timesteps | 3000320 | -| train/ | | -| approx_kl | 0.09505321 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | 0.0468 | -| n_updates | 234390 | -| policy_gradient_loss | 0.0879 | -| std | 0.00595 | -| value_loss | 8.08e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23441 | -| time_elapsed | 127339 | -| total_timesteps | 3000448 | -| train/ | | -| approx_kl | 3.0826777e-07 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | -4.89e-05 | -| n_updates | 234400 | -| policy_gradient_loss | 0.0952 | -| std | 0.00595 | -| value_loss | 2.56e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23442 | -| time_elapsed | 127345 | -| total_timesteps | 3000576 | -| train/ | | -| approx_kl | 0.17751503 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0085 | -| learning_rate | 0.0003 | -| loss | 0.0997 | -| n_updates | 234410 | -| policy_gradient_loss | 0.283 | -| std | 0.00596 | -| value_loss | 1.14e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23443 | -| time_elapsed | 127351 | -| total_timesteps | 3000704 | -| train/ | | -| approx_kl | 0.09664191 | -| clip_fraction | 0.507 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | 0.0679 | -| n_updates | 234420 | -| policy_gradient_loss | 0.0552 | -| std | 0.00596 | -| value_loss | 5.19e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23444 | -| time_elapsed | 127356 | -| total_timesteps | 3000832 | -| train/ | | -| approx_kl | 0.34775236 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 234430 | -| policy_gradient_loss | 0.121 | -| std | 0.00597 | -| value_loss | 3.44e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 23445 | -| time_elapsed | 127361 | -| total_timesteps | 3000960 | -| train/ | | -| approx_kl | 0.24210188 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 234440 | -| policy_gradient_loss | 0.172 | -| std | 0.00596 | -| value_loss | 4.67e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23446 | -| time_elapsed | 127365 | -| total_timesteps | 3001088 | -| train/ | | -| approx_kl | 0.15367356 | -| clip_fraction | 0.694 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.307 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 234450 | -| policy_gradient_loss | 0.135 | -| std | 0.00596 | -| value_loss | 8.56e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23447 | -| time_elapsed | 127373 | -| total_timesteps | 3001216 | -| train/ | | -| approx_kl | 0.64720047 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -4.24 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 234460 | -| policy_gradient_loss | 0.0236 | -| std | 0.00596 | -| value_loss | 0.00344 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23448 | -| time_elapsed | 127377 | -| total_timesteps | 3001344 | -| train/ | | -| approx_kl | 0.079979 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -2.34 | -| learning_rate | 0.0003 | -| loss | 0.00892 | -| n_updates | 234470 | -| policy_gradient_loss | 0.0181 | -| std | 0.00596 | -| value_loss | 4.12e-06 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23449 | -| time_elapsed | 127382 | -| total_timesteps | 3001472 | -| train/ | | -| approx_kl | 0.0033003665 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -5.69 | -| learning_rate | 0.0003 | -| loss | 0.00134 | -| n_updates | 234480 | -| policy_gradient_loss | 0.00159 | -| std | 0.00596 | -| value_loss | 2.58e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23450 | -| time_elapsed | 127387 | -| total_timesteps | 3001600 | -| train/ | | -| approx_kl | 0.28342754 | -| clip_fraction | 0.742 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00653 | -| learning_rate | 0.0003 | -| loss | 0.182 | -| n_updates | 234490 | -| policy_gradient_loss | 0.235 | -| std | 0.00597 | -| value_loss | 1.2e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23451 | -| time_elapsed | 127391 | -| total_timesteps | 3001728 | -| train/ | | -| approx_kl | 0.2059382 | -| clip_fraction | 0.729 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 234500 | -| policy_gradient_loss | 0.0979 | -| std | 0.00597 | -| value_loss | 1.25e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23452 | -| time_elapsed | 127395 | -| total_timesteps | 3001856 | -| train/ | | -| approx_kl | 0.031453855 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0452 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 234510 | -| policy_gradient_loss | 0.0208 | -| std | 0.00597 | -| value_loss | 1.16e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 23453 | -| time_elapsed | 127398 | -| total_timesteps | 3001984 | -| train/ | | -| approx_kl | 0.00065878546 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.00251 | -| n_updates | 234520 | -| policy_gradient_loss | 0.0361 | -| std | 0.00597 | -| value_loss | 8.52e-09 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 23454 | -| time_elapsed | 127403 | -| total_timesteps | 3002112 | -| train/ | | -| approx_kl | 0.6057366 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.335 | -| n_updates | 234530 | -| policy_gradient_loss | 0.0932 | -| std | 0.00596 | -| value_loss | 6.62e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 23455 | -| time_elapsed | 127414 | -| total_timesteps | 3002240 | -| train/ | | -| approx_kl | 0.11946317 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 234540 | -| policy_gradient_loss | -0.0102 | -| std | 0.00596 | -| value_loss | 5.79e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 23456 | -| time_elapsed | 127419 | -| total_timesteps | 3002368 | -| train/ | | -| approx_kl | 0.00029126555 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -50.6 | -| learning_rate | 0.0003 | -| loss | -0.000391 | -| n_updates | 234550 | -| policy_gradient_loss | 0.00576 | -| std | 0.00595 | -| value_loss | 9.01e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 23457 | -| time_elapsed | 127424 | -| total_timesteps | 3002496 | -| train/ | | -| approx_kl | 4.6029687e-05 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.488 | -| learning_rate | 0.0003 | -| loss | -0.000449 | -| n_updates | 234560 | -| policy_gradient_loss | 0.0406 | -| std | 0.00593 | -| value_loss | 4.15e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 23458 | -| time_elapsed | 127430 | -| total_timesteps | 3002624 | -| train/ | | -| approx_kl | 0.8750684 | -| clip_fraction | 0.774 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0783 | -| learning_rate | 0.0003 | -| loss | 0.444 | -| n_updates | 234570 | -| policy_gradient_loss | 0.28 | -| std | 0.00593 | -| value_loss | 8.79e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 23459 | -| time_elapsed | 127433 | -| total_timesteps | 3002752 | -| train/ | | -| approx_kl | 0.032104228 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.00433 | -| n_updates | 234580 | -| policy_gradient_loss | -0.00229 | -| std | 0.00593 | -| value_loss | 5.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 23460 | -| time_elapsed | 127439 | -| total_timesteps | 3002880 | -| train/ | | -| approx_kl | 0.017832294 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0074 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 234590 | -| policy_gradient_loss | -0.00396 | -| std | 0.00593 | -| value_loss | 3.32e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23461 | -| time_elapsed | 127445 | -| total_timesteps | 3003008 | -| train/ | | -| approx_kl | 0.035131425 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.00719 | -| n_updates | 234600 | -| policy_gradient_loss | 0.0328 | -| std | 0.00593 | -| value_loss | 2.35e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23462 | -| time_elapsed | 127459 | -| total_timesteps | 3003136 | -| train/ | | -| approx_kl | 0.031855956 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.772 | -| learning_rate | 0.0003 | -| loss | 0.00397 | -| n_updates | 234610 | -| policy_gradient_loss | 0.00705 | -| std | 0.00593 | -| value_loss | 0.00594 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23463 | -| time_elapsed | 127465 | -| total_timesteps | 3003264 | -| train/ | | -| approx_kl | 0.016601235 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.13 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 234620 | -| policy_gradient_loss | 0.017 | -| std | 0.00593 | -| value_loss | 0.000433 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23464 | -| time_elapsed | 127470 | -| total_timesteps | 3003392 | -| train/ | | -| approx_kl | 0.15331677 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.000794 | -| learning_rate | 0.0003 | -| loss | 0.094 | -| n_updates | 234630 | -| policy_gradient_loss | 0.046 | -| std | 0.00593 | -| value_loss | 8.22e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23465 | -| time_elapsed | 127474 | -| total_timesteps | 3003520 | -| train/ | | -| approx_kl | 0.15212408 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00129 | -| learning_rate | 0.0003 | -| loss | 0.0863 | -| n_updates | 234640 | -| policy_gradient_loss | 0.0282 | -| std | 0.00593 | -| value_loss | 2.62e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23466 | -| time_elapsed | 127478 | -| total_timesteps | 3003648 | -| train/ | | -| approx_kl | 0.03803962 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | -0.00579 | -| n_updates | 234650 | -| policy_gradient_loss | 0.0301 | -| std | 0.00593 | -| value_loss | 2.49e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23467 | -| time_elapsed | 127484 | -| total_timesteps | 3003776 | -| train/ | | -| approx_kl | 0.11661546 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.0697 | -| n_updates | 234660 | -| policy_gradient_loss | 0.0325 | -| std | 0.00594 | -| value_loss | 1.99e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.899 | -| time/ | | -| fps | 23 | -| iterations | 23468 | -| time_elapsed | 127489 | -| total_timesteps | 3003904 | -| train/ | | -| approx_kl | 0.00017549936 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | -0.000958 | -| n_updates | 234670 | -| policy_gradient_loss | 0.0232 | -| std | 0.00594 | -| value_loss | 1.47e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23469 | -| time_elapsed | 127493 | -| total_timesteps | 3004032 | -| train/ | | -| approx_kl | 0.002130161 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 234680 | -| policy_gradient_loss | 0.0395 | -| std | 0.00594 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23470 | -| time_elapsed | 127507 | -| total_timesteps | 3004160 | -| train/ | | -| approx_kl | 0.014957111 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.316 | -| learning_rate | 0.0003 | -| loss | -0.0279 | -| n_updates | 234690 | -| policy_gradient_loss | -0.0147 | -| std | 0.00594 | -| value_loss | 0.00213 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23471 | -| time_elapsed | 127512 | -| total_timesteps | 3004288 | -| train/ | | -| approx_kl | 0.0093154125 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.3 | -| learning_rate | 0.0003 | -| loss | -0.00689 | -| n_updates | 234700 | -| policy_gradient_loss | 0.0331 | -| std | 0.00594 | -| value_loss | 3.02e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23472 | -| time_elapsed | 127518 | -| total_timesteps | 3004416 | -| train/ | | -| approx_kl | 2.9097311e-05 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.000552 | -| n_updates | 234710 | -| policy_gradient_loss | 0.0271 | -| std | 0.00594 | -| value_loss | 1.53e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23473 | -| time_elapsed | 127522 | -| total_timesteps | 3004544 | -| train/ | | -| approx_kl | 0.2970706 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.253 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 234720 | -| policy_gradient_loss | 0.0234 | -| std | 0.00594 | -| value_loss | 5.62e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23474 | -| time_elapsed | 127526 | -| total_timesteps | 3004672 | -| train/ | | -| approx_kl | 0.018913135 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.273 | -| learning_rate | 0.0003 | -| loss | -0.000377 | -| n_updates | 234730 | -| policy_gradient_loss | 0.0292 | -| std | 0.00594 | -| value_loss | 9.6e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23475 | -| time_elapsed | 127530 | -| total_timesteps | 3004800 | -| train/ | | -| approx_kl | 0.3642238 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.203 | -| n_updates | 234740 | -| policy_gradient_loss | 0.155 | -| std | 0.00594 | -| value_loss | 6.39e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 23476 | -| time_elapsed | 127536 | -| total_timesteps | 3004928 | -| train/ | | -| approx_kl | 0.2912729 | -| clip_fraction | 0.747 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 234750 | -| policy_gradient_loss | 0.197 | -| std | 0.00594 | -| value_loss | 5.57e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23477 | -| time_elapsed | 127542 | -| total_timesteps | 3005056 | -| train/ | | -| approx_kl | 0.15722416 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 234760 | -| policy_gradient_loss | 0.121 | -| std | 0.00594 | -| value_loss | 4.85e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23478 | -| time_elapsed | 127551 | -| total_timesteps | 3005184 | -| train/ | | -| approx_kl | 0.092434995 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | 0.0869 | -| n_updates | 234770 | -| policy_gradient_loss | 0.0773 | -| std | 0.00594 | -| value_loss | 0.00429 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23479 | -| time_elapsed | 127556 | -| total_timesteps | 3005312 | -| train/ | | -| approx_kl | 0.21548715 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 234780 | -| policy_gradient_loss | 0.183 | -| std | 0.00594 | -| value_loss | 2.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23480 | -| time_elapsed | 127561 | -| total_timesteps | 3005440 | -| train/ | | -| approx_kl | 0.19643745 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00152 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 234790 | -| policy_gradient_loss | 0.166 | -| std | 0.00594 | -| value_loss | 8.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23481 | -| time_elapsed | 127567 | -| total_timesteps | 3005568 | -| train/ | | -| approx_kl | 0.030748785 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00433 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 234800 | -| policy_gradient_loss | 0.029 | -| std | 0.00594 | -| value_loss | 4.68e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23482 | -| time_elapsed | 127572 | -| total_timesteps | 3005696 | -| train/ | | -| approx_kl | 0.19680442 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0174 | -| learning_rate | 0.0003 | -| loss | 0.0889 | -| n_updates | 234810 | -| policy_gradient_loss | 0.0239 | -| std | 0.00594 | -| value_loss | 3.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23483 | -| time_elapsed | 127577 | -| total_timesteps | 3005824 | -| train/ | | -| approx_kl | 0.019904189 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.025 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 234820 | -| policy_gradient_loss | 0.00542 | -| std | 0.00595 | -| value_loss | 1.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 23484 | -| time_elapsed | 127582 | -| total_timesteps | 3005952 | -| train/ | | -| approx_kl | 0.01843534 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0722 | -| learning_rate | 0.0003 | -| loss | 0.00722 | -| n_updates | 234830 | -| policy_gradient_loss | 0.00351 | -| std | 0.00595 | -| value_loss | 1.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23485 | -| time_elapsed | 127587 | -| total_timesteps | 3006080 | -| train/ | | -| approx_kl | 0.015250767 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 234840 | -| policy_gradient_loss | -0.00522 | -| std | 0.00595 | -| value_loss | 9.4e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23486 | -| time_elapsed | 127595 | -| total_timesteps | 3006208 | -| train/ | | -| approx_kl | 0.7453259 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.342 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 234850 | -| policy_gradient_loss | -0.00171 | -| std | 0.00595 | -| value_loss | 0.00145 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23487 | -| time_elapsed | 127599 | -| total_timesteps | 3006336 | -| train/ | | -| approx_kl | 0.045950096 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -120 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 234860 | -| policy_gradient_loss | -0.000756 | -| std | 0.00596 | -| value_loss | 3.43e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23488 | -| time_elapsed | 127606 | -| total_timesteps | 3006464 | -| train/ | | -| approx_kl | 0.06322664 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | -0.0271 | -| n_updates | 234870 | -| policy_gradient_loss | -0.0144 | -| std | 0.00596 | -| value_loss | 8.95e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23489 | -| time_elapsed | 127610 | -| total_timesteps | 3006592 | -| train/ | | -| approx_kl | 0.062313847 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -12.9 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 234880 | -| policy_gradient_loss | 0.00707 | -| std | 0.00596 | -| value_loss | 6.78e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23490 | -| time_elapsed | 127615 | -| total_timesteps | 3006720 | -| train/ | | -| approx_kl | 0.06007778 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.089 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 234890 | -| policy_gradient_loss | -0.00155 | -| std | 0.00596 | -| value_loss | 2.92e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23491 | -| time_elapsed | 127621 | -| total_timesteps | 3006848 | -| train/ | | -| approx_kl | 0.009421998 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 234900 | -| policy_gradient_loss | 0.0054 | -| std | 0.00596 | -| value_loss | 3.36e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 23492 | -| time_elapsed | 127630 | -| total_timesteps | 3006976 | -| train/ | | -| approx_kl | 0.09231216 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 234910 | -| policy_gradient_loss | 0.00628 | -| std | 0.00596 | -| value_loss | 2.79e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 23493 | -| time_elapsed | 127635 | -| total_timesteps | 3007104 | -| train/ | | -| approx_kl | 0.015078908 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0222 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 234920 | -| policy_gradient_loss | 0.00666 | -| std | 0.00596 | -| value_loss | 2.62e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 23494 | -| time_elapsed | 127648 | -| total_timesteps | 3007232 | -| train/ | | -| approx_kl | 0.013307288 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.764 | -| learning_rate | 0.0003 | -| loss | -0.00444 | -| n_updates | 234930 | -| policy_gradient_loss | -0.01 | -| std | 0.00595 | -| value_loss | 0.00648 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 23495 | -| time_elapsed | 127652 | -| total_timesteps | 3007360 | -| train/ | | -| approx_kl | 0.037720807 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | -0.00223 | -| n_updates | 234940 | -| policy_gradient_loss | 0.00374 | -| std | 0.00595 | -| value_loss | 1.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 23496 | -| time_elapsed | 127660 | -| total_timesteps | 3007488 | -| train/ | | -| approx_kl | 0.008182616 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00344 | -| learning_rate | 0.0003 | -| loss | -0.00679 | -| n_updates | 234950 | -| policy_gradient_loss | 0.00936 | -| std | 0.00595 | -| value_loss | 3.31e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 23497 | -| time_elapsed | 127666 | -| total_timesteps | 3007616 | -| train/ | | -| approx_kl | 0.03792781 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 234960 | -| policy_gradient_loss | 0.107 | -| std | 0.00595 | -| value_loss | 2.75e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 23498 | -| time_elapsed | 127671 | -| total_timesteps | 3007744 | -| train/ | | -| approx_kl | 0.11158848 | -| clip_fraction | 0.681 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.456 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 234970 | -| policy_gradient_loss | 0.106 | -| std | 0.00595 | -| value_loss | 4.56e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.902 | -| time/ | | -| fps | 23 | -| iterations | 23499 | -| time_elapsed | 127675 | -| total_timesteps | 3007872 | -| train/ | | -| approx_kl | 0.15202406 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.0886 | -| n_updates | 234980 | -| policy_gradient_loss | 0.203 | -| std | 0.00595 | -| value_loss | 3.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23500 | -| time_elapsed | 127680 | -| total_timesteps | 3008000 | -| train/ | | -| approx_kl | 0.028244214 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.416 | -| learning_rate | 0.0003 | -| loss | -0.0284 | -| n_updates | 234990 | -| policy_gradient_loss | 0.0194 | -| std | 0.00595 | -| value_loss | 3.95e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23501 | -| time_elapsed | 127686 | -| total_timesteps | 3008128 | -| train/ | | -| approx_kl | 0.6464695 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00843 | -| learning_rate | 0.0003 | -| loss | 0.201 | -| n_updates | 235000 | -| policy_gradient_loss | 0.0724 | -| std | 0.00595 | -| value_loss | 2.33e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23502 | -| time_elapsed | 127699 | -| total_timesteps | 3008256 | -| train/ | | -| approx_kl | 0.033659842 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.786 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 235010 | -| policy_gradient_loss | 0.00192 | -| std | 0.00595 | -| value_loss | 0.00476 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23503 | -| time_elapsed | 127706 | -| total_timesteps | 3008384 | -| train/ | | -| approx_kl | 0.09741232 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 235020 | -| policy_gradient_loss | 0.0128 | -| std | 0.00595 | -| value_loss | 2.06e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23504 | -| time_elapsed | 127712 | -| total_timesteps | 3008512 | -| train/ | | -| approx_kl | 0.054094434 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00829 | -| learning_rate | 0.0003 | -| loss | 0.00201 | -| n_updates | 235030 | -| policy_gradient_loss | 0.00294 | -| std | 0.00595 | -| value_loss | 5.82e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23505 | -| time_elapsed | 127715 | -| total_timesteps | 3008640 | -| train/ | | -| approx_kl | 0.0075102746 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00426 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 235040 | -| policy_gradient_loss | 0.00415 | -| std | 0.00595 | -| value_loss | 3.41e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23506 | -| time_elapsed | 127720 | -| total_timesteps | 3008768 | -| train/ | | -| approx_kl | 0.026095647 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0163 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 235050 | -| policy_gradient_loss | 0.0169 | -| std | 0.00596 | -| value_loss | 1.48e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 23507 | -| time_elapsed | 127723 | -| total_timesteps | 3008896 | -| train/ | | -| approx_kl | 0.00013984414 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0776 | -| learning_rate | 0.0003 | -| loss | 0.000542 | -| n_updates | 235060 | -| policy_gradient_loss | 0.0151 | -| std | 0.00598 | -| value_loss | 8.78e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23508 | -| time_elapsed | 127726 | -| total_timesteps | 3009024 | -| train/ | | -| approx_kl | 0.24542248 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 235070 | -| policy_gradient_loss | 0.0373 | -| std | 0.00599 | -| value_loss | 5.15e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23509 | -| time_elapsed | 127737 | -| total_timesteps | 3009152 | -| train/ | | -| approx_kl | 0.004001087 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.772 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 235080 | -| policy_gradient_loss | 0.00365 | -| std | 0.00599 | -| value_loss | 0.00618 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23510 | -| time_elapsed | 127743 | -| total_timesteps | 3009280 | -| train/ | | -| approx_kl | 0.015045943 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 235090 | -| policy_gradient_loss | 0.0285 | -| std | 0.00599 | -| value_loss | 8.86e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23511 | -| time_elapsed | 127746 | -| total_timesteps | 3009408 | -| train/ | | -| approx_kl | 0.19038302 | -| clip_fraction | 0.551 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 235100 | -| policy_gradient_loss | 0.0827 | -| std | 0.00599 | -| value_loss | 3.33e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23512 | -| time_elapsed | 127751 | -| total_timesteps | 3009536 | -| train/ | | -| approx_kl | 0.0077216234 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00595 | -| learning_rate | 0.0003 | -| loss | 0.00975 | -| n_updates | 235110 | -| policy_gradient_loss | 0.0112 | -| std | 0.00599 | -| value_loss | 2.06e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23513 | -| time_elapsed | 127758 | -| total_timesteps | 3009664 | -| train/ | | -| approx_kl | 0.030668776 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | 0.0134 | -| n_updates | 235120 | -| policy_gradient_loss | 0.0372 | -| std | 0.00598 | -| value_loss | 8.35e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23514 | -| time_elapsed | 127764 | -| total_timesteps | 3009792 | -| train/ | | -| approx_kl | 0.1430781 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 235130 | -| policy_gradient_loss | 0.0473 | -| std | 0.00598 | -| value_loss | 4.87e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 23515 | -| time_elapsed | 127769 | -| total_timesteps | 3009920 | -| train/ | | -| approx_kl | 0.0004917793 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | 0.0027 | -| n_updates | 235140 | -| policy_gradient_loss | 0.0108 | -| std | 0.00597 | -| value_loss | 4.11e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23516 | -| time_elapsed | 127774 | -| total_timesteps | 3010048 | -| train/ | | -| approx_kl | 0.04463067 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -44.8 | -| learning_rate | 0.0003 | -| loss | -0.000981 | -| n_updates | 235150 | -| policy_gradient_loss | 0.00522 | -| std | 0.00597 | -| value_loss | 2.82e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23517 | -| time_elapsed | 127783 | -| total_timesteps | 3010176 | -| train/ | | -| approx_kl | 0.60341376 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -2.74 | -| learning_rate | 0.0003 | -| loss | 0.0507 | -| n_updates | 235160 | -| policy_gradient_loss | 0.0151 | -| std | 0.00597 | -| value_loss | 0.00326 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23518 | -| time_elapsed | 127786 | -| total_timesteps | 3010304 | -| train/ | | -| approx_kl | 0.040232174 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.116 | -| learning_rate | 0.0003 | -| loss | 0.0098 | -| n_updates | 235170 | -| policy_gradient_loss | 0.00668 | -| std | 0.00597 | -| value_loss | 1.3e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23519 | -| time_elapsed | 127789 | -| total_timesteps | 3010432 | -| train/ | | -| approx_kl | 0.008010676 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00905 | -| learning_rate | 0.0003 | -| loss | -0.00761 | -| n_updates | 235180 | -| policy_gradient_loss | 0.00583 | -| std | 0.00597 | -| value_loss | 1.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23520 | -| time_elapsed | 127792 | -| total_timesteps | 3010560 | -| train/ | | -| approx_kl | 0.08180278 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | 0.0357 | -| n_updates | 235190 | -| policy_gradient_loss | 0.0131 | -| std | 0.00597 | -| value_loss | 9.95e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23521 | -| time_elapsed | 127797 | -| total_timesteps | 3010688 | -| train/ | | -| approx_kl | 0.013118857 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | -0.00535 | -| n_updates | 235200 | -| policy_gradient_loss | 0.00378 | -| std | 0.00597 | -| value_loss | 7.87e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23522 | -| time_elapsed | 127802 | -| total_timesteps | 3010816 | -| train/ | | -| approx_kl | 0.15486032 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0656 | -| n_updates | 235210 | -| policy_gradient_loss | 0.0172 | -| std | 0.006 | -| value_loss | 8.69e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.922 | -| time/ | | -| fps | 23 | -| iterations | 23523 | -| time_elapsed | 127808 | -| total_timesteps | 3010944 | -| train/ | | -| approx_kl | 0.2601213 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.65 | -| learning_rate | 0.0003 | -| loss | 0.0624 | -| n_updates | 235220 | -| policy_gradient_loss | 0.0026 | -| std | 0.00601 | -| value_loss | 1.4e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23524 | -| time_elapsed | 127813 | -| total_timesteps | 3011072 | -| train/ | | -| approx_kl | 0.051555857 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.358 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 235230 | -| policy_gradient_loss | 0.0452 | -| std | 0.00601 | -| value_loss | 3.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23525 | -| time_elapsed | 127822 | -| total_timesteps | 3011200 | -| train/ | | -| approx_kl | 0.11674401 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.911 | -| learning_rate | 0.0003 | -| loss | 0.0133 | -| n_updates | 235240 | -| policy_gradient_loss | -0.00358 | -| std | 0.00601 | -| value_loss | 0.00137 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23526 | -| time_elapsed | 127828 | -| total_timesteps | 3011328 | -| train/ | | -| approx_kl | 0.014453332 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | 0.00468 | -| n_updates | 235250 | -| policy_gradient_loss | 0.00151 | -| std | 0.00601 | -| value_loss | 7.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23527 | -| time_elapsed | 127833 | -| total_timesteps | 3011456 | -| train/ | | -| approx_kl | 0.02586631 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00703 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 235260 | -| policy_gradient_loss | 0.0341 | -| std | 0.00601 | -| value_loss | 1.56e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23528 | -| time_elapsed | 127838 | -| total_timesteps | 3011584 | -| train/ | | -| approx_kl | 0.46364537 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 235270 | -| policy_gradient_loss | 0.14 | -| std | 0.00601 | -| value_loss | 2.27e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23529 | -| time_elapsed | 127842 | -| total_timesteps | 3011712 | -| train/ | | -| approx_kl | 0.0027997354 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0884 | -| learning_rate | 0.0003 | -| loss | -5.71e-05 | -| n_updates | 235280 | -| policy_gradient_loss | 0.0794 | -| std | 0.00601 | -| value_loss | 4.61e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23530 | -| time_elapsed | 127848 | -| total_timesteps | 3011840 | -| train/ | | -| approx_kl | 0.025474988 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.14 | -| learning_rate | 0.0003 | -| loss | -0.00644 | -| n_updates | 235290 | -| policy_gradient_loss | 0.0271 | -| std | 0.00602 | -| value_loss | 3.13e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 23531 | -| time_elapsed | 127854 | -| total_timesteps | 3011968 | -| train/ | | -| approx_kl | 0.008670976 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | -0.00113 | -| n_updates | 235300 | -| policy_gradient_loss | 0.0283 | -| std | 0.00602 | -| value_loss | 2.17e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23532 | -| time_elapsed | 127859 | -| total_timesteps | 3012096 | -| train/ | | -| approx_kl | 0.045345873 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0699 | -| learning_rate | 0.0003 | -| loss | 0.00946 | -| n_updates | 235310 | -| policy_gradient_loss | 0.0283 | -| std | 0.00602 | -| value_loss | 1.66e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23533 | -| time_elapsed | 127868 | -| total_timesteps | 3012224 | -| train/ | | -| approx_kl | 0.0063328673 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.766 | -| learning_rate | 0.0003 | -| loss | -0.00185 | -| n_updates | 235320 | -| policy_gradient_loss | 0.134 | -| std | 0.00602 | -| value_loss | 0.00319 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23534 | -| time_elapsed | 127872 | -| total_timesteps | 3012352 | -| train/ | | -| approx_kl | 0.021592256 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.47 | -| learning_rate | 0.0003 | -| loss | 0.00908 | -| n_updates | 235330 | -| policy_gradient_loss | 0.0296 | -| std | 0.00602 | -| value_loss | 2.14e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23535 | -| time_elapsed | 127876 | -| total_timesteps | 3012480 | -| train/ | | -| approx_kl | 0.065245464 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.000398 | -| learning_rate | 0.0003 | -| loss | 0.0406 | -| n_updates | 235340 | -| policy_gradient_loss | 0.0312 | -| std | 0.00602 | -| value_loss | 1.91e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23536 | -| time_elapsed | 127881 | -| total_timesteps | 3012608 | -| train/ | | -| approx_kl | 0.6590431 | -| clip_fraction | 0.704 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0746 | -| learning_rate | 0.0003 | -| loss | 0.237 | -| n_updates | 235350 | -| policy_gradient_loss | 0.185 | -| std | 0.00602 | -| value_loss | 9.88e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23537 | -| time_elapsed | 127887 | -| total_timesteps | 3012736 | -| train/ | | -| approx_kl | 0.104980245 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.087 | -| learning_rate | 0.0003 | -| loss | 0.0625 | -| n_updates | 235360 | -| policy_gradient_loss | 0.0353 | -| std | 0.00602 | -| value_loss | 6.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23538 | -| time_elapsed | 127891 | -| total_timesteps | 3012864 | -| train/ | | -| approx_kl | 0.005285882 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 235370 | -| policy_gradient_loss | 0.0097 | -| std | 0.00602 | -| value_loss | 5.61e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 23539 | -| time_elapsed | 127896 | -| total_timesteps | 3012992 | -| train/ | | -| approx_kl | 0.2078599 | -| clip_fraction | 0.683 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 235380 | -| policy_gradient_loss | 0.122 | -| std | 0.00602 | -| value_loss | 3.3e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23540 | -| time_elapsed | 127900 | -| total_timesteps | 3013120 | -| train/ | | -| approx_kl | 0.1326121 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | 0.0906 | -| n_updates | 235390 | -| policy_gradient_loss | 0.108 | -| std | 0.00602 | -| value_loss | 3.14e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23541 | -| time_elapsed | 127913 | -| total_timesteps | 3013248 | -| train/ | | -| approx_kl | 0.23896447 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 235400 | -| policy_gradient_loss | 0.0336 | -| std | 0.00602 | -| value_loss | 0.000408 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23542 | -| time_elapsed | 127918 | -| total_timesteps | 3013376 | -| train/ | | -| approx_kl | 0.19885159 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0818 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 235410 | -| policy_gradient_loss | 0.13 | -| std | 0.00602 | -| value_loss | 9.69e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23543 | -| time_elapsed | 127924 | -| total_timesteps | 3013504 | -| train/ | | -| approx_kl | 0.035827905 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0912 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 235420 | -| policy_gradient_loss | 0.0279 | -| std | 0.00602 | -| value_loss | 7.08e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23544 | -| time_elapsed | 127929 | -| total_timesteps | 3013632 | -| train/ | | -| approx_kl | 0.17101671 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.0865 | -| n_updates | 235430 | -| policy_gradient_loss | 0.0238 | -| std | 0.00602 | -| value_loss | 4.67e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23545 | -| time_elapsed | 127934 | -| total_timesteps | 3013760 | -| train/ | | -| approx_kl | 0.01600999 | -| clip_fraction | 0.137 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0562 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 235440 | -| policy_gradient_loss | -0.00921 | -| std | 0.00602 | -| value_loss | 3.53e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23546 | -| time_elapsed | 127939 | -| total_timesteps | 3013888 | -| train/ | | -| approx_kl | 0.01861943 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | -0.00864 | -| n_updates | 235450 | -| policy_gradient_loss | -0.00474 | -| std | 0.00602 | -| value_loss | 2.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23547 | -| time_elapsed | 127944 | -| total_timesteps | 3014016 | -| train/ | | -| approx_kl | 0.015716529 | -| clip_fraction | 0.133 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | -0.00914 | -| n_updates | 235460 | -| policy_gradient_loss | -0.0047 | -| std | 0.00602 | -| value_loss | 2.25e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23548 | -| time_elapsed | 127956 | -| total_timesteps | 3014144 | -| train/ | | -| approx_kl | 0.00465988 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -0.0269 | -| n_updates | 235470 | -| policy_gradient_loss | -0.00887 | -| std | 0.00602 | -| value_loss | 0.000151 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23549 | -| time_elapsed | 127961 | -| total_timesteps | 3014272 | -| train/ | | -| approx_kl | 0.0047971406 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.472 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 235480 | -| policy_gradient_loss | 0.0284 | -| std | 0.00602 | -| value_loss | 2.94e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23550 | -| time_elapsed | 127966 | -| total_timesteps | 3014400 | -| train/ | | -| approx_kl | 1.1735218 | -| clip_fraction | 0.782 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.883 | -| learning_rate | 0.0003 | -| loss | 0.332 | -| n_updates | 235490 | -| policy_gradient_loss | 0.156 | -| std | 0.00602 | -| value_loss | 6.09e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23551 | -| time_elapsed | 127969 | -| total_timesteps | 3014528 | -| train/ | | -| approx_kl | 0.010133686 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -8.17 | -| learning_rate | 0.0003 | -| loss | -0.00917 | -| n_updates | 235500 | -| policy_gradient_loss | 0.0102 | -| std | 0.00602 | -| value_loss | 4.35e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23552 | -| time_elapsed | 127974 | -| total_timesteps | 3014656 | -| train/ | | -| approx_kl | 0.0014031152 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.92 | -| learning_rate | 0.0003 | -| loss | -0.00296 | -| n_updates | 235510 | -| policy_gradient_loss | 0.00379 | -| std | 0.00602 | -| value_loss | 7.53e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23553 | -| time_elapsed | 127979 | -| total_timesteps | 3014784 | -| train/ | | -| approx_kl | 0.12487023 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | 0.0581 | -| n_updates | 235520 | -| policy_gradient_loss | 0.11 | -| std | 0.00601 | -| value_loss | 6.52e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23554 | -| time_elapsed | 127984 | -| total_timesteps | 3014912 | -| train/ | | -| approx_kl | 0.057410825 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00863 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 235530 | -| policy_gradient_loss | 0.0267 | -| std | 0.00601 | -| value_loss | 2.85e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23555 | -| time_elapsed | 127990 | -| total_timesteps | 3015040 | -| train/ | | -| approx_kl | 0.25681844 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 235540 | -| policy_gradient_loss | 0.0539 | -| std | 0.00602 | -| value_loss | 1.1e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23556 | -| time_elapsed | 128004 | -| total_timesteps | 3015168 | -| train/ | | -| approx_kl | 0.04645127 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.564 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 235550 | -| policy_gradient_loss | 0.0599 | -| std | 0.00602 | -| value_loss | 0.0108 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23557 | -| time_elapsed | 128010 | -| total_timesteps | 3015296 | -| train/ | | -| approx_kl | 0.025180953 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.704 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 235560 | -| policy_gradient_loss | 0.00719 | -| std | 0.00602 | -| value_loss | 2.53e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23558 | -| time_elapsed | 128015 | -| total_timesteps | 3015424 | -| train/ | | -| approx_kl | 0.18474464 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0817 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 235570 | -| policy_gradient_loss | 0.0474 | -| std | 0.00601 | -| value_loss | 4.76e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23559 | -| time_elapsed | 128020 | -| total_timesteps | 3015552 | -| train/ | | -| approx_kl | 0.0706698 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -8.01 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 235580 | -| policy_gradient_loss | 0.0322 | -| std | 0.00601 | -| value_loss | 1.34e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23560 | -| time_elapsed | 128025 | -| total_timesteps | 3015680 | -| train/ | | -| approx_kl | 0.0027980558 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00791 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 235590 | -| policy_gradient_loss | 0.112 | -| std | 0.00601 | -| value_loss | 5.44e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23561 | -| time_elapsed | 128030 | -| total_timesteps | 3015808 | -| train/ | | -| approx_kl | 0.04048878 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.25 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 235600 | -| policy_gradient_loss | 0.04 | -| std | 0.00601 | -| value_loss | 2.56e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23562 | -| time_elapsed | 128034 | -| total_timesteps | 3015936 | -| train/ | | -| approx_kl | 0.33747005 | -| clip_fraction | 0.735 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | 0.267 | -| n_updates | 235610 | -| policy_gradient_loss | 0.197 | -| std | 0.00601 | -| value_loss | 4.67e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23563 | -| time_elapsed | 128039 | -| total_timesteps | 3016064 | -| train/ | | -| approx_kl | 0.067387275 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | -0.00596 | -| n_updates | 235620 | -| policy_gradient_loss | 0.0198 | -| std | 0.00601 | -| value_loss | 4.59e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23564 | -| time_elapsed | 128048 | -| total_timesteps | 3016192 | -| train/ | | -| approx_kl | 0.0028062942 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 235630 | -| policy_gradient_loss | 0.00763 | -| std | 0.00601 | -| value_loss | 0.00579 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23565 | -| time_elapsed | 128053 | -| total_timesteps | 3016320 | -| train/ | | -| approx_kl | 0.012011537 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.372 | -| learning_rate | 0.0003 | -| loss | -0.00935 | -| n_updates | 235640 | -| policy_gradient_loss | 0.0229 | -| std | 0.00601 | -| value_loss | 2.81e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23566 | -| time_elapsed | 128056 | -| total_timesteps | 3016448 | -| train/ | | -| approx_kl | 0.39643708 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.222 | -| n_updates | 235650 | -| policy_gradient_loss | 0.218 | -| std | 0.00601 | -| value_loss | 5.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23567 | -| time_elapsed | 128059 | -| total_timesteps | 3016576 | -| train/ | | -| approx_kl | 0.049568534 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00121 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 235660 | -| policy_gradient_loss | 0.0292 | -| std | 0.00601 | -| value_loss | 2.78e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23568 | -| time_elapsed | 128064 | -| total_timesteps | 3016704 | -| train/ | | -| approx_kl | 0.0009772489 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.00119 | -| n_updates | 235670 | -| policy_gradient_loss | 0.0338 | -| std | 0.00601 | -| value_loss | 1.76e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23569 | -| time_elapsed | 128070 | -| total_timesteps | 3016832 | -| train/ | | -| approx_kl | 0.6352013 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0707 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 235680 | -| policy_gradient_loss | 0.0508 | -| std | 0.00601 | -| value_loss | 7.95e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23570 | -| time_elapsed | 128076 | -| total_timesteps | 3016960 | -| train/ | | -| approx_kl | 0.044617448 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0997 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 235690 | -| policy_gradient_loss | 0.00757 | -| std | 0.00601 | -| value_loss | 6.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23571 | -| time_elapsed | 128081 | -| total_timesteps | 3017088 | -| train/ | | -| approx_kl | 0.06532672 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 235700 | -| policy_gradient_loss | 0.0211 | -| std | 0.00601 | -| value_loss | 4.77e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23572 | -| time_elapsed | 128090 | -| total_timesteps | 3017216 | -| train/ | | -| approx_kl | 0.0023560426 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.00653 | -| n_updates | 235710 | -| policy_gradient_loss | -0.000231 | -| std | 0.006 | -| value_loss | 0.00151 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23573 | -| time_elapsed | 128095 | -| total_timesteps | 3017344 | -| train/ | | -| approx_kl | 0.009242449 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00337 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 235720 | -| policy_gradient_loss | 0.00894 | -| std | 0.00599 | -| value_loss | 6.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23574 | -| time_elapsed | 128100 | -| total_timesteps | 3017472 | -| train/ | | -| approx_kl | 0.032579154 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0119 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 235730 | -| policy_gradient_loss | 0.0251 | -| std | 0.00601 | -| value_loss | 5.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23575 | -| time_elapsed | 128104 | -| total_timesteps | 3017600 | -| train/ | | -| approx_kl | 0.015756423 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 235740 | -| policy_gradient_loss | 0.0109 | -| std | 0.00601 | -| value_loss | 1.46e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23576 | -| time_elapsed | 128109 | -| total_timesteps | 3017728 | -| train/ | | -| approx_kl | 0.09339595 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | -0.00782 | -| n_updates | 235750 | -| policy_gradient_loss | 0.0185 | -| std | 0.00601 | -| value_loss | 3.35e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23577 | -| time_elapsed | 128115 | -| total_timesteps | 3017856 | -| train/ | | -| approx_kl | 0.17420524 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 235760 | -| policy_gradient_loss | 0.0848 | -| std | 0.00602 | -| value_loss | 2.39e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23578 | -| time_elapsed | 128120 | -| total_timesteps | 3017984 | -| train/ | | -| approx_kl | 0.20752433 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 235770 | -| policy_gradient_loss | 0.0259 | -| std | 0.00602 | -| value_loss | 1.67e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23579 | -| time_elapsed | 128126 | -| total_timesteps | 3018112 | -| train/ | | -| approx_kl | 0.5849284 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 235780 | -| policy_gradient_loss | 0.0524 | -| std | 0.00602 | -| value_loss | 7.94e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23580 | -| time_elapsed | 128138 | -| total_timesteps | 3018240 | -| train/ | | -| approx_kl | 0.12854366 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.897 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 235790 | -| policy_gradient_loss | -0.0123 | -| std | 0.00602 | -| value_loss | 0.00174 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23581 | -| time_elapsed | 128142 | -| total_timesteps | 3018368 | -| train/ | | -| approx_kl | 0.0021188506 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.00365 | -| n_updates | 235800 | -| policy_gradient_loss | 0.0102 | -| std | 0.00602 | -| value_loss | 6.51e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23582 | -| time_elapsed | 128147 | -| total_timesteps | 3018496 | -| train/ | | -| approx_kl | 0.006546137 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00625 | -| learning_rate | 0.0003 | -| loss | -0.000858 | -| n_updates | 235810 | -| policy_gradient_loss | 0.00976 | -| std | 0.00601 | -| value_loss | 1.09e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23583 | -| time_elapsed | 128152 | -| total_timesteps | 3018624 | -| train/ | | -| approx_kl | 0.08984044 | -| clip_fraction | 0.507 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0615 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 235820 | -| policy_gradient_loss | 0.0355 | -| std | 0.00601 | -| value_loss | 1.18e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23584 | -| time_elapsed | 128156 | -| total_timesteps | 3018752 | -| train/ | | -| approx_kl | 0.99762994 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.394 | -| n_updates | 235830 | -| policy_gradient_loss | 0.23 | -| std | 0.00601 | -| value_loss | 9.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 23585 | -| time_elapsed | 128160 | -| total_timesteps | 3018880 | -| train/ | | -| approx_kl | 0.06028151 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0485 | -| n_updates | 235840 | -| policy_gradient_loss | 0.0101 | -| std | 0.00601 | -| value_loss | 5.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23586 | -| time_elapsed | 128165 | -| total_timesteps | 3019008 | -| train/ | | -| approx_kl | 0.75559646 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0611 | -| learning_rate | 0.0003 | -| loss | 0.234 | -| n_updates | 235850 | -| policy_gradient_loss | 0.0763 | -| std | 0.00602 | -| value_loss | 4.22e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23587 | -| time_elapsed | 128176 | -| total_timesteps | 3019136 | -| train/ | | -| approx_kl | 0.12392253 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 235860 | -| policy_gradient_loss | -0.0169 | -| std | 0.00601 | -| value_loss | 0.000166 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23588 | -| time_elapsed | 128182 | -| total_timesteps | 3019264 | -| train/ | | -| approx_kl | 0.05851374 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.235 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 235870 | -| policy_gradient_loss | 0.0341 | -| std | 0.00601 | -| value_loss | 0.000153 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23589 | -| time_elapsed | 128186 | -| total_timesteps | 3019392 | -| train/ | | -| approx_kl | 0.9351659 | -| clip_fraction | 0.759 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.284 | -| n_updates | 235880 | -| policy_gradient_loss | 0.15 | -| std | 0.00602 | -| value_loss | 5.4e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23590 | -| time_elapsed | 128192 | -| total_timesteps | 3019520 | -| train/ | | -| approx_kl | 0.006667675 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00569 | -| n_updates | 235890 | -| policy_gradient_loss | 0.0212 | -| std | 0.00602 | -| value_loss | 1.44e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23591 | -| time_elapsed | 128198 | -| total_timesteps | 3019648 | -| train/ | | -| approx_kl | 0.00031261705 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 235900 | -| policy_gradient_loss | 0.0419 | -| std | 0.00602 | -| value_loss | 5.82e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23592 | -| time_elapsed | 128203 | -| total_timesteps | 3019776 | -| train/ | | -| approx_kl | 0.0030813655 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 235910 | -| policy_gradient_loss | 0.0381 | -| std | 0.00602 | -| value_loss | 4.89e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 23593 | -| time_elapsed | 128206 | -| total_timesteps | 3019904 | -| train/ | | -| approx_kl | 0.21710013 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0402 | -| n_updates | 235920 | -| policy_gradient_loss | 0.0124 | -| std | 0.00602 | -| value_loss | 4.02e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23594 | -| time_elapsed | 128211 | -| total_timesteps | 3020032 | -| train/ | | -| approx_kl | 0.02095045 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | 0.00671 | -| n_updates | 235930 | -| policy_gradient_loss | 0.00216 | -| std | 0.00602 | -| value_loss | 2.31e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23595 | -| time_elapsed | 128222 | -| total_timesteps | 3020160 | -| train/ | | -| approx_kl | 0.002979008 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0276 | -| n_updates | 235940 | -| policy_gradient_loss | -0.00314 | -| std | 0.00602 | -| value_loss | 0.000313 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23596 | -| time_elapsed | 128227 | -| total_timesteps | 3020288 | -| train/ | | -| approx_kl | 0.04665314 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 235950 | -| policy_gradient_loss | 0.0203 | -| std | 0.00602 | -| value_loss | 4.86e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23597 | -| time_elapsed | 128231 | -| total_timesteps | 3020416 | -| train/ | | -| approx_kl | 0.15914734 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.0854 | -| n_updates | 235960 | -| policy_gradient_loss | 0.0243 | -| std | 0.00602 | -| value_loss | 7.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23598 | -| time_elapsed | 128235 | -| total_timesteps | 3020544 | -| train/ | | -| approx_kl | 0.014556233 | -| clip_fraction | 0.114 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 235970 | -| policy_gradient_loss | -0.0105 | -| std | 0.00602 | -| value_loss | 3.16e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23599 | -| time_elapsed | 128240 | -| total_timesteps | 3020672 | -| train/ | | -| approx_kl | 0.014112009 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 235980 | -| policy_gradient_loss | -0.00575 | -| std | 0.00602 | -| value_loss | 1.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23600 | -| time_elapsed | 128244 | -| total_timesteps | 3020800 | -| train/ | | -| approx_kl | 0.035225317 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0477 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 235990 | -| policy_gradient_loss | 0.0449 | -| std | 0.00602 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 23601 | -| time_elapsed | 128250 | -| total_timesteps | 3020928 | -| train/ | | -| approx_kl | 0.13084164 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0841 | -| n_updates | 236000 | -| policy_gradient_loss | 0.0408 | -| std | 0.00601 | -| value_loss | 1.36e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23602 | -| time_elapsed | 128254 | -| total_timesteps | 3021056 | -| train/ | | -| approx_kl | 0.00027247472 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.00271 | -| n_updates | 236010 | -| policy_gradient_loss | 0.0291 | -| std | 0.00601 | -| value_loss | 1.13e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23603 | -| time_elapsed | 128265 | -| total_timesteps | 3021184 | -| train/ | | -| approx_kl | 0.19844288 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 236020 | -| policy_gradient_loss | 0.00758 | -| std | 0.00602 | -| value_loss | 0.000122 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23604 | -| time_elapsed | 128270 | -| total_timesteps | 3021312 | -| train/ | | -| approx_kl | 0.015430131 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 236030 | -| policy_gradient_loss | -0.00167 | -| std | 0.00602 | -| value_loss | 2.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23605 | -| time_elapsed | 128275 | -| total_timesteps | 3021440 | -| train/ | | -| approx_kl | 0.015158657 | -| clip_fraction | 0.103 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 236040 | -| policy_gradient_loss | -0.00536 | -| std | 0.00602 | -| value_loss | 3.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23606 | -| time_elapsed | 128280 | -| total_timesteps | 3021568 | -| train/ | | -| approx_kl | 0.015030855 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.09 | -| learning_rate | 0.0003 | -| loss | -0.0236 | -| n_updates | 236050 | -| policy_gradient_loss | -0.0118 | -| std | 0.00601 | -| value_loss | 2.36e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23607 | -| time_elapsed | 128285 | -| total_timesteps | 3021696 | -| train/ | | -| approx_kl | 0.02763136 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0603 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 236060 | -| policy_gradient_loss | 0.0352 | -| std | 0.00602 | -| value_loss | 1.28e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23608 | -| time_elapsed | 128288 | -| total_timesteps | 3021824 | -| train/ | | -| approx_kl | 0.32618967 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0985 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 236070 | -| policy_gradient_loss | 0.156 | -| std | 0.00602 | -| value_loss | 7.47e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.904 | -| time/ | | -| fps | 23 | -| iterations | 23609 | -| time_elapsed | 128293 | -| total_timesteps | 3021952 | -| train/ | | -| approx_kl | 0.055485163 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.087 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 236080 | -| policy_gradient_loss | 0.0214 | -| std | 0.00602 | -| value_loss | 5.51e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23610 | -| time_elapsed | 128297 | -| total_timesteps | 3022080 | -| train/ | | -| approx_kl | 0.0018842923 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.00222 | -| n_updates | 236090 | -| policy_gradient_loss | 0.0332 | -| std | 0.00601 | -| value_loss | 4.21e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23611 | -| time_elapsed | 128305 | -| total_timesteps | 3022208 | -| train/ | | -| approx_kl | 0.20681387 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | 0.0765 | -| n_updates | 236100 | -| policy_gradient_loss | 0.0194 | -| std | 0.00601 | -| value_loss | 0.000254 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23612 | -| time_elapsed | 128310 | -| total_timesteps | 3022336 | -| train/ | | -| approx_kl | 0.026493486 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.00207 | -| n_updates | 236110 | -| policy_gradient_loss | 0.0346 | -| std | 0.00601 | -| value_loss | 3.79e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23613 | -| time_elapsed | 128316 | -| total_timesteps | 3022464 | -| train/ | | -| approx_kl | 0.13130796 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00892 | -| learning_rate | 0.0003 | -| loss | 0.0619 | -| n_updates | 236120 | -| policy_gradient_loss | 0.0328 | -| std | 0.00601 | -| value_loss | 1.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23614 | -| time_elapsed | 128321 | -| total_timesteps | 3022592 | -| train/ | | -| approx_kl | 0.16854212 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00672 | -| learning_rate | 0.0003 | -| loss | 0.0756 | -| n_updates | 236130 | -| policy_gradient_loss | 0.028 | -| std | 0.00601 | -| value_loss | 5.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23615 | -| time_elapsed | 128325 | -| total_timesteps | 3022720 | -| train/ | | -| approx_kl | 0.033835992 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 236140 | -| policy_gradient_loss | 0.0301 | -| std | 0.00601 | -| value_loss | 3.68e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23616 | -| time_elapsed | 128330 | -| total_timesteps | 3022848 | -| train/ | | -| approx_kl | 0.26934803 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0348 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 236150 | -| policy_gradient_loss | 0.109 | -| std | 0.00602 | -| value_loss | 2.39e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 23617 | -| time_elapsed | 128336 | -| total_timesteps | 3022976 | -| train/ | | -| approx_kl | 0.04396108 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 236160 | -| policy_gradient_loss | 0.0119 | -| std | 0.00602 | -| value_loss | 2.21e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 23618 | -| time_elapsed | 128341 | -| total_timesteps | 3023104 | -| train/ | | -| approx_kl | 0.17476514 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.0863 | -| n_updates | 236170 | -| policy_gradient_loss | 0.0236 | -| std | 0.00602 | -| value_loss | 1.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 23619 | -| time_elapsed | 128350 | -| total_timesteps | 3023232 | -| train/ | | -| approx_kl | 0.031686895 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 236180 | -| policy_gradient_loss | 0.0108 | -| std | 0.00602 | -| value_loss | 0.00141 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 23620 | -| time_elapsed | 128355 | -| total_timesteps | 3023360 | -| train/ | | -| approx_kl | 0.14021903 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 236190 | -| policy_gradient_loss | 0.0454 | -| std | 0.00602 | -| value_loss | 2.64e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 23621 | -| time_elapsed | 128360 | -| total_timesteps | 3023488 | -| train/ | | -| approx_kl | 0.00079056993 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00972 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 236200 | -| policy_gradient_loss | 0.0374 | -| std | 0.00602 | -| value_loss | 4.59e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 23622 | -| time_elapsed | 128365 | -| total_timesteps | 3023616 | -| train/ | | -| approx_kl | 0.18608142 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 236210 | -| policy_gradient_loss | 0.0197 | -| std | 0.00602 | -| value_loss | 4.15e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 23623 | -| time_elapsed | 128369 | -| total_timesteps | 3023744 | -| train/ | | -| approx_kl | 0.028904688 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 236220 | -| policy_gradient_loss | 0.0395 | -| std | 0.00602 | -| value_loss | 2.77e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 23624 | -| time_elapsed | 128374 | -| total_timesteps | 3023872 | -| train/ | | -| approx_kl | 0.43952715 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | 0.216 | -| n_updates | 236230 | -| policy_gradient_loss | 0.17 | -| std | 0.00602 | -| value_loss | 2e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23625 | -| time_elapsed | 128378 | -| total_timesteps | 3024000 | -| train/ | | -| approx_kl | 0.2527646 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 236240 | -| policy_gradient_loss | 0.156 | -| std | 0.00602 | -| value_loss | 1.12e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23626 | -| time_elapsed | 128381 | -| total_timesteps | 3024128 | -| train/ | | -| approx_kl | 0.16069223 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00833 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 236250 | -| policy_gradient_loss | 0.134 | -| std | 0.00602 | -| value_loss | 6.83e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23627 | -| time_elapsed | 128392 | -| total_timesteps | 3024256 | -| train/ | | -| approx_kl | 0.12677537 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.999 | -| learning_rate | 0.0003 | -| loss | 0.0671 | -| n_updates | 236260 | -| policy_gradient_loss | 0.0906 | -| std | 0.00602 | -| value_loss | 8.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23628 | -| time_elapsed | 128396 | -| total_timesteps | 3024384 | -| train/ | | -| approx_kl | 0.049570765 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.000363 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 236270 | -| policy_gradient_loss | 0.0332 | -| std | 0.00603 | -| value_loss | 1.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23629 | -| time_elapsed | 128401 | -| total_timesteps | 3024512 | -| train/ | | -| approx_kl | 0.18833068 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00389 | -| learning_rate | 0.0003 | -| loss | 0.0812 | -| n_updates | 236280 | -| policy_gradient_loss | 0.0237 | -| std | 0.00603 | -| value_loss | 5.92e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23630 | -| time_elapsed | 128405 | -| total_timesteps | 3024640 | -| train/ | | -| approx_kl | 0.030500315 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 236290 | -| policy_gradient_loss | 0.0333 | -| std | 0.00603 | -| value_loss | 4.45e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23631 | -| time_elapsed | 128410 | -| total_timesteps | 3024768 | -| train/ | | -| approx_kl | 0.12564966 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 236300 | -| policy_gradient_loss | 0.0267 | -| std | 0.00602 | -| value_loss | 3.64e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 23632 | -| time_elapsed | 128416 | -| total_timesteps | 3024896 | -| train/ | | -| approx_kl | 0.0002572583 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.000254 | -| n_updates | 236310 | -| policy_gradient_loss | 0.0416 | -| std | 0.00603 | -| value_loss | 1.73e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23633 | -| time_elapsed | 128422 | -| total_timesteps | 3025024 | -| train/ | | -| approx_kl | 0.003132536 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0917 | -| learning_rate | 0.0003 | -| loss | -0.000821 | -| n_updates | 236320 | -| policy_gradient_loss | 0.0417 | -| std | 0.00604 | -| value_loss | 1.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23634 | -| time_elapsed | 128433 | -| total_timesteps | 3025152 | -| train/ | | -| approx_kl | 0.15046676 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 236330 | -| policy_gradient_loss | 0.00857 | -| std | 0.00605 | -| value_loss | 0.00382 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23635 | -| time_elapsed | 128437 | -| total_timesteps | 3025280 | -| train/ | | -| approx_kl | 0.024889914 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.06 | -| learning_rate | 0.0003 | -| loss | 0.00544 | -| n_updates | 236340 | -| policy_gradient_loss | 0.0225 | -| std | 0.00605 | -| value_loss | 3.24e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23636 | -| time_elapsed | 128442 | -| total_timesteps | 3025408 | -| train/ | | -| approx_kl | 0.12197399 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0038 | -| learning_rate | 0.0003 | -| loss | 0.0352 | -| n_updates | 236350 | -| policy_gradient_loss | 0.0219 | -| std | 0.00605 | -| value_loss | 6.31e-06 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23637 | -| time_elapsed | 128447 | -| total_timesteps | 3025536 | -| train/ | | -| approx_kl | 0.145754 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 236360 | -| policy_gradient_loss | 0.0221 | -| std | 0.00605 | -| value_loss | 3.77e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23638 | -| time_elapsed | 128452 | -| total_timesteps | 3025664 | -| train/ | | -| approx_kl | 0.016790582 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | -0.000333 | -| n_updates | 236370 | -| policy_gradient_loss | 0.000181 | -| std | 0.00605 | -| value_loss | 2.59e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23639 | -| time_elapsed | 128456 | -| total_timesteps | 3025792 | -| train/ | | -| approx_kl | 0.01335791 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0386 | -| learning_rate | 0.0003 | -| loss | 0.0036 | -| n_updates | 236380 | -| policy_gradient_loss | 0.00197 | -| std | 0.00606 | -| value_loss | 2.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 23640 | -| time_elapsed | 128462 | -| total_timesteps | 3025920 | -| train/ | | -| approx_kl | 0.012230906 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.00479 | -| n_updates | 236390 | -| policy_gradient_loss | 0.0025 | -| std | 0.00607 | -| value_loss | 4.04e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23641 | -| time_elapsed | 128467 | -| total_timesteps | 3026048 | -| train/ | | -| approx_kl | 0.015477646 | -| clip_fraction | 0.119 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.344 | -| learning_rate | 0.0003 | -| loss | 9.38e-05 | -| n_updates | 236400 | -| policy_gradient_loss | 0.000112 | -| std | 0.00607 | -| value_loss | 9.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23642 | -| time_elapsed | 128476 | -| total_timesteps | 3026176 | -| train/ | | -| approx_kl | 0.022072323 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.915 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 236410 | -| policy_gradient_loss | -0.00314 | -| std | 0.00607 | -| value_loss | 0.00141 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23643 | -| time_elapsed | 128481 | -| total_timesteps | 3026304 | -| train/ | | -| approx_kl | 0.013386123 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | -0.000629 | -| n_updates | 236420 | -| policy_gradient_loss | 0.00058 | -| std | 0.00607 | -| value_loss | 1.23e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23644 | -| time_elapsed | 128485 | -| total_timesteps | 3026432 | -| train/ | | -| approx_kl | 0.13216811 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 236430 | -| policy_gradient_loss | 0.0146 | -| std | 0.00607 | -| value_loss | 2.79e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23645 | -| time_elapsed | 128490 | -| total_timesteps | 3026560 | -| train/ | | -| approx_kl | 0.025688019 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 236440 | -| policy_gradient_loss | 0.0262 | -| std | 0.00608 | -| value_loss | 1.33e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23646 | -| time_elapsed | 128495 | -| total_timesteps | 3026688 | -| train/ | | -| approx_kl | 0.060284685 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.0626 | -| n_updates | 236450 | -| policy_gradient_loss | 0.0109 | -| std | 0.00608 | -| value_loss | 6.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23647 | -| time_elapsed | 128500 | -| total_timesteps | 3026816 | -| train/ | | -| approx_kl | 0.098253176 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | 0.0422 | -| n_updates | 236460 | -| policy_gradient_loss | 0.024 | -| std | 0.00608 | -| value_loss | 9.41e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23648 | -| time_elapsed | 128505 | -| total_timesteps | 3026944 | -| train/ | | -| approx_kl | 0.11054474 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.871 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 236470 | -| policy_gradient_loss | 0.0187 | -| std | 0.00608 | -| value_loss | 3.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23649 | -| time_elapsed | 128509 | -| total_timesteps | 3027072 | -| train/ | | -| approx_kl | 0.001066226 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.00305 | -| n_updates | 236480 | -| policy_gradient_loss | 0.0209 | -| std | 0.00607 | -| value_loss | 7.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23650 | -| time_elapsed | 128519 | -| total_timesteps | 3027200 | -| train/ | | -| approx_kl | 0.07699151 | -| clip_fraction | 0.483 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 236490 | -| policy_gradient_loss | 0.00841 | -| std | 0.00606 | -| value_loss | 1.56e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23651 | -| time_elapsed | 128524 | -| total_timesteps | 3027328 | -| train/ | | -| approx_kl | 0.01654411 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.438 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 236500 | -| policy_gradient_loss | 0.0809 | -| std | 0.00606 | -| value_loss | 1.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23652 | -| time_elapsed | 128528 | -| total_timesteps | 3027456 | -| train/ | | -| approx_kl | 0.014382521 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 236510 | -| policy_gradient_loss | 0.0107 | -| std | 0.00606 | -| value_loss | 4.58e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23653 | -| time_elapsed | 128534 | -| total_timesteps | 3027584 | -| train/ | | -| approx_kl | 0.046369474 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 236520 | -| policy_gradient_loss | 0.0518 | -| std | 0.00606 | -| value_loss | 1.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23654 | -| time_elapsed | 128540 | -| total_timesteps | 3027712 | -| train/ | | -| approx_kl | 0.019828305 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 236530 | -| policy_gradient_loss | 0.00903 | -| std | 0.00606 | -| value_loss | 2.23e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23655 | -| time_elapsed | 128546 | -| total_timesteps | 3027840 | -| train/ | | -| approx_kl | 0.21130478 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | 0.0524 | -| n_updates | 236540 | -| policy_gradient_loss | 0.0458 | -| std | 0.00606 | -| value_loss | 1.85e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 23656 | -| time_elapsed | 128550 | -| total_timesteps | 3027968 | -| train/ | | -| approx_kl | 0.003752463 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00577 | -| n_updates | 236550 | -| policy_gradient_loss | 0.0147 | -| std | 0.00606 | -| value_loss | 1.36e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23657 | -| time_elapsed | 128556 | -| total_timesteps | 3028096 | -| train/ | | -| approx_kl | 0.029813206 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0952 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 236560 | -| policy_gradient_loss | 0.0392 | -| std | 0.00604 | -| value_loss | 1.15e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23658 | -| time_elapsed | 128567 | -| total_timesteps | 3028224 | -| train/ | | -| approx_kl | 0.4386959 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | 0.218 | -| n_updates | 236570 | -| policy_gradient_loss | 0.165 | -| std | 0.00603 | -| value_loss | 0.000545 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23659 | -| time_elapsed | 128573 | -| total_timesteps | 3028352 | -| train/ | | -| approx_kl | 0.3146041 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.354 | -| learning_rate | 0.0003 | -| loss | 0.184 | -| n_updates | 236580 | -| policy_gradient_loss | 0.179 | -| std | 0.00603 | -| value_loss | 0.000123 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23660 | -| time_elapsed | 128578 | -| total_timesteps | 3028480 | -| train/ | | -| approx_kl | 0.22119349 | -| clip_fraction | 0.722 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0147 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 236590 | -| policy_gradient_loss | 0.151 | -| std | 0.00603 | -| value_loss | 4.98e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23661 | -| time_elapsed | 128583 | -| total_timesteps | 3028608 | -| train/ | | -| approx_kl | 0.03406404 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00454 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 236600 | -| policy_gradient_loss | 0.0298 | -| std | 0.00603 | -| value_loss | 1.68e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23662 | -| time_elapsed | 128588 | -| total_timesteps | 3028736 | -| train/ | | -| approx_kl | 0.56258523 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 236610 | -| policy_gradient_loss | 0.0535 | -| std | 0.00603 | -| value_loss | 1.14e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23663 | -| time_elapsed | 128593 | -| total_timesteps | 3028864 | -| train/ | | -| approx_kl | 0.011594058 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | 0.000302 | -| n_updates | 236620 | -| policy_gradient_loss | 0.00805 | -| std | 0.00603 | -| value_loss | 8.29e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 23664 | -| time_elapsed | 128598 | -| total_timesteps | 3028992 | -| train/ | | -| approx_kl | 0.06921704 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0508 | -| learning_rate | 0.0003 | -| loss | 0.00874 | -| n_updates | 236630 | -| policy_gradient_loss | 0.000414 | -| std | 0.00603 | -| value_loss | 6.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23665 | -| time_elapsed | 128602 | -| total_timesteps | 3029120 | -| train/ | | -| approx_kl | 0.015664123 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | -0.000331 | -| n_updates | 236640 | -| policy_gradient_loss | 0.0101 | -| std | 0.00602 | -| value_loss | 4.88e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23666 | -| time_elapsed | 128618 | -| total_timesteps | 3029248 | -| train/ | | -| approx_kl | 0.009539029 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.992 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 236650 | -| policy_gradient_loss | 0.000511 | -| std | 0.00602 | -| value_loss | 6.59e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23667 | -| time_elapsed | 128622 | -| total_timesteps | 3029376 | -| train/ | | -| approx_kl | 0.1297944 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 236660 | -| policy_gradient_loss | 0.00971 | -| std | 0.00602 | -| value_loss | 1.49e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23668 | -| time_elapsed | 128627 | -| total_timesteps | 3029504 | -| train/ | | -| approx_kl | 0.044042718 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0517 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 236670 | -| policy_gradient_loss | 0.00875 | -| std | 0.00602 | -| value_loss | 1.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23669 | -| time_elapsed | 128632 | -| total_timesteps | 3029632 | -| train/ | | -| approx_kl | 0.057114102 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 236680 | -| policy_gradient_loss | 0.0134 | -| std | 0.00602 | -| value_loss | 6.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23670 | -| time_elapsed | 128637 | -| total_timesteps | 3029760 | -| train/ | | -| approx_kl | 0.049475856 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 236690 | -| policy_gradient_loss | 0.0125 | -| std | 0.00602 | -| value_loss | 4.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23671 | -| time_elapsed | 128643 | -| total_timesteps | 3029888 | -| train/ | | -| approx_kl | 0.009950828 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 236700 | -| policy_gradient_loss | 0.00784 | -| std | 0.00602 | -| value_loss | 8.58e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23672 | -| time_elapsed | 128648 | -| total_timesteps | 3030016 | -| train/ | | -| approx_kl | 0.0023913602 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 236710 | -| policy_gradient_loss | 0.0105 | -| std | 0.00602 | -| value_loss | 5.45e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23673 | -| time_elapsed | 128661 | -| total_timesteps | 3030144 | -| train/ | | -| approx_kl | 0.07375887 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.879 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 236720 | -| policy_gradient_loss | 0.0282 | -| std | 0.00602 | -| value_loss | 0.00237 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23674 | -| time_elapsed | 128667 | -| total_timesteps | 3030272 | -| train/ | | -| approx_kl | 0.21731746 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0291 | -| learning_rate | 0.0003 | -| loss | 0.0829 | -| n_updates | 236730 | -| policy_gradient_loss | 0.0785 | -| std | 0.00602 | -| value_loss | 2.71e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23675 | -| time_elapsed | 128672 | -| total_timesteps | 3030400 | -| train/ | | -| approx_kl | 0.047597192 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 236740 | -| policy_gradient_loss | 0.0289 | -| std | 0.00602 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23676 | -| time_elapsed | 128677 | -| total_timesteps | 3030528 | -| train/ | | -| approx_kl | 0.0014034491 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.228 | -| learning_rate | 0.0003 | -| loss | 0.00338 | -| n_updates | 236750 | -| policy_gradient_loss | 0.0322 | -| std | 0.00602 | -| value_loss | 4.09e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23677 | -| time_elapsed | 128681 | -| total_timesteps | 3030656 | -| train/ | | -| approx_kl | 0.64318025 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 236760 | -| policy_gradient_loss | 0.0641 | -| std | 0.00602 | -| value_loss | 2.7e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23678 | -| time_elapsed | 128687 | -| total_timesteps | 3030784 | -| train/ | | -| approx_kl | 0.05005272 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | -0.0326 | -| n_updates | 236770 | -| policy_gradient_loss | -0.0163 | -| std | 0.00602 | -| value_loss | 2.34e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 23679 | -| time_elapsed | 128692 | -| total_timesteps | 3030912 | -| train/ | | -| approx_kl | 0.008377206 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.00186 | -| n_updates | 236780 | -| policy_gradient_loss | 0.0083 | -| std | 0.00602 | -| value_loss | 1.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23680 | -| time_elapsed | 128696 | -| total_timesteps | 3031040 | -| train/ | | -| approx_kl | 0.08121467 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0896 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 236790 | -| policy_gradient_loss | 0.015 | -| std | 0.00603 | -| value_loss | 8.89e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23681 | -| time_elapsed | 128704 | -| total_timesteps | 3031168 | -| train/ | | -| approx_kl | 0.014171517 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | -0.0183 | -| n_updates | 236800 | -| policy_gradient_loss | -0.00953 | -| std | 0.00603 | -| value_loss | 0.00045 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23682 | -| time_elapsed | 128710 | -| total_timesteps | 3031296 | -| train/ | | -| approx_kl | 0.080399066 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.663 | -| learning_rate | 0.0003 | -| loss | 0.000949 | -| n_updates | 236810 | -| policy_gradient_loss | -0.000763 | -| std | 0.00603 | -| value_loss | 5.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23683 | -| time_elapsed | 128715 | -| total_timesteps | 3031424 | -| train/ | | -| approx_kl | 0.013785878 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 236820 | -| policy_gradient_loss | 0.00396 | -| std | 0.00603 | -| value_loss | 9.74e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23684 | -| time_elapsed | 128721 | -| total_timesteps | 3031552 | -| train/ | | -| approx_kl | 0.0034959177 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -4.86 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 236830 | -| policy_gradient_loss | 0.00722 | -| std | 0.00603 | -| value_loss | 5.55e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23685 | -| time_elapsed | 128724 | -| total_timesteps | 3031680 | -| train/ | | -| approx_kl | 0.048069056 | -| clip_fraction | 0.65 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00512 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 236840 | -| policy_gradient_loss | 0.129 | -| std | 0.00603 | -| value_loss | 4.86e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23686 | -| time_elapsed | 128728 | -| total_timesteps | 3031808 | -| train/ | | -| approx_kl | 0.10375281 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0642 | -| learning_rate | 0.0003 | -| loss | 0.0504 | -| n_updates | 236850 | -| policy_gradient_loss | 0.0743 | -| std | 0.00603 | -| value_loss | 3.26e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 23687 | -| time_elapsed | 128733 | -| total_timesteps | 3031936 | -| train/ | | -| approx_kl | 0.15181176 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 236860 | -| policy_gradient_loss | 0.175 | -| std | 0.00604 | -| value_loss | 2.85e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23688 | -| time_elapsed | 128739 | -| total_timesteps | 3032064 | -| train/ | | -| approx_kl | 0.03096167 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 236870 | -| policy_gradient_loss | 0.0195 | -| std | 0.00604 | -| value_loss | 4.02e-10 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23689 | -| time_elapsed | 128747 | -| total_timesteps | 3032192 | -| train/ | | -| approx_kl | 0.3589102 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 236880 | -| policy_gradient_loss | 0.0183 | -| std | 0.00605 | -| value_loss | 0.00358 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23690 | -| time_elapsed | 128753 | -| total_timesteps | 3032320 | -| train/ | | -| approx_kl | 0.04552579 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.541 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 236890 | -| policy_gradient_loss | 0.0466 | -| std | 0.00605 | -| value_loss | 1.12e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23691 | -| time_elapsed | 128763 | -| total_timesteps | 3032448 | -| train/ | | -| approx_kl | 0.8989433 | -| clip_fraction | 0.76 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00639 | -| learning_rate | 0.0003 | -| loss | 0.253 | -| n_updates | 236900 | -| policy_gradient_loss | 0.205 | -| std | 0.00605 | -| value_loss | 1.06e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23692 | -| time_elapsed | 128767 | -| total_timesteps | 3032576 | -| train/ | | -| approx_kl | 0.009232596 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 236910 | -| policy_gradient_loss | 0.0364 | -| std | 0.00605 | -| value_loss | 7.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23693 | -| time_elapsed | 128773 | -| total_timesteps | 3032704 | -| train/ | | -| approx_kl | 0.113837376 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.0779 | -| n_updates | 236920 | -| policy_gradient_loss | 0.0404 | -| std | 0.00605 | -| value_loss | 4.71e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23694 | -| time_elapsed | 128779 | -| total_timesteps | 3032832 | -| train/ | | -| approx_kl | 0.14827205 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.068 | -| learning_rate | 0.0003 | -| loss | 0.0812 | -| n_updates | 236930 | -| policy_gradient_loss | 0.0259 | -| std | 0.00605 | -| value_loss | 3.59e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 23695 | -| time_elapsed | 128785 | -| total_timesteps | 3032960 | -| train/ | | -| approx_kl | 0.015200602 | -| clip_fraction | 0.125 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0508 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 236940 | -| policy_gradient_loss | -0.00947 | -| std | 0.00605 | -| value_loss | 2.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23696 | -| time_elapsed | 128789 | -| total_timesteps | 3033088 | -| train/ | | -| approx_kl | 0.026077053 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 236950 | -| policy_gradient_loss | 0.0338 | -| std | 0.00605 | -| value_loss | 1.68e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23697 | -| time_elapsed | 128800 | -| total_timesteps | 3033216 | -| train/ | | -| approx_kl | 0.1341844 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 236960 | -| policy_gradient_loss | 0.0187 | -| std | 0.00605 | -| value_loss | 0.00108 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23698 | -| time_elapsed | 128807 | -| total_timesteps | 3033344 | -| train/ | | -| approx_kl | 0.00840971 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0972 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 236970 | -| policy_gradient_loss | 0.0131 | -| std | 0.00605 | -| value_loss | 1.07e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23699 | -| time_elapsed | 128813 | -| total_timesteps | 3033472 | -| train/ | | -| approx_kl | 0.18871698 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0143 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 236980 | -| policy_gradient_loss | 0.12 | -| std | 0.00605 | -| value_loss | 1.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23700 | -| time_elapsed | 128819 | -| total_timesteps | 3033600 | -| train/ | | -| approx_kl | 0.041596226 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | 0.00936 | -| n_updates | 236990 | -| policy_gradient_loss | 0.0231 | -| std | 0.00605 | -| value_loss | 6.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23701 | -| time_elapsed | 128823 | -| total_timesteps | 3033728 | -| train/ | | -| approx_kl | 0.21756837 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0576 | -| learning_rate | 0.0003 | -| loss | 0.0913 | -| n_updates | 237000 | -| policy_gradient_loss | 0.027 | -| std | 0.00606 | -| value_loss | 5.02e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23702 | -| time_elapsed | 128828 | -| total_timesteps | 3033856 | -| train/ | | -| approx_kl | 0.015088802 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | -0.00833 | -| n_updates | 237010 | -| policy_gradient_loss | -0.00484 | -| std | 0.00606 | -| value_loss | 3.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.936 | -| time/ | | -| fps | 23 | -| iterations | 23703 | -| time_elapsed | 128835 | -| total_timesteps | 3033984 | -| train/ | | -| approx_kl | 0.027895516 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 237020 | -| policy_gradient_loss | 0.042 | -| std | 0.00605 | -| value_loss | 3.14e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 23704 | -| time_elapsed | 128841 | -| total_timesteps | 3034112 | -| train/ | | -| approx_kl | 0.1381591 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | 0.0685 | -| n_updates | 237030 | -| policy_gradient_loss | 0.0365 | -| std | 0.00605 | -| value_loss | 1.02e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 23705 | -| time_elapsed | 128853 | -| total_timesteps | 3034240 | -| train/ | | -| approx_kl | 0.033594374 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.806 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 237040 | -| policy_gradient_loss | -0.0127 | -| std | 0.00604 | -| value_loss | 0.00548 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 23706 | -| time_elapsed | 128859 | -| total_timesteps | 3034368 | -| train/ | | -| approx_kl | 0.09111903 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.249 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 237050 | -| policy_gradient_loss | 0.0363 | -| std | 0.00604 | -| value_loss | 8.56e-05 | ----------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 23707 | -| time_elapsed | 128865 | -| total_timesteps | 3034496 | -| train/ | | -| approx_kl | 1.44992955e-05 | -| clip_fraction | 0.46 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00844 | -| learning_rate | 0.0003 | -| loss | 8.34e-05 | -| n_updates | 237060 | -| policy_gradient_loss | 0.0322 | -| std | 0.00603 | -| value_loss | 2.41e-05 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 23708 | -| time_elapsed | 128871 | -| total_timesteps | 3034624 | -| train/ | | -| approx_kl | 0.56533486 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.64 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 237070 | -| policy_gradient_loss | 0.0387 | -| std | 0.00602 | -| value_loss | 0.00022 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 23709 | -| time_elapsed | 128877 | -| total_timesteps | 3034752 | -| train/ | | -| approx_kl | 0.012357108 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -2.39 | -| learning_rate | 0.0003 | -| loss | -0.00505 | -| n_updates | 237080 | -| policy_gradient_loss | 0.00422 | -| std | 0.00601 | -| value_loss | 1.09e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.944 | -| time/ | | -| fps | 23 | -| iterations | 23710 | -| time_elapsed | 128882 | -| total_timesteps | 3034880 | -| train/ | | -| approx_kl | 0.08072007 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.0404 | -| n_updates | 237090 | -| policy_gradient_loss | 0.0163 | -| std | 0.00601 | -| value_loss | 6.72e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23711 | -| time_elapsed | 128889 | -| total_timesteps | 3035008 | -| train/ | | -| approx_kl | 0.014703301 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 237100 | -| policy_gradient_loss | 0.00133 | -| std | 0.00601 | -| value_loss | 5.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23712 | -| time_elapsed | 128900 | -| total_timesteps | 3035136 | -| train/ | | -| approx_kl | 0.07765288 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0133 | -| n_updates | 237110 | -| policy_gradient_loss | -0.000335 | -| std | 0.00602 | -| value_loss | 0.00412 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23713 | -| time_elapsed | 128905 | -| total_timesteps | 3035264 | -| train/ | | -| approx_kl | 0.12284424 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.566 | -| learning_rate | 0.0003 | -| loss | 0.0605 | -| n_updates | 237120 | -| policy_gradient_loss | 0.0435 | -| std | 0.00602 | -| value_loss | 3.06e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23714 | -| time_elapsed | 128910 | -| total_timesteps | 3035392 | -| train/ | | -| approx_kl | 9.113364e-05 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0962 | -| learning_rate | 0.0003 | -| loss | -0.000814 | -| n_updates | 237130 | -| policy_gradient_loss | 0.0117 | -| std | 0.00602 | -| value_loss | 8.51e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23715 | -| time_elapsed | 128915 | -| total_timesteps | 3035520 | -| train/ | | -| approx_kl | 0.19631197 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 237140 | -| policy_gradient_loss | 0.0317 | -| std | 0.00602 | -| value_loss | 2.85e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23716 | -| time_elapsed | 128920 | -| total_timesteps | 3035648 | -| train/ | | -| approx_kl | 0.8575783 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0925 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 237150 | -| policy_gradient_loss | 0.071 | -| std | 0.00602 | -| value_loss | 1.88e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23717 | -| time_elapsed | 128925 | -| total_timesteps | 3035776 | -| train/ | | -| approx_kl | 0.04693027 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0633 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 237160 | -| policy_gradient_loss | 0.0134 | -| std | 0.00602 | -| value_loss | 1.53e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 23718 | -| time_elapsed | 128929 | -| total_timesteps | 3035904 | -| train/ | | -| approx_kl | 0.069249325 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.0441 | -| n_updates | 237170 | -| policy_gradient_loss | 0.0207 | -| std | 0.00602 | -| value_loss | 9.07e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23719 | -| time_elapsed | 128934 | -| total_timesteps | 3036032 | -| train/ | | -| approx_kl | 0.01018875 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0853 | -| learning_rate | 0.0003 | -| loss | -0.00857 | -| n_updates | 237180 | -| policy_gradient_loss | 0.00687 | -| std | 0.00602 | -| value_loss | 6.62e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23720 | -| time_elapsed | 128945 | -| total_timesteps | 3036160 | -| train/ | | -| approx_kl | 0.0066122585 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.509 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 237190 | -| policy_gradient_loss | -0.00772 | -| std | 0.00602 | -| value_loss | 0.00169 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23721 | -| time_elapsed | 128949 | -| total_timesteps | 3036288 | -| train/ | | -| approx_kl | 0.09058642 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.297 | -| learning_rate | 0.0003 | -| loss | -0.00232 | -| n_updates | 237200 | -| policy_gradient_loss | -0.00113 | -| std | 0.00602 | -| value_loss | 1.55e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23722 | -| time_elapsed | 128952 | -| total_timesteps | 3036416 | -| train/ | | -| approx_kl | 0.04228212 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | 0.00448 | -| n_updates | 237210 | -| policy_gradient_loss | 0.0253 | -| std | 0.00602 | -| value_loss | 1.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23723 | -| time_elapsed | 128955 | -| total_timesteps | 3036544 | -| train/ | | -| approx_kl | 0.040861573 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0966 | -| learning_rate | 0.0003 | -| loss | 0.0338 | -| n_updates | 237220 | -| policy_gradient_loss | 0.0211 | -| std | 0.006 | -| value_loss | 7.14e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23724 | -| time_elapsed | 128959 | -| total_timesteps | 3036672 | -| train/ | | -| approx_kl | 6.944407e-06 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.259 | -| learning_rate | 0.0003 | -| loss | 0.00044 | -| n_updates | 237230 | -| policy_gradient_loss | 0.00104 | -| std | 0.006 | -| value_loss | 6.33e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23725 | -| time_elapsed | 128962 | -| total_timesteps | 3036800 | -| train/ | | -| approx_kl | 0.07395762 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -25.6 | -| learning_rate | 0.0003 | -| loss | 0.00271 | -| n_updates | 237240 | -| policy_gradient_loss | 0.00109 | -| std | 0.00599 | -| value_loss | 3.13e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 23726 | -| time_elapsed | 128966 | -| total_timesteps | 3036928 | -| train/ | | -| approx_kl | 0.011071742 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 237250 | -| policy_gradient_loss | 0.0036 | -| std | 0.00599 | -| value_loss | 4.39e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23727 | -| time_elapsed | 128970 | -| total_timesteps | 3037056 | -| train/ | | -| approx_kl | 0.04509208 | -| clip_fraction | 0.658 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0855 | -| learning_rate | 0.0003 | -| loss | 0.0553 | -| n_updates | 237260 | -| policy_gradient_loss | 0.12 | -| std | 0.00599 | -| value_loss | 5.23e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23728 | -| time_elapsed | 128982 | -| total_timesteps | 3037184 | -| train/ | | -| approx_kl | 0.22969545 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.874 | -| learning_rate | 0.0003 | -| loss | 0.0941 | -| n_updates | 237270 | -| policy_gradient_loss | 0.0643 | -| std | 0.00599 | -| value_loss | 0.00294 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23729 | -| time_elapsed | 128988 | -| total_timesteps | 3037312 | -| train/ | | -| approx_kl | 0.09525993 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.064 | -| n_updates | 237280 | -| policy_gradient_loss | 0.0373 | -| std | 0.00599 | -| value_loss | 1.55e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23730 | -| time_elapsed | 128993 | -| total_timesteps | 3037440 | -| train/ | | -| approx_kl | 0.17019473 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00654 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 237290 | -| policy_gradient_loss | 0.0301 | -| std | 0.00599 | -| value_loss | 2.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23731 | -| time_elapsed | 128998 | -| total_timesteps | 3037568 | -| train/ | | -| approx_kl | 0.013366563 | -| clip_fraction | 0.0992 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.00623 | -| n_updates | 237300 | -| policy_gradient_loss | 0.00302 | -| std | 0.00599 | -| value_loss | 1.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23732 | -| time_elapsed | 129002 | -| total_timesteps | 3037696 | -| train/ | | -| approx_kl | 0.016091263 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | -0.0037 | -| n_updates | 237310 | -| policy_gradient_loss | -0.00184 | -| std | 0.00599 | -| value_loss | 5.81e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23733 | -| time_elapsed | 129007 | -| total_timesteps | 3037824 | -| train/ | | -| approx_kl | 0.013311366 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00741 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 237320 | -| policy_gradient_loss | -0.00824 | -| std | 0.006 | -| value_loss | 9.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 23734 | -| time_elapsed | 129013 | -| total_timesteps | 3037952 | -| train/ | | -| approx_kl | 0.026624363 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0579 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 237330 | -| policy_gradient_loss | 0.0314 | -| std | 0.006 | -| value_loss | 6.82e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23735 | -| time_elapsed | 129017 | -| total_timesteps | 3038080 | -| train/ | | -| approx_kl | 0.13629133 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | 0.0701 | -| n_updates | 237340 | -| policy_gradient_loss | 0.0324 | -| std | 0.006 | -| value_loss | 4.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23736 | -| time_elapsed | 129027 | -| total_timesteps | 3038208 | -| train/ | | -| approx_kl | 0.024387946 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -2.91 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 237350 | -| policy_gradient_loss | -0.00857 | -| std | 0.006 | -| value_loss | 0.00457 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23737 | -| time_elapsed | 129033 | -| total_timesteps | 3038336 | -| train/ | | -| approx_kl | 0.0032717092 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 237360 | -| policy_gradient_loss | 0.0093 | -| std | 0.006 | -| value_loss | 8.82e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23738 | -| time_elapsed | 129037 | -| total_timesteps | 3038464 | -| train/ | | -| approx_kl | 0.065512136 | -| clip_fraction | 0.597 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.0335 | -| n_updates | 237370 | -| policy_gradient_loss | 0.0718 | -| std | 0.006 | -| value_loss | 2.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23739 | -| time_elapsed | 129041 | -| total_timesteps | 3038592 | -| train/ | | -| approx_kl | 0.050694894 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00648 | -| learning_rate | 0.0003 | -| loss | 0.0571 | -| n_updates | 237380 | -| policy_gradient_loss | 0.0282 | -| std | 0.006 | -| value_loss | 2.01e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23740 | -| time_elapsed | 129046 | -| total_timesteps | 3038720 | -| train/ | | -| approx_kl | 0.2795485 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 237390 | -| policy_gradient_loss | 0.0436 | -| std | 0.006 | -| value_loss | 1.09e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23741 | -| time_elapsed | 129049 | -| total_timesteps | 3038848 | -| train/ | | -| approx_kl | 0.0023533646 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.00957 | -| n_updates | 237400 | -| policy_gradient_loss | 0.00162 | -| std | 0.006 | -| value_loss | 9.91e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 23742 | -| time_elapsed | 129055 | -| total_timesteps | 3038976 | -| train/ | | -| approx_kl | 2.3748726e-07 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 2.53e-05 | -| n_updates | 237410 | -| policy_gradient_loss | 0.0185 | -| std | 0.006 | -| value_loss | 6.08e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 23743 | -| time_elapsed | 129058 | -| total_timesteps | 3039104 | -| train/ | | -| approx_kl | 0.07650851 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0556 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 237420 | -| policy_gradient_loss | 0.0712 | -| std | 0.006 | -| value_loss | 4.85e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 23744 | -| time_elapsed | 129070 | -| total_timesteps | 3039232 | -| train/ | | -| approx_kl | 0.16739368 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.873 | -| learning_rate | 0.0003 | -| loss | -0.00514 | -| n_updates | 237430 | -| policy_gradient_loss | -0.0104 | -| std | 0.006 | -| value_loss | 0.00272 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 23745 | -| time_elapsed | 129076 | -| total_timesteps | 3039360 | -| train/ | | -| approx_kl | 0.16382472 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | 0.0362 | -| n_updates | 237440 | -| policy_gradient_loss | 0.0166 | -| std | 0.006 | -| value_loss | 8.46e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 23746 | -| time_elapsed | 129080 | -| total_timesteps | 3039488 | -| train/ | | -| approx_kl | 0.13489304 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00208 | -| learning_rate | 0.0003 | -| loss | 0.0696 | -| n_updates | 237450 | -| policy_gradient_loss | 0.0292 | -| std | 0.006 | -| value_loss | 1.05e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 23747 | -| time_elapsed | 129084 | -| total_timesteps | 3039616 | -| train/ | | -| approx_kl | 0.012342499 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.00183 | -| n_updates | 237460 | -| policy_gradient_loss | 0.00157 | -| std | 0.006 | -| value_loss | 4.95e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 23748 | -| time_elapsed | 129088 | -| total_timesteps | 3039744 | -| train/ | | -| approx_kl | 0.034766648 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0637 | -| learning_rate | 0.0003 | -| loss | 0.00554 | -| n_updates | 237470 | -| policy_gradient_loss | 0.0329 | -| std | 0.006 | -| value_loss | 4.05e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 23749 | -| time_elapsed | 129093 | -| total_timesteps | 3039872 | -| train/ | | -| approx_kl | 0.2910721 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.209 | -| n_updates | 237480 | -| policy_gradient_loss | 0.146 | -| std | 0.006 | -| value_loss | 3.48e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23750 | -| time_elapsed | 129097 | -| total_timesteps | 3040000 | -| train/ | | -| approx_kl | 0.17532857 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 237490 | -| policy_gradient_loss | 0.111 | -| std | 0.006 | -| value_loss | 2.67e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23751 | -| time_elapsed | 129102 | -| total_timesteps | 3040128 | -| train/ | | -| approx_kl | 0.15703881 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00417 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 237500 | -| policy_gradient_loss | 0.153 | -| std | 0.006 | -| value_loss | 1.24e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23752 | -| time_elapsed | 129114 | -| total_timesteps | 3040256 | -| train/ | | -| approx_kl | 0.32708362 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.906 | -| learning_rate | 0.0003 | -| loss | 0.0671 | -| n_updates | 237510 | -| policy_gradient_loss | 0.0529 | -| std | 0.006 | -| value_loss | 0.00176 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23753 | -| time_elapsed | 129120 | -| total_timesteps | 3040384 | -| train/ | | -| approx_kl | 0.3272673 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 237520 | -| policy_gradient_loss | 0.134 | -| std | 0.006 | -| value_loss | 3.56e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23754 | -| time_elapsed | 129126 | -| total_timesteps | 3040512 | -| train/ | | -| approx_kl | 0.2509676 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 237530 | -| policy_gradient_loss | 0.154 | -| std | 0.006 | -| value_loss | 1.06e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23755 | -| time_elapsed | 129131 | -| total_timesteps | 3040640 | -| train/ | | -| approx_kl | 0.14566736 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 237540 | -| policy_gradient_loss | 0.104 | -| std | 0.00601 | -| value_loss | 6.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23756 | -| time_elapsed | 129135 | -| total_timesteps | 3040768 | -| train/ | | -| approx_kl | 0.03280741 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.00806 | -| n_updates | 237550 | -| policy_gradient_loss | 0.0278 | -| std | 0.00601 | -| value_loss | 4.5e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.968 | -| time/ | | -| fps | 23 | -| iterations | 23757 | -| time_elapsed | 129139 | -| total_timesteps | 3040896 | -| train/ | | -| approx_kl | 0.8585238 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.309 | -| n_updates | 237560 | -| policy_gradient_loss | 0.096 | -| std | 0.00601 | -| value_loss | 3.22e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23758 | -| time_elapsed | 129144 | -| total_timesteps | 3041024 | -| train/ | | -| approx_kl | 0.012331035 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0393 | -| learning_rate | 0.0003 | -| loss | 0.00161 | -| n_updates | 237570 | -| policy_gradient_loss | 0.0081 | -| std | 0.006 | -| value_loss | 1.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23759 | -| time_elapsed | 129156 | -| total_timesteps | 3041152 | -| train/ | | -| approx_kl | 0.04285773 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.00348 | -| n_updates | 237580 | -| policy_gradient_loss | -0.00282 | -| std | 0.006 | -| value_loss | 0.00119 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23760 | -| time_elapsed | 129164 | -| total_timesteps | 3041280 | -| train/ | | -| approx_kl | 0.00057003926 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.00303 | -| n_updates | 237590 | -| policy_gradient_loss | 0.00922 | -| std | 0.006 | -| value_loss | 4.86e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23761 | -| time_elapsed | 129170 | -| total_timesteps | 3041408 | -| train/ | | -| approx_kl | 0.0004156325 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00867 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 237600 | -| policy_gradient_loss | 0.0105 | -| std | 0.006 | -| value_loss | 8.64e-07 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23762 | -| time_elapsed | 129176 | -| total_timesteps | 3041536 | -| train/ | | -| approx_kl | 0.000117311254 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 237610 | -| policy_gradient_loss | 0.0112 | -| std | 0.006 | -| value_loss | 6.03e-07 | --------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23763 | -| time_elapsed | 129181 | -| total_timesteps | 3041664 | -| train/ | | -| approx_kl | 0.00017386442 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | -0.000803 | -| n_updates | 237620 | -| policy_gradient_loss | 0.0117 | -| std | 0.006 | -| value_loss | 3.59e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23764 | -| time_elapsed | 129186 | -| total_timesteps | 3041792 | -| train/ | | -| approx_kl | 0.00019131042 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0724 | -| learning_rate | 0.0003 | -| loss | -0.00153 | -| n_updates | 237630 | -| policy_gradient_loss | 0.0105 | -| std | 0.006 | -| value_loss | 2.64e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23765 | -| time_elapsed | 129191 | -| total_timesteps | 3041920 | -| train/ | | -| approx_kl | 0.09992019 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 237640 | -| policy_gradient_loss | 0.0817 | -| std | 0.00599 | -| value_loss | 1.83e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23766 | -| time_elapsed | 129197 | -| total_timesteps | 3042048 | -| train/ | | -| approx_kl | 0.09465748 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.0607 | -| n_updates | 237650 | -| policy_gradient_loss | 0.0282 | -| std | 0.00599 | -| value_loss | 3.66e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23767 | -| time_elapsed | 129206 | -| total_timesteps | 3042176 | -| train/ | | -| approx_kl | 0.09174858 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.748 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 237660 | -| policy_gradient_loss | 0.0604 | -| std | 0.00599 | -| value_loss | 0.00247 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23768 | -| time_elapsed | 129210 | -| total_timesteps | 3042304 | -| train/ | | -| approx_kl | 0.002337928 | -| clip_fraction | 0.613 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | -0.00477 | -| n_updates | 237670 | -| policy_gradient_loss | 0.11 | -| std | 0.00599 | -| value_loss | 3.86e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23769 | -| time_elapsed | 129214 | -| total_timesteps | 3042432 | -| train/ | | -| approx_kl | 0.026363825 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0042 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 237680 | -| policy_gradient_loss | 0.0373 | -| std | 0.00599 | -| value_loss | 4.96e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23770 | -| time_elapsed | 129218 | -| total_timesteps | 3042560 | -| train/ | | -| approx_kl | 0.34865028 | -| clip_fraction | 0.729 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 237690 | -| policy_gradient_loss | 0.137 | -| std | 0.00599 | -| value_loss | 3.55e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23771 | -| time_elapsed | 129223 | -| total_timesteps | 3042688 | -| train/ | | -| approx_kl | 0.07121501 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.0425 | -| n_updates | 237700 | -| policy_gradient_loss | 0.0409 | -| std | 0.00599 | -| value_loss | 2.75e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23772 | -| time_elapsed | 129228 | -| total_timesteps | 3042816 | -| train/ | | -| approx_kl | 0.002612228 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.00738 | -| n_updates | 237710 | -| policy_gradient_loss | 0.0458 | -| std | 0.00599 | -| value_loss | 1.92e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 23773 | -| time_elapsed | 129232 | -| total_timesteps | 3042944 | -| train/ | | -| approx_kl | 0.64053863 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 237720 | -| policy_gradient_loss | 0.0651 | -| std | 0.00599 | -| value_loss | 1.19e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23774 | -| time_elapsed | 129238 | -| total_timesteps | 3043072 | -| train/ | | -| approx_kl | 0.010655051 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.00871 | -| n_updates | 237730 | -| policy_gradient_loss | 0.00836 | -| std | 0.006 | -| value_loss | 9.5e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23775 | -| time_elapsed | 129248 | -| total_timesteps | 3043200 | -| train/ | | -| approx_kl | 0.049042773 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.647 | -| learning_rate | 0.0003 | -| loss | 0.00977 | -| n_updates | 237740 | -| policy_gradient_loss | 0.00477 | -| std | 0.00599 | -| value_loss | 0.0094 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23776 | -| time_elapsed | 129253 | -| total_timesteps | 3043328 | -| train/ | | -| approx_kl | 0.00038910285 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.243 | -| learning_rate | 0.0003 | -| loss | 0.0042 | -| n_updates | 237750 | -| policy_gradient_loss | 0.0022 | -| std | 0.00599 | -| value_loss | 0.000206 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23777 | -| time_elapsed | 129258 | -| total_timesteps | 3043456 | -| train/ | | -| approx_kl | 0.0874731 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0129 | -| learning_rate | 0.0003 | -| loss | 0.054 | -| n_updates | 237760 | -| policy_gradient_loss | 0.0249 | -| std | 0.006 | -| value_loss | 2.6e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23778 | -| time_elapsed | 129261 | -| total_timesteps | 3043584 | -| train/ | | -| approx_kl | 0.048774455 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.0081 | -| n_updates | 237770 | -| policy_gradient_loss | 0.00431 | -| std | 0.006 | -| value_loss | 2.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23779 | -| time_elapsed | 129266 | -| total_timesteps | 3043712 | -| train/ | | -| approx_kl | 0.010807328 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | -0.00346 | -| n_updates | 237780 | -| policy_gradient_loss | 0.00921 | -| std | 0.00601 | -| value_loss | 1.64e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23780 | -| time_elapsed | 129270 | -| total_timesteps | 3043840 | -| train/ | | -| approx_kl | 0.085896984 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 237790 | -| policy_gradient_loss | 0.00625 | -| std | 0.00601 | -| value_loss | 1.35e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23781 | -| time_elapsed | 129274 | -| total_timesteps | 3043968 | -| train/ | | -| approx_kl | 0.013492273 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 237800 | -| policy_gradient_loss | 0.00626 | -| std | 0.006 | -| value_loss | 9.43e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23782 | -| time_elapsed | 129279 | -| total_timesteps | 3044096 | -| train/ | | -| approx_kl | 0.0027880007 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 237810 | -| policy_gradient_loss | 0.00708 | -| std | 0.006 | -| value_loss | 5.24e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23783 | -| time_elapsed | 129288 | -| total_timesteps | 3044224 | -| train/ | | -| approx_kl | 0.06297187 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.408 | -| learning_rate | 0.0003 | -| loss | 0.0498 | -| n_updates | 237820 | -| policy_gradient_loss | 0.0544 | -| std | 0.006 | -| value_loss | 0.00299 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23784 | -| time_elapsed | 129292 | -| total_timesteps | 3044352 | -| train/ | | -| approx_kl | 0.11555429 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 237830 | -| policy_gradient_loss | 0.13 | -| std | 0.006 | -| value_loss | 2.88e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23785 | -| time_elapsed | 129296 | -| total_timesteps | 3044480 | -| train/ | | -| approx_kl | 0.030717582 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00915 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 237840 | -| policy_gradient_loss | 0.0326 | -| std | 0.006 | -| value_loss | 1.34e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23786 | -| time_elapsed | 129301 | -| total_timesteps | 3044608 | -| train/ | | -| approx_kl | 0.7140434 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 237850 | -| policy_gradient_loss | 0.0674 | -| std | 0.006 | -| value_loss | 7.59e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23787 | -| time_elapsed | 129305 | -| total_timesteps | 3044736 | -| train/ | | -| approx_kl | 0.04734567 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | 0.0369 | -| n_updates | 237860 | -| policy_gradient_loss | 0.0184 | -| std | 0.00601 | -| value_loss | 0.000647 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23788 | -| time_elapsed | 129310 | -| total_timesteps | 3044864 | -| train/ | | -| approx_kl | 0.06792376 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.44 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 237870 | -| policy_gradient_loss | 0.00165 | -| std | 0.00601 | -| value_loss | 0.0194 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 23789 | -| time_elapsed | 129313 | -| total_timesteps | 3044992 | -| train/ | | -| approx_kl | 0.013011832 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | 0.00757 | -| n_updates | 237880 | -| policy_gradient_loss | 0.0137 | -| std | 0.00601 | -| value_loss | 0.00346 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23790 | -| time_elapsed | 129318 | -| total_timesteps | 3045120 | -| train/ | | -| approx_kl | 0.001035939 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0151 | -| learning_rate | 0.0003 | -| loss | 0.00425 | -| n_updates | 237890 | -| policy_gradient_loss | 0.00569 | -| std | 0.00602 | -| value_loss | 0.0018 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23791 | -| time_elapsed | 129329 | -| total_timesteps | 3045248 | -| train/ | | -| approx_kl | 0.012997497 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.539 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 237900 | -| policy_gradient_loss | 0.00114 | -| std | 0.00602 | -| value_loss | 0.00498 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23792 | -| time_elapsed | 129333 | -| total_timesteps | 3045376 | -| train/ | | -| approx_kl | 2.9985793e-05 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.000504 | -| n_updates | 237910 | -| policy_gradient_loss | 0.052 | -| std | 0.00602 | -| value_loss | 0.000674 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23793 | -| time_elapsed | 129338 | -| total_timesteps | 3045504 | -| train/ | | -| approx_kl | 0.20302527 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 237920 | -| policy_gradient_loss | 0.0532 | -| std | 0.00602 | -| value_loss | 0.000585 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23794 | -| time_elapsed | 129343 | -| total_timesteps | 3045632 | -| train/ | | -| approx_kl | 0.28665057 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 237930 | -| policy_gradient_loss | 0.0313 | -| std | 0.00602 | -| value_loss | 0.000506 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23795 | -| time_elapsed | 129347 | -| total_timesteps | 3045760 | -| train/ | | -| approx_kl | 0.18797617 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.0334 | -| n_updates | 237940 | -| policy_gradient_loss | 0.012 | -| std | 0.00603 | -| value_loss | 0.000224 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23796 | -| time_elapsed | 129353 | -| total_timesteps | 3045888 | -| train/ | | -| approx_kl | 0.0195867 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0681 | -| learning_rate | 0.0003 | -| loss | 0.0057 | -| n_updates | 237950 | -| policy_gradient_loss | 0.00204 | -| std | 0.00604 | -| value_loss | 0.000195 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23797 | -| time_elapsed | 129358 | -| total_timesteps | 3046016 | -| train/ | | -| approx_kl | 0.01949964 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0371 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 237960 | -| policy_gradient_loss | 0.00945 | -| std | 0.00603 | -| value_loss | 0.000179 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23798 | -| time_elapsed | 129370 | -| total_timesteps | 3046144 | -| train/ | | -| approx_kl | 0.005467032 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.735 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 237970 | -| policy_gradient_loss | 0.00853 | -| std | 0.00602 | -| value_loss | 0.00171 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23799 | -| time_elapsed | 129376 | -| total_timesteps | 3046272 | -| train/ | | -| approx_kl | 0.76377153 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 237980 | -| policy_gradient_loss | 0.0542 | -| std | 0.00602 | -| value_loss | 0.000134 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23800 | -| time_elapsed | 129381 | -| total_timesteps | 3046400 | -| train/ | | -| approx_kl | 0.013662083 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.00634 | -| n_updates | 237990 | -| policy_gradient_loss | 0.00888 | -| std | 0.00602 | -| value_loss | 0.000126 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23801 | -| time_elapsed | 129386 | -| total_timesteps | 3046528 | -| train/ | | -| approx_kl | 0.09067257 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 238000 | -| policy_gradient_loss | 0.016 | -| std | 0.00602 | -| value_loss | 0.000111 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23802 | -| time_elapsed | 129390 | -| total_timesteps | 3046656 | -| train/ | | -| approx_kl | 0.045958363 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.00766 | -| n_updates | 238010 | -| policy_gradient_loss | 0.00479 | -| std | 0.00602 | -| value_loss | 9.71e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23803 | -| time_elapsed | 129395 | -| total_timesteps | 3046784 | -| train/ | | -| approx_kl | 0.07467181 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 238020 | -| policy_gradient_loss | 0.0195 | -| std | 0.00602 | -| value_loss | 8.67e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23804 | -| time_elapsed | 129400 | -| total_timesteps | 3046912 | -| train/ | | -| approx_kl | 0.010003656 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.00321 | -| n_updates | 238030 | -| policy_gradient_loss | 0.00845 | -| std | 0.00602 | -| value_loss | 4.89e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23805 | -| time_elapsed | 129407 | -| total_timesteps | 3047040 | -| train/ | | -| approx_kl | 0.0026357346 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.00228 | -| n_updates | 238040 | -| policy_gradient_loss | 0.00765 | -| std | 0.00602 | -| value_loss | 4.72e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23806 | -| time_elapsed | 129419 | -| total_timesteps | 3047168 | -| train/ | | -| approx_kl | 0.15156363 | -| clip_fraction | 0.701 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -6.85 | -| learning_rate | 0.0003 | -| loss | 0.00834 | -| n_updates | 238050 | -| policy_gradient_loss | 0.0322 | -| std | 0.00602 | -| value_loss | 0.00497 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23807 | -| time_elapsed | 129424 | -| total_timesteps | 3047296 | -| train/ | | -| approx_kl | 0.12273239 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | 0.0535 | -| n_updates | 238060 | -| policy_gradient_loss | 0.0333 | -| std | 0.00602 | -| value_loss | 3.76e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23808 | -| time_elapsed | 129428 | -| total_timesteps | 3047424 | -| train/ | | -| approx_kl | 1.3634562e-06 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | 7.44e-05 | -| n_updates | 238070 | -| policy_gradient_loss | 0.0251 | -| std | 0.00602 | -| value_loss | 3.49e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23809 | -| time_elapsed | 129434 | -| total_timesteps | 3047552 | -| train/ | | -| approx_kl | 0.00048981793 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.000473 | -| n_updates | 238080 | -| policy_gradient_loss | 0.032 | -| std | 0.00603 | -| value_loss | 2.52e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23810 | -| time_elapsed | 129438 | -| total_timesteps | 3047680 | -| train/ | | -| approx_kl | 0.0011092639 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | -0.00221 | -| n_updates | 238090 | -| policy_gradient_loss | 0.0409 | -| std | 0.00603 | -| value_loss | 2.17e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23811 | -| time_elapsed | 129443 | -| total_timesteps | 3047808 | -| train/ | | -| approx_kl | 0.5417515 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.195 | -| n_updates | 238100 | -| policy_gradient_loss | 0.0778 | -| std | 0.00603 | -| value_loss | 2.12e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23812 | -| time_elapsed | 129447 | -| total_timesteps | 3047936 | -| train/ | | -| approx_kl | 0.008089729 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.00442 | -| n_updates | 238110 | -| policy_gradient_loss | 0.00886 | -| std | 0.00603 | -| value_loss | 1.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23813 | -| time_elapsed | 129451 | -| total_timesteps | 3048064 | -| train/ | | -| approx_kl | 0.002412131 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | -0.00799 | -| n_updates | 238120 | -| policy_gradient_loss | 0.0191 | -| std | 0.00603 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23814 | -| time_elapsed | 129460 | -| total_timesteps | 3048192 | -| train/ | | -| approx_kl | 0.059352655 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.903 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 238130 | -| policy_gradient_loss | 0.0348 | -| std | 0.00603 | -| value_loss | 0.000509 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23815 | -| time_elapsed | 129466 | -| total_timesteps | 3048320 | -| train/ | | -| approx_kl | 0.018707117 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0416 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 238140 | -| policy_gradient_loss | 0.0358 | -| std | 0.00602 | -| value_loss | 9.43e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23816 | -| time_elapsed | 129472 | -| total_timesteps | 3048448 | -| train/ | | -| approx_kl | 0.17616704 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.072 | -| n_updates | 238150 | -| policy_gradient_loss | 0.0207 | -| std | 0.00602 | -| value_loss | 7.81e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23817 | -| time_elapsed | 129477 | -| total_timesteps | 3048576 | -| train/ | | -| approx_kl | 0.026522659 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 238160 | -| policy_gradient_loss | 0.0294 | -| std | 0.00602 | -| value_loss | 7.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23818 | -| time_elapsed | 129482 | -| total_timesteps | 3048704 | -| train/ | | -| approx_kl | 0.09869294 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.013 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 238170 | -| policy_gradient_loss | 0.0205 | -| std | 0.00603 | -| value_loss | 6.42e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23819 | -| time_elapsed | 129487 | -| total_timesteps | 3048832 | -| train/ | | -| approx_kl | 0.00018464308 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00078 | -| n_updates | 238180 | -| policy_gradient_loss | 0.0319 | -| std | 0.00603 | -| value_loss | 5.26e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23820 | -| time_elapsed | 129492 | -| total_timesteps | 3048960 | -| train/ | | -| approx_kl | 0.0006984826 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 5.85e-05 | -| n_updates | 238190 | -| policy_gradient_loss | 0.037 | -| std | 0.00603 | -| value_loss | 1.44e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23821 | -| time_elapsed | 129497 | -| total_timesteps | 3049088 | -| train/ | | -| approx_kl | 0.5527194 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 238200 | -| policy_gradient_loss | 0.067 | -| std | 0.00603 | -| value_loss | 9.39e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23822 | -| time_elapsed | 129507 | -| total_timesteps | 3049216 | -| train/ | | -| approx_kl | 0.053553175 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 238210 | -| policy_gradient_loss | -0.0055 | -| std | 0.00603 | -| value_loss | 0.000119 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23823 | -| time_elapsed | 129512 | -| total_timesteps | 3049344 | -| train/ | | -| approx_kl | 0.16023415 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00664 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 238220 | -| policy_gradient_loss | 0.0846 | -| std | 0.00603 | -| value_loss | 1.04e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23824 | -| time_elapsed | 129518 | -| total_timesteps | 3049472 | -| train/ | | -| approx_kl | 0.015355643 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 238230 | -| policy_gradient_loss | 0.0157 | -| std | 0.00602 | -| value_loss | 7.79e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23825 | -| time_elapsed | 129522 | -| total_timesteps | 3049600 | -| train/ | | -| approx_kl | 0.0009872364 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.00466 | -| n_updates | 238240 | -| policy_gradient_loss | 0.0072 | -| std | 0.00601 | -| value_loss | 4.27e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23826 | -| time_elapsed | 129526 | -| total_timesteps | 3049728 | -| train/ | | -| approx_kl | 0.072577305 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 238250 | -| policy_gradient_loss | 0.0155 | -| std | 0.00601 | -| value_loss | 4.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23827 | -| time_elapsed | 129530 | -| total_timesteps | 3049856 | -| train/ | | -| approx_kl | 0.008637556 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 238260 | -| policy_gradient_loss | 0.00305 | -| std | 0.00602 | -| value_loss | 3.53e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23828 | -| time_elapsed | 129534 | -| total_timesteps | 3049984 | -| train/ | | -| approx_kl | 0.0030063274 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 238270 | -| policy_gradient_loss | 0.00741 | -| std | 0.00602 | -| value_loss | 2.49e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23829 | -| time_elapsed | 129538 | -| total_timesteps | 3050112 | -| train/ | | -| approx_kl | 0.037748426 | -| clip_fraction | 0.621 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 238280 | -| policy_gradient_loss | 0.107 | -| std | 0.00602 | -| value_loss | 1.22e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23830 | -| time_elapsed | 129550 | -| total_timesteps | 3050240 | -| train/ | | -| approx_kl | 0.03128578 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.977 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 238290 | -| policy_gradient_loss | 0.041 | -| std | 0.00603 | -| value_loss | 0.000233 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23831 | -| time_elapsed | 129555 | -| total_timesteps | 3050368 | -| train/ | | -| approx_kl | 0.15875115 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.805 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 238300 | -| policy_gradient_loss | 0.0328 | -| std | 0.00603 | -| value_loss | 1.72e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23832 | -| time_elapsed | 129560 | -| total_timesteps | 3050496 | -| train/ | | -| approx_kl | 0.0062597883 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.42 | -| learning_rate | 0.0003 | -| loss | 0.00541 | -| n_updates | 238310 | -| policy_gradient_loss | 0.00411 | -| std | 0.00603 | -| value_loss | 1.21e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23833 | -| time_elapsed | 129564 | -| total_timesteps | 3050624 | -| train/ | | -| approx_kl | 0.3474213 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.427 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 238320 | -| policy_gradient_loss | 0.0376 | -| std | 0.00605 | -| value_loss | 3.13e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23834 | -| time_elapsed | 129568 | -| total_timesteps | 3050752 | -| train/ | | -| approx_kl | 0.08266733 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.403 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 238330 | -| policy_gradient_loss | 0.0111 | -| std | 0.00606 | -| value_loss | 5.87e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23835 | -| time_elapsed | 129571 | -| total_timesteps | 3050880 | -| train/ | | -| approx_kl | 0.050186824 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 238340 | -| policy_gradient_loss | 0.0146 | -| std | 0.00606 | -| value_loss | 1.9e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23836 | -| time_elapsed | 129575 | -| total_timesteps | 3051008 | -| train/ | | -| approx_kl | 0.06634918 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0628 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 238350 | -| policy_gradient_loss | 0.00492 | -| std | 0.00606 | -| value_loss | 1.83e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23837 | -| time_elapsed | 129583 | -| total_timesteps | 3051136 | -| train/ | | -| approx_kl | 0.041673876 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.853 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 238360 | -| policy_gradient_loss | -0.000386 | -| std | 0.00606 | -| value_loss | 0.00262 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23838 | -| time_elapsed | 129587 | -| total_timesteps | 3051264 | -| train/ | | -| approx_kl | 0.7486057 | -| clip_fraction | 0.773 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.479 | -| learning_rate | 0.0003 | -| loss | 0.263 | -| n_updates | 238370 | -| policy_gradient_loss | 0.117 | -| std | 0.00606 | -| value_loss | 1.39e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23839 | -| time_elapsed | 129591 | -| total_timesteps | 3051392 | -| train/ | | -| approx_kl | 0.013495778 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00756 | -| learning_rate | 0.0003 | -| loss | 0.00162 | -| n_updates | 238380 | -| policy_gradient_loss | 0.0481 | -| std | 0.00606 | -| value_loss | 2.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23840 | -| time_elapsed | 129595 | -| total_timesteps | 3051520 | -| train/ | | -| approx_kl | 0.11995439 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00469 | -| learning_rate | 0.0003 | -| loss | 0.0631 | -| n_updates | 238390 | -| policy_gradient_loss | 0.0327 | -| std | 0.00607 | -| value_loss | 1.56e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23841 | -| time_elapsed | 129598 | -| total_timesteps | 3051648 | -| train/ | | -| approx_kl | 0.7283074 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0133 | -| learning_rate | 0.0003 | -| loss | 0.0969 | -| n_updates | 238400 | -| policy_gradient_loss | 0.0379 | -| std | 0.00607 | -| value_loss | 1.23e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23842 | -| time_elapsed | 129603 | -| total_timesteps | 3051776 | -| train/ | | -| approx_kl | 0.01604703 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.00253 | -| n_updates | 238410 | -| policy_gradient_loss | 0.00735 | -| std | 0.00607 | -| value_loss | 9.68e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23843 | -| time_elapsed | 129608 | -| total_timesteps | 3051904 | -| train/ | | -| approx_kl | 0.00428067 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | -0.00196 | -| n_updates | 238420 | -| policy_gradient_loss | 0.0106 | -| std | 0.00607 | -| value_loss | 8.09e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23844 | -| time_elapsed | 129612 | -| total_timesteps | 3052032 | -| train/ | | -| approx_kl | 0.0018387125 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.000839 | -| n_updates | 238430 | -| policy_gradient_loss | 0.00929 | -| std | 0.00607 | -| value_loss | 5.3e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23845 | -| time_elapsed | 129622 | -| total_timesteps | 3052160 | -| train/ | | -| approx_kl | 0.023143211 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.37 | -| learning_rate | 0.0003 | -| loss | -0.0184 | -| n_updates | 238440 | -| policy_gradient_loss | -0.0107 | -| std | 0.00608 | -| value_loss | 0.00223 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23846 | -| time_elapsed | 129627 | -| total_timesteps | 3052288 | -| train/ | | -| approx_kl | 0.13560562 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0592 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 238450 | -| policy_gradient_loss | 0.119 | -| std | 0.00608 | -| value_loss | 1.13e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23847 | -| time_elapsed | 129631 | -| total_timesteps | 3052416 | -| train/ | | -| approx_kl | 0.14620207 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00862 | -| learning_rate | 0.0003 | -| loss | 0.091 | -| n_updates | 238460 | -| policy_gradient_loss | 0.177 | -| std | 0.00608 | -| value_loss | 2.54e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23848 | -| time_elapsed | 129636 | -| total_timesteps | 3052544 | -| train/ | | -| approx_kl | 0.028585445 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00233 | -| learning_rate | 0.0003 | -| loss | 0.00588 | -| n_updates | 238470 | -| policy_gradient_loss | 0.0197 | -| std | 0.00609 | -| value_loss | 1.73e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23849 | -| time_elapsed | 129641 | -| total_timesteps | 3052672 | -| train/ | | -| approx_kl | 0.0005234638 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | 0.00163 | -| n_updates | 238480 | -| policy_gradient_loss | 0.0256 | -| std | 0.00609 | -| value_loss | 1.31e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23850 | -| time_elapsed | 129645 | -| total_timesteps | 3052800 | -| train/ | | -| approx_kl | 0.00095061446 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.000961 | -| n_updates | 238490 | -| policy_gradient_loss | 0.0165 | -| std | 0.0061 | -| value_loss | 7e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23851 | -| time_elapsed | 129652 | -| total_timesteps | 3052928 | -| train/ | | -| approx_kl | 0.5274452 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 238500 | -| policy_gradient_loss | 0.0992 | -| std | 0.0061 | -| value_loss | 5.99e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23852 | -| time_elapsed | 129658 | -| total_timesteps | 3053056 | -| train/ | | -| approx_kl | 0.006611618 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.000608 | -| n_updates | 238510 | -| policy_gradient_loss | 0.00493 | -| std | 0.00611 | -| value_loss | 3.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23853 | -| time_elapsed | 129668 | -| total_timesteps | 3053184 | -| train/ | | -| approx_kl | 0.010862121 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.785 | -| learning_rate | 0.0003 | -| loss | -0.00918 | -| n_updates | 238520 | -| policy_gradient_loss | -0.00224 | -| std | 0.0061 | -| value_loss | 0.00583 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23854 | -| time_elapsed | 129673 | -| total_timesteps | 3053312 | -| train/ | | -| approx_kl | 0.00656647 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -21.1 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 238530 | -| policy_gradient_loss | 0.00429 | -| std | 0.0061 | -| value_loss | 1.16e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23855 | -| time_elapsed | 129678 | -| total_timesteps | 3053440 | -| train/ | | -| approx_kl | 0.025553176 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 238540 | -| policy_gradient_loss | 0.0163 | -| std | 0.00612 | -| value_loss | 3.88e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23856 | -| time_elapsed | 129682 | -| total_timesteps | 3053568 | -| train/ | | -| approx_kl | 0.0397951 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0711 | -| learning_rate | 0.0003 | -| loss | -0.00512 | -| n_updates | 238550 | -| policy_gradient_loss | 0.0213 | -| std | 0.00613 | -| value_loss | 2.1e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23857 | -| time_elapsed | 129688 | -| total_timesteps | 3053696 | -| train/ | | -| approx_kl | 0.97548157 | -| clip_fraction | 0.751 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.441 | -| n_updates | 238560 | -| policy_gradient_loss | 0.189 | -| std | 0.00614 | -| value_loss | 2.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23858 | -| time_elapsed | 129694 | -| total_timesteps | 3053824 | -| train/ | | -| approx_kl | 0.024915524 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 238570 | -| policy_gradient_loss | 0.026 | -| std | 0.00612 | -| value_loss | 2.43e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 23859 | -| time_elapsed | 129700 | -| total_timesteps | 3053952 | -| train/ | | -| approx_kl | 0.19719422 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.293 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 238580 | -| policy_gradient_loss | 0.0214 | -| std | 0.00611 | -| value_loss | 4.27e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23860 | -| time_elapsed | 129705 | -| total_timesteps | 3054080 | -| train/ | | -| approx_kl | 0.016146066 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0864 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 238590 | -| policy_gradient_loss | -0.00664 | -| std | 0.00611 | -| value_loss | 2.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23861 | -| time_elapsed | 129715 | -| total_timesteps | 3054208 | -| train/ | | -| approx_kl | 0.003980785 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 238600 | -| policy_gradient_loss | 0.00414 | -| std | 0.0061 | -| value_loss | 0.0045 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23862 | -| time_elapsed | 129720 | -| total_timesteps | 3054336 | -| train/ | | -| approx_kl | 0.50637746 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 238610 | -| policy_gradient_loss | 0.057 | -| std | 0.0061 | -| value_loss | 4.16e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23863 | -| time_elapsed | 129724 | -| total_timesteps | 3054464 | -| train/ | | -| approx_kl | 0.0501716 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0119 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 238620 | -| policy_gradient_loss | 0.0144 | -| std | 0.00611 | -| value_loss | 9.08e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23864 | -| time_elapsed | 129729 | -| total_timesteps | 3054592 | -| train/ | | -| approx_kl | 0.048235077 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 238630 | -| policy_gradient_loss | 0.00993 | -| std | 0.00611 | -| value_loss | 3.05e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23865 | -| time_elapsed | 129733 | -| total_timesteps | 3054720 | -| train/ | | -| approx_kl | 0.010082 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | -0.00409 | -| n_updates | 238640 | -| policy_gradient_loss | 0.00946 | -| std | 0.00611 | -| value_loss | 3.09e-07 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23866 | -| time_elapsed | 129738 | -| total_timesteps | 3054848 | -| train/ | | -| approx_kl | 0.06923734 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 238650 | -| policy_gradient_loss | 0.00374 | -| std | 0.00611 | -| value_loss | 2.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23867 | -| time_elapsed | 129743 | -| total_timesteps | 3054976 | -| train/ | | -| approx_kl | 0.04476691 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 238660 | -| policy_gradient_loss | 0.0142 | -| std | 0.00611 | -| value_loss | 2.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23868 | -| time_elapsed | 129748 | -| total_timesteps | 3055104 | -| train/ | | -| approx_kl | 0.008772235 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | -0.000984 | -| n_updates | 238670 | -| policy_gradient_loss | 0.00969 | -| std | 0.00611 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23869 | -| time_elapsed | 129761 | -| total_timesteps | 3055232 | -| train/ | | -| approx_kl | 0.006555342 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.925 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 238680 | -| policy_gradient_loss | -0.0088 | -| std | 0.00611 | -| value_loss | 0.0011 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23870 | -| time_elapsed | 129766 | -| total_timesteps | 3055360 | -| train/ | | -| approx_kl | 0.0001383773 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.000834 | -| n_updates | 238690 | -| policy_gradient_loss | 0.0402 | -| std | 0.00611 | -| value_loss | 4.25e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23871 | -| time_elapsed | 129770 | -| total_timesteps | 3055488 | -| train/ | | -| approx_kl | 0.7170465 | -| clip_fraction | 0.762 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.245 | -| n_updates | 238700 | -| policy_gradient_loss | 0.146 | -| std | 0.00611 | -| value_loss | 1.64e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23872 | -| time_elapsed | 129775 | -| total_timesteps | 3055616 | -| train/ | | -| approx_kl | 0.014643662 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00111 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 238710 | -| policy_gradient_loss | 0.0323 | -| std | 0.00611 | -| value_loss | 1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23873 | -| time_elapsed | 129780 | -| total_timesteps | 3055744 | -| train/ | | -| approx_kl | 0.12523696 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0126 | -| learning_rate | 0.0003 | -| loss | 0.0589 | -| n_updates | 238720 | -| policy_gradient_loss | 0.0315 | -| std | 0.00612 | -| value_loss | 8.76e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23874 | -| time_elapsed | 129785 | -| total_timesteps | 3055872 | -| train/ | | -| approx_kl | 4.8676506e-05 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.00076 | -| n_updates | 238730 | -| policy_gradient_loss | 0.0275 | -| std | 0.00612 | -| value_loss | 7.62e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23875 | -| time_elapsed | 129791 | -| total_timesteps | 3056000 | -| train/ | | -| approx_kl | 0.6342959 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 238740 | -| policy_gradient_loss | 0.0653 | -| std | 0.00612 | -| value_loss | 5.77e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23876 | -| time_elapsed | 129795 | -| total_timesteps | 3056128 | -| train/ | | -| approx_kl | 0.05296622 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00401 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 238750 | -| policy_gradient_loss | 0.0105 | -| std | 0.00612 | -| value_loss | 2.35e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23877 | -| time_elapsed | 129805 | -| total_timesteps | 3056256 | -| train/ | | -| approx_kl | 0.009865828 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | -0.00568 | -| n_updates | 238760 | -| policy_gradient_loss | -0.00667 | -| std | 0.00612 | -| value_loss | 0.002 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23878 | -| time_elapsed | 129810 | -| total_timesteps | 3056384 | -| train/ | | -| approx_kl | 0.07230501 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00462 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 238770 | -| policy_gradient_loss | 0.00354 | -| std | 0.00612 | -| value_loss | 4.44e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23879 | -| time_elapsed | 129816 | -| total_timesteps | 3056512 | -| train/ | | -| approx_kl | 0.05533545 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0127 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 238780 | -| policy_gradient_loss | 0.0153 | -| std | 0.00612 | -| value_loss | 1.82e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23880 | -| time_elapsed | 129821 | -| total_timesteps | 3056640 | -| train/ | | -| approx_kl | 0.0076735932 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00387 | -| learning_rate | 0.0003 | -| loss | -0.00836 | -| n_updates | 238790 | -| policy_gradient_loss | 0.00563 | -| std | 0.00612 | -| value_loss | 1.09e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23881 | -| time_elapsed | 129825 | -| total_timesteps | 3056768 | -| train/ | | -| approx_kl | 0.0012107855 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.00392 | -| n_updates | 238800 | -| policy_gradient_loss | 0.00487 | -| std | 0.00612 | -| value_loss | 7.11e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23882 | -| time_elapsed | 129829 | -| total_timesteps | 3056896 | -| train/ | | -| approx_kl | 0.062709816 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 238810 | -| policy_gradient_loss | 0.0134 | -| std | 0.00612 | -| value_loss | 6.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23883 | -| time_elapsed | 129835 | -| total_timesteps | 3057024 | -| train/ | | -| approx_kl | 0.047740392 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 238820 | -| policy_gradient_loss | 0.0191 | -| std | 0.00612 | -| value_loss | 4.99e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23884 | -| time_elapsed | 129844 | -| total_timesteps | 3057152 | -| train/ | | -| approx_kl | 0.00072625745 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | 0.00381 | -| n_updates | 238830 | -| policy_gradient_loss | -0.00125 | -| std | 0.00612 | -| value_loss | 0.00623 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23885 | -| time_elapsed | 129851 | -| total_timesteps | 3057280 | -| train/ | | -| approx_kl | 0.10229096 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 238840 | -| policy_gradient_loss | 0.0279 | -| std | 0.00609 | -| value_loss | 2.24e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23886 | -| time_elapsed | 129856 | -| total_timesteps | 3057408 | -| train/ | | -| approx_kl | 0.020721361 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -30.9 | -| learning_rate | 0.0003 | -| loss | -0.0191 | -| n_updates | 238850 | -| policy_gradient_loss | -0.00183 | -| std | 0.00608 | -| value_loss | 1.16e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23887 | -| time_elapsed | 129862 | -| total_timesteps | 3057536 | -| train/ | | -| approx_kl | 0.13818946 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -5.68 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 238860 | -| policy_gradient_loss | 0.036 | -| std | 0.00608 | -| value_loss | 5.18e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23888 | -| time_elapsed | 129866 | -| total_timesteps | 3057664 | -| train/ | | -| approx_kl | 0.34251904 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 238870 | -| policy_gradient_loss | 0.144 | -| std | 0.00608 | -| value_loss | 1.66e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23889 | -| time_elapsed | 129870 | -| total_timesteps | 3057792 | -| train/ | | -| approx_kl | 0.20366497 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 238880 | -| policy_gradient_loss | 0.1 | -| std | 0.00608 | -| value_loss | 1.86e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23890 | -| time_elapsed | 129874 | -| total_timesteps | 3057920 | -| train/ | | -| approx_kl | 0.032608677 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 238890 | -| policy_gradient_loss | 0.023 | -| std | 0.00608 | -| value_loss | 1.7e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23891 | -| time_elapsed | 129878 | -| total_timesteps | 3058048 | -| train/ | | -| approx_kl | 0.6713778 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0176 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 238900 | -| policy_gradient_loss | 0.0462 | -| std | 0.00608 | -| value_loss | 1.6e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23892 | -| time_elapsed | 129889 | -| total_timesteps | 3058176 | -| train/ | | -| approx_kl | 0.007526674 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.00902 | -| n_updates | 238910 | -| policy_gradient_loss | -0.00664 | -| std | 0.00608 | -| value_loss | 0.0027 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23893 | -| time_elapsed | 129894 | -| total_timesteps | 3058304 | -| train/ | | -| approx_kl | 0.074256234 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.375 | -| learning_rate | 0.0003 | -| loss | 0.0403 | -| n_updates | 238920 | -| policy_gradient_loss | 0.0161 | -| std | 0.00608 | -| value_loss | 1.08e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23894 | -| time_elapsed | 129899 | -| total_timesteps | 3058432 | -| train/ | | -| approx_kl | 0.011553137 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | -0.00625 | -| n_updates | 238930 | -| policy_gradient_loss | 0.00605 | -| std | 0.00608 | -| value_loss | 2.83e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23895 | -| time_elapsed | 129904 | -| total_timesteps | 3058560 | -| train/ | | -| approx_kl | 0.0008206959 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00585 | -| learning_rate | 0.0003 | -| loss | 0.00478 | -| n_updates | 238940 | -| policy_gradient_loss | 0.00248 | -| std | 0.00608 | -| value_loss | 1.58e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23896 | -| time_elapsed | 129909 | -| total_timesteps | 3058688 | -| train/ | | -| approx_kl | 0.059225004 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 238950 | -| policy_gradient_loss | 0.0186 | -| std | 0.00608 | -| value_loss | 8.25e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23897 | -| time_elapsed | 129914 | -| total_timesteps | 3058816 | -| train/ | | -| approx_kl | 0.05046925 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0466 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 238960 | -| policy_gradient_loss | 0.013 | -| std | 0.00609 | -| value_loss | 4.45e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.98 | -| time/ | | -| fps | 23 | -| iterations | 23898 | -| time_elapsed | 129919 | -| total_timesteps | 3058944 | -| train/ | | -| approx_kl | 0.010066405 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.00362 | -| n_updates | 238970 | -| policy_gradient_loss | 0.012 | -| std | 0.00611 | -| value_loss | 5.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23899 | -| time_elapsed | 129923 | -| total_timesteps | 3059072 | -| train/ | | -| approx_kl | 0.002650416 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 238980 | -| policy_gradient_loss | 0.0106 | -| std | 0.00611 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23900 | -| time_elapsed | 129932 | -| total_timesteps | 3059200 | -| train/ | | -| approx_kl | 0.025515074 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.204 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 238990 | -| policy_gradient_loss | -0.00488 | -| std | 0.00612 | -| value_loss | 0.00226 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23901 | -| time_elapsed | 129937 | -| total_timesteps | 3059328 | -| train/ | | -| approx_kl | 0.22454576 | -| clip_fraction | 0.536 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 239000 | -| policy_gradient_loss | 0.0758 | -| std | 0.00612 | -| value_loss | 1.87e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23902 | -| time_elapsed | 129942 | -| total_timesteps | 3059456 | -| train/ | | -| approx_kl | 0.045675628 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.661 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 239010 | -| policy_gradient_loss | 0.0498 | -| std | 0.00612 | -| value_loss | 3.41e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23903 | -| time_elapsed | 129947 | -| total_timesteps | 3059584 | -| train/ | | -| approx_kl | 0.18798277 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0104 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 239020 | -| policy_gradient_loss | 0.065 | -| std | 0.00612 | -| value_loss | 1.27e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23904 | -| time_elapsed | 129952 | -| total_timesteps | 3059712 | -| train/ | | -| approx_kl | 0.00014013983 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.000841 | -| learning_rate | 0.0003 | -| loss | 7.05e-05 | -| n_updates | 239030 | -| policy_gradient_loss | 0.0181 | -| std | 0.00611 | -| value_loss | 4.22e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23905 | -| time_elapsed | 129957 | -| total_timesteps | 3059840 | -| train/ | | -| approx_kl | 0.059300903 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 239040 | -| policy_gradient_loss | 0.0343 | -| std | 0.00611 | -| value_loss | 3.53e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 23906 | -| time_elapsed | 129961 | -| total_timesteps | 3059968 | -| train/ | | -| approx_kl | 2.0353217 | -| clip_fraction | 0.764 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.546 | -| n_updates | 239050 | -| policy_gradient_loss | 0.282 | -| std | 0.00611 | -| value_loss | 1.34e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23907 | -| time_elapsed | 129966 | -| total_timesteps | 3060096 | -| train/ | | -| approx_kl | 0.008410437 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -1.41 | -| learning_rate | 0.0003 | -| loss | -0.00936 | -| n_updates | 239060 | -| policy_gradient_loss | 0.0118 | -| std | 0.00611 | -| value_loss | 1.22e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23908 | -| time_elapsed | 129977 | -| total_timesteps | 3060224 | -| train/ | | -| approx_kl | 0.018436447 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -2.22 | -| learning_rate | 0.0003 | -| loss | -0.0258 | -| n_updates | 239070 | -| policy_gradient_loss | -0.00741 | -| std | 0.00611 | -| value_loss | 0.00334 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23909 | -| time_elapsed | 129984 | -| total_timesteps | 3060352 | -| train/ | | -| approx_kl | 0.0017686551 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0145 | -| learning_rate | 0.0003 | -| loss | -0.00463 | -| n_updates | 239080 | -| policy_gradient_loss | 0.0952 | -| std | 0.00611 | -| value_loss | 5.78e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23910 | -| time_elapsed | 129989 | -| total_timesteps | 3060480 | -| train/ | | -| approx_kl | 0.13160428 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 239090 | -| policy_gradient_loss | 0.165 | -| std | 0.00611 | -| value_loss | 1.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23911 | -| time_elapsed | 129994 | -| total_timesteps | 3060608 | -| train/ | | -| approx_kl | 0.021912854 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00364 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 239100 | -| policy_gradient_loss | 0.0214 | -| std | 0.00611 | -| value_loss | 4.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23912 | -| time_elapsed | 129999 | -| total_timesteps | 3060736 | -| train/ | | -| approx_kl | 0.018454457 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.00989 | -| n_updates | 239110 | -| policy_gradient_loss | 0.00419 | -| std | 0.00611 | -| value_loss | 2.46e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23913 | -| time_elapsed | 130004 | -| total_timesteps | 3060864 | -| train/ | | -| approx_kl | 0.016963057 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | -0.0052 | -| n_updates | 239120 | -| policy_gradient_loss | -0.00288 | -| std | 0.00611 | -| value_loss | 4.93e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.986 | -| time/ | | -| fps | 23 | -| iterations | 23914 | -| time_elapsed | 130011 | -| total_timesteps | 3060992 | -| train/ | | -| approx_kl | 0.033495195 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00384 | -| learning_rate | 0.0003 | -| loss | 0.00411 | -| n_updates | 239130 | -| policy_gradient_loss | 0.023 | -| std | 0.00611 | -| value_loss | 2.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 23915 | -| time_elapsed | 130017 | -| total_timesteps | 3061120 | -| train/ | | -| approx_kl | 0.13597913 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0589 | -| n_updates | 239140 | -| policy_gradient_loss | 0.0287 | -| std | 0.00611 | -| value_loss | 1.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 23916 | -| time_elapsed | 130030 | -| total_timesteps | 3061248 | -| train/ | | -| approx_kl | 0.26101092 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 239150 | -| policy_gradient_loss | 0.0015 | -| std | 0.00611 | -| value_loss | 0.000223 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 23917 | -| time_elapsed | 130036 | -| total_timesteps | 3061376 | -| train/ | | -| approx_kl | 0.46487784 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.194 | -| n_updates | 239160 | -| policy_gradient_loss | 0.08 | -| std | 0.00611 | -| value_loss | 4.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 23918 | -| time_elapsed | 130041 | -| total_timesteps | 3061504 | -| train/ | | -| approx_kl | 0.094275095 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0128 | -| n_updates | 239170 | -| policy_gradient_loss | 0.00218 | -| std | 0.00611 | -| value_loss | 3.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 23919 | -| time_elapsed | 130046 | -| total_timesteps | 3061632 | -| train/ | | -| approx_kl | 0.012838749 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 239180 | -| policy_gradient_loss | 0.00617 | -| std | 0.00611 | -| value_loss | 3.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 23920 | -| time_elapsed | 130050 | -| total_timesteps | 3061760 | -| train/ | | -| approx_kl | 0.07924204 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0261 | -| learning_rate | 0.0003 | -| loss | 0.0319 | -| n_updates | 239190 | -| policy_gradient_loss | 0.0113 | -| std | 0.00611 | -| value_loss | 3.09e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.972 | -| time/ | | -| fps | 23 | -| iterations | 23921 | -| time_elapsed | 130054 | -| total_timesteps | 3061888 | -| train/ | | -| approx_kl | 0.010715365 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.00021 | -| n_updates | 239200 | -| policy_gradient_loss | 0.00672 | -| std | 0.00611 | -| value_loss | 2.48e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23922 | -| time_elapsed | 130059 | -| total_timesteps | 3062016 | -| train/ | | -| approx_kl | 0.07050753 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 239210 | -| policy_gradient_loss | -0.0105 | -| std | 0.00611 | -| value_loss | 2.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23923 | -| time_elapsed | 130075 | -| total_timesteps | 3062144 | -| train/ | | -| approx_kl | 0.070017226 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 239220 | -| policy_gradient_loss | 0.01 | -| std | 0.00611 | -| value_loss | 0.00032 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23924 | -| time_elapsed | 130083 | -| total_timesteps | 3062272 | -| train/ | | -| approx_kl | 0.07126361 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00237 | -| learning_rate | 0.0003 | -| loss | 0.00585 | -| n_updates | 239230 | -| policy_gradient_loss | 0.00173 | -| std | 0.00611 | -| value_loss | 5.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23925 | -| time_elapsed | 130090 | -| total_timesteps | 3062400 | -| train/ | | -| approx_kl | 0.048849527 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 239240 | -| policy_gradient_loss | 0.0149 | -| std | 0.0061 | -| value_loss | 5.63e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23926 | -| time_elapsed | 130096 | -| total_timesteps | 3062528 | -| train/ | | -| approx_kl | 0.008710223 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00413 | -| learning_rate | 0.0003 | -| loss | -0.00365 | -| n_updates | 239250 | -| policy_gradient_loss | 0.00753 | -| std | 0.0061 | -| value_loss | 2.42e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23927 | -| time_elapsed | 130102 | -| total_timesteps | 3062656 | -| train/ | | -| approx_kl | 0.0011857697 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.00648 | -| n_updates | 239260 | -| policy_gradient_loss | 0.00441 | -| std | 0.0061 | -| value_loss | 2.17e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23928 | -| time_elapsed | 130107 | -| total_timesteps | 3062784 | -| train/ | | -| approx_kl | 0.07742571 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 239270 | -| policy_gradient_loss | 0.00648 | -| std | 0.00609 | -| value_loss | 1.83e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23929 | -| time_elapsed | 130111 | -| total_timesteps | 3062912 | -| train/ | | -| approx_kl | 0.011397418 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.00692 | -| n_updates | 239280 | -| policy_gradient_loss | 0.00818 | -| std | 0.00609 | -| value_loss | 1.72e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23930 | -| time_elapsed | 130115 | -| total_timesteps | 3063040 | -| train/ | | -| approx_kl | 0.0780487 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.0484 | -| n_updates | 239290 | -| policy_gradient_loss | 0.0198 | -| std | 0.00609 | -| value_loss | 1.33e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23931 | -| time_elapsed | 130126 | -| total_timesteps | 3063168 | -| train/ | | -| approx_kl | 0.015554268 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 239300 | -| policy_gradient_loss | -0.0181 | -| std | 0.00609 | -| value_loss | 0.00221 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23932 | -| time_elapsed | 130130 | -| total_timesteps | 3063296 | -| train/ | | -| approx_kl | 0.06692013 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 239310 | -| policy_gradient_loss | 0.0105 | -| std | 0.00609 | -| value_loss | 5.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23933 | -| time_elapsed | 130135 | -| total_timesteps | 3063424 | -| train/ | | -| approx_kl | 0.010096801 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00852 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 239320 | -| policy_gradient_loss | 0.0056 | -| std | 0.00609 | -| value_loss | 1.45e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23934 | -| time_elapsed | 130141 | -| total_timesteps | 3063552 | -| train/ | | -| approx_kl | 0.0026394436 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00053 | -| learning_rate | 0.0003 | -| loss | -6.12e-05 | -| n_updates | 239330 | -| policy_gradient_loss | 0.0107 | -| std | 0.00609 | -| value_loss | 2.02e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23935 | -| time_elapsed | 130146 | -| total_timesteps | 3063680 | -| train/ | | -| approx_kl | 0.0032844045 | -| clip_fraction | 0.0414 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00194 | -| n_updates | 239340 | -| policy_gradient_loss | -0.000368 | -| std | 0.00608 | -| value_loss | 0.000104 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23936 | -| time_elapsed | 130153 | -| total_timesteps | 3063808 | -| train/ | | -| approx_kl | 0.41339874 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0146 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 239350 | -| policy_gradient_loss | 0.13 | -| std | 0.00609 | -| value_loss | 9.8e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 23937 | -| time_elapsed | 130158 | -| total_timesteps | 3063936 | -| train/ | | -| approx_kl | 0.08126305 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -2.9 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 239360 | -| policy_gradient_loss | 0.0136 | -| std | 0.00609 | -| value_loss | 4.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23938 | -| time_elapsed | 130163 | -| total_timesteps | 3064064 | -| train/ | | -| approx_kl | 0.18128657 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0135 | -| learning_rate | 0.0003 | -| loss | 0.084 | -| n_updates | 239370 | -| policy_gradient_loss | 0.0267 | -| std | 0.00609 | -| value_loss | 1.02e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23939 | -| time_elapsed | 130171 | -| total_timesteps | 3064192 | -| train/ | | -| approx_kl | 0.03420724 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.0218 | -| n_updates | 239380 | -| policy_gradient_loss | 0.00243 | -| std | 0.00609 | -| value_loss | 0.00032 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23940 | -| time_elapsed | 130177 | -| total_timesteps | 3064320 | -| train/ | | -| approx_kl | 0.003818376 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.000978 | -| n_updates | 239390 | -| policy_gradient_loss | 0.0292 | -| std | 0.00612 | -| value_loss | 5.39e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23941 | -| time_elapsed | 130182 | -| total_timesteps | 3064448 | -| train/ | | -| approx_kl | 0.25259954 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -4.67 | -| learning_rate | 0.0003 | -| loss | 0.0726 | -| n_updates | 239400 | -| policy_gradient_loss | 0.0324 | -| std | 0.00613 | -| value_loss | 6.3e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23942 | -| time_elapsed | 130185 | -| total_timesteps | 3064576 | -| train/ | | -| approx_kl | 0.3271724 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00974 | -| learning_rate | 0.0003 | -| loss | 0.311 | -| n_updates | 239410 | -| policy_gradient_loss | 0.0607 | -| std | 0.00613 | -| value_loss | 1.43e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23943 | -| time_elapsed | 130188 | -| total_timesteps | 3064704 | -| train/ | | -| approx_kl | 0.0033977907 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00215 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 239420 | -| policy_gradient_loss | 0.0435 | -| std | 0.00612 | -| value_loss | 1.08e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23944 | -| time_elapsed | 130192 | -| total_timesteps | 3064832 | -| train/ | | -| approx_kl | 0.0181903 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.97 | -| learning_rate | 0.0003 | -| loss | 0.00485 | -| n_updates | 239430 | -| policy_gradient_loss | 0.00155 | -| std | 0.0061 | -| value_loss | 7.86e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 23945 | -| time_elapsed | 130196 | -| total_timesteps | 3064960 | -| train/ | | -| approx_kl | 0.030491214 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -4.35 | -| learning_rate | 0.0003 | -| loss | -0.0216 | -| n_updates | 239440 | -| policy_gradient_loss | 0.0102 | -| std | 0.00609 | -| value_loss | 2.51e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23946 | -| time_elapsed | 130200 | -| total_timesteps | 3065088 | -| train/ | | -| approx_kl | 0.40825662 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0138 | -| learning_rate | 0.0003 | -| loss | 0.25 | -| n_updates | 239450 | -| policy_gradient_loss | 0.163 | -| std | 0.00608 | -| value_loss | 8.95e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23947 | -| time_elapsed | 130210 | -| total_timesteps | 3065216 | -| train/ | | -| approx_kl | 0.057549763 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 239460 | -| policy_gradient_loss | 0.017 | -| std | 0.00608 | -| value_loss | 0.00101 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23948 | -| time_elapsed | 130216 | -| total_timesteps | 3065344 | -| train/ | | -| approx_kl | 0.00011088373 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.000745 | -| n_updates | 239470 | -| policy_gradient_loss | 0.0366 | -| std | 0.00608 | -| value_loss | 1.38e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23949 | -| time_elapsed | 130221 | -| total_timesteps | 3065472 | -| train/ | | -| approx_kl | 0.6419603 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00526 | -| learning_rate | 0.0003 | -| loss | 0.233 | -| n_updates | 239480 | -| policy_gradient_loss | 0.0742 | -| std | 0.00608 | -| value_loss | 3.36e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23950 | -| time_elapsed | 130227 | -| total_timesteps | 3065600 | -| train/ | | -| approx_kl | 0.0124623235 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -3.76e-05 | -| learning_rate | 0.0003 | -| loss | 0.000483 | -| n_updates | 239490 | -| policy_gradient_loss | 0.00921 | -| std | 0.00608 | -| value_loss | 2.07e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23951 | -| time_elapsed | 130234 | -| total_timesteps | 3065728 | -| train/ | | -| approx_kl | 0.07361691 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.0434 | -| n_updates | 239500 | -| policy_gradient_loss | 0.0169 | -| std | 0.00608 | -| value_loss | 1.66e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23952 | -| time_elapsed | 130238 | -| total_timesteps | 3065856 | -| train/ | | -| approx_kl | 0.013476843 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.019 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 239510 | -| policy_gradient_loss | 0.00861 | -| std | 0.00608 | -| value_loss | 1.19e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 23953 | -| time_elapsed | 130243 | -| total_timesteps | 3065984 | -| train/ | | -| approx_kl | 0.0032173134 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | -0.000826 | -| n_updates | 239520 | -| policy_gradient_loss | 0.0101 | -| std | 0.00608 | -| value_loss | 8.03e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23954 | -| time_elapsed | 130247 | -| total_timesteps | 3066112 | -| train/ | | -| approx_kl | 0.0027618455 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.00565 | -| n_updates | 239530 | -| policy_gradient_loss | 0.00915 | -| std | 0.00608 | -| value_loss | 7.26e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23955 | -| time_elapsed | 130258 | -| total_timesteps | 3066240 | -| train/ | | -| approx_kl | 0.2624178 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.657 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 239540 | -| policy_gradient_loss | -0.019 | -| std | 0.00608 | -| value_loss | 0.0011 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23956 | -| time_elapsed | 130263 | -| total_timesteps | 3066368 | -| train/ | | -| approx_kl | 0.040673643 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00888 | -| learning_rate | 0.0003 | -| loss | 0.00559 | -| n_updates | 239550 | -| policy_gradient_loss | 0.0248 | -| std | 0.00608 | -| value_loss | 2.5e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23957 | -| time_elapsed | 130268 | -| total_timesteps | 3066496 | -| train/ | | -| approx_kl | 0.1493256 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0167 | -| learning_rate | 0.0003 | -| loss | 0.0852 | -| n_updates | 239560 | -| policy_gradient_loss | 0.038 | -| std | 0.00608 | -| value_loss | 7.21e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23958 | -| time_elapsed | 130272 | -| total_timesteps | 3066624 | -| train/ | | -| approx_kl | 0.12050192 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0744 | -| learning_rate | 0.0003 | -| loss | 0.0713 | -| n_updates | 239570 | -| policy_gradient_loss | 0.0215 | -| std | 0.00608 | -| value_loss | 9e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23959 | -| time_elapsed | 130277 | -| total_timesteps | 3066752 | -| train/ | | -| approx_kl | 0.0099970875 | -| clip_fraction | 0.082 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00442 | -| learning_rate | 0.0003 | -| loss | -0.000936 | -| n_updates | 239580 | -| policy_gradient_loss | -0.000253 | -| std | 0.00608 | -| value_loss | 4.08e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 23960 | -| time_elapsed | 130280 | -| total_timesteps | 3066880 | -| train/ | | -| approx_kl | 0.035913445 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.00927 | -| n_updates | 239590 | -| policy_gradient_loss | 0.0351 | -| std | 0.00608 | -| value_loss | 3.1e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23961 | -| time_elapsed | 130285 | -| total_timesteps | 3067008 | -| train/ | | -| approx_kl | 0.46592763 | -| clip_fraction | 0.744 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 239600 | -| policy_gradient_loss | 0.169 | -| std | 0.00608 | -| value_loss | 2.61e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23962 | -| time_elapsed | 130298 | -| total_timesteps | 3067136 | -| train/ | | -| approx_kl | 0.08495794 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.815 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 239610 | -| policy_gradient_loss | -0.00472 | -| std | 0.00608 | -| value_loss | 0.00455 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23963 | -| time_elapsed | 130303 | -| total_timesteps | 3067264 | -| train/ | | -| approx_kl | 0.041383244 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.449 | -| learning_rate | 0.0003 | -| loss | 0.00523 | -| n_updates | 239620 | -| policy_gradient_loss | -0.00169 | -| std | 0.00608 | -| value_loss | 4.09e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23964 | -| time_elapsed | 130309 | -| total_timesteps | 3067392 | -| train/ | | -| approx_kl | 0.021256257 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00177 | -| learning_rate | 0.0003 | -| loss | 0.00839 | -| n_updates | 239630 | -| policy_gradient_loss | 0.00321 | -| std | 0.00608 | -| value_loss | 2.26e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23965 | -| time_elapsed | 130316 | -| total_timesteps | 3067520 | -| train/ | | -| approx_kl | 0.026637254 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | -0.00744 | -| n_updates | 239640 | -| policy_gradient_loss | 0.0216 | -| std | 0.00607 | -| value_loss | 9.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23966 | -| time_elapsed | 130320 | -| total_timesteps | 3067648 | -| train/ | | -| approx_kl | 0.15847996 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.082 | -| n_updates | 239650 | -| policy_gradient_loss | 0.042 | -| std | 0.00607 | -| value_loss | 1.02e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23967 | -| time_elapsed | 130325 | -| total_timesteps | 3067776 | -| train/ | | -| approx_kl | 0.0001811427 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.000896 | -| n_updates | 239660 | -| policy_gradient_loss | 0.0226 | -| std | 0.00607 | -| value_loss | 8.73e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23968 | -| time_elapsed | 130329 | -| total_timesteps | 3067904 | -| train/ | | -| approx_kl | 0.00065329066 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.000456 | -| n_updates | 239670 | -| policy_gradient_loss | 0.0333 | -| std | 0.00607 | -| value_loss | 4.4e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23969 | -| time_elapsed | 130334 | -| total_timesteps | 3068032 | -| train/ | | -| approx_kl | 0.5576421 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 239680 | -| policy_gradient_loss | 0.0578 | -| std | 0.00607 | -| value_loss | 4.56e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23970 | -| time_elapsed | 130344 | -| total_timesteps | 3068160 | -| train/ | | -| approx_kl | 0.033817537 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.168 | -| learning_rate | 0.0003 | -| loss | -0.0319 | -| n_updates | 239690 | -| policy_gradient_loss | -0.0189 | -| std | 0.00607 | -| value_loss | 0.0019 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23971 | -| time_elapsed | 130347 | -| total_timesteps | 3068288 | -| train/ | | -| approx_kl | 0.023078334 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -2.13 | -| learning_rate | 0.0003 | -| loss | -0.00932 | -| n_updates | 239700 | -| policy_gradient_loss | 0.0219 | -| std | 0.00607 | -| value_loss | 4.59e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23972 | -| time_elapsed | 130352 | -| total_timesteps | 3068416 | -| train/ | | -| approx_kl | 0.70220065 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 239710 | -| policy_gradient_loss | 0.0598 | -| std | 0.00607 | -| value_loss | 3.75e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23973 | -| time_elapsed | 130357 | -| total_timesteps | 3068544 | -| train/ | | -| approx_kl | 0.0511291 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 239720 | -| policy_gradient_loss | 0.0109 | -| std | 0.00607 | -| value_loss | 1.3e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23974 | -| time_elapsed | 130361 | -| total_timesteps | 3068672 | -| train/ | | -| approx_kl | 0.057699144 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00875 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 239730 | -| policy_gradient_loss | 0.0121 | -| std | 0.00607 | -| value_loss | 6.92e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23975 | -| time_elapsed | 130366 | -| total_timesteps | 3068800 | -| train/ | | -| approx_kl | 0.06864365 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 239740 | -| policy_gradient_loss | 0.0101 | -| std | 0.00607 | -| value_loss | 4.78e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 23976 | -| time_elapsed | 130372 | -| total_timesteps | 3068928 | -| train/ | | -| approx_kl | 0.051557627 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.0226 | -| n_updates | 239750 | -| policy_gradient_loss | 0.0108 | -| std | 0.00607 | -| value_loss | 3.49e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23977 | -| time_elapsed | 130379 | -| total_timesteps | 3069056 | -| train/ | | -| approx_kl | 0.059135046 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | -0.00339 | -| n_updates | 239760 | -| policy_gradient_loss | -0.00149 | -| std | 0.00607 | -| value_loss | 2.8e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23978 | -| time_elapsed | 130389 | -| total_timesteps | 3069184 | -| train/ | | -| approx_kl | 0.009053435 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 239770 | -| policy_gradient_loss | 0.00825 | -| std | 0.00607 | -| value_loss | 0.00013 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23979 | -| time_elapsed | 130395 | -| total_timesteps | 3069312 | -| train/ | | -| approx_kl | 0.0010352684 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -2.52 | -| learning_rate | 0.0003 | -| loss | -0.00216 | -| n_updates | 239780 | -| policy_gradient_loss | 0.0184 | -| std | 0.00607 | -| value_loss | 1.94e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23980 | -| time_elapsed | 130399 | -| total_timesteps | 3069440 | -| train/ | | -| approx_kl | 0.0012486991 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0793 | -| learning_rate | 0.0003 | -| loss | 0.00154 | -| n_updates | 239790 | -| policy_gradient_loss | 0.0441 | -| std | 0.00607 | -| value_loss | 2e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23981 | -| time_elapsed | 130403 | -| total_timesteps | 3069568 | -| train/ | | -| approx_kl | 0.003753278 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.000562 | -| n_updates | 239800 | -| policy_gradient_loss | 0.0401 | -| std | 0.00606 | -| value_loss | 4.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23982 | -| time_elapsed | 130407 | -| total_timesteps | 3069696 | -| train/ | | -| approx_kl | 0.59146595 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.617 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 239810 | -| policy_gradient_loss | 0.053 | -| std | 0.00606 | -| value_loss | 1.33e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23983 | -| time_elapsed | 130413 | -| total_timesteps | 3069824 | -| train/ | | -| approx_kl | 0.055127863 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0334 | -| n_updates | 239820 | -| policy_gradient_loss | 0.016 | -| std | 0.00605 | -| value_loss | 2.04e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23984 | -| time_elapsed | 130418 | -| total_timesteps | 3069952 | -| train/ | | -| approx_kl | 0.044635873 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0919 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 239830 | -| policy_gradient_loss | 0.012 | -| std | 0.00605 | -| value_loss | 2.35e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23985 | -| time_elapsed | 130422 | -| total_timesteps | 3070080 | -| train/ | | -| approx_kl | 0.07514 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 239840 | -| policy_gradient_loss | 0.0121 | -| std | 0.00605 | -| value_loss | 1.21e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23986 | -| time_elapsed | 130431 | -| total_timesteps | 3070208 | -| train/ | | -| approx_kl | 0.13349338 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | 0.00821 | -| n_updates | 239850 | -| policy_gradient_loss | -0.00383 | -| std | 0.00604 | -| value_loss | 0.0027 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23987 | -| time_elapsed | 130435 | -| total_timesteps | 3070336 | -| train/ | | -| approx_kl | 0.016584795 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.216 | -| learning_rate | 0.0003 | -| loss | -0.0049 | -| n_updates | 239860 | -| policy_gradient_loss | 0.0365 | -| std | 0.00604 | -| value_loss | 9.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23988 | -| time_elapsed | 130440 | -| total_timesteps | 3070464 | -| train/ | | -| approx_kl | 0.93931735 | -| clip_fraction | 0.754 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00668 | -| learning_rate | 0.0003 | -| loss | 0.332 | -| n_updates | 239870 | -| policy_gradient_loss | 0.184 | -| std | 0.00604 | -| value_loss | 2.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23989 | -| time_elapsed | 130443 | -| total_timesteps | 3070592 | -| train/ | | -| approx_kl | 0.033241764 | -| clip_fraction | 0.178 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00449 | -| learning_rate | 0.0003 | -| loss | -0.00579 | -| n_updates | 239880 | -| policy_gradient_loss | -0.00856 | -| std | 0.00604 | -| value_loss | 1.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23990 | -| time_elapsed | 130448 | -| total_timesteps | 3070720 | -| train/ | | -| approx_kl | 0.023184147 | -| clip_fraction | 0.506 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 239890 | -| policy_gradient_loss | 0.0292 | -| std | 0.00604 | -| value_loss | 1.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23991 | -| time_elapsed | 130452 | -| total_timesteps | 3070848 | -| train/ | | -| approx_kl | 0.13643631 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | 0.0735 | -| n_updates | 239900 | -| policy_gradient_loss | 0.0359 | -| std | 0.00605 | -| value_loss | 9.74e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 23992 | -| time_elapsed | 130456 | -| total_timesteps | 3070976 | -| train/ | | -| approx_kl | 8.870941e-05 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | -0.000221 | -| n_updates | 239910 | -| policy_gradient_loss | 0.0294 | -| std | 0.00605 | -| value_loss | 5.85e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23993 | -| time_elapsed | 130460 | -| total_timesteps | 3071104 | -| train/ | | -| approx_kl | 0.24214554 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0874 | -| n_updates | 239920 | -| policy_gradient_loss | 0.0266 | -| std | 0.00605 | -| value_loss | 5.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23994 | -| time_elapsed | 130472 | -| total_timesteps | 3071232 | -| train/ | | -| approx_kl | 0.19131793 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 239930 | -| policy_gradient_loss | -0.0159 | -| std | 0.00605 | -| value_loss | 0.000846 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23995 | -| time_elapsed | 130476 | -| total_timesteps | 3071360 | -| train/ | | -| approx_kl | 0.087696016 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -3.52 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 239940 | -| policy_gradient_loss | 0.0129 | -| std | 0.00605 | -| value_loss | 1.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23996 | -| time_elapsed | 130479 | -| total_timesteps | 3071488 | -| train/ | | -| approx_kl | 0.0033436916 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -11.4 | -| learning_rate | 0.0003 | -| loss | -0.00343 | -| n_updates | 239950 | -| policy_gradient_loss | 0.0146 | -| std | 0.00605 | -| value_loss | 5.9e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23997 | -| time_elapsed | 130482 | -| total_timesteps | 3071616 | -| train/ | | -| approx_kl | 0.090963766 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00717 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 239960 | -| policy_gradient_loss | 0.0301 | -| std | 0.00605 | -| value_loss | 5.04e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23998 | -| time_elapsed | 130485 | -| total_timesteps | 3071744 | -| train/ | | -| approx_kl | 0.20230532 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 239970 | -| policy_gradient_loss | 0.0123 | -| std | 0.00605 | -| value_loss | 4.32e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 23999 | -| time_elapsed | 130489 | -| total_timesteps | 3071872 | -| train/ | | -| approx_kl | 0.012275413 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 239980 | -| policy_gradient_loss | 0.0178 | -| std | 0.00605 | -| value_loss | 3.57e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24000 | -| time_elapsed | 130494 | -| total_timesteps | 3072000 | -| train/ | | -| approx_kl | 0.07716896 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0477 | -| n_updates | 239990 | -| policy_gradient_loss | 0.031 | -| std | 0.00605 | -| value_loss | 2.15e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24001 | -| time_elapsed | 130500 | -| total_timesteps | 3072128 | -| train/ | | -| approx_kl | 0.8361077 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00472 | -| learning_rate | 0.0003 | -| loss | 0.28 | -| n_updates | 240000 | -| policy_gradient_loss | 0.0787 | -| std | 0.00605 | -| value_loss | 1.31e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24002 | -| time_elapsed | 130515 | -| total_timesteps | 3072256 | -| train/ | | -| approx_kl | 0.0038354155 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.00581 | -| n_updates | 240010 | -| policy_gradient_loss | 0.00209 | -| std | 0.00605 | -| value_loss | 0.00253 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24003 | -| time_elapsed | 130521 | -| total_timesteps | 3072384 | -| train/ | | -| approx_kl | 0.3896045 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.357 | -| learning_rate | 0.0003 | -| loss | 0.247 | -| n_updates | 240020 | -| policy_gradient_loss | 0.212 | -| std | 0.00604 | -| value_loss | 5.66e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24004 | -| time_elapsed | 130526 | -| total_timesteps | 3072512 | -| train/ | | -| approx_kl | 0.21817409 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00101 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 240030 | -| policy_gradient_loss | 0.171 | -| std | 0.00605 | -| value_loss | 1.25e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24005 | -| time_elapsed | 130530 | -| total_timesteps | 3072640 | -| train/ | | -| approx_kl | 0.04001437 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.377 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 240040 | -| policy_gradient_loss | 0.0338 | -| std | 0.00605 | -| value_loss | 2.6e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24006 | -| time_elapsed | 130535 | -| total_timesteps | 3072768 | -| train/ | | -| approx_kl | 0.6616281 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.215 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 240050 | -| policy_gradient_loss | 0.0568 | -| std | 0.00605 | -| value_loss | 7.22e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24007 | -| time_elapsed | 130541 | -| total_timesteps | 3072896 | -| train/ | | -| approx_kl | 0.012070296 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0643 | -| learning_rate | 0.0003 | -| loss | -0.00695 | -| n_updates | 240060 | -| policy_gradient_loss | 0.00752 | -| std | 0.00605 | -| value_loss | 7.12e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24008 | -| time_elapsed | 130546 | -| total_timesteps | 3073024 | -| train/ | | -| approx_kl | 0.0031716349 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.000373 | -| n_updates | 240070 | -| policy_gradient_loss | 0.0165 | -| std | 0.00605 | -| value_loss | 3.42e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24009 | -| time_elapsed | 130555 | -| total_timesteps | 3073152 | -| train/ | | -| approx_kl | 0.033021566 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -5.88 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 240080 | -| policy_gradient_loss | -0.0125 | -| std | 0.00606 | -| value_loss | 0.00439 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24010 | -| time_elapsed | 130559 | -| total_timesteps | 3073280 | -| train/ | | -| approx_kl | 0.72954255 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.34 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 240090 | -| policy_gradient_loss | 0.0438 | -| std | 0.00606 | -| value_loss | 4.06e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24011 | -| time_elapsed | 130564 | -| total_timesteps | 3073408 | -| train/ | | -| approx_kl | 0.024026798 | -| clip_fraction | 0.563 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.000759 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 240100 | -| policy_gradient_loss | 0.123 | -| std | 0.00607 | -| value_loss | 3.34e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24012 | -| time_elapsed | 130568 | -| total_timesteps | 3073536 | -| train/ | | -| approx_kl | 0.3420465 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 240110 | -| policy_gradient_loss | 0.0471 | -| std | 0.00607 | -| value_loss | 2.99e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24013 | -| time_elapsed | 130573 | -| total_timesteps | 3073664 | -| train/ | | -| approx_kl | 0.07846995 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0361 | -| n_updates | 240120 | -| policy_gradient_loss | 0.0728 | -| std | 0.00607 | -| value_loss | 2.41e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24014 | -| time_elapsed | 130578 | -| total_timesteps | 3073792 | -| train/ | | -| approx_kl | 0.26464826 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 240130 | -| policy_gradient_loss | 0.0486 | -| std | 0.00607 | -| value_loss | 1.96e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24015 | -| time_elapsed | 130583 | -| total_timesteps | 3073920 | -| train/ | | -| approx_kl | 0.0013240459 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | -0.00191 | -| n_updates | 240140 | -| policy_gradient_loss | 0.0143 | -| std | 0.00607 | -| value_loss | 1.34e-07 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24016 | -| time_elapsed | 130587 | -| total_timesteps | 3074048 | -| train/ | | -| approx_kl | 0.000108784996 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | -0.000538 | -| n_updates | 240150 | -| policy_gradient_loss | 0.0132 | -| std | 0.00607 | -| value_loss | 8.16e-08 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24017 | -| time_elapsed | 130597 | -| total_timesteps | 3074176 | -| train/ | | -| approx_kl | 0.31722096 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | 0.0789 | -| n_updates | 240160 | -| policy_gradient_loss | 0.0239 | -| std | 0.00607 | -| value_loss | 0.000125 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24018 | -| time_elapsed | 130602 | -| total_timesteps | 3074304 | -| train/ | | -| approx_kl | 0.014220164 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.67 | -| learning_rate | 0.0003 | -| loss | 0.0334 | -| n_updates | 240170 | -| policy_gradient_loss | 0.0198 | -| std | 0.00607 | -| value_loss | 2.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24019 | -| time_elapsed | 130608 | -| total_timesteps | 3074432 | -| train/ | | -| approx_kl | 0.034802906 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00875 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 240180 | -| policy_gradient_loss | 0.00905 | -| std | 0.00607 | -| value_loss | 4.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24020 | -| time_elapsed | 130612 | -| total_timesteps | 3074560 | -| train/ | | -| approx_kl | 0.033147603 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00972 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 240190 | -| policy_gradient_loss | 0.0476 | -| std | 0.00607 | -| value_loss | 1.62e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24021 | -| time_elapsed | 130618 | -| total_timesteps | 3074688 | -| train/ | | -| approx_kl | 0.12100685 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.00972 | -| n_updates | 240200 | -| policy_gradient_loss | 0.0138 | -| std | 0.00607 | -| value_loss | 1.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24022 | -| time_elapsed | 130623 | -| total_timesteps | 3074816 | -| train/ | | -| approx_kl | 0.17145966 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | 0.0833 | -| n_updates | 240210 | -| policy_gradient_loss | 0.0295 | -| std | 0.00607 | -| value_loss | 1.39e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24023 | -| time_elapsed | 130628 | -| total_timesteps | 3074944 | -| train/ | | -| approx_kl | 0.013658805 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.00429 | -| n_updates | 240220 | -| policy_gradient_loss | 0.00237 | -| std | 0.00607 | -| value_loss | 6.91e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24024 | -| time_elapsed | 130632 | -| total_timesteps | 3075072 | -| train/ | | -| approx_kl | 0.035981562 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.076 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 240230 | -| policy_gradient_loss | 0.0442 | -| std | 0.00607 | -| value_loss | 5.36e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24025 | -| time_elapsed | 130643 | -| total_timesteps | 3075200 | -| train/ | | -| approx_kl | 0.1966716 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.807 | -| learning_rate | 0.0003 | -| loss | 0.0532 | -| n_updates | 240240 | -| policy_gradient_loss | 0.00777 | -| std | 0.00607 | -| value_loss | 0.00331 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24026 | -| time_elapsed | 130648 | -| total_timesteps | 3075328 | -| train/ | | -| approx_kl | 0.012367822 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | 0.0148 | -| n_updates | 240250 | -| policy_gradient_loss | 0.0179 | -| std | 0.00607 | -| value_loss | 1.67e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24027 | -| time_elapsed | 130652 | -| total_timesteps | 3075456 | -| train/ | | -| approx_kl | 0.020659473 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0115 | -| learning_rate | 0.0003 | -| loss | 0.00806 | -| n_updates | 240260 | -| policy_gradient_loss | 0.00265 | -| std | 0.00607 | -| value_loss | 2.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24028 | -| time_elapsed | 130657 | -| total_timesteps | 3075584 | -| train/ | | -| approx_kl | 0.016675921 | -| clip_fraction | 0.144 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 240270 | -| policy_gradient_loss | 0.000401 | -| std | 0.00607 | -| value_loss | 1.33e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24029 | -| time_elapsed | 130661 | -| total_timesteps | 3075712 | -| train/ | | -| approx_kl | 0.013986213 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0516 | -| learning_rate | 0.0003 | -| loss | 0.00603 | -| n_updates | 240280 | -| policy_gradient_loss | 0.00375 | -| std | 0.00605 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24030 | -| time_elapsed | 130666 | -| total_timesteps | 3075840 | -| train/ | | -| approx_kl | 0.035728153 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0783 | -| learning_rate | 0.0003 | -| loss | -0.0167 | -| n_updates | 240290 | -| policy_gradient_loss | 0.0146 | -| std | 0.00604 | -| value_loss | 4.09e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24031 | -| time_elapsed | 130670 | -| total_timesteps | 3075968 | -| train/ | | -| approx_kl | 0.4318438 | -| clip_fraction | 0.748 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0138 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 240300 | -| policy_gradient_loss | 0.197 | -| std | 0.00604 | -| value_loss | 1.04e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24032 | -| time_elapsed | 130676 | -| total_timesteps | 3076096 | -| train/ | | -| approx_kl | 0.10543843 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 240310 | -| policy_gradient_loss | 0.038 | -| std | 0.00603 | -| value_loss | 1.08e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24033 | -| time_elapsed | 130684 | -| total_timesteps | 3076224 | -| train/ | | -| approx_kl | 0.06253839 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 240320 | -| policy_gradient_loss | 0.0089 | -| std | 0.00603 | -| value_loss | 0.00572 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24034 | -| time_elapsed | 130688 | -| total_timesteps | 3076352 | -| train/ | | -| approx_kl | 0.69441694 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00532 | -| learning_rate | 0.0003 | -| loss | 0.246 | -| n_updates | 240330 | -| policy_gradient_loss | 0.0869 | -| std | 0.00603 | -| value_loss | 9.91e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24035 | -| time_elapsed | 130693 | -| total_timesteps | 3076480 | -| train/ | | -| approx_kl | 0.008450289 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00975 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 240340 | -| policy_gradient_loss | 0.00841 | -| std | 0.00603 | -| value_loss | 2.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24036 | -| time_elapsed | 130696 | -| total_timesteps | 3076608 | -| train/ | | -| approx_kl | 0.004963714 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | -0.00088 | -| n_updates | 240350 | -| policy_gradient_loss | 0.0112 | -| std | 0.00602 | -| value_loss | 4.13e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24037 | -| time_elapsed | 130700 | -| total_timesteps | 3076736 | -| train/ | | -| approx_kl | 0.0010220609 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.446 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 240360 | -| policy_gradient_loss | 0.0199 | -| std | 0.00601 | -| value_loss | 4.42e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24038 | -| time_elapsed | 130704 | -| total_timesteps | 3076864 | -| train/ | | -| approx_kl | 0.17272869 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0143 | -| learning_rate | 0.0003 | -| loss | 0.0944 | -| n_updates | 240370 | -| policy_gradient_loss | 0.0541 | -| std | 0.00598 | -| value_loss | 1.56e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24039 | -| time_elapsed | 130708 | -| total_timesteps | 3076992 | -| train/ | | -| approx_kl | 0.0068330485 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 240380 | -| policy_gradient_loss | 0.0218 | -| std | 0.00597 | -| value_loss | 3.42e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 24040 | -| time_elapsed | 130713 | -| total_timesteps | 3077120 | -| train/ | | -| approx_kl | 0.15090865 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00367 | -| learning_rate | 0.0003 | -| loss | 0.0517 | -| n_updates | 240390 | -| policy_gradient_loss | 0.0506 | -| std | 0.00597 | -| value_loss | 1.13e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 24041 | -| time_elapsed | 130725 | -| total_timesteps | 3077248 | -| train/ | | -| approx_kl | 0.02589455 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 240400 | -| policy_gradient_loss | 0.0467 | -| std | 0.00597 | -| value_loss | 0.00202 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 24042 | -| time_elapsed | 130730 | -| total_timesteps | 3077376 | -| train/ | | -| approx_kl | 0.0731976 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0599 | -| n_updates | 240410 | -| policy_gradient_loss | 0.0372 | -| std | 0.00596 | -| value_loss | 2.29e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 24043 | -| time_elapsed | 130734 | -| total_timesteps | 3077504 | -| train/ | | -| approx_kl | 0.11942214 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0111 | -| learning_rate | 0.0003 | -| loss | 0.063 | -| n_updates | 240420 | -| policy_gradient_loss | 0.0184 | -| std | 0.00596 | -| value_loss | 1.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 24044 | -| time_elapsed | 130739 | -| total_timesteps | 3077632 | -| train/ | | -| approx_kl | 0.05340528 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 240430 | -| policy_gradient_loss | 0.0313 | -| std | 0.00596 | -| value_loss | 1.12e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 24045 | -| time_elapsed | 130743 | -| total_timesteps | 3077760 | -| train/ | | -| approx_kl | 0.3656019 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 240440 | -| policy_gradient_loss | 0.164 | -| std | 0.00596 | -| value_loss | 9.04e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 24046 | -| time_elapsed | 130748 | -| total_timesteps | 3077888 | -| train/ | | -| approx_kl | 0.25101942 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0212 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 240450 | -| policy_gradient_loss | 0.157 | -| std | 0.00596 | -| value_loss | 7.68e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24047 | -| time_elapsed | 130753 | -| total_timesteps | 3078016 | -| train/ | | -| approx_kl | 0.2392326 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0204 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 240460 | -| policy_gradient_loss | 0.245 | -| std | 0.00596 | -| value_loss | 7.29e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24048 | -| time_elapsed | 130765 | -| total_timesteps | 3078144 | -| train/ | | -| approx_kl | 0.21939825 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | 0.0706 | -| n_updates | 240470 | -| policy_gradient_loss | 0.1 | -| std | 0.00596 | -| value_loss | 0.000791 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24049 | -| time_elapsed | 130770 | -| total_timesteps | 3078272 | -| train/ | | -| approx_kl | 0.22399685 | -| clip_fraction | 0.728 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.168 | -| learning_rate | 0.0003 | -| loss | 0.0856 | -| n_updates | 240480 | -| policy_gradient_loss | 0.116 | -| std | 0.00596 | -| value_loss | 1.63e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24050 | -| time_elapsed | 130776 | -| total_timesteps | 3078400 | -| train/ | | -| approx_kl | 0.056523718 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.35 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 240490 | -| policy_gradient_loss | 0.0313 | -| std | 0.00596 | -| value_loss | 1.34e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24051 | -| time_elapsed | 130780 | -| total_timesteps | 3078528 | -| train/ | | -| approx_kl | 0.7033722 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0982 | -| learning_rate | 0.0003 | -| loss | 0.222 | -| n_updates | 240500 | -| policy_gradient_loss | 0.0733 | -| std | 0.00595 | -| value_loss | 1.07e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24052 | -| time_elapsed | 130785 | -| total_timesteps | 3078656 | -| train/ | | -| approx_kl | 0.053418294 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 240510 | -| policy_gradient_loss | 0.00749 | -| std | 0.00595 | -| value_loss | 1.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24053 | -| time_elapsed | 130790 | -| total_timesteps | 3078784 | -| train/ | | -| approx_kl | 0.080448896 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 240520 | -| policy_gradient_loss | 0.0176 | -| std | 0.00595 | -| value_loss | 8.87e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24054 | -| time_elapsed | 130795 | -| total_timesteps | 3078912 | -| train/ | | -| approx_kl | 0.012678944 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.00439 | -| n_updates | 240530 | -| policy_gradient_loss | 0.0132 | -| std | 0.00595 | -| value_loss | 2.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24055 | -| time_elapsed | 130800 | -| total_timesteps | 3079040 | -| train/ | | -| approx_kl | 0.003332585 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.682 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 240540 | -| policy_gradient_loss | 0.0135 | -| std | 0.00594 | -| value_loss | 1.31e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24056 | -| time_elapsed | 130807 | -| total_timesteps | 3079168 | -| train/ | | -| approx_kl | 0.05632638 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.679 | -| learning_rate | 0.0003 | -| loss | 0.05 | -| n_updates | 240550 | -| policy_gradient_loss | 0.14 | -| std | 0.00594 | -| value_loss | 0.00612 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24057 | -| time_elapsed | 130812 | -| total_timesteps | 3079296 | -| train/ | | -| approx_kl | 0.12173928 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.883 | -| learning_rate | 0.0003 | -| loss | 0.092 | -| n_updates | 240560 | -| policy_gradient_loss | 0.123 | -| std | 0.00594 | -| value_loss | 1.57e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24058 | -| time_elapsed | 130817 | -| total_timesteps | 3079424 | -| train/ | | -| approx_kl | 0.14260127 | -| clip_fraction | 0.701 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00252 | -| learning_rate | 0.0003 | -| loss | 0.0876 | -| n_updates | 240570 | -| policy_gradient_loss | 0.127 | -| std | 0.00594 | -| value_loss | 3.9e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24059 | -| time_elapsed | 130821 | -| total_timesteps | 3079552 | -| train/ | | -| approx_kl | 0.035374314 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.000227 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 240580 | -| policy_gradient_loss | 0.0393 | -| std | 0.00594 | -| value_loss | 2.18e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24060 | -| time_elapsed | 130826 | -| total_timesteps | 3079680 | -| train/ | | -| approx_kl | 0.0002705278 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.000367 | -| n_updates | 240590 | -| policy_gradient_loss | 0.0377 | -| std | 0.00595 | -| value_loss | 1.33e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24061 | -| time_elapsed | 130831 | -| total_timesteps | 3079808 | -| train/ | | -| approx_kl | 0.0017461311 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 240600 | -| policy_gradient_loss | 0.0468 | -| std | 0.00595 | -| value_loss | 9.58e-07 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24062 | -| time_elapsed | 130836 | -| total_timesteps | 3079936 | -| train/ | | -| approx_kl | 0.53329 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.236 | -| n_updates | 240610 | -| policy_gradient_loss | 0.0847 | -| std | 0.00595 | -| value_loss | 6.33e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24063 | -| time_elapsed | 130841 | -| total_timesteps | 3080064 | -| train/ | | -| approx_kl | 0.009367993 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | -0.0031 | -| n_updates | 240620 | -| policy_gradient_loss | 0.0119 | -| std | 0.00595 | -| value_loss | 5.61e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24064 | -| time_elapsed | 130849 | -| total_timesteps | 3080192 | -| train/ | | -| approx_kl | 0.044698775 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.934 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 240630 | -| policy_gradient_loss | -0.00966 | -| std | 0.00595 | -| value_loss | 0.00036 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24065 | -| time_elapsed | 130853 | -| total_timesteps | 3080320 | -| train/ | | -| approx_kl | 0.08643932 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.13 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 240640 | -| policy_gradient_loss | 0.0169 | -| std | 0.00595 | -| value_loss | 1.61e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24066 | -| time_elapsed | 130857 | -| total_timesteps | 3080448 | -| train/ | | -| approx_kl | 0.05172614 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0282 | -| n_updates | 240650 | -| policy_gradient_loss | 0.0147 | -| std | 0.00595 | -| value_loss | 8.17e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24067 | -| time_elapsed | 130860 | -| total_timesteps | 3080576 | -| train/ | | -| approx_kl | 0.0070995297 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | -0.000727 | -| n_updates | 240660 | -| policy_gradient_loss | 0.00969 | -| std | 0.00596 | -| value_loss | 2.12e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24068 | -| time_elapsed | 130865 | -| total_timesteps | 3080704 | -| train/ | | -| approx_kl | 0.0023733922 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00737 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 240670 | -| policy_gradient_loss | 0.00951 | -| std | 0.00596 | -| value_loss | 7.28e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24069 | -| time_elapsed | 130870 | -| total_timesteps | 3080832 | -| train/ | | -| approx_kl | 0.13205226 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 240680 | -| policy_gradient_loss | 0.00972 | -| std | 0.00596 | -| value_loss | 5.94e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24070 | -| time_elapsed | 130876 | -| total_timesteps | 3080960 | -| train/ | | -| approx_kl | 0.052619472 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 240690 | -| policy_gradient_loss | 0.0143 | -| std | 0.00596 | -| value_loss | 4.76e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24071 | -| time_elapsed | 130880 | -| total_timesteps | 3081088 | -| train/ | | -| approx_kl | 1.0536476 | -| clip_fraction | 0.763 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.311 | -| n_updates | 240700 | -| policy_gradient_loss | 0.235 | -| std | 0.00596 | -| value_loss | 4.29e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24072 | -| time_elapsed | 130891 | -| total_timesteps | 3081216 | -| train/ | | -| approx_kl | 0.77941525 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.919 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 240710 | -| policy_gradient_loss | 0.0782 | -| std | 0.00597 | -| value_loss | 0.000619 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24073 | -| time_elapsed | 130896 | -| total_timesteps | 3081344 | -| train/ | | -| approx_kl | 0.05754575 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.642 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 240720 | -| policy_gradient_loss | 0.0735 | -| std | 0.00597 | -| value_loss | 0.000119 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24074 | -| time_elapsed | 130901 | -| total_timesteps | 3081472 | -| train/ | | -| approx_kl | 0.0004283879 | -| clip_fraction | 0.558 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00103 | -| learning_rate | 0.0003 | -| loss | 0.00128 | -| n_updates | 240730 | -| policy_gradient_loss | 0.114 | -| std | 0.00597 | -| value_loss | 3.41e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24075 | -| time_elapsed | 130906 | -| total_timesteps | 3081600 | -| train/ | | -| approx_kl | 0.02958698 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00199 | -| learning_rate | 0.0003 | -| loss | 0.0531 | -| n_updates | 240740 | -| policy_gradient_loss | 0.0657 | -| std | 0.00597 | -| value_loss | 1.8e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24076 | -| time_elapsed | 130911 | -| total_timesteps | 3081728 | -| train/ | | -| approx_kl | 0.29359478 | -| clip_fraction | 0.742 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 240750 | -| policy_gradient_loss | 0.138 | -| std | 0.00597 | -| value_loss | 1.25e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24077 | -| time_elapsed | 130916 | -| total_timesteps | 3081856 | -| train/ | | -| approx_kl | 0.067984596 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 240760 | -| policy_gradient_loss | 0.032 | -| std | 0.00597 | -| value_loss | 1.07e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24078 | -| time_elapsed | 130922 | -| total_timesteps | 3081984 | -| train/ | | -| approx_kl | 0.1834833 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | 0.0643 | -| n_updates | 240770 | -| policy_gradient_loss | 0.02 | -| std | 0.00597 | -| value_loss | 8.64e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 24079 | -| time_elapsed | 130928 | -| total_timesteps | 3082112 | -| train/ | | -| approx_kl | 0.017725104 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.00749 | -| n_updates | 240780 | -| policy_gradient_loss | 0.00331 | -| std | 0.00597 | -| value_loss | 4.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 24080 | -| time_elapsed | 130941 | -| total_timesteps | 3082240 | -| train/ | | -| approx_kl | 0.06424127 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.00299 | -| n_updates | 240790 | -| policy_gradient_loss | 0.00724 | -| std | 0.00596 | -| value_loss | 0.00567 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 24081 | -| time_elapsed | 130946 | -| total_timesteps | 3082368 | -| train/ | | -| approx_kl | 0.28407115 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0127 | -| learning_rate | 0.0003 | -| loss | 0.192 | -| n_updates | 240800 | -| policy_gradient_loss | 0.134 | -| std | 0.00596 | -| value_loss | 1.89e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 24082 | -| time_elapsed | 130951 | -| total_timesteps | 3082496 | -| train/ | | -| approx_kl | 0.24080525 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0093 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 240810 | -| policy_gradient_loss | 0.149 | -| std | 0.00596 | -| value_loss | 8.7e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 24083 | -| time_elapsed | 130955 | -| total_timesteps | 3082624 | -| train/ | | -| approx_kl | 0.22990881 | -| clip_fraction | 0.758 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 240820 | -| policy_gradient_loss | 0.177 | -| std | 0.00596 | -| value_loss | 6.06e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 24084 | -| time_elapsed | 130960 | -| total_timesteps | 3082752 | -| train/ | | -| approx_kl | 0.1500943 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 240830 | -| policy_gradient_loss | 0.116 | -| std | 0.00596 | -| value_loss | 5.18e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.989 | -| time/ | | -| fps | 23 | -| iterations | 24085 | -| time_elapsed | 130965 | -| total_timesteps | 3082880 | -| train/ | | -| approx_kl | 0.14934543 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.0946 | -| n_updates | 240840 | -| policy_gradient_loss | 0.115 | -| std | 0.00596 | -| value_loss | 3.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24086 | -| time_elapsed | 130969 | -| total_timesteps | 3083008 | -| train/ | | -| approx_kl | 0.034072887 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 240850 | -| policy_gradient_loss | 0.0346 | -| std | 0.00597 | -| value_loss | 1.15e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24087 | -| time_elapsed | 130980 | -| total_timesteps | 3083136 | -| train/ | | -| approx_kl | 0.021935986 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | -0.00715 | -| n_updates | 240860 | -| policy_gradient_loss | 0.0135 | -| std | 0.00597 | -| value_loss | 0.00389 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24088 | -| time_elapsed | 130985 | -| total_timesteps | 3083264 | -| train/ | | -| approx_kl | 0.43702203 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.238 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 240870 | -| policy_gradient_loss | 0.057 | -| std | 0.00597 | -| value_loss | 0.000194 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24089 | -| time_elapsed | 130989 | -| total_timesteps | 3083392 | -| train/ | | -| approx_kl | 0.071058154 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.0411 | -| n_updates | 240880 | -| policy_gradient_loss | 0.0184 | -| std | 0.00596 | -| value_loss | 7.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24090 | -| time_elapsed | 130994 | -| total_timesteps | 3083520 | -| train/ | | -| approx_kl | 0.058187596 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00515 | -| learning_rate | 0.0003 | -| loss | 0.0119 | -| n_updates | 240890 | -| policy_gradient_loss | 0.00642 | -| std | 0.00596 | -| value_loss | 3.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24091 | -| time_elapsed | 130998 | -| total_timesteps | 3083648 | -| train/ | | -| approx_kl | 0.052131556 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | -0.000712 | -| n_updates | 240900 | -| policy_gradient_loss | -0.000539 | -| std | 0.00596 | -| value_loss | 2.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24092 | -| time_elapsed | 131002 | -| total_timesteps | 3083776 | -| train/ | | -| approx_kl | 0.059909135 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 240910 | -| policy_gradient_loss | 0.0132 | -| std | 0.00596 | -| value_loss | 1.92e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24093 | -| time_elapsed | 131005 | -| total_timesteps | 3083904 | -| train/ | | -| approx_kl | 0.011293475 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | -0.00526 | -| n_updates | 240920 | -| policy_gradient_loss | 0.00818 | -| std | 0.00596 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24094 | -| time_elapsed | 131011 | -| total_timesteps | 3084032 | -| train/ | | -| approx_kl | 0.0012561707 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.00591 | -| n_updates | 240930 | -| policy_gradient_loss | 0.00866 | -| std | 0.00597 | -| value_loss | 1.14e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24095 | -| time_elapsed | 131022 | -| total_timesteps | 3084160 | -| train/ | | -| approx_kl | 0.02581703 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0215 | -| n_updates | 240940 | -| policy_gradient_loss | 0.00486 | -| std | 0.00597 | -| value_loss | 7.03e-05 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24096 | -| time_elapsed | 131027 | -| total_timesteps | 3084288 | -| train/ | | -| approx_kl | 0.91801 | -| clip_fraction | 0.775 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0179 | -| learning_rate | 0.0003 | -| loss | 0.372 | -| n_updates | 240950 | -| policy_gradient_loss | 0.217 | -| std | 0.00597 | -| value_loss | 2.73e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24097 | -| time_elapsed | 131031 | -| total_timesteps | 3084416 | -| train/ | | -| approx_kl | 0.030552357 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.00925 | -| n_updates | 240960 | -| policy_gradient_loss | 0.00159 | -| std | 0.00597 | -| value_loss | 1.51e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24098 | -| time_elapsed | 131036 | -| total_timesteps | 3084544 | -| train/ | | -| approx_kl | 0.019890204 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.00321 | -| n_updates | 240970 | -| policy_gradient_loss | 0.000158 | -| std | 0.00597 | -| value_loss | 6.7e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24099 | -| time_elapsed | 131041 | -| total_timesteps | 3084672 | -| train/ | | -| approx_kl | 0.018735413 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | -0.0073 | -| n_updates | 240980 | -| policy_gradient_loss | -0.00402 | -| std | 0.00597 | -| value_loss | 5.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24100 | -| time_elapsed | 131046 | -| total_timesteps | 3084800 | -| train/ | | -| approx_kl | 0.01715834 | -| clip_fraction | 0.142 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0316 | -| learning_rate | 0.0003 | -| loss | -0.0213 | -| n_updates | 240990 | -| policy_gradient_loss | -0.0108 | -| std | 0.00597 | -| value_loss | 3.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24101 | -| time_elapsed | 131051 | -| total_timesteps | 3084928 | -| train/ | | -| approx_kl | 0.012262721 | -| clip_fraction | 0.0977 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | -0.0095 | -| n_updates | 241000 | -| policy_gradient_loss | -0.00487 | -| std | 0.00596 | -| value_loss | 2.17e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24102 | -| time_elapsed | 131056 | -| total_timesteps | 3085056 | -| train/ | | -| approx_kl | 0.032013018 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 241010 | -| policy_gradient_loss | 0.013 | -| std | 0.00596 | -| value_loss | 1.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24103 | -| time_elapsed | 131067 | -| total_timesteps | 3085184 | -| train/ | | -| approx_kl | 0.015087553 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.0249 | -| n_updates | 241020 | -| policy_gradient_loss | -0.0063 | -| std | 0.00596 | -| value_loss | 0.000159 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24104 | -| time_elapsed | 131072 | -| total_timesteps | 3085312 | -| train/ | | -| approx_kl | 0.7025174 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00779 | -| learning_rate | 0.0003 | -| loss | 0.261 | -| n_updates | 241030 | -| policy_gradient_loss | 0.0887 | -| std | 0.00596 | -| value_loss | 8.45e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24105 | -| time_elapsed | 131078 | -| total_timesteps | 3085440 | -| train/ | | -| approx_kl | 0.007670365 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 241040 | -| policy_gradient_loss | 0.00814 | -| std | 0.00597 | -| value_loss | 8.89e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24106 | -| time_elapsed | 131084 | -| total_timesteps | 3085568 | -| train/ | | -| approx_kl | 0.002403513 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.000835 | -| n_updates | 241050 | -| policy_gradient_loss | 0.0116 | -| std | 0.00596 | -| value_loss | 3.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24107 | -| time_elapsed | 131089 | -| total_timesteps | 3085696 | -| train/ | | -| approx_kl | 0.049745243 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.0429 | -| n_updates | 241060 | -| policy_gradient_loss | 0.131 | -| std | 0.00596 | -| value_loss | 4.8e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24108 | -| time_elapsed | 131095 | -| total_timesteps | 3085824 | -| train/ | | -| approx_kl | 0.10448211 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0215 | -| learning_rate | 0.0003 | -| loss | 0.0917 | -| n_updates | 241070 | -| policy_gradient_loss | 0.121 | -| std | 0.00596 | -| value_loss | 3.41e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24109 | -| time_elapsed | 131100 | -| total_timesteps | 3085952 | -| train/ | | -| approx_kl | 0.026225857 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.00592 | -| n_updates | 241080 | -| policy_gradient_loss | 0.0251 | -| std | 0.00596 | -| value_loss | 1.99e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24110 | -| time_elapsed | 131105 | -| total_timesteps | 3086080 | -| train/ | | -| approx_kl | 0.5802617 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 241090 | -| policy_gradient_loss | 0.0683 | -| std | 0.00596 | -| value_loss | 1.55e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24111 | -| time_elapsed | 131114 | -| total_timesteps | 3086208 | -| train/ | | -| approx_kl | 0.019683177 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 241100 | -| policy_gradient_loss | -0.0024 | -| std | 0.00596 | -| value_loss | 0.00244 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24112 | -| time_elapsed | 131119 | -| total_timesteps | 3086336 | -| train/ | | -| approx_kl | 0.07770784 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.0417 | -| n_updates | 241110 | -| policy_gradient_loss | 0.0164 | -| std | 0.00596 | -| value_loss | 0.000149 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24113 | -| time_elapsed | 131124 | -| total_timesteps | 3086464 | -| train/ | | -| approx_kl | 0.0015091845 | -| clip_fraction | 0.585 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 241120 | -| policy_gradient_loss | 0.0999 | -| std | 0.00596 | -| value_loss | 5.82e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24114 | -| time_elapsed | 131128 | -| total_timesteps | 3086592 | -| train/ | | -| approx_kl | 0.08171859 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00972 | -| learning_rate | 0.0003 | -| loss | 0.0865 | -| n_updates | 241130 | -| policy_gradient_loss | 0.0501 | -| std | 0.00596 | -| value_loss | 2.88e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24115 | -| time_elapsed | 131133 | -| total_timesteps | 3086720 | -| train/ | | -| approx_kl | 0.10677096 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.036 | -| n_updates | 241140 | -| policy_gradient_loss | 0.061 | -| std | 0.00596 | -| value_loss | 2.19e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24116 | -| time_elapsed | 131138 | -| total_timesteps | 3086848 | -| train/ | | -| approx_kl | 0.0154604465 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 241150 | -| policy_gradient_loss | 0.217 | -| std | 0.00596 | -| value_loss | 1.65e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24117 | -| time_elapsed | 131143 | -| total_timesteps | 3086976 | -| train/ | | -| approx_kl | 0.047762416 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 241160 | -| policy_gradient_loss | 0.0123 | -| std | 0.00596 | -| value_loss | 0.000112 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24118 | -| time_elapsed | 131149 | -| total_timesteps | 3087104 | -| train/ | | -| approx_kl | 0.020867605 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.000342 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 241170 | -| policy_gradient_loss | 0.00844 | -| std | 0.00597 | -| value_loss | 0.000146 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24119 | -| time_elapsed | 131160 | -| total_timesteps | 3087232 | -| train/ | | -| approx_kl | 0.22699627 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.0572 | -| n_updates | 241180 | -| policy_gradient_loss | 0.0329 | -| std | 0.00597 | -| value_loss | 0.00014 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24120 | -| time_elapsed | 131165 | -| total_timesteps | 3087360 | -| train/ | | -| approx_kl | 0.048602253 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 241190 | -| policy_gradient_loss | 0.0842 | -| std | 0.00597 | -| value_loss | 3.44e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24121 | -| time_elapsed | 131170 | -| total_timesteps | 3087488 | -| train/ | | -| approx_kl | 0.003589557 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0065 | -| learning_rate | 0.0003 | -| loss | 0.006 | -| n_updates | 241200 | -| policy_gradient_loss | 0.105 | -| std | 0.00597 | -| value_loss | 1.41e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24122 | -| time_elapsed | 131175 | -| total_timesteps | 3087616 | -| train/ | | -| approx_kl | 11.371069 | -| clip_fraction | 0.872 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0599 | -| learning_rate | 0.0003 | -| loss | 0.278 | -| n_updates | 241210 | -| policy_gradient_loss | 0.235 | -| std | 0.00598 | -| value_loss | 7.25e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24123 | -| time_elapsed | 131180 | -| total_timesteps | 3087744 | -| train/ | | -| approx_kl | 0.05675973 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 241220 | -| policy_gradient_loss | 0.0967 | -| std | 0.00598 | -| value_loss | 9.92e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24124 | -| time_elapsed | 131186 | -| total_timesteps | 3087872 | -| train/ | | -| approx_kl | 0.2981112 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00197 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 241230 | -| policy_gradient_loss | 0.0425 | -| std | 0.00598 | -| value_loss | 6.23e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24125 | -| time_elapsed | 131192 | -| total_timesteps | 3088000 | -| train/ | | -| approx_kl | 0.006652309 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | -0.00404 | -| n_updates | 241240 | -| policy_gradient_loss | 0.0233 | -| std | 0.00598 | -| value_loss | 4.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24126 | -| time_elapsed | 131197 | -| total_timesteps | 3088128 | -| train/ | | -| approx_kl | 0.23461828 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00446 | -| learning_rate | 0.0003 | -| loss | 0.082 | -| n_updates | 241250 | -| policy_gradient_loss | 0.0451 | -| std | 0.00598 | -| value_loss | 1.69e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24127 | -| time_elapsed | 131210 | -| total_timesteps | 3088256 | -| train/ | | -| approx_kl | 0.021942383 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 241260 | -| policy_gradient_loss | 0.0498 | -| std | 0.00599 | -| value_loss | 0.000554 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24128 | -| time_elapsed | 131215 | -| total_timesteps | 3088384 | -| train/ | | -| approx_kl | 0.17530069 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00683 | -| learning_rate | 0.0003 | -| loss | 0.071 | -| n_updates | 241270 | -| policy_gradient_loss | 0.0488 | -| std | 0.00599 | -| value_loss | 2.56e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24129 | -| time_elapsed | 131218 | -| total_timesteps | 3088512 | -| train/ | | -| approx_kl | 5.8794394e-06 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.014 | -| learning_rate | 0.0003 | -| loss | 0.000495 | -| n_updates | 241280 | -| policy_gradient_loss | 0.03 | -| std | 0.00599 | -| value_loss | 9.31e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24130 | -| time_elapsed | 131223 | -| total_timesteps | 3088640 | -| train/ | | -| approx_kl | 0.055219643 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00669 | -| learning_rate | 0.0003 | -| loss | 0.00878 | -| n_updates | 241290 | -| policy_gradient_loss | 0.0308 | -| std | 0.00598 | -| value_loss | 2.99e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24131 | -| time_elapsed | 131228 | -| total_timesteps | 3088768 | -| train/ | | -| approx_kl | 0.0042394595 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -2.33 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 241300 | -| policy_gradient_loss | 0.00942 | -| std | 0.00598 | -| value_loss | 3.32e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24132 | -| time_elapsed | 131233 | -| total_timesteps | 3088896 | -| train/ | | -| approx_kl | 0.12094411 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | 0.0477 | -| n_updates | 241310 | -| policy_gradient_loss | 0.0323 | -| std | 0.00598 | -| value_loss | 1.44e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24133 | -| time_elapsed | 131237 | -| total_timesteps | 3089024 | -| train/ | | -| approx_kl | 0.118636236 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.0747 | -| n_updates | 241320 | -| policy_gradient_loss | 0.0177 | -| std | 0.00598 | -| value_loss | 4.05e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24134 | -| time_elapsed | 131249 | -| total_timesteps | 3089152 | -| train/ | | -| approx_kl | 0.018630892 | -| clip_fraction | 0.185 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.907 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 241330 | -| policy_gradient_loss | -0.0153 | -| std | 0.00598 | -| value_loss | 0.00173 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24135 | -| time_elapsed | 131256 | -| total_timesteps | 3089280 | -| train/ | | -| approx_kl | 0.0012372937 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.769 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 241340 | -| policy_gradient_loss | 0.0357 | -| std | 0.00598 | -| value_loss | 7.8e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24136 | -| time_elapsed | 131261 | -| total_timesteps | 3089408 | -| train/ | | -| approx_kl | 0.11203134 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00425 | -| learning_rate | 0.0003 | -| loss | 0.0763 | -| n_updates | 241350 | -| policy_gradient_loss | 0.0608 | -| std | 0.00598 | -| value_loss | 1.66e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24137 | -| time_elapsed | 131266 | -| total_timesteps | 3089536 | -| train/ | | -| approx_kl | 0.47428262 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.318 | -| learning_rate | 0.0003 | -| loss | 0.213 | -| n_updates | 241360 | -| policy_gradient_loss | 0.145 | -| std | 0.00598 | -| value_loss | 4.68e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24138 | -| time_elapsed | 131272 | -| total_timesteps | 3089664 | -| train/ | | -| approx_kl | 0.10328648 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.0545 | -| n_updates | 241370 | -| policy_gradient_loss | 0.0405 | -| std | 0.00598 | -| value_loss | 3.47e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24139 | -| time_elapsed | 131276 | -| total_timesteps | 3089792 | -| train/ | | -| approx_kl | 0.00022797938 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 241380 | -| policy_gradient_loss | 0.0432 | -| std | 0.00598 | -| value_loss | 3.03e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24140 | -| time_elapsed | 131282 | -| total_timesteps | 3089920 | -| train/ | | -| approx_kl | 0.10466297 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0537 | -| n_updates | 241390 | -| policy_gradient_loss | 0.0252 | -| std | 0.00596 | -| value_loss | 1.04e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24141 | -| time_elapsed | 131287 | -| total_timesteps | 3090048 | -| train/ | | -| approx_kl | 0.057726543 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -3.77 | -| learning_rate | 0.0003 | -| loss | 0.0359 | -| n_updates | 241400 | -| policy_gradient_loss | 0.0529 | -| std | 0.00595 | -| value_loss | 3.29e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24142 | -| time_elapsed | 131298 | -| total_timesteps | 3090176 | -| train/ | | -| approx_kl | 0.8110507 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.988 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 241410 | -| policy_gradient_loss | 0.0217 | -| std | 0.00595 | -| value_loss | 8.98e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24143 | -| time_elapsed | 131304 | -| total_timesteps | 3090304 | -| train/ | | -| approx_kl | 0.009642189 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.0121 | -| n_updates | 241420 | -| policy_gradient_loss | 0.0339 | -| std | 0.00595 | -| value_loss | 1.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24144 | -| time_elapsed | 131313 | -| total_timesteps | 3090432 | -| train/ | | -| approx_kl | 0.017710527 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.163 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 241430 | -| policy_gradient_loss | 0.0148 | -| std | 0.00595 | -| value_loss | 5.75e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24145 | -| time_elapsed | 131320 | -| total_timesteps | 3090560 | -| train/ | | -| approx_kl | 0.13437997 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | 0.078 | -| n_updates | 241440 | -| policy_gradient_loss | 0.0355 | -| std | 0.00595 | -| value_loss | 4.45e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24146 | -| time_elapsed | 131327 | -| total_timesteps | 3090688 | -| train/ | | -| approx_kl | 0.01192325 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.0192 | -| n_updates | 241450 | -| policy_gradient_loss | 0.0133 | -| std | 0.00595 | -| value_loss | 3.46e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24147 | -| time_elapsed | 131331 | -| total_timesteps | 3090816 | -| train/ | | -| approx_kl | 0.06256297 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -128 | -| learning_rate | 0.0003 | -| loss | 0.000467 | -| n_updates | 241460 | -| policy_gradient_loss | 0.00964 | -| std | 0.00595 | -| value_loss | 4.09e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24148 | -| time_elapsed | 131336 | -| total_timesteps | 3090944 | -| train/ | | -| approx_kl | 0.20246434 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.36 | -| learning_rate | 0.0003 | -| loss | 0.0665 | -| n_updates | 241470 | -| policy_gradient_loss | 0.0225 | -| std | 0.00595 | -| value_loss | 2.43e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24149 | -| time_elapsed | 131341 | -| total_timesteps | 3091072 | -| train/ | | -| approx_kl | 0.022993874 | -| clip_fraction | 0.164 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.000974 | -| learning_rate | 0.0003 | -| loss | 0.00306 | -| n_updates | 241480 | -| policy_gradient_loss | 0.00125 | -| std | 0.00595 | -| value_loss | 1.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24150 | -| time_elapsed | 131348 | -| total_timesteps | 3091200 | -| train/ | | -| approx_kl | 0.13425834 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.612 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 241490 | -| policy_gradient_loss | 0.00347 | -| std | 0.00595 | -| value_loss | 0.00173 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24151 | -| time_elapsed | 131353 | -| total_timesteps | 3091328 | -| train/ | | -| approx_kl | 0.055216186 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.402 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 241500 | -| policy_gradient_loss | 0.0913 | -| std | 0.00595 | -| value_loss | 1.67e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24152 | -| time_elapsed | 131358 | -| total_timesteps | 3091456 | -| train/ | | -| approx_kl | 0.0052267746 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.000601 | -| learning_rate | 0.0003 | -| loss | -0.00976 | -| n_updates | 241510 | -| policy_gradient_loss | 0.0839 | -| std | 0.00595 | -| value_loss | 5.33e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24153 | -| time_elapsed | 131363 | -| total_timesteps | 3091584 | -| train/ | | -| approx_kl | 0.030701295 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00321 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 241520 | -| policy_gradient_loss | 0.0443 | -| std | 0.00596 | -| value_loss | 2.46e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24154 | -| time_elapsed | 131368 | -| total_timesteps | 3091712 | -| train/ | | -| approx_kl | 0.40035334 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.22 | -| n_updates | 241530 | -| policy_gradient_loss | 0.156 | -| std | 0.00596 | -| value_loss | 1.95e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24155 | -| time_elapsed | 131374 | -| total_timesteps | 3091840 | -| train/ | | -| approx_kl | 0.0632098 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 241540 | -| policy_gradient_loss | 0.0346 | -| std | 0.00596 | -| value_loss | 1.51e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24156 | -| time_elapsed | 131379 | -| total_timesteps | 3091968 | -| train/ | | -| approx_kl | 0.87084705 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.245 | -| n_updates | 241550 | -| policy_gradient_loss | 0.0789 | -| std | 0.00596 | -| value_loss | 1.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24157 | -| time_elapsed | 131384 | -| total_timesteps | 3092096 | -| train/ | | -| approx_kl | 0.06385187 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 241560 | -| policy_gradient_loss | 0.0109 | -| std | 0.00596 | -| value_loss | 1.07e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24158 | -| time_elapsed | 131395 | -| total_timesteps | 3092224 | -| train/ | | -| approx_kl | 0.023165928 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -6.66 | -| learning_rate | 0.0003 | -| loss | -0.0206 | -| n_updates | 241570 | -| policy_gradient_loss | -0.00396 | -| std | 0.00596 | -| value_loss | 0.00491 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24159 | -| time_elapsed | 131400 | -| total_timesteps | 3092352 | -| train/ | | -| approx_kl | 0.004368266 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -102 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 241580 | -| policy_gradient_loss | 0.00168 | -| std | 0.00596 | -| value_loss | 7.03e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24160 | -| time_elapsed | 131406 | -| total_timesteps | 3092480 | -| train/ | | -| approx_kl | 0.0038081883 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 241590 | -| policy_gradient_loss | 0.00719 | -| std | 0.00596 | -| value_loss | 1.83e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24161 | -| time_elapsed | 131411 | -| total_timesteps | 3092608 | -| train/ | | -| approx_kl | 0.10654333 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -5.98 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 241600 | -| policy_gradient_loss | 0.00702 | -| std | 0.00597 | -| value_loss | 6.84e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24162 | -| time_elapsed | 131416 | -| total_timesteps | 3092736 | -| train/ | | -| approx_kl | 0.32619774 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00431 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 241610 | -| policy_gradient_loss | 0.041 | -| std | 0.00597 | -| value_loss | 3.68e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24163 | -| time_elapsed | 131420 | -| total_timesteps | 3092864 | -| train/ | | -| approx_kl | 0.00051401975 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.000353 | -| n_updates | 241620 | -| policy_gradient_loss | 0.0345 | -| std | 0.00597 | -| value_loss | 1.62e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24164 | -| time_elapsed | 131424 | -| total_timesteps | 3092992 | -| train/ | | -| approx_kl | 0.008576292 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0742 | -| learning_rate | 0.0003 | -| loss | 0.00445 | -| n_updates | 241630 | -| policy_gradient_loss | 0.0531 | -| std | 0.00597 | -| value_loss | 1.23e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24165 | -| time_elapsed | 131429 | -| total_timesteps | 3093120 | -| train/ | | -| approx_kl | 0.7390218 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.259 | -| n_updates | 241640 | -| policy_gradient_loss | 0.0822 | -| std | 0.00597 | -| value_loss | 7.26e-10 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24166 | -| time_elapsed | 131443 | -| total_timesteps | 3093248 | -| train/ | | -| approx_kl | 0.014793247 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 241650 | -| policy_gradient_loss | -0.00218 | -| std | 0.00597 | -| value_loss | 0.000686 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24167 | -| time_elapsed | 131448 | -| total_timesteps | 3093376 | -| train/ | | -| approx_kl | 0.0333245 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.289 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 241660 | -| policy_gradient_loss | -0.00377 | -| std | 0.00597 | -| value_loss | 3.29e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24168 | -| time_elapsed | 131454 | -| total_timesteps | 3093504 | -| train/ | | -| approx_kl | 0.014766652 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | -0.00548 | -| n_updates | 241670 | -| policy_gradient_loss | -0.00201 | -| std | 0.00596 | -| value_loss | 4.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24169 | -| time_elapsed | 131458 | -| total_timesteps | 3093632 | -| train/ | | -| approx_kl | 0.048011694 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00049 | -| learning_rate | 0.0003 | -| loss | 0.0247 | -| n_updates | 241680 | -| policy_gradient_loss | 0.057 | -| std | 0.00596 | -| value_loss | 2.19e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24170 | -| time_elapsed | 131463 | -| total_timesteps | 3093760 | -| train/ | | -| approx_kl | 0.45271403 | -| clip_fraction | 0.753 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.225 | -| n_updates | 241690 | -| policy_gradient_loss | 0.23 | -| std | 0.00596 | -| value_loss | 1.93e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24171 | -| time_elapsed | 131468 | -| total_timesteps | 3093888 | -| train/ | | -| approx_kl | 0.059437204 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0171 | -| learning_rate | 0.0003 | -| loss | 0.00923 | -| n_updates | 241700 | -| policy_gradient_loss | 0.0355 | -| std | 0.00596 | -| value_loss | 1.75e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24172 | -| time_elapsed | 131472 | -| total_timesteps | 3094016 | -| train/ | | -| approx_kl | 0.82557607 | -| clip_fraction | 0.558 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | 0.209 | -| n_updates | 241710 | -| policy_gradient_loss | 0.0766 | -| std | 0.00596 | -| value_loss | 1.48e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24173 | -| time_elapsed | 131484 | -| total_timesteps | 3094144 | -| train/ | | -| approx_kl | 0.027245324 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 241720 | -| policy_gradient_loss | 0.0014 | -| std | 0.00596 | -| value_loss | 0.000134 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24174 | -| time_elapsed | 131489 | -| total_timesteps | 3094272 | -| train/ | | -| approx_kl | 0.033327084 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0581 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 241730 | -| policy_gradient_loss | 0.156 | -| std | 0.00596 | -| value_loss | 2.26e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24175 | -| time_elapsed | 131494 | -| total_timesteps | 3094400 | -| train/ | | -| approx_kl | 0.18133661 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00803 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 241740 | -| policy_gradient_loss | 0.153 | -| std | 0.00596 | -| value_loss | 1.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24176 | -| time_elapsed | 131498 | -| total_timesteps | 3094528 | -| train/ | | -| approx_kl | 0.03435516 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00461 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 241750 | -| policy_gradient_loss | 0.031 | -| std | 0.00596 | -| value_loss | 4.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24177 | -| time_elapsed | 131502 | -| total_timesteps | 3094656 | -| train/ | | -| approx_kl | 0.0061228364 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.082 | -| learning_rate | 0.0003 | -| loss | 0.00498 | -| n_updates | 241760 | -| policy_gradient_loss | 0.0367 | -| std | 0.00596 | -| value_loss | 2.74e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24178 | -| time_elapsed | 131507 | -| total_timesteps | 3094784 | -| train/ | | -| approx_kl | 0.18219894 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.0678 | -| n_updates | 241770 | -| policy_gradient_loss | 0.0204 | -| std | 0.00597 | -| value_loss | 2.15e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24179 | -| time_elapsed | 131513 | -| total_timesteps | 3094912 | -| train/ | | -| approx_kl | 0.011334274 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.00172 | -| n_updates | 241780 | -| policy_gradient_loss | 0.00202 | -| std | 0.00596 | -| value_loss | 1.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24180 | -| time_elapsed | 131517 | -| total_timesteps | 3095040 | -| train/ | | -| approx_kl | 0.082748234 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0851 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 241790 | -| policy_gradient_loss | 0.00708 | -| std | 0.00596 | -| value_loss | 8.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24181 | -| time_elapsed | 131529 | -| total_timesteps | 3095168 | -| train/ | | -| approx_kl | 0.038147047 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.91 | -| learning_rate | 0.0003 | -| loss | 0.0469 | -| n_updates | 241800 | -| policy_gradient_loss | 0.0165 | -| std | 0.00596 | -| value_loss | 0.0016 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24182 | -| time_elapsed | 131534 | -| total_timesteps | 3095296 | -| train/ | | -| approx_kl | 0.5738085 | -| clip_fraction | 0.568 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.192 | -| learning_rate | 0.0003 | -| loss | 0.249 | -| n_updates | 241810 | -| policy_gradient_loss | 0.0906 | -| std | 0.00596 | -| value_loss | 1.57e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24183 | -| time_elapsed | 131538 | -| total_timesteps | 3095424 | -| train/ | | -| approx_kl | 0.045654062 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00449 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 241820 | -| policy_gradient_loss | 0.0176 | -| std | 0.00597 | -| value_loss | 2.65e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24184 | -| time_elapsed | 131542 | -| total_timesteps | 3095552 | -| train/ | | -| approx_kl | 0.0030264272 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 241830 | -| policy_gradient_loss | 0.0157 | -| std | 0.00598 | -| value_loss | 3.34e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24185 | -| time_elapsed | 131546 | -| total_timesteps | 3095680 | -| train/ | | -| approx_kl | 0.002327648 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | -0.000191 | -| n_updates | 241840 | -| policy_gradient_loss | 0.0154 | -| std | 0.00598 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24186 | -| time_elapsed | 131549 | -| total_timesteps | 3095808 | -| train/ | | -| approx_kl | 0.013695705 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | -0.00631 | -| n_updates | 241850 | -| policy_gradient_loss | 0.018 | -| std | 0.00596 | -| value_loss | 0.000173 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24187 | -| time_elapsed | 131554 | -| total_timesteps | 3095936 | -| train/ | | -| approx_kl | 0.0028085252 | -| clip_fraction | 0.579 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.476 | -| learning_rate | 0.0003 | -| loss | 0.0002 | -| n_updates | 241860 | -| policy_gradient_loss | 0.0947 | -| std | 0.00594 | -| value_loss | 0.00042 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24188 | -| time_elapsed | 131558 | -| total_timesteps | 3096064 | -| train/ | | -| approx_kl | 0.022115983 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 241870 | -| policy_gradient_loss | 0.0432 | -| std | 0.00594 | -| value_loss | 3.46e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24189 | -| time_elapsed | 131567 | -| total_timesteps | 3096192 | -| train/ | | -| approx_kl | 0.6886163 | -| clip_fraction | 0.722 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.895 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 241880 | -| policy_gradient_loss | 0.0833 | -| std | 0.00594 | -| value_loss | 0.000639 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24190 | -| time_elapsed | 131572 | -| total_timesteps | 3096320 | -| train/ | | -| approx_kl | 0.49327722 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.184 | -| learning_rate | 0.0003 | -| loss | 0.274 | -| n_updates | 241890 | -| policy_gradient_loss | 0.17 | -| std | 0.00594 | -| value_loss | 8e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24191 | -| time_elapsed | 131575 | -| total_timesteps | 3096448 | -| train/ | | -| approx_kl | 0.25603598 | -| clip_fraction | 0.735 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0899 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 241900 | -| policy_gradient_loss | 0.181 | -| std | 0.00594 | -| value_loss | 5.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24192 | -| time_elapsed | 131581 | -| total_timesteps | 3096576 | -| train/ | | -| approx_kl | 0.048953656 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.00873 | -| n_updates | 241910 | -| policy_gradient_loss | 0.0263 | -| std | 0.00594 | -| value_loss | 2.82e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24193 | -| time_elapsed | 131587 | -| total_timesteps | 3096704 | -| train/ | | -| approx_kl | 0.0015158383 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | 0.000242 | -| n_updates | 241920 | -| policy_gradient_loss | 0.0449 | -| std | 0.00594 | -| value_loss | 1.9e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24194 | -| time_elapsed | 131593 | -| total_timesteps | 3096832 | -| train/ | | -| approx_kl | 0.60590786 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 241930 | -| policy_gradient_loss | 0.0707 | -| std | 0.00594 | -| value_loss | 2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24195 | -| time_elapsed | 131598 | -| total_timesteps | 3096960 | -| train/ | | -| approx_kl | 0.008619651 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00359 | -| n_updates | 241940 | -| policy_gradient_loss | 0.00458 | -| std | 0.00595 | -| value_loss | 1.34e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24196 | -| time_elapsed | 131604 | -| total_timesteps | 3097088 | -| train/ | | -| approx_kl | 0.0891218 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 241950 | -| policy_gradient_loss | 0.0127 | -| std | 0.00595 | -| value_loss | 7.72e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24197 | -| time_elapsed | 131615 | -| total_timesteps | 3097216 | -| train/ | | -| approx_kl | 0.011298606 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 241960 | -| policy_gradient_loss | -0.00227 | -| std | 0.00595 | -| value_loss | 0.000551 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24198 | -| time_elapsed | 131619 | -| total_timesteps | 3097344 | -| train/ | | -| approx_kl | 0.44237968 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.49 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 241970 | -| policy_gradient_loss | 0.0498 | -| std | 0.00595 | -| value_loss | 2.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24199 | -| time_elapsed | 131625 | -| total_timesteps | 3097472 | -| train/ | | -| approx_kl | 0.12557408 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -18 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 241980 | -| policy_gradient_loss | 0.0284 | -| std | 0.00595 | -| value_loss | 2.61e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24200 | -| time_elapsed | 131629 | -| total_timesteps | 3097600 | -| train/ | | -| approx_kl | 1.0872566 | -| clip_fraction | 0.762 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.372 | -| learning_rate | 0.0003 | -| loss | 0.271 | -| n_updates | 241990 | -| policy_gradient_loss | 0.14 | -| std | 0.00595 | -| value_loss | 5.78e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24201 | -| time_elapsed | 131634 | -| total_timesteps | 3097728 | -| train/ | | -| approx_kl | 0.009745207 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0167 | -| learning_rate | 0.0003 | -| loss | -0.00486 | -| n_updates | 242000 | -| policy_gradient_loss | 0.0281 | -| std | 0.00595 | -| value_loss | 1.11e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24202 | -| time_elapsed | 131639 | -| total_timesteps | 3097856 | -| train/ | | -| approx_kl | 0.1334479 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 242010 | -| policy_gradient_loss | 0.0304 | -| std | 0.00595 | -| value_loss | 9.08e-10 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24203 | -| time_elapsed | 131644 | -| total_timesteps | 3097984 | -| train/ | | -| approx_kl | 4.7419686e-05 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | -0.000391 | -| n_updates | 242020 | -| policy_gradient_loss | 0.0333 | -| std | 0.00595 | -| value_loss | 6.87e-10 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24204 | -| time_elapsed | 131649 | -| total_timesteps | 3098112 | -| train/ | | -| approx_kl | 0.81158686 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.228 | -| n_updates | 242030 | -| policy_gradient_loss | 0.0762 | -| std | 0.00595 | -| value_loss | 5.9e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24205 | -| time_elapsed | 131665 | -| total_timesteps | 3098240 | -| train/ | | -| approx_kl | 0.051733036 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.42 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 242040 | -| policy_gradient_loss | 0.00264 | -| std | 0.00595 | -| value_loss | 0.00323 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24206 | -| time_elapsed | 131671 | -| total_timesteps | 3098368 | -| train/ | | -| approx_kl | 0.18392085 | -| clip_fraction | 0.588 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.383 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 242050 | -| policy_gradient_loss | 0.0897 | -| std | 0.00595 | -| value_loss | 1.35e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24207 | -| time_elapsed | 131675 | -| total_timesteps | 3098496 | -| train/ | | -| approx_kl | 0.057270274 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0281 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 242060 | -| policy_gradient_loss | 0.051 | -| std | 0.00595 | -| value_loss | 2.35e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24208 | -| time_elapsed | 131681 | -| total_timesteps | 3098624 | -| train/ | | -| approx_kl | 1.0951921 | -| clip_fraction | 0.779 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.015 | -| learning_rate | 0.0003 | -| loss | 0.271 | -| n_updates | 242070 | -| policy_gradient_loss | 0.261 | -| std | 0.00595 | -| value_loss | 7.81e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24209 | -| time_elapsed | 131686 | -| total_timesteps | 3098752 | -| train/ | | -| approx_kl | 0.011916135 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | -0.00339 | -| n_updates | 242080 | -| policy_gradient_loss | 0.0341 | -| std | 0.00595 | -| value_loss | 6.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24210 | -| time_elapsed | 131690 | -| total_timesteps | 3098880 | -| train/ | | -| approx_kl | 0.15415666 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | 0.096 | -| n_updates | 242090 | -| policy_gradient_loss | 0.0494 | -| std | 0.00595 | -| value_loss | 5.06e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24211 | -| time_elapsed | 131696 | -| total_timesteps | 3099008 | -| train/ | | -| approx_kl | 8.633593e-05 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | -0.000774 | -| n_updates | 242100 | -| policy_gradient_loss | 0.0414 | -| std | 0.00595 | -| value_loss | 4.28e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24212 | -| time_elapsed | 131708 | -| total_timesteps | 3099136 | -| train/ | | -| approx_kl | 0.5527837 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.94 | -| learning_rate | 0.0003 | -| loss | 0.0728 | -| n_updates | 242110 | -| policy_gradient_loss | 0.021 | -| std | 0.00595 | -| value_loss | 0.000905 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24213 | -| time_elapsed | 131712 | -| total_timesteps | 3099264 | -| train/ | | -| approx_kl | 0.061646953 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.145 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 242120 | -| policy_gradient_loss | 0.0111 | -| std | 0.00595 | -| value_loss | 0.000663 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24214 | -| time_elapsed | 131718 | -| total_timesteps | 3099392 | -| train/ | | -| approx_kl | 0.004288477 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00422 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 242130 | -| policy_gradient_loss | 0.00552 | -| std | 0.00595 | -| value_loss | 1.27e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24215 | -| time_elapsed | 131723 | -| total_timesteps | 3099520 | -| train/ | | -| approx_kl | 0.06770057 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 242140 | -| policy_gradient_loss | 0.00922 | -| std | 0.00595 | -| value_loss | 3.31e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24216 | -| time_elapsed | 131729 | -| total_timesteps | 3099648 | -| train/ | | -| approx_kl | 0.056708872 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0257 | -| learning_rate | 0.0003 | -| loss | -0.00801 | -| n_updates | 242150 | -| policy_gradient_loss | -0.00278 | -| std | 0.00595 | -| value_loss | 2.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24217 | -| time_elapsed | 131733 | -| total_timesteps | 3099776 | -| train/ | | -| approx_kl | 0.011473631 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | -0.00944 | -| n_updates | 242160 | -| policy_gradient_loss | 0.00981 | -| std | 0.00595 | -| value_loss | 1.96e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24218 | -| time_elapsed | 131739 | -| total_timesteps | 3099904 | -| train/ | | -| approx_kl | 0.0032682274 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 242170 | -| policy_gradient_loss | 0.0147 | -| std | 0.00595 | -| value_loss | 1.09e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24219 | -| time_elapsed | 131744 | -| total_timesteps | 3100032 | -| train/ | | -| approx_kl | 2.4270266e-06 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.047 | -| learning_rate | 0.0003 | -| loss | 0.000135 | -| n_updates | 242180 | -| policy_gradient_loss | 0.0455 | -| std | 0.00595 | -| value_loss | 9.8e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24220 | -| time_elapsed | 131754 | -| total_timesteps | 3100160 | -| train/ | | -| approx_kl | 0.035314996 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.13 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 242190 | -| policy_gradient_loss | -0.00466 | -| std | 0.00595 | -| value_loss | 0.00316 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24221 | -| time_elapsed | 131760 | -| total_timesteps | 3100288 | -| train/ | | -| approx_kl | 0.00012884382 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.32 | -| learning_rate | 0.0003 | -| loss | 5.76e-05 | -| n_updates | 242200 | -| policy_gradient_loss | 0.0354 | -| std | 0.00595 | -| value_loss | 5.63e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24222 | -| time_elapsed | 131766 | -| total_timesteps | 3100416 | -| train/ | | -| approx_kl | 0.26271984 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -2.19 | -| learning_rate | 0.0003 | -| loss | 0.0958 | -| n_updates | 242210 | -| policy_gradient_loss | 0.0314 | -| std | 0.00595 | -| value_loss | 2.5e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24223 | -| time_elapsed | 131770 | -| total_timesteps | 3100544 | -| train/ | | -| approx_kl | 0.022669192 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.139 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 242220 | -| policy_gradient_loss | -0.0106 | -| std | 0.00595 | -| value_loss | 1.25e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24224 | -| time_elapsed | 131776 | -| total_timesteps | 3100672 | -| train/ | | -| approx_kl | 0.02905197 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 242230 | -| policy_gradient_loss | 0.0313 | -| std | 0.00595 | -| value_loss | 6.84e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24225 | -| time_elapsed | 131781 | -| total_timesteps | 3100800 | -| train/ | | -| approx_kl | 0.37379813 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0805 | -| learning_rate | 0.0003 | -| loss | 0.252 | -| n_updates | 242240 | -| policy_gradient_loss | 0.168 | -| std | 0.00595 | -| value_loss | 6.23e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24226 | -| time_elapsed | 131785 | -| total_timesteps | 3100928 | -| train/ | | -| approx_kl | 0.2129027 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 242250 | -| policy_gradient_loss | 0.142 | -| std | 0.00595 | -| value_loss | 4.46e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24227 | -| time_elapsed | 131788 | -| total_timesteps | 3101056 | -| train/ | | -| approx_kl | 0.17754003 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 242260 | -| policy_gradient_loss | 0.111 | -| std | 0.00595 | -| value_loss | 3.8e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24228 | -| time_elapsed | 131797 | -| total_timesteps | 3101184 | -| train/ | | -| approx_kl | 0.22208777 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 242270 | -| policy_gradient_loss | 0.213 | -| std | 0.00596 | -| value_loss | 0.00596 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24229 | -| time_elapsed | 131802 | -| total_timesteps | 3101312 | -| train/ | | -| approx_kl | 0.033401746 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.888 | -| learning_rate | 0.0003 | -| loss | 0.00673 | -| n_updates | 242280 | -| policy_gradient_loss | 0.0282 | -| std | 0.00596 | -| value_loss | 2.07e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24230 | -| time_elapsed | 131806 | -| total_timesteps | 3101440 | -| train/ | | -| approx_kl | 0.60876536 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00306 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 242290 | -| policy_gradient_loss | 0.0718 | -| std | 0.00596 | -| value_loss | 3.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24231 | -| time_elapsed | 131811 | -| total_timesteps | 3101568 | -| train/ | | -| approx_kl | 0.065101095 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.0365 | -| n_updates | 242300 | -| policy_gradient_loss | 0.0184 | -| std | 0.00596 | -| value_loss | 2.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24232 | -| time_elapsed | 131817 | -| total_timesteps | 3101696 | -| train/ | | -| approx_kl | 0.052076105 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 242310 | -| policy_gradient_loss | 0.0146 | -| std | 0.00596 | -| value_loss | 1.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24233 | -| time_elapsed | 131821 | -| total_timesteps | 3101824 | -| train/ | | -| approx_kl | 0.010518754 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0701 | -| learning_rate | 0.0003 | -| loss | -0.00983 | -| n_updates | 242320 | -| policy_gradient_loss | 0.00666 | -| std | 0.00596 | -| value_loss | 9.46e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24234 | -| time_elapsed | 131826 | -| total_timesteps | 3101952 | -| train/ | | -| approx_kl | 0.0030804244 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | -0.000996 | -| n_updates | 242330 | -| policy_gradient_loss | 0.0147 | -| std | 0.00596 | -| value_loss | 5.47e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24235 | -| time_elapsed | 131832 | -| total_timesteps | 3102080 | -| train/ | | -| approx_kl | 0.13352302 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | 0.0472 | -| n_updates | 242340 | -| policy_gradient_loss | 0.0137 | -| std | 0.00595 | -| value_loss | 5.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24236 | -| time_elapsed | 131841 | -| total_timesteps | 3102208 | -| train/ | | -| approx_kl | 0.052480984 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.206 | -| learning_rate | 0.0003 | -| loss | -0.027 | -| n_updates | 242350 | -| policy_gradient_loss | -0.00901 | -| std | 0.00595 | -| value_loss | 0.00196 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24237 | -| time_elapsed | 131844 | -| total_timesteps | 3102336 | -| train/ | | -| approx_kl | 0.6054975 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.83 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 242360 | -| policy_gradient_loss | 0.0482 | -| std | 0.00595 | -| value_loss | 1.63e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24238 | -| time_elapsed | 131849 | -| total_timesteps | 3102464 | -| train/ | | -| approx_kl | 0.014813019 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -10.8 | -| learning_rate | 0.0003 | -| loss | -0.00198 | -| n_updates | 242370 | -| policy_gradient_loss | 0.00659 | -| std | 0.00595 | -| value_loss | 5.45e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24239 | -| time_elapsed | 131854 | -| total_timesteps | 3102592 | -| train/ | | -| approx_kl | 0.0036152722 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | -0.00317 | -| n_updates | 242380 | -| policy_gradient_loss | 0.0123 | -| std | 0.00595 | -| value_loss | 1.12e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24240 | -| time_elapsed | 131860 | -| total_timesteps | 3102720 | -| train/ | | -| approx_kl | 0.064475454 | -| clip_fraction | 0.682 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | 0.0792 | -| n_updates | 242390 | -| policy_gradient_loss | 0.175 | -| std | 0.00595 | -| value_loss | 1.11e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24241 | -| time_elapsed | 131866 | -| total_timesteps | 3102848 | -| train/ | | -| approx_kl | 0.15354075 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 242400 | -| policy_gradient_loss | 0.164 | -| std | 0.00595 | -| value_loss | 1.02e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 24242 | -| time_elapsed | 131871 | -| total_timesteps | 3102976 | -| train/ | | -| approx_kl | 0.17366238 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 242410 | -| policy_gradient_loss | 0.184 | -| std | 0.00595 | -| value_loss | 9.39e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24243 | -| time_elapsed | 131877 | -| total_timesteps | 3103104 | -| train/ | | -| approx_kl | 0.03298159 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 242420 | -| policy_gradient_loss | 0.0354 | -| std | 0.00595 | -| value_loss | 7.02e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24244 | -| time_elapsed | 131885 | -| total_timesteps | 3103232 | -| train/ | | -| approx_kl | 0.013271059 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.71 | -| learning_rate | 0.0003 | -| loss | -0.0193 | -| n_updates | 242430 | -| policy_gradient_loss | 0.00493 | -| std | 0.00595 | -| value_loss | 0.00334 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24245 | -| time_elapsed | 131889 | -| total_timesteps | 3103360 | -| train/ | | -| approx_kl | 0.626794 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.354 | -| learning_rate | 0.0003 | -| loss | 0.312 | -| n_updates | 242440 | -| policy_gradient_loss | 0.0978 | -| std | 0.00595 | -| value_loss | 3.73e-06 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24246 | -| time_elapsed | 131895 | -| total_timesteps | 3103488 | -| train/ | | -| approx_kl | 0.0070468956 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00951 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 242450 | -| policy_gradient_loss | 0.00472 | -| std | 0.00595 | -| value_loss | 8.17e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24247 | -| time_elapsed | 131899 | -| total_timesteps | 3103616 | -| train/ | | -| approx_kl | 0.047553096 | -| clip_fraction | 0.642 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | 0.0534 | -| n_updates | 242460 | -| policy_gradient_loss | 0.138 | -| std | 0.00595 | -| value_loss | 8.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24248 | -| time_elapsed | 131903 | -| total_timesteps | 3103744 | -| train/ | | -| approx_kl | 0.003605125 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -12.4 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 242470 | -| policy_gradient_loss | 0.00521 | -| std | 0.00596 | -| value_loss | 3.45e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24249 | -| time_elapsed | 131909 | -| total_timesteps | 3103872 | -| train/ | | -| approx_kl | 0.6601327 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -36.5 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 242480 | -| policy_gradient_loss | 0.00376 | -| std | 0.00597 | -| value_loss | 2.86e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24250 | -| time_elapsed | 131913 | -| total_timesteps | 3104000 | -| train/ | | -| approx_kl | 0.034878295 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0201 | -| n_updates | 242490 | -| policy_gradient_loss | 0.0448 | -| std | 0.00598 | -| value_loss | 7.79e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24251 | -| time_elapsed | 131919 | -| total_timesteps | 3104128 | -| train/ | | -| approx_kl | 0.3264155 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 242500 | -| policy_gradient_loss | 0.135 | -| std | 0.00598 | -| value_loss | 1.39e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24252 | -| time_elapsed | 131928 | -| total_timesteps | 3104256 | -| train/ | | -| approx_kl | 0.32791215 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 242510 | -| policy_gradient_loss | 0.11 | -| std | 0.00598 | -| value_loss | 0.00235 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24253 | -| time_elapsed | 131933 | -| total_timesteps | 3104384 | -| train/ | | -| approx_kl | 0.12136479 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.459 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 242520 | -| policy_gradient_loss | 0.0229 | -| std | 0.00598 | -| value_loss | 1.58e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24254 | -| time_elapsed | 131937 | -| total_timesteps | 3104512 | -| train/ | | -| approx_kl | 0.7466971 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 242530 | -| policy_gradient_loss | 0.0504 | -| std | 0.00599 | -| value_loss | 3.3e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24255 | -| time_elapsed | 131943 | -| total_timesteps | 3104640 | -| train/ | | -| approx_kl | 0.053461373 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00285 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 242540 | -| policy_gradient_loss | 0.0146 | -| std | 0.00598 | -| value_loss | 1.17e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24256 | -| time_elapsed | 131947 | -| total_timesteps | 3104768 | -| train/ | | -| approx_kl | 0.07330903 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 242550 | -| policy_gradient_loss | 0.0117 | -| std | 0.00599 | -| value_loss | 9.67e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24257 | -| time_elapsed | 131952 | -| total_timesteps | 3104896 | -| train/ | | -| approx_kl | 0.013737964 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 242560 | -| policy_gradient_loss | 0.00902 | -| std | 0.00599 | -| value_loss | 8.25e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24258 | -| time_elapsed | 131957 | -| total_timesteps | 3105024 | -| train/ | | -| approx_kl | 0.09604496 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0509 | -| n_updates | 242570 | -| policy_gradient_loss | 0.0202 | -| std | 0.00599 | -| value_loss | 5.88e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24259 | -| time_elapsed | 131969 | -| total_timesteps | 3105152 | -| train/ | | -| approx_kl | 0.060541652 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 242580 | -| policy_gradient_loss | -0.00359 | -| std | 0.00599 | -| value_loss | 0.000383 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24260 | -| time_elapsed | 131974 | -| total_timesteps | 3105280 | -| train/ | | -| approx_kl | 0.0066679367 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00188 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 242590 | -| policy_gradient_loss | 0.0083 | -| std | 0.00599 | -| value_loss | 1.75e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24261 | -| time_elapsed | 131979 | -| total_timesteps | 3105408 | -| train/ | | -| approx_kl | 0.13231196 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00931 | -| learning_rate | 0.0003 | -| loss | 0.0919 | -| n_updates | 242600 | -| policy_gradient_loss | 0.0379 | -| std | 0.00599 | -| value_loss | 2.78e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24262 | -| time_elapsed | 131983 | -| total_timesteps | 3105536 | -| train/ | | -| approx_kl | 0.017284563 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0668 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 242610 | -| policy_gradient_loss | 0.00449 | -| std | 0.00599 | -| value_loss | 1.32e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24263 | -| time_elapsed | 131988 | -| total_timesteps | 3105664 | -| train/ | | -| approx_kl | 0.0042338353 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0595 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 242620 | -| policy_gradient_loss | 0.0127 | -| std | 0.00599 | -| value_loss | 1.21e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24264 | -| time_elapsed | 131994 | -| total_timesteps | 3105792 | -| train/ | | -| approx_kl | 0.00018855976 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | -0.000255 | -| n_updates | 242630 | -| policy_gradient_loss | 0.0432 | -| std | 0.006 | -| value_loss | 1.44e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24265 | -| time_elapsed | 131999 | -| total_timesteps | 3105920 | -| train/ | | -| approx_kl | 0.79578835 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.789 | -| learning_rate | 0.0003 | -| loss | 0.465 | -| n_updates | 242640 | -| policy_gradient_loss | 0.183 | -| std | 0.006 | -| value_loss | 6.96e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24266 | -| time_elapsed | 132005 | -| total_timesteps | 3106048 | -| train/ | | -| approx_kl | 0.033941742 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 242650 | -| policy_gradient_loss | 0.00485 | -| std | 0.006 | -| value_loss | 8.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24267 | -| time_elapsed | 132013 | -| total_timesteps | 3106176 | -| train/ | | -| approx_kl | 0.012962415 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -3.09 | -| learning_rate | 0.0003 | -| loss | -0.0261 | -| n_updates | 242660 | -| policy_gradient_loss | -0.00687 | -| std | 0.006 | -| value_loss | 0.00407 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24268 | -| time_elapsed | 132018 | -| total_timesteps | 3106304 | -| train/ | | -| approx_kl | 0.06329204 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.272 | -| learning_rate | 0.0003 | -| loss | 0.0282 | -| n_updates | 242670 | -| policy_gradient_loss | 0.0666 | -| std | 0.00601 | -| value_loss | 9.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24269 | -| time_elapsed | 132024 | -| total_timesteps | 3106432 | -| train/ | | -| approx_kl | 0.005501502 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -4.83 | -| learning_rate | 0.0003 | -| loss | -0.00693 | -| n_updates | 242680 | -| policy_gradient_loss | 0.0671 | -| std | 0.00601 | -| value_loss | 2.15e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24270 | -| time_elapsed | 132030 | -| total_timesteps | 3106560 | -| train/ | | -| approx_kl | 2.8743482 | -| clip_fraction | 0.857 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 242690 | -| policy_gradient_loss | 0.172 | -| std | 0.00603 | -| value_loss | 1.92e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24271 | -| time_elapsed | 132035 | -| total_timesteps | 3106688 | -| train/ | | -| approx_kl | 0.4376048 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 242700 | -| policy_gradient_loss | 0.0467 | -| std | 0.00604 | -| value_loss | 4.37e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24272 | -| time_elapsed | 132040 | -| total_timesteps | 3106816 | -| train/ | | -| approx_kl | 0.09527324 | -| clip_fraction | 0.639 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00623 | -| learning_rate | 0.0003 | -| loss | 0.0668 | -| n_updates | 242710 | -| policy_gradient_loss | 0.103 | -| std | 0.00605 | -| value_loss | 7.9e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24273 | -| time_elapsed | 132045 | -| total_timesteps | 3106944 | -| train/ | | -| approx_kl | 0.07123525 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0043 | -| learning_rate | 0.0003 | -| loss | 0.0724 | -| n_updates | 242720 | -| policy_gradient_loss | 0.0376 | -| std | 0.00605 | -| value_loss | 4.97e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24274 | -| time_elapsed | 132050 | -| total_timesteps | 3107072 | -| train/ | | -| approx_kl | 0.24962065 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 242730 | -| policy_gradient_loss | 0.046 | -| std | 0.00605 | -| value_loss | 2.11e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24275 | -| time_elapsed | 132059 | -| total_timesteps | 3107200 | -| train/ | | -| approx_kl | 0.070037186 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.904 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 242740 | -| policy_gradient_loss | -0.0159 | -| std | 0.00605 | -| value_loss | 0.000462 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24276 | -| time_elapsed | 132064 | -| total_timesteps | 3107328 | -| train/ | | -| approx_kl | 0.02102939 | -| clip_fraction | 0.607 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 242750 | -| policy_gradient_loss | 0.0648 | -| std | 0.00605 | -| value_loss | 3.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24277 | -| time_elapsed | 132068 | -| total_timesteps | 3107456 | -| train/ | | -| approx_kl | 0.098748095 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00479 | -| learning_rate | 0.0003 | -| loss | 0.0789 | -| n_updates | 242760 | -| policy_gradient_loss | 0.0368 | -| std | 0.00606 | -| value_loss | 6.93e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24278 | -| time_elapsed | 132072 | -| total_timesteps | 3107584 | -| train/ | | -| approx_kl | 0.7696173 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.294 | -| learning_rate | 0.0003 | -| loss | 0.354 | -| n_updates | 242770 | -| policy_gradient_loss | 0.198 | -| std | 0.00606 | -| value_loss | 1.02e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24279 | -| time_elapsed | 132078 | -| total_timesteps | 3107712 | -| train/ | | -| approx_kl | 0.10370504 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.039 | -| n_updates | 242780 | -| policy_gradient_loss | 0.0242 | -| std | 0.00606 | -| value_loss | 5.23e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24280 | -| time_elapsed | 132083 | -| total_timesteps | 3107840 | -| train/ | | -| approx_kl | 0.15350898 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0592 | -| learning_rate | 0.0003 | -| loss | 0.089 | -| n_updates | 242790 | -| policy_gradient_loss | 0.0276 | -| std | 0.00606 | -| value_loss | 3.75e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24281 | -| time_elapsed | 132088 | -| total_timesteps | 3107968 | -| train/ | | -| approx_kl | 0.018415935 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | -0.00371 | -| n_updates | 242800 | -| policy_gradient_loss | -0.00182 | -| std | 0.00606 | -| value_loss | 2.73e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24282 | -| time_elapsed | 132094 | -| total_timesteps | 3108096 | -| train/ | | -| approx_kl | 0.03078061 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.00776 | -| n_updates | 242810 | -| policy_gradient_loss | 0.0345 | -| std | 0.00606 | -| value_loss | 2.15e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24283 | -| time_elapsed | 132104 | -| total_timesteps | 3108224 | -| train/ | | -| approx_kl | 0.017418947 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 242820 | -| policy_gradient_loss | 0.0103 | -| std | 0.00605 | -| value_loss | 0.0042 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24284 | -| time_elapsed | 132108 | -| total_timesteps | 3108352 | -| train/ | | -| approx_kl | 0.00026240945 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.308 | -| learning_rate | 0.0003 | -| loss | 0.0043 | -| n_updates | 242830 | -| policy_gradient_loss | 0.0342 | -| std | 0.00605 | -| value_loss | 9.92e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24285 | -| time_elapsed | 132113 | -| total_timesteps | 3108480 | -| train/ | | -| approx_kl | 0.71730983 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -15 | -| learning_rate | 0.0003 | -| loss | 0.199 | -| n_updates | 242840 | -| policy_gradient_loss | 0.054 | -| std | 0.00605 | -| value_loss | 6.47e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24286 | -| time_elapsed | 132118 | -| total_timesteps | 3108608 | -| train/ | | -| approx_kl | 0.013663067 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.826 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 242850 | -| policy_gradient_loss | 0.00416 | -| std | 0.00605 | -| value_loss | 9.25e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24287 | -| time_elapsed | 132122 | -| total_timesteps | 3108736 | -| train/ | | -| approx_kl | 0.003336269 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.35 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 242860 | -| policy_gradient_loss | 0.0078 | -| std | 0.00605 | -| value_loss | 3.37e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24288 | -| time_elapsed | 132127 | -| total_timesteps | 3108864 | -| train/ | | -| approx_kl | 0.12126727 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0203 | -| learning_rate | 0.0003 | -| loss | 0.0553 | -| n_updates | 242870 | -| policy_gradient_loss | 0.0149 | -| std | 0.00605 | -| value_loss | 1.63e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24289 | -| time_elapsed | 132132 | -| total_timesteps | 3108992 | -| train/ | | -| approx_kl | 0.29724765 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.214 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 242880 | -| policy_gradient_loss | 0.0425 | -| std | 0.00604 | -| value_loss | 7.09e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24290 | -| time_elapsed | 132136 | -| total_timesteps | 3109120 | -| train/ | | -| approx_kl | 0.85878474 | -| clip_fraction | 0.546 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 242890 | -| policy_gradient_loss | 0.0691 | -| std | 0.00604 | -| value_loss | 6.84e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24291 | -| time_elapsed | 132147 | -| total_timesteps | 3109248 | -| train/ | | -| approx_kl | 0.024343248 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.127 | -| learning_rate | 0.0003 | -| loss | -0.0294 | -| n_updates | 242900 | -| policy_gradient_loss | -0.0185 | -| std | 0.00604 | -| value_loss | 0.00191 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24292 | -| time_elapsed | 132151 | -| total_timesteps | 3109376 | -| train/ | | -| approx_kl | 0.14875686 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.32 | -| learning_rate | 0.0003 | -| loss | 0.0974 | -| n_updates | 242910 | -| policy_gradient_loss | 0.148 | -| std | 0.00604 | -| value_loss | 1.42e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24293 | -| time_elapsed | 132155 | -| total_timesteps | 3109504 | -| train/ | | -| approx_kl | 0.02164732 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -24.2 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 242920 | -| policy_gradient_loss | 0.0157 | -| std | 0.00604 | -| value_loss | 1.29e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24294 | -| time_elapsed | 132160 | -| total_timesteps | 3109632 | -| train/ | | -| approx_kl | 9.4915275e-05 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.000158 | -| n_updates | 242930 | -| policy_gradient_loss | 0.0562 | -| std | 0.00603 | -| value_loss | 6.69e-09 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24295 | -| time_elapsed | 132165 | -| total_timesteps | 3109760 | -| train/ | | -| approx_kl | 0.5690843 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 242940 | -| policy_gradient_loss | 0.0537 | -| std | 0.00603 | -| value_loss | 4.41e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 24296 | -| time_elapsed | 132170 | -| total_timesteps | 3109888 | -| train/ | | -| approx_kl | 0.06534036 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.0509 | -| n_updates | 242950 | -| policy_gradient_loss | 0.0224 | -| std | 0.00603 | -| value_loss | 2.57e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24297 | -| time_elapsed | 132175 | -| total_timesteps | 3110016 | -| train/ | | -| approx_kl | 0.014880745 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.00601 | -| n_updates | 242960 | -| policy_gradient_loss | 0.0152 | -| std | 0.00602 | -| value_loss | 1.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24298 | -| time_elapsed | 132187 | -| total_timesteps | 3110144 | -| train/ | | -| approx_kl | 0.023423847 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.895 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 242970 | -| policy_gradient_loss | -0.0211 | -| std | 0.00602 | -| value_loss | 0.00183 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24299 | -| time_elapsed | 132193 | -| total_timesteps | 3110272 | -| train/ | | -| approx_kl | 0.005205158 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00375 | -| learning_rate | 0.0003 | -| loss | -0.00459 | -| n_updates | 242980 | -| policy_gradient_loss | 0.0104 | -| std | 0.00602 | -| value_loss | 2.38e-05 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24300 | -| time_elapsed | 132197 | -| total_timesteps | 3110400 | -| train/ | | -| approx_kl | 0.110318 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0239 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 242990 | -| policy_gradient_loss | 0.00325 | -| std | 0.00602 | -| value_loss | 2.78e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24301 | -| time_elapsed | 132202 | -| total_timesteps | 3110528 | -| train/ | | -| approx_kl | 0.04879028 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00387 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 243000 | -| policy_gradient_loss | 0.0117 | -| std | 0.00602 | -| value_loss | 1.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24302 | -| time_elapsed | 132206 | -| total_timesteps | 3110656 | -| train/ | | -| approx_kl | 0.06392273 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 243010 | -| policy_gradient_loss | 0.00988 | -| std | 0.00602 | -| value_loss | 7.65e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24303 | -| time_elapsed | 132211 | -| total_timesteps | 3110784 | -| train/ | | -| approx_kl | 0.010458183 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.00497 | -| n_updates | 243020 | -| policy_gradient_loss | 0.00719 | -| std | 0.00603 | -| value_loss | 5.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.983 | -| time/ | | -| fps | 23 | -| iterations | 24304 | -| time_elapsed | 132217 | -| total_timesteps | 3110912 | -| train/ | | -| approx_kl | 0.09171496 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.0552 | -| n_updates | 243030 | -| policy_gradient_loss | 0.0226 | -| std | 0.00603 | -| value_loss | 3.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24305 | -| time_elapsed | 132222 | -| total_timesteps | 3111040 | -| train/ | | -| approx_kl | 0.012245031 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 243040 | -| policy_gradient_loss | 0.00393 | -| std | 0.00602 | -| value_loss | 2.77e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24306 | -| time_elapsed | 132231 | -| total_timesteps | 3111168 | -| train/ | | -| approx_kl | 0.06847919 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | 0.00361 | -| n_updates | 243050 | -| policy_gradient_loss | 0.0453 | -| std | 0.00603 | -| value_loss | 0.000173 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24307 | -| time_elapsed | 132237 | -| total_timesteps | 3111296 | -| train/ | | -| approx_kl | 1.4513944 | -| clip_fraction | 0.779 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.000241 | -| learning_rate | 0.0003 | -| loss | 0.504 | -| n_updates | 243060 | -| policy_gradient_loss | 0.198 | -| std | 0.00603 | -| value_loss | 0.000103 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24308 | -| time_elapsed | 132243 | -| total_timesteps | 3111424 | -| train/ | | -| approx_kl | 0.0743184 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0138 | -| learning_rate | 0.0003 | -| loss | 0.0717 | -| n_updates | 243070 | -| policy_gradient_loss | 0.00656 | -| std | 0.00603 | -| value_loss | 5.69e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24309 | -| time_elapsed | 132248 | -| total_timesteps | 3111552 | -| train/ | | -| approx_kl | 0.4605456 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00969 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 243080 | -| policy_gradient_loss | 0.0555 | -| std | 0.00603 | -| value_loss | 1.3e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24310 | -| time_elapsed | 132252 | -| total_timesteps | 3111680 | -| train/ | | -| approx_kl | 0.06094019 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0559 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 243090 | -| policy_gradient_loss | 0.0197 | -| std | 0.00603 | -| value_loss | 9.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24311 | -| time_elapsed | 132257 | -| total_timesteps | 3111808 | -| train/ | | -| approx_kl | 0.009946949 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0708 | -| learning_rate | 0.0003 | -| loss | -0.0034 | -| n_updates | 243100 | -| policy_gradient_loss | 0.00749 | -| std | 0.00603 | -| value_loss | 6.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.994 | -| time/ | | -| fps | 23 | -| iterations | 24312 | -| time_elapsed | 132263 | -| total_timesteps | 3111936 | -| train/ | | -| approx_kl | 0.108313486 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 243110 | -| policy_gradient_loss | 0.0249 | -| std | 0.00603 | -| value_loss | 4.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24313 | -| time_elapsed | 132269 | -| total_timesteps | 3112064 | -| train/ | | -| approx_kl | 0.053418804 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.0389 | -| n_updates | 243120 | -| policy_gradient_loss | 0.0204 | -| std | 0.00603 | -| value_loss | 2.66e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24314 | -| time_elapsed | 132282 | -| total_timesteps | 3112192 | -| train/ | | -| approx_kl | 0.11468777 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.937 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 243130 | -| policy_gradient_loss | 0.0227 | -| std | 0.00604 | -| value_loss | 0.000895 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24315 | -| time_elapsed | 132289 | -| total_timesteps | 3112320 | -| train/ | | -| approx_kl | 0.28490314 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00324 | -| learning_rate | 0.0003 | -| loss | 0.0867 | -| n_updates | 243140 | -| policy_gradient_loss | 0.017 | -| std | 0.00604 | -| value_loss | 2.14e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24316 | -| time_elapsed | 132294 | -| total_timesteps | 3112448 | -| train/ | | -| approx_kl | 0.017695729 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00355 | -| learning_rate | 0.0003 | -| loss | -0.00692 | -| n_updates | 243150 | -| policy_gradient_loss | 0.0326 | -| std | 0.00604 | -| value_loss | 6.59e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24317 | -| time_elapsed | 132299 | -| total_timesteps | 3112576 | -| train/ | | -| approx_kl | 0.14512083 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.0734 | -| n_updates | 243160 | -| policy_gradient_loss | 0.0371 | -| std | 0.00604 | -| value_loss | 3.36e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24318 | -| time_elapsed | 132303 | -| total_timesteps | 3112704 | -| train/ | | -| approx_kl | 1.6302336e-05 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.071 | -| learning_rate | 0.0003 | -| loss | -7.6e-05 | -| n_updates | 243170 | -| policy_gradient_loss | 0.028 | -| std | 0.00604 | -| value_loss | 1.99e-07 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24319 | -| time_elapsed | 132308 | -| total_timesteps | 3112832 | -| train/ | | -| approx_kl | 0.677143 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0788 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 243180 | -| policy_gradient_loss | 0.076 | -| std | 0.00604 | -| value_loss | 2.69e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24320 | -| time_elapsed | 132314 | -| total_timesteps | 3112960 | -| train/ | | -| approx_kl | 0.045712728 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 243190 | -| policy_gradient_loss | 0.019 | -| std | 0.00603 | -| value_loss | 1.39e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24321 | -| time_elapsed | 132318 | -| total_timesteps | 3113088 | -| train/ | | -| approx_kl | 0.010429403 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.52 | -| learning_rate | 0.0003 | -| loss | -0.00706 | -| n_updates | 243200 | -| policy_gradient_loss | 0.00788 | -| std | 0.00602 | -| value_loss | 2.94e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24322 | -| time_elapsed | 132328 | -| total_timesteps | 3113216 | -| train/ | | -| approx_kl | 0.07432834 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.00933 | -| n_updates | 243210 | -| policy_gradient_loss | 0.00524 | -| std | 0.00602 | -| value_loss | 0.0035 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24323 | -| time_elapsed | 132334 | -| total_timesteps | 3113344 | -| train/ | | -| approx_kl | 0.03454698 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.92 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 243220 | -| policy_gradient_loss | 0.0244 | -| std | 0.00601 | -| value_loss | 1.06e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24324 | -| time_elapsed | 132339 | -| total_timesteps | 3113472 | -| train/ | | -| approx_kl | 0.35830182 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 243230 | -| policy_gradient_loss | 0.182 | -| std | 0.00602 | -| value_loss | 8.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24325 | -| time_elapsed | 132343 | -| total_timesteps | 3113600 | -| train/ | | -| approx_kl | 0.23267943 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 243240 | -| policy_gradient_loss | 0.137 | -| std | 0.00602 | -| value_loss | 7.57e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24326 | -| time_elapsed | 132348 | -| total_timesteps | 3113728 | -| train/ | | -| approx_kl | 0.03847788 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | 0.00337 | -| n_updates | 243250 | -| policy_gradient_loss | 0.0265 | -| std | 0.00602 | -| value_loss | 6.06e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24327 | -| time_elapsed | 132353 | -| total_timesteps | 3113856 | -| train/ | | -| approx_kl | 0.1698426 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.063 | -| n_updates | 243260 | -| policy_gradient_loss | 0.0201 | -| std | 0.00602 | -| value_loss | 4.15e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24328 | -| time_elapsed | 132358 | -| total_timesteps | 3113984 | -| train/ | | -| approx_kl | 0.021739649 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 243270 | -| policy_gradient_loss | -0.00676 | -| std | 0.00602 | -| value_loss | 3.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24329 | -| time_elapsed | 132363 | -| total_timesteps | 3114112 | -| train/ | | -| approx_kl | 0.01571393 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.00497 | -| n_updates | 243280 | -| policy_gradient_loss | 0.00236 | -| std | 0.00602 | -| value_loss | 2.1e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24330 | -| time_elapsed | 132374 | -| total_timesteps | 3114240 | -| train/ | | -| approx_kl | 0.014322622 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 243290 | -| policy_gradient_loss | -0.00482 | -| std | 0.00602 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24331 | -| time_elapsed | 132378 | -| total_timesteps | 3114368 | -| train/ | | -| approx_kl | 0.017904576 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 243300 | -| policy_gradient_loss | 0.0272 | -| std | 0.00602 | -| value_loss | 1.2e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24332 | -| time_elapsed | 132384 | -| total_timesteps | 3114496 | -| train/ | | -| approx_kl | 0.025327615 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00743 | -| learning_rate | 0.0003 | -| loss | -0.00856 | -| n_updates | 243310 | -| policy_gradient_loss | 0.0255 | -| std | 0.00602 | -| value_loss | 2.88e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24333 | -| time_elapsed | 132389 | -| total_timesteps | 3114624 | -| train/ | | -| approx_kl | 0.305013 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 243320 | -| policy_gradient_loss | 0.144 | -| std | 0.00602 | -| value_loss | 1.54e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24334 | -| time_elapsed | 132394 | -| total_timesteps | 3114752 | -| train/ | | -| approx_kl | 0.22933891 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 243330 | -| policy_gradient_loss | 0.135 | -| std | 0.00602 | -| value_loss | 9.12e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24335 | -| time_elapsed | 132398 | -| total_timesteps | 3114880 | -| train/ | | -| approx_kl | 0.2535446 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 243340 | -| policy_gradient_loss | 0.211 | -| std | 0.00602 | -| value_loss | 6.59e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24336 | -| time_elapsed | 132404 | -| total_timesteps | 3115008 | -| train/ | | -| approx_kl | 0.045526903 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 243350 | -| policy_gradient_loss | 0.0397 | -| std | 0.00602 | -| value_loss | 6.34e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24337 | -| time_elapsed | 132418 | -| total_timesteps | 3115136 | -| train/ | | -| approx_kl | 0.02070588 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | -0.0176 | -| n_updates | 243360 | -| policy_gradient_loss | -0.0126 | -| std | 0.00602 | -| value_loss | 0.000312 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24338 | -| time_elapsed | 132426 | -| total_timesteps | 3115264 | -| train/ | | -| approx_kl | 0.12887342 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 243370 | -| policy_gradient_loss | 0.0459 | -| std | 0.00602 | -| value_loss | 4.48e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24339 | -| time_elapsed | 132431 | -| total_timesteps | 3115392 | -| train/ | | -| approx_kl | 0.31047934 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -2.52 | -| learning_rate | 0.0003 | -| loss | 0.0868 | -| n_updates | 243380 | -| policy_gradient_loss | 0.0394 | -| std | 0.00602 | -| value_loss | 3.63e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24340 | -| time_elapsed | 132437 | -| total_timesteps | 3115520 | -| train/ | | -| approx_kl | 0.0025773249 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | -0.000867 | -| n_updates | 243390 | -| policy_gradient_loss | 0.0119 | -| std | 0.00603 | -| value_loss | 2.21e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24341 | -| time_elapsed | 132443 | -| total_timesteps | 3115648 | -| train/ | | -| approx_kl | 0.07883362 | -| clip_fraction | 0.582 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 243400 | -| policy_gradient_loss | 0.064 | -| std | 0.00603 | -| value_loss | 4.44e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24342 | -| time_elapsed | 132448 | -| total_timesteps | 3115776 | -| train/ | | -| approx_kl | 3.1059608e-07 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00843 | -| learning_rate | 0.0003 | -| loss | -0.000101 | -| n_updates | 243410 | -| policy_gradient_loss | 0.105 | -| std | 0.00603 | -| value_loss | 1.71e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24343 | -| time_elapsed | 132454 | -| total_timesteps | 3115904 | -| train/ | | -| approx_kl | 0.17105003 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 243420 | -| policy_gradient_loss | 0.173 | -| std | 0.00603 | -| value_loss | 9.51e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24344 | -| time_elapsed | 132459 | -| total_timesteps | 3116032 | -| train/ | | -| approx_kl | 0.012519467 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 243430 | -| policy_gradient_loss | 0.0347 | -| std | 0.00603 | -| value_loss | 5.33e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24345 | -| time_elapsed | 132468 | -| total_timesteps | 3116160 | -| train/ | | -| approx_kl | 0.11545989 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 243440 | -| policy_gradient_loss | -0.00826 | -| std | 0.00603 | -| value_loss | 0.0002 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24346 | -| time_elapsed | 132473 | -| total_timesteps | 3116288 | -| train/ | | -| approx_kl | 0.49431473 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0839 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 243450 | -| policy_gradient_loss | 0.0382 | -| std | 0.00603 | -| value_loss | 3.75e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24347 | -| time_elapsed | 132478 | -| total_timesteps | 3116416 | -| train/ | | -| approx_kl | 0.010549008 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | 0.00152 | -| n_updates | 243460 | -| policy_gradient_loss | 0.0138 | -| std | 0.00603 | -| value_loss | 2.46e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24348 | -| time_elapsed | 132481 | -| total_timesteps | 3116544 | -| train/ | | -| approx_kl | 0.08413786 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.0353 | -| n_updates | 243470 | -| policy_gradient_loss | 0.0133 | -| std | 0.00604 | -| value_loss | 1.34e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24349 | -| time_elapsed | 132487 | -| total_timesteps | 3116672 | -| train/ | | -| approx_kl | 0.05388469 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 243480 | -| policy_gradient_loss | 0.0178 | -| std | 0.00604 | -| value_loss | 8.22e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24350 | -| time_elapsed | 132492 | -| total_timesteps | 3116800 | -| train/ | | -| approx_kl | 0.058537476 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 243490 | -| policy_gradient_loss | 0.00927 | -| std | 0.00604 | -| value_loss | 5.92e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24351 | -| time_elapsed | 132497 | -| total_timesteps | 3116928 | -| train/ | | -| approx_kl | 0.009388271 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.000392 | -| n_updates | 243500 | -| policy_gradient_loss | 0.00493 | -| std | 0.00604 | -| value_loss | 4.16e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24352 | -| time_elapsed | 132503 | -| total_timesteps | 3117056 | -| train/ | | -| approx_kl | 0.015683787 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.0107 | -| n_updates | 243510 | -| policy_gradient_loss | 0.0129 | -| std | 0.00601 | -| value_loss | 4.25e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24353 | -| time_elapsed | 132510 | -| total_timesteps | 3117184 | -| train/ | | -| approx_kl | 0.023584934 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.808 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 243520 | -| policy_gradient_loss | -0.0163 | -| std | 0.00599 | -| value_loss | 0.00515 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24354 | -| time_elapsed | 132515 | -| total_timesteps | 3117312 | -| train/ | | -| approx_kl | 0.004890163 | -| clip_fraction | 0.176 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.391 | -| learning_rate | 0.0003 | -| loss | 0.00181 | -| n_updates | 243530 | -| policy_gradient_loss | 0.00902 | -| std | 0.00597 | -| value_loss | 2.16e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24355 | -| time_elapsed | 132518 | -| total_timesteps | 3117440 | -| train/ | | -| approx_kl | 0.06349803 | -| clip_fraction | 0.594 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0898 | -| learning_rate | 0.0003 | -| loss | -0.0278 | -| n_updates | 243540 | -| policy_gradient_loss | 0.0564 | -| std | 0.00597 | -| value_loss | 1.45e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24356 | -| time_elapsed | 132523 | -| total_timesteps | 3117568 | -| train/ | | -| approx_kl | 8.176174e-05 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0197 | -| learning_rate | 0.0003 | -| loss | 0.000729 | -| n_updates | 243550 | -| policy_gradient_loss | 0.0983 | -| std | 0.00597 | -| value_loss | 8.93e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24357 | -| time_elapsed | 132528 | -| total_timesteps | 3117696 | -| train/ | | -| approx_kl | 2.0354924 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.67 | -| n_updates | 243560 | -| policy_gradient_loss | 0.284 | -| std | 0.00597 | -| value_loss | 4.81e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24358 | -| time_elapsed | 132532 | -| total_timesteps | 3117824 | -| train/ | | -| approx_kl | 0.16753086 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0938 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 243570 | -| policy_gradient_loss | 0.0673 | -| std | 0.00597 | -| value_loss | 3.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24359 | -| time_elapsed | 132536 | -| total_timesteps | 3117952 | -| train/ | | -| approx_kl | 0.13431492 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.0872 | -| n_updates | 243580 | -| policy_gradient_loss | 0.0576 | -| std | 0.00597 | -| value_loss | 5.01e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24360 | -| time_elapsed | 132541 | -| total_timesteps | 3118080 | -| train/ | | -| approx_kl | 0.04198576 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 243590 | -| policy_gradient_loss | 0.091 | -| std | 0.00597 | -| value_loss | 1.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24361 | -| time_elapsed | 132553 | -| total_timesteps | 3118208 | -| train/ | | -| approx_kl | 0.040494718 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.00093 | -| n_updates | 243600 | -| policy_gradient_loss | -0.000836 | -| std | 0.00597 | -| value_loss | 0.00379 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24362 | -| time_elapsed | 132557 | -| total_timesteps | 3118336 | -| train/ | | -| approx_kl | 0.28302953 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 243610 | -| policy_gradient_loss | 0.172 | -| std | 0.00597 | -| value_loss | 4.73e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24363 | -| time_elapsed | 132562 | -| total_timesteps | 3118464 | -| train/ | | -| approx_kl | 0.056841195 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00258 | -| learning_rate | 0.0003 | -| loss | -0.00354 | -| n_updates | 243620 | -| policy_gradient_loss | 0.0256 | -| std | 0.00597 | -| value_loss | 1.17e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24364 | -| time_elapsed | 132566 | -| total_timesteps | 3118592 | -| train/ | | -| approx_kl | 0.0014637765 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00348 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 243630 | -| policy_gradient_loss | 0.0359 | -| std | 0.00597 | -| value_loss | 3.87e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24365 | -| time_elapsed | 132572 | -| total_timesteps | 3118720 | -| train/ | | -| approx_kl | 0.46781558 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 243640 | -| policy_gradient_loss | 0.048 | -| std | 0.00597 | -| value_loss | 2.59e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24366 | -| time_elapsed | 132578 | -| total_timesteps | 3118848 | -| train/ | | -| approx_kl | 0.011149399 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0636 | -| learning_rate | 0.0003 | -| loss | 0.000613 | -| n_updates | 243650 | -| policy_gradient_loss | 0.0134 | -| std | 0.00597 | -| value_loss | 1.92e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 24367 | -| time_elapsed | 132583 | -| total_timesteps | 3118976 | -| train/ | | -| approx_kl | 0.09645768 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.0431 | -| n_updates | 243660 | -| policy_gradient_loss | 0.0174 | -| std | 0.00597 | -| value_loss | 1.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24368 | -| time_elapsed | 132586 | -| total_timesteps | 3119104 | -| train/ | | -| approx_kl | 0.056943603 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | -0.00036 | -| n_updates | 243670 | -| policy_gradient_loss | 0.00242 | -| std | 0.00597 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24369 | -| time_elapsed | 132598 | -| total_timesteps | 3119232 | -| train/ | | -| approx_kl | 0.001350041 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 243680 | -| policy_gradient_loss | -0.00626 | -| std | 0.00597 | -| value_loss | 0.00173 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24370 | -| time_elapsed | 132603 | -| total_timesteps | 3119360 | -| train/ | | -| approx_kl | 0.0035508056 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00731 | -| learning_rate | 0.0003 | -| loss | -0.00878 | -| n_updates | 243690 | -| policy_gradient_loss | 0.0145 | -| std | 0.00597 | -| value_loss | 8.64e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24371 | -| time_elapsed | 132607 | -| total_timesteps | 3119488 | -| train/ | | -| approx_kl | 0.051731467 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | 0.043 | -| n_updates | 243700 | -| policy_gradient_loss | 0.173 | -| std | 0.00597 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24372 | -| time_elapsed | 132612 | -| total_timesteps | 3119616 | -| train/ | | -| approx_kl | 0.014415652 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 243710 | -| policy_gradient_loss | 0.0312 | -| std | 0.00597 | -| value_loss | 1.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24373 | -| time_elapsed | 132618 | -| total_timesteps | 3119744 | -| train/ | | -| approx_kl | 0.26542178 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 243720 | -| policy_gradient_loss | 0.0289 | -| std | 0.00597 | -| value_loss | 9.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24374 | -| time_elapsed | 132622 | -| total_timesteps | 3119872 | -| train/ | | -| approx_kl | 0.02372443 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -0.00459 | -| n_updates | 243730 | -| policy_gradient_loss | 0.0281 | -| std | 0.00597 | -| value_loss | 6.76e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24375 | -| time_elapsed | 132628 | -| total_timesteps | 3120000 | -| train/ | | -| approx_kl | 0.2948438 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 243740 | -| policy_gradient_loss | 0.105 | -| std | 0.00597 | -| value_loss | 3.81e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24376 | -| time_elapsed | 132633 | -| total_timesteps | 3120128 | -| train/ | | -| approx_kl | 0.05918451 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00703 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 243750 | -| policy_gradient_loss | 0.0283 | -| std | 0.00598 | -| value_loss | 2.41e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24377 | -| time_elapsed | 132647 | -| total_timesteps | 3120256 | -| train/ | | -| approx_kl | 0.30460608 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | 0.099 | -| n_updates | 243760 | -| policy_gradient_loss | 0.0208 | -| std | 0.00598 | -| value_loss | 6.64e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24378 | -| time_elapsed | 132653 | -| total_timesteps | 3120384 | -| train/ | | -| approx_kl | 0.032107998 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 243770 | -| policy_gradient_loss | 0.0039 | -| std | 0.00597 | -| value_loss | 8.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24379 | -| time_elapsed | 132658 | -| total_timesteps | 3120512 | -| train/ | | -| approx_kl | 0.024165612 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.00589 | -| n_updates | 243780 | -| policy_gradient_loss | 0.033 | -| std | 0.00597 | -| value_loss | 1.91e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24380 | -| time_elapsed | 132663 | -| total_timesteps | 3120640 | -| train/ | | -| approx_kl | 0.1417006 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0874 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 243790 | -| policy_gradient_loss | 0.0364 | -| std | 0.00598 | -| value_loss | 1.28e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24381 | -| time_elapsed | 132668 | -| total_timesteps | 3120768 | -| train/ | | -| approx_kl | 0.00019494817 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0833 | -| learning_rate | 0.0003 | -| loss | -0.000575 | -| n_updates | 243800 | -| policy_gradient_loss | 0.0378 | -| std | 0.00598 | -| value_loss | 8.55e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24382 | -| time_elapsed | 132673 | -| total_timesteps | 3120896 | -| train/ | | -| approx_kl | 0.19371636 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.0682 | -| n_updates | 243810 | -| policy_gradient_loss | 0.0218 | -| std | 0.00597 | -| value_loss | 7.57e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24383 | -| time_elapsed | 132678 | -| total_timesteps | 3121024 | -| train/ | | -| approx_kl | 0.0313858 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 243820 | -| policy_gradient_loss | 0.0369 | -| std | 0.00597 | -| value_loss | 3.89e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24384 | -| time_elapsed | 132691 | -| total_timesteps | 3121152 | -| train/ | | -| approx_kl | 0.02880017 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.93 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 243830 | -| policy_gradient_loss | -0.00163 | -| std | 0.00597 | -| value_loss | 0.00139 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24385 | -| time_elapsed | 132696 | -| total_timesteps | 3121280 | -| train/ | | -| approx_kl | 0.18560609 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.489 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 243840 | -| policy_gradient_loss | 0.135 | -| std | 0.00597 | -| value_loss | 4.5e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24386 | -| time_elapsed | 132701 | -| total_timesteps | 3121408 | -| train/ | | -| approx_kl | 0.20955116 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 243850 | -| policy_gradient_loss | 0.193 | -| std | 0.00597 | -| value_loss | 8.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24387 | -| time_elapsed | 132706 | -| total_timesteps | 3121536 | -| train/ | | -| approx_kl | 0.031171417 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 243860 | -| policy_gradient_loss | 0.0266 | -| std | 0.00597 | -| value_loss | 6.38e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24388 | -| time_elapsed | 132712 | -| total_timesteps | 3121664 | -| train/ | | -| approx_kl | 0.1992295 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 243870 | -| policy_gradient_loss | 0.0299 | -| std | 0.00597 | -| value_loss | 3.59e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24389 | -| time_elapsed | 132717 | -| total_timesteps | 3121792 | -| train/ | | -| approx_kl | 0.02604003 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.00474 | -| n_updates | 243880 | -| policy_gradient_loss | 0.0345 | -| std | 0.00597 | -| value_loss | 1.81e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24390 | -| time_elapsed | 132721 | -| total_timesteps | 3121920 | -| train/ | | -| approx_kl | 0.3983702 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 243890 | -| policy_gradient_loss | 0.149 | -| std | 0.00598 | -| value_loss | 1.29e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24391 | -| time_elapsed | 132726 | -| total_timesteps | 3122048 | -| train/ | | -| approx_kl | 0.27266368 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 243900 | -| policy_gradient_loss | 0.138 | -| std | 0.00598 | -| value_loss | 6.91e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24392 | -| time_elapsed | 132734 | -| total_timesteps | 3122176 | -| train/ | | -| approx_kl | 0.015484736 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 243910 | -| policy_gradient_loss | 0.00758 | -| std | 0.00598 | -| value_loss | 0.00402 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24393 | -| time_elapsed | 132739 | -| total_timesteps | 3122304 | -| train/ | | -| approx_kl | 0.27325332 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.778 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 243920 | -| policy_gradient_loss | 0.081 | -| std | 0.00598 | -| value_loss | 9.57e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24394 | -| time_elapsed | 132744 | -| total_timesteps | 3122432 | -| train/ | | -| approx_kl | 0.3278351 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.681 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 243930 | -| policy_gradient_loss | 0.0348 | -| std | 0.00598 | -| value_loss | 1.53e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24395 | -| time_elapsed | 132749 | -| total_timesteps | 3122560 | -| train/ | | -| approx_kl | 0.6946628 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | 0.0979 | -| n_updates | 243940 | -| policy_gradient_loss | 0.045 | -| std | 0.00598 | -| value_loss | 2.81e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24396 | -| time_elapsed | 132753 | -| total_timesteps | 3122688 | -| train/ | | -| approx_kl | 0.047350135 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | 0.0217 | -| n_updates | 243950 | -| policy_gradient_loss | 0.0121 | -| std | 0.00598 | -| value_loss | 1.8e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24397 | -| time_elapsed | 132759 | -| total_timesteps | 3122816 | -| train/ | | -| approx_kl | 0.06745401 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.00374 | -| n_updates | 243960 | -| policy_gradient_loss | 0.00123 | -| std | 0.00598 | -| value_loss | 1.32e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 24398 | -| time_elapsed | 132763 | -| total_timesteps | 3122944 | -| train/ | | -| approx_kl | 0.014159573 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.045 | -| learning_rate | 0.0003 | -| loss | -0.00938 | -| n_updates | 243970 | -| policy_gradient_loss | 0.00737 | -| std | 0.00598 | -| value_loss | 9.65e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24399 | -| time_elapsed | 132768 | -| total_timesteps | 3123072 | -| train/ | | -| approx_kl | 0.09835646 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.0676 | -| n_updates | 243980 | -| policy_gradient_loss | 0.0283 | -| std | 0.00598 | -| value_loss | 5.79e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24400 | -| time_elapsed | 132779 | -| total_timesteps | 3123200 | -| train/ | | -| approx_kl | 0.034540534 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.389 | -| learning_rate | 0.0003 | -| loss | -0.0314 | -| n_updates | 243990 | -| policy_gradient_loss | -0.0199 | -| std | 0.00598 | -| value_loss | 0.002 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24401 | -| time_elapsed | 132784 | -| total_timesteps | 3123328 | -| train/ | | -| approx_kl | 0.10595657 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.286 | -| learning_rate | 0.0003 | -| loss | 0.0891 | -| n_updates | 244000 | -| policy_gradient_loss | 0.16 | -| std | 0.00598 | -| value_loss | 7.09e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24402 | -| time_elapsed | 132789 | -| total_timesteps | 3123456 | -| train/ | | -| approx_kl | 0.12578294 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00428 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 244010 | -| policy_gradient_loss | 0.145 | -| std | 0.00598 | -| value_loss | 1.65e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24403 | -| time_elapsed | 132794 | -| total_timesteps | 3123584 | -| train/ | | -| approx_kl | 0.17054512 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00956 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 244020 | -| policy_gradient_loss | 0.159 | -| std | 0.00598 | -| value_loss | 6.81e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24404 | -| time_elapsed | 132798 | -| total_timesteps | 3123712 | -| train/ | | -| approx_kl | 0.14585282 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.0794 | -| n_updates | 244030 | -| policy_gradient_loss | 0.132 | -| std | 0.00598 | -| value_loss | 5.28e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24405 | -| time_elapsed | 132803 | -| total_timesteps | 3123840 | -| train/ | | -| approx_kl | 0.16045126 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.0938 | -| n_updates | 244040 | -| policy_gradient_loss | 0.11 | -| std | 0.00598 | -| value_loss | 1.51e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24406 | -| time_elapsed | 132808 | -| total_timesteps | 3123968 | -| train/ | | -| approx_kl | 0.03196689 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0773 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 244050 | -| policy_gradient_loss | 0.0316 | -| std | 0.00598 | -| value_loss | 9.85e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24407 | -| time_elapsed | 132813 | -| total_timesteps | 3124096 | -| train/ | | -| approx_kl | 0.70076877 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 244060 | -| policy_gradient_loss | 0.0825 | -| std | 0.00598 | -| value_loss | 8.25e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24408 | -| time_elapsed | 132828 | -| total_timesteps | 3124224 | -| train/ | | -| approx_kl | 0.021968033 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.699 | -| learning_rate | 0.0003 | -| loss | 0.00212 | -| n_updates | 244070 | -| policy_gradient_loss | 0.00917 | -| std | 0.00598 | -| value_loss | 0.00976 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24409 | -| time_elapsed | 132834 | -| total_timesteps | 3124352 | -| train/ | | -| approx_kl | 0.0067078397 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.398 | -| learning_rate | 0.0003 | -| loss | -0.00944 | -| n_updates | 244080 | -| policy_gradient_loss | 0.0076 | -| std | 0.00598 | -| value_loss | 0.000152 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24410 | -| time_elapsed | 132839 | -| total_timesteps | 3124480 | -| train/ | | -| approx_kl | 0.0013420172 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00516 | -| learning_rate | 0.0003 | -| loss | 0.00673 | -| n_updates | 244090 | -| policy_gradient_loss | 0.00364 | -| std | 0.00598 | -| value_loss | 8.13e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24411 | -| time_elapsed | 132845 | -| total_timesteps | 3124608 | -| train/ | | -| approx_kl | 0.062275596 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0827 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 244100 | -| policy_gradient_loss | 0.017 | -| std | 0.00598 | -| value_loss | 6.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24412 | -| time_elapsed | 132850 | -| total_timesteps | 3124736 | -| train/ | | -| approx_kl | 0.013203366 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | 0.00373 | -| n_updates | 244110 | -| policy_gradient_loss | 0.0128 | -| std | 0.00599 | -| value_loss | 3.86e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24413 | -| time_elapsed | 132855 | -| total_timesteps | 3124864 | -| train/ | | -| approx_kl | 0.09721727 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0761 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 244120 | -| policy_gradient_loss | 0.00708 | -| std | 0.00599 | -| value_loss | 2.79e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24414 | -| time_elapsed | 132860 | -| total_timesteps | 3124992 | -| train/ | | -| approx_kl | 0.014956076 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 244130 | -| policy_gradient_loss | 0.011 | -| std | 0.00599 | -| value_loss | 1.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24415 | -| time_elapsed | 132865 | -| total_timesteps | 3125120 | -| train/ | | -| approx_kl | 0.000771421 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | 0.00443 | -| n_updates | 244140 | -| policy_gradient_loss | 0.00433 | -| std | 0.00599 | -| value_loss | 1.43e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24416 | -| time_elapsed | 132877 | -| total_timesteps | 3125248 | -| train/ | | -| approx_kl | 0.037243325 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | -0.0275 | -| n_updates | 244150 | -| policy_gradient_loss | 0.00572 | -| std | 0.00599 | -| value_loss | 0.000388 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24417 | -| time_elapsed | 132881 | -| total_timesteps | 3125376 | -| train/ | | -| approx_kl | 0.23891447 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 244160 | -| policy_gradient_loss | 0.0627 | -| std | 0.00599 | -| value_loss | 4.34e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24418 | -| time_elapsed | 132886 | -| total_timesteps | 3125504 | -| train/ | | -| approx_kl | 0.0026906612 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.099 | -| learning_rate | 0.0003 | -| loss | 0.0067 | -| n_updates | 244170 | -| policy_gradient_loss | 0.0126 | -| std | 0.00598 | -| value_loss | 4.42e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24419 | -| time_elapsed | 132889 | -| total_timesteps | 3125632 | -| train/ | | -| approx_kl | 0.0012529553 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | 0.00382 | -| n_updates | 244180 | -| policy_gradient_loss | 0.0184 | -| std | 0.00598 | -| value_loss | 1.38e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24420 | -| time_elapsed | 132895 | -| total_timesteps | 3125760 | -| train/ | | -| approx_kl | 0.006670596 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.00316 | -| n_updates | 244190 | -| policy_gradient_loss | 0.0124 | -| std | 0.00596 | -| value_loss | 4.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24421 | -| time_elapsed | 132900 | -| total_timesteps | 3125888 | -| train/ | | -| approx_kl | 0.0059404834 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00159 | -| learning_rate | 0.0003 | -| loss | -0.00102 | -| n_updates | 244200 | -| policy_gradient_loss | 0.0112 | -| std | 0.00594 | -| value_loss | 2.36e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24422 | -| time_elapsed | 132904 | -| total_timesteps | 3126016 | -| train/ | | -| approx_kl | 0.08849162 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 244210 | -| policy_gradient_loss | 0.0109 | -| std | 0.00594 | -| value_loss | 2.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24423 | -| time_elapsed | 132915 | -| total_timesteps | 3126144 | -| train/ | | -| approx_kl | 0.020149797 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.917 | -| learning_rate | 0.0003 | -| loss | 0.025 | -| n_updates | 244220 | -| policy_gradient_loss | -0.000523 | -| std | 0.00594 | -| value_loss | 0.000729 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24424 | -| time_elapsed | 132920 | -| total_timesteps | 3126272 | -| train/ | | -| approx_kl | 0.2854992 | -| clip_fraction | 0.578 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | 0.0519 | -| n_updates | 244230 | -| policy_gradient_loss | 0.0395 | -| std | 0.00594 | -| value_loss | 0.000635 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24425 | -| time_elapsed | 132925 | -| total_timesteps | 3126400 | -| train/ | | -| approx_kl | 0.008492331 | -| clip_fraction | 0.582 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 244240 | -| policy_gradient_loss | 0.104 | -| std | 0.00594 | -| value_loss | 5.5e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24426 | -| time_elapsed | 132932 | -| total_timesteps | 3126528 | -| train/ | | -| approx_kl | 0.010353885 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 244250 | -| policy_gradient_loss | 0.027 | -| std | 0.00594 | -| value_loss | 4.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24427 | -| time_elapsed | 132936 | -| total_timesteps | 3126656 | -| train/ | | -| approx_kl | 0.23582248 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0817 | -| learning_rate | 0.0003 | -| loss | 0.0783 | -| n_updates | 244260 | -| policy_gradient_loss | 0.0163 | -| std | 0.00594 | -| value_loss | 2.65e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24428 | -| time_elapsed | 132941 | -| total_timesteps | 3126784 | -| train/ | | -| approx_kl | 0.0037656599 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0846 | -| learning_rate | 0.0003 | -| loss | 0.00913 | -| n_updates | 244270 | -| policy_gradient_loss | 0.0228 | -| std | 0.00594 | -| value_loss | 1.74e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24429 | -| time_elapsed | 132945 | -| total_timesteps | 3126912 | -| train/ | | -| approx_kl | 0.0014882032 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0739 | -| learning_rate | 0.0003 | -| loss | -0.00773 | -| n_updates | 244280 | -| policy_gradient_loss | 0.0106 | -| std | 0.00594 | -| value_loss | 1.16e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24430 | -| time_elapsed | 132950 | -| total_timesteps | 3127040 | -| train/ | | -| approx_kl | 0.01679292 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0533 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 244290 | -| policy_gradient_loss | 0.0333 | -| std | 0.00594 | -| value_loss | 7.31e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24431 | -| time_elapsed | 132960 | -| total_timesteps | 3127168 | -| train/ | | -| approx_kl | 0.007789216 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.00888 | -| n_updates | 244300 | -| policy_gradient_loss | 0.031 | -| std | 0.00594 | -| value_loss | 0.00235 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24432 | -| time_elapsed | 132965 | -| total_timesteps | 3127296 | -| train/ | | -| approx_kl | 0.010629265 | -| clip_fraction | 0.589 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.0202 | -| n_updates | 244310 | -| policy_gradient_loss | 0.119 | -| std | 0.00594 | -| value_loss | 1.11e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24433 | -| time_elapsed | 132969 | -| total_timesteps | 3127424 | -| train/ | | -| approx_kl | 0.097389646 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0947 | -| n_updates | 244320 | -| policy_gradient_loss | 0.134 | -| std | 0.00594 | -| value_loss | 2.68e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24434 | -| time_elapsed | 132974 | -| total_timesteps | 3127552 | -| train/ | | -| approx_kl | 0.017535783 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.021 | -| learning_rate | 0.0003 | -| loss | -0.00638 | -| n_updates | 244330 | -| policy_gradient_loss | 0.0277 | -| std | 0.00594 | -| value_loss | 1.73e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24435 | -| time_elapsed | 132979 | -| total_timesteps | 3127680 | -| train/ | | -| approx_kl | 0.23723693 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0903 | -| n_updates | 244340 | -| policy_gradient_loss | 0.0248 | -| std | 0.00594 | -| value_loss | 1.11e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24436 | -| time_elapsed | 132984 | -| total_timesteps | 3127808 | -| train/ | | -| approx_kl | 0.027072087 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.00985 | -| n_updates | 244350 | -| policy_gradient_loss | 0.0391 | -| std | 0.00594 | -| value_loss | 7.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24437 | -| time_elapsed | 132988 | -| total_timesteps | 3127936 | -| train/ | | -| approx_kl | 0.16509885 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0442 | -| n_updates | 244360 | -| policy_gradient_loss | 0.027 | -| std | 0.00594 | -| value_loss | 6.05e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24438 | -| time_elapsed | 132994 | -| total_timesteps | 3128064 | -| train/ | | -| approx_kl | 0.17920296 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.0777 | -| n_updates | 244370 | -| policy_gradient_loss | 0.028 | -| std | 0.00594 | -| value_loss | 4.07e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24439 | -| time_elapsed | 133002 | -| total_timesteps | 3128192 | -| train/ | | -| approx_kl | 0.0052879513 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.922 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 244380 | -| policy_gradient_loss | -0.0136 | -| std | 0.00594 | -| value_loss | 0.0015 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24440 | -| time_elapsed | 133006 | -| total_timesteps | 3128320 | -| train/ | | -| approx_kl | 0.29061142 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 244390 | -| policy_gradient_loss | 0.137 | -| std | 0.00594 | -| value_loss | 1.83e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24441 | -| time_elapsed | 133012 | -| total_timesteps | 3128448 | -| train/ | | -| approx_kl | 0.0025050594 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00943 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 244400 | -| policy_gradient_loss | 0.095 | -| std | 0.00594 | -| value_loss | 9.23e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24442 | -| time_elapsed | 133017 | -| total_timesteps | 3128576 | -| train/ | | -| approx_kl | 0.04065419 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 244410 | -| policy_gradient_loss | 0.0598 | -| std | 0.00594 | -| value_loss | 6.5e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24443 | -| time_elapsed | 133022 | -| total_timesteps | 3128704 | -| train/ | | -| approx_kl | 0.40167466 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0458 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 244420 | -| policy_gradient_loss | 0.164 | -| std | 0.00594 | -| value_loss | 4.83e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24444 | -| time_elapsed | 133027 | -| total_timesteps | 3128832 | -| train/ | | -| approx_kl | 0.2992205 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | 0.191 | -| n_updates | 244430 | -| policy_gradient_loss | 0.171 | -| std | 0.00594 | -| value_loss | 3.14e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.996 | -| time/ | | -| fps | 23 | -| iterations | 24445 | -| time_elapsed | 133032 | -| total_timesteps | 3128960 | -| train/ | | -| approx_kl | 0.057447243 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 244440 | -| policy_gradient_loss | 0.0356 | -| std | 0.00594 | -| value_loss | 2.49e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24446 | -| time_elapsed | 133036 | -| total_timesteps | 3129088 | -| train/ | | -| approx_kl | 0.0014918866 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.00035 | -| n_updates | 244450 | -| policy_gradient_loss | 0.0413 | -| std | 0.00593 | -| value_loss | 1.16e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24447 | -| time_elapsed | 133048 | -| total_timesteps | 3129216 | -| train/ | | -| approx_kl | 0.14041078 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 244460 | -| policy_gradient_loss | -0.00425 | -| std | 0.00593 | -| value_loss | 0.00068 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24448 | -| time_elapsed | 133053 | -| total_timesteps | 3129344 | -| train/ | | -| approx_kl | 0.008870577 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 244470 | -| policy_gradient_loss | 0.0248 | -| std | 0.00593 | -| value_loss | 8.6e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24449 | -| time_elapsed | 133057 | -| total_timesteps | 3129472 | -| train/ | | -| approx_kl | 0.02022068 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00142 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 244480 | -| policy_gradient_loss | 0.044 | -| std | 0.00592 | -| value_loss | 3.13e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24450 | -| time_elapsed | 133061 | -| total_timesteps | 3129600 | -| train/ | | -| approx_kl | 0.40857264 | -| clip_fraction | 0.735 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -87.5 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 244490 | -| policy_gradient_loss | 0.0924 | -| std | 0.00592 | -| value_loss | 6.93e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24451 | -| time_elapsed | 133066 | -| total_timesteps | 3129728 | -| train/ | | -| approx_kl | 0.054756112 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.968 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 244500 | -| policy_gradient_loss | 0.0222 | -| std | 0.00592 | -| value_loss | 5.89e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24452 | -| time_elapsed | 133071 | -| total_timesteps | 3129856 | -| train/ | | -| approx_kl | 0.0030304594 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 244510 | -| policy_gradient_loss | 0.0114 | -| std | 0.00593 | -| value_loss | 1.76e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.999 | -| time/ | | -| fps | 23 | -| iterations | 24453 | -| time_elapsed | 133077 | -| total_timesteps | 3129984 | -| train/ | | -| approx_kl | 0.27658308 | -| clip_fraction | 0.746 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.203 | -| n_updates | 244520 | -| policy_gradient_loss | 0.133 | -| std | 0.00593 | -| value_loss | 8.42e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24454 | -| time_elapsed | 133082 | -| total_timesteps | 3130112 | -| train/ | | -| approx_kl | 0.20082062 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0986 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 244530 | -| policy_gradient_loss | 0.118 | -| std | 0.00593 | -| value_loss | 4.8e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24455 | -| time_elapsed | 133093 | -| total_timesteps | 3130240 | -| train/ | | -| approx_kl | 0.038107414 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -2.18 | -| learning_rate | 0.0003 | -| loss | -0.0284 | -| n_updates | 244540 | -| policy_gradient_loss | -0.0168 | -| std | 0.00593 | -| value_loss | 0.00452 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24456 | -| time_elapsed | 133098 | -| total_timesteps | 3130368 | -| train/ | | -| approx_kl | 0.006723018 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.332 | -| learning_rate | 0.0003 | -| loss | -0.00392 | -| n_updates | 244550 | -| policy_gradient_loss | 0.0143 | -| std | 0.00593 | -| value_loss | 1.67e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24457 | -| time_elapsed | 133104 | -| total_timesteps | 3130496 | -| train/ | | -| approx_kl | 0.12292337 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.0717 | -| n_updates | 244560 | -| policy_gradient_loss | 0.027 | -| std | 0.00593 | -| value_loss | 9.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24458 | -| time_elapsed | 133109 | -| total_timesteps | 3130624 | -| train/ | | -| approx_kl | 0.053628232 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0581 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 244570 | -| policy_gradient_loss | 0.0105 | -| std | 0.00593 | -| value_loss | 7.52e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24459 | -| time_elapsed | 133114 | -| total_timesteps | 3130752 | -| train/ | | -| approx_kl | 0.079420716 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.0285 | -| n_updates | 244580 | -| policy_gradient_loss | 0.0129 | -| std | 0.00593 | -| value_loss | 5.05e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24460 | -| time_elapsed | 133120 | -| total_timesteps | 3130880 | -| train/ | | -| approx_kl | 0.014929274 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 244590 | -| policy_gradient_loss | 0.00727 | -| std | 0.00593 | -| value_loss | 3.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24461 | -| time_elapsed | 133125 | -| total_timesteps | 3131008 | -| train/ | | -| approx_kl | 0.042121463 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.0538 | -| n_updates | 244600 | -| policy_gradient_loss | 0.116 | -| std | 0.00593 | -| value_loss | 2.46e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24462 | -| time_elapsed | 133137 | -| total_timesteps | 3131136 | -| train/ | | -| approx_kl | 0.07827562 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.00694 | -| n_updates | 244610 | -| policy_gradient_loss | 0.00798 | -| std | 0.00594 | -| value_loss | 0.000199 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24463 | -| time_elapsed | 133141 | -| total_timesteps | 3131264 | -| train/ | | -| approx_kl | 0.001907303 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0231 | -| learning_rate | 0.0003 | -| loss | 0.00559 | -| n_updates | 244620 | -| policy_gradient_loss | 0.132 | -| std | 0.00594 | -| value_loss | 0.0218 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24464 | -| time_elapsed | 133147 | -| total_timesteps | 3131392 | -| train/ | | -| approx_kl | 2.1138883 | -| clip_fraction | 0.742 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | 0.357 | -| n_updates | 244630 | -| policy_gradient_loss | 0.22 | -| std | 0.00594 | -| value_loss | 0.000374 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24465 | -| time_elapsed | 133153 | -| total_timesteps | 3131520 | -| train/ | | -| approx_kl | 0.04062621 | -| clip_fraction | 0.617 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00741 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 244640 | -| policy_gradient_loss | 0.075 | -| std | 0.00594 | -| value_loss | 3.34e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24466 | -| time_elapsed | 133159 | -| total_timesteps | 3131648 | -| train/ | | -| approx_kl | 0.11402429 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | 0.0794 | -| n_updates | 244650 | -| policy_gradient_loss | 0.0404 | -| std | 0.00595 | -| value_loss | 8.08e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24467 | -| time_elapsed | 133165 | -| total_timesteps | 3131776 | -| train/ | | -| approx_kl | 0.11665035 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 244660 | -| policy_gradient_loss | 0.0194 | -| std | 0.00595 | -| value_loss | 4.95e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.991 | -| time/ | | -| fps | 23 | -| iterations | 24468 | -| time_elapsed | 133170 | -| total_timesteps | 3131904 | -| train/ | | -| approx_kl | 0.3175217 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0971 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 244670 | -| policy_gradient_loss | 0.0197 | -| std | 0.00594 | -| value_loss | 2.84e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24469 | -| time_elapsed | 133176 | -| total_timesteps | 3132032 | -| train/ | | -| approx_kl | 0.06431776 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 244680 | -| policy_gradient_loss | 0.0353 | -| std | 0.00593 | -| value_loss | 2.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24470 | -| time_elapsed | 133187 | -| total_timesteps | 3132160 | -| train/ | | -| approx_kl | 0.071009584 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.555 | -| learning_rate | 0.0003 | -| loss | -0.0285 | -| n_updates | 244690 | -| policy_gradient_loss | -0.0179 | -| std | 0.00593 | -| value_loss | 0.00166 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24471 | -| time_elapsed | 133192 | -| total_timesteps | 3132288 | -| train/ | | -| approx_kl | 0.00039148005 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0599 | -| learning_rate | 0.0003 | -| loss | 0.00291 | -| n_updates | 244700 | -| policy_gradient_loss | 0.00711 | -| std | 0.00592 | -| value_loss | 1.23e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24472 | -| time_elapsed | 133196 | -| total_timesteps | 3132416 | -| train/ | | -| approx_kl | 0.07436239 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0995 | -| learning_rate | 0.0003 | -| loss | 0.0408 | -| n_updates | 244710 | -| policy_gradient_loss | 0.0185 | -| std | 0.00592 | -| value_loss | 7.01e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24473 | -| time_elapsed | 133200 | -| total_timesteps | 3132544 | -| train/ | | -| approx_kl | 0.048246175 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00267 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 244720 | -| policy_gradient_loss | 0.017 | -| std | 0.00591 | -| value_loss | 7.2e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24474 | -| time_elapsed | 133204 | -| total_timesteps | 3132672 | -| train/ | | -| approx_kl | 0.07064338 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 244730 | -| policy_gradient_loss | 0.0112 | -| std | 0.0059 | -| value_loss | 5.82e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24475 | -| time_elapsed | 133207 | -| total_timesteps | 3132800 | -| train/ | | -| approx_kl | 0.015660338 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.523 | -| learning_rate | 0.0003 | -| loss | 0.00121 | -| n_updates | 244740 | -| policy_gradient_loss | 0.0147 | -| std | 0.0059 | -| value_loss | 2.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 24476 | -| time_elapsed | 133211 | -| total_timesteps | 3132928 | -| train/ | | -| approx_kl | 0.08689247 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00233 | -| learning_rate | 0.0003 | -| loss | 0.0499 | -| n_updates | 244750 | -| policy_gradient_loss | 0.0202 | -| std | 0.0059 | -| value_loss | 6.42e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24477 | -| time_elapsed | 133215 | -| total_timesteps | 3133056 | -| train/ | | -| approx_kl | 0.059021514 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0839 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 244760 | -| policy_gradient_loss | 0.0116 | -| std | 0.00589 | -| value_loss | 6.95e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24478 | -| time_elapsed | 133223 | -| total_timesteps | 3133184 | -| train/ | | -| approx_kl | 0.05525582 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.965 | -| learning_rate | 0.0003 | -| loss | -0.0042 | -| n_updates | 244770 | -| policy_gradient_loss | -0.00708 | -| std | 0.00589 | -| value_loss | 0.000284 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24479 | -| time_elapsed | 133228 | -| total_timesteps | 3133312 | -| train/ | | -| approx_kl | 0.5184345 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.87 | -| learning_rate | 0.0003 | -| loss | 0.0421 | -| n_updates | 244780 | -| policy_gradient_loss | -0.000741 | -| std | 0.00589 | -| value_loss | 1.91e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24480 | -| time_elapsed | 133234 | -| total_timesteps | 3133440 | -| train/ | | -| approx_kl | 0.084088326 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0149 | -| learning_rate | 0.0003 | -| loss | 0.0578 | -| n_updates | 244790 | -| policy_gradient_loss | 0.0126 | -| std | 0.00589 | -| value_loss | 7.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24481 | -| time_elapsed | 133239 | -| total_timesteps | 3133568 | -| train/ | | -| approx_kl | 0.27479288 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.46 | -| learning_rate | 0.0003 | -| loss | 0.0402 | -| n_updates | 244800 | -| policy_gradient_loss | 0.0104 | -| std | 0.00589 | -| value_loss | 6.03e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24482 | -| time_elapsed | 133244 | -| total_timesteps | 3133696 | -| train/ | | -| approx_kl | 0.02293669 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | -0.0125 | -| n_updates | 244810 | -| policy_gradient_loss | 0.0319 | -| std | 0.00589 | -| value_loss | 3.39e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24483 | -| time_elapsed | 133250 | -| total_timesteps | 3133824 | -| train/ | | -| approx_kl | 0.33765054 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.195 | -| n_updates | 244820 | -| policy_gradient_loss | 0.181 | -| std | 0.00589 | -| value_loss | 2.71e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.992 | -| time/ | | -| fps | 23 | -| iterations | 24484 | -| time_elapsed | 133256 | -| total_timesteps | 3133952 | -| train/ | | -| approx_kl | 0.0522533 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.00179 | -| n_updates | 244830 | -| policy_gradient_loss | 0.0251 | -| std | 0.00589 | -| value_loss | 2.22e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24485 | -| time_elapsed | 133262 | -| total_timesteps | 3134080 | -| train/ | | -| approx_kl | 0.7335068 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.281 | -| n_updates | 244840 | -| policy_gradient_loss | 0.0769 | -| std | 0.00589 | -| value_loss | 9.92e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24486 | -| time_elapsed | 133271 | -| total_timesteps | 3134208 | -| train/ | | -| approx_kl | 0.013619635 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 244850 | -| policy_gradient_loss | -0.0106 | -| std | 0.00589 | -| value_loss | 0.00273 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24487 | -| time_elapsed | 133278 | -| total_timesteps | 3134336 | -| train/ | | -| approx_kl | 0.10616316 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.544 | -| learning_rate | 0.0003 | -| loss | 0.0495 | -| n_updates | 244860 | -| policy_gradient_loss | 0.0246 | -| std | 0.00588 | -| value_loss | 3.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24488 | -| time_elapsed | 133282 | -| total_timesteps | 3134464 | -| train/ | | -| approx_kl | 0.050799888 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 244870 | -| policy_gradient_loss | 0.0465 | -| std | 0.00588 | -| value_loss | 4.5e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24489 | -| time_elapsed | 133287 | -| total_timesteps | 3134592 | -| train/ | | -| approx_kl | 0.158818 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -3.79 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 244880 | -| policy_gradient_loss | 0.0225 | -| std | 0.00588 | -| value_loss | 1.88e-07 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24490 | -| time_elapsed | 133292 | -| total_timesteps | 3134720 | -| train/ | | -| approx_kl | 0.17789587 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0176 | -| learning_rate | 0.0003 | -| loss | 0.0825 | -| n_updates | 244890 | -| policy_gradient_loss | 0.0277 | -| std | 0.00588 | -| value_loss | 1.88e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24491 | -| time_elapsed | 133297 | -| total_timesteps | 3134848 | -| train/ | | -| approx_kl | 0.020210575 | -| clip_fraction | 0.165 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | -0.00309 | -| n_updates | 244900 | -| policy_gradient_loss | -0.00121 | -| std | 0.00588 | -| value_loss | 1.27e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 24492 | -| time_elapsed | 133302 | -| total_timesteps | 3134976 | -| train/ | | -| approx_kl | 0.04047289 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.00404 | -| n_updates | 244910 | -| policy_gradient_loss | 0.0363 | -| std | 0.00588 | -| value_loss | 9.58e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 24493 | -| time_elapsed | 133306 | -| total_timesteps | 3135104 | -| train/ | | -| approx_kl | 0.16206555 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.068 | -| n_updates | 244920 | -| policy_gradient_loss | 0.0358 | -| std | 0.00588 | -| value_loss | 6.88e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 24494 | -| time_elapsed | 133319 | -| total_timesteps | 3135232 | -| train/ | | -| approx_kl | 0.6092752 | -| clip_fraction | 0.546 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | 0.0916 | -| n_updates | 244930 | -| policy_gradient_loss | 0.0381 | -| std | 0.00588 | -| value_loss | 0.00169 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 24495 | -| time_elapsed | 133323 | -| total_timesteps | 3135360 | -| train/ | | -| approx_kl | 0.007062323 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | -0.00151 | -| n_updates | 244940 | -| policy_gradient_loss | 0.0138 | -| std | 0.00588 | -| value_loss | 1.04e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 24496 | -| time_elapsed | 133329 | -| total_timesteps | 3135488 | -| train/ | | -| approx_kl | 0.11015795 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00786 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 244950 | -| policy_gradient_loss | 0.00856 | -| std | 0.00588 | -| value_loss | 1.43e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 24497 | -| time_elapsed | 133334 | -| total_timesteps | 3135616 | -| train/ | | -| approx_kl | 0.05258009 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 244960 | -| policy_gradient_loss | 0.0141 | -| std | 0.00588 | -| value_loss | 8.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 24498 | -| time_elapsed | 133339 | -| total_timesteps | 3135744 | -| train/ | | -| approx_kl | 0.075210646 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0381 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 244970 | -| policy_gradient_loss | 0.00716 | -| std | 0.00588 | -| value_loss | 5.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 24499 | -| time_elapsed | 133344 | -| total_timesteps | 3135872 | -| train/ | | -| approx_kl | 0.057349384 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | -0.00831 | -| n_updates | 244980 | -| policy_gradient_loss | -0.00337 | -| std | 0.00589 | -| value_loss | 4.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24500 | -| time_elapsed | 133349 | -| total_timesteps | 3136000 | -| train/ | | -| approx_kl | 0.08419046 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 244990 | -| policy_gradient_loss | 0.0119 | -| std | 0.00589 | -| value_loss | 3.57e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24501 | -| time_elapsed | 133354 | -| total_timesteps | 3136128 | -| train/ | | -| approx_kl | 0.013026409 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00405 | -| learning_rate | 0.0003 | -| loss | 0.00225 | -| n_updates | 245000 | -| policy_gradient_loss | 0.0125 | -| std | 0.00589 | -| value_loss | 1.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24502 | -| time_elapsed | 133364 | -| total_timesteps | 3136256 | -| train/ | | -| approx_kl | 0.022506407 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 245010 | -| policy_gradient_loss | -0.0107 | -| std | 0.00589 | -| value_loss | 0.000161 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24503 | -| time_elapsed | 133369 | -| total_timesteps | 3136384 | -| train/ | | -| approx_kl | 0.7588003 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | 0.283 | -| n_updates | 245020 | -| policy_gradient_loss | 0.0821 | -| std | 0.00589 | -| value_loss | 5.47e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24504 | -| time_elapsed | 133375 | -| total_timesteps | 3136512 | -| train/ | | -| approx_kl | 0.010103772 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 245030 | -| policy_gradient_loss | 0.0128 | -| std | 0.00589 | -| value_loss | 7.26e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24505 | -| time_elapsed | 133380 | -| total_timesteps | 3136640 | -| train/ | | -| approx_kl | 0.0018925355 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.284 | -| learning_rate | 0.0003 | -| loss | -0.00266 | -| n_updates | 245040 | -| policy_gradient_loss | 0.0118 | -| std | 0.00589 | -| value_loss | 8.76e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24506 | -| time_elapsed | 133386 | -| total_timesteps | 3136768 | -| train/ | | -| approx_kl | 3.2216776e-05 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 245050 | -| policy_gradient_loss | 0.0657 | -| std | 0.00589 | -| value_loss | 7.62e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 24507 | -| time_elapsed | 133391 | -| total_timesteps | 3136896 | -| train/ | | -| approx_kl | 0.32735047 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 245060 | -| policy_gradient_loss | 0.09 | -| std | 0.00589 | -| value_loss | 3.95e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24508 | -| time_elapsed | 133396 | -| total_timesteps | 3137024 | -| train/ | | -| approx_kl | 0.38263154 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0525 | -| learning_rate | 0.0003 | -| loss | 0.192 | -| n_updates | 245070 | -| policy_gradient_loss | 0.0486 | -| std | 0.00588 | -| value_loss | 2.8e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24509 | -| time_elapsed | 133410 | -| total_timesteps | 3137152 | -| train/ | | -| approx_kl | 0.10765384 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.396 | -| learning_rate | 0.0003 | -| loss | -0.0265 | -| n_updates | 245080 | -| policy_gradient_loss | -0.00694 | -| std | 0.00588 | -| value_loss | 0.00177 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24510 | -| time_elapsed | 133414 | -| total_timesteps | 3137280 | -| train/ | | -| approx_kl | 0.27353877 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.483 | -| learning_rate | 0.0003 | -| loss | 0.069 | -| n_updates | 245090 | -| policy_gradient_loss | 0.0339 | -| std | 0.00588 | -| value_loss | 5.61e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24511 | -| time_elapsed | 133419 | -| total_timesteps | 3137408 | -| train/ | | -| approx_kl | 2.5679357e-05 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00173 | -| learning_rate | 0.0003 | -| loss | -0.000247 | -| n_updates | 245100 | -| policy_gradient_loss | 0.0329 | -| std | 0.00589 | -| value_loss | 1.2e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24512 | -| time_elapsed | 133425 | -| total_timesteps | 3137536 | -| train/ | | -| approx_kl | 0.7284194 | -| clip_fraction | 0.572 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.241 | -| n_updates | 245110 | -| policy_gradient_loss | 0.08 | -| std | 0.00589 | -| value_loss | 7.63e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24513 | -| time_elapsed | 133431 | -| total_timesteps | 3137664 | -| train/ | | -| approx_kl | 0.018197743 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.00656 | -| n_updates | 245120 | -| policy_gradient_loss | 0.0119 | -| std | 0.00589 | -| value_loss | 5.69e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24514 | -| time_elapsed | 133437 | -| total_timesteps | 3137792 | -| train/ | | -| approx_kl | 0.12083338 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0846 | -| learning_rate | 0.0003 | -| loss | 0.0285 | -| n_updates | 245130 | -| policy_gradient_loss | 0.00943 | -| std | 0.00589 | -| value_loss | 3.43e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 24515 | -| time_elapsed | 133442 | -| total_timesteps | 3137920 | -| train/ | | -| approx_kl | 0.0658843 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 245140 | -| policy_gradient_loss | 0.00881 | -| std | 0.00589 | -| value_loss | 2.71e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24516 | -| time_elapsed | 133447 | -| total_timesteps | 3138048 | -| train/ | | -| approx_kl | 0.08798407 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.000687 | -| n_updates | 245150 | -| policy_gradient_loss | 0.000678 | -| std | 0.00589 | -| value_loss | 2.04e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24517 | -| time_elapsed | 133455 | -| total_timesteps | 3138176 | -| train/ | | -| approx_kl | 0.2560466 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00492 | -| n_updates | 245160 | -| policy_gradient_loss | -0.0163 | -| std | 0.00589 | -| value_loss | 0.00223 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24518 | -| time_elapsed | 133460 | -| total_timesteps | 3138304 | -| train/ | | -| approx_kl | 0.37813875 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.227 | -| learning_rate | 0.0003 | -| loss | 0.0996 | -| n_updates | 245170 | -| policy_gradient_loss | 0.049 | -| std | 0.00589 | -| value_loss | 7.23e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24519 | -| time_elapsed | 133464 | -| total_timesteps | 3138432 | -| train/ | | -| approx_kl | 0.0012235311 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0604 | -| learning_rate | 0.0003 | -| loss | -0.0025 | -| n_updates | 245180 | -| policy_gradient_loss | 0.0149 | -| std | 0.00589 | -| value_loss | 1.77e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24520 | -| time_elapsed | 133469 | -| total_timesteps | 3138560 | -| train/ | | -| approx_kl | 0.12713815 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 245190 | -| policy_gradient_loss | 0.0796 | -| std | 0.00589 | -| value_loss | 1.55e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24521 | -| time_elapsed | 133473 | -| total_timesteps | 3138688 | -| train/ | | -| approx_kl | 0.19371372 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 245200 | -| policy_gradient_loss | 0.0479 | -| std | 0.0059 | -| value_loss | 1.17e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24522 | -| time_elapsed | 133477 | -| total_timesteps | 3138816 | -| train/ | | -| approx_kl | 0.179141 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 245210 | -| policy_gradient_loss | 0.0181 | -| std | 0.0059 | -| value_loss | 4.08e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24523 | -| time_elapsed | 133481 | -| total_timesteps | 3138944 | -| train/ | | -| approx_kl | 0.25828952 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.0903 | -| n_updates | 245220 | -| policy_gradient_loss | 0.0146 | -| std | 0.0059 | -| value_loss | 3.12e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24524 | -| time_elapsed | 133485 | -| total_timesteps | 3139072 | -| train/ | | -| approx_kl | 0.055367637 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | 0.0954 | -| n_updates | 245230 | -| policy_gradient_loss | 0.0473 | -| std | 0.0059 | -| value_loss | 4.15e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24525 | -| time_elapsed | 133492 | -| total_timesteps | 3139200 | -| train/ | | -| approx_kl | 0.0072857183 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | -0.0303 | -| n_updates | 245240 | -| policy_gradient_loss | 0.0165 | -| std | 0.00589 | -| value_loss | 0.00379 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24526 | -| time_elapsed | 133497 | -| total_timesteps | 3139328 | -| train/ | | -| approx_kl | 0.02946229 | -| clip_fraction | 0.599 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 245250 | -| policy_gradient_loss | 0.0831 | -| std | 0.0059 | -| value_loss | 4.42e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24527 | -| time_elapsed | 133500 | -| total_timesteps | 3139456 | -| train/ | | -| approx_kl | 0.0017935238 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00609 | -| learning_rate | 0.0003 | -| loss | 0.00157 | -| n_updates | 245260 | -| policy_gradient_loss | 0.15 | -| std | 0.00589 | -| value_loss | 3.51e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24528 | -| time_elapsed | 133507 | -| total_timesteps | 3139584 | -| train/ | | -| approx_kl | 0.024616376 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0343 | -| learning_rate | 0.0003 | -| loss | 0.0339 | -| n_updates | 245270 | -| policy_gradient_loss | 0.0514 | -| std | 0.00589 | -| value_loss | 1.94e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24529 | -| time_elapsed | 133512 | -| total_timesteps | 3139712 | -| train/ | | -| approx_kl | 0.3604592 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 245280 | -| policy_gradient_loss | 0.153 | -| std | 0.00589 | -| value_loss | 1.36e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24530 | -| time_elapsed | 133515 | -| total_timesteps | 3139840 | -| train/ | | -| approx_kl | 0.2844429 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 245290 | -| policy_gradient_loss | 0.168 | -| std | 0.00589 | -| value_loss | 1.05e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24531 | -| time_elapsed | 133521 | -| total_timesteps | 3139968 | -| train/ | | -| approx_kl | 0.19556485 | -| clip_fraction | 0.733 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 245300 | -| policy_gradient_loss | 0.167 | -| std | 0.00589 | -| value_loss | 6.62e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24532 | -| time_elapsed | 133526 | -| total_timesteps | 3140096 | -| train/ | | -| approx_kl | 0.034501597 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | 0.0037 | -| n_updates | 245310 | -| policy_gradient_loss | 0.0248 | -| std | 0.00589 | -| value_loss | 5.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24533 | -| time_elapsed | 133535 | -| total_timesteps | 3140224 | -| train/ | | -| approx_kl | 0.02483397 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | -0.0268 | -| n_updates | 245320 | -| policy_gradient_loss | -0.0164 | -| std | 0.00589 | -| value_loss | 0.00304 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24534 | -| time_elapsed | 133540 | -| total_timesteps | 3140352 | -| train/ | | -| approx_kl | 0.006837196 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00142 | -| learning_rate | 0.0003 | -| loss | 0.0162 | -| n_updates | 245330 | -| policy_gradient_loss | 0.0078 | -| std | 0.00589 | -| value_loss | 7.22e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24535 | -| time_elapsed | 133545 | -| total_timesteps | 3140480 | -| train/ | | -| approx_kl | 0.081761554 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00658 | -| learning_rate | 0.0003 | -| loss | 0.053 | -| n_updates | 245340 | -| policy_gradient_loss | 0.0233 | -| std | 0.00589 | -| value_loss | 1.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24536 | -| time_elapsed | 133549 | -| total_timesteps | 3140608 | -| train/ | | -| approx_kl | 0.057413455 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0717 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 245350 | -| policy_gradient_loss | 0.0182 | -| std | 0.0059 | -| value_loss | 6.92e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24537 | -| time_elapsed | 133554 | -| total_timesteps | 3140736 | -| train/ | | -| approx_kl | 0.08692309 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | 0.0479 | -| n_updates | 245360 | -| policy_gradient_loss | 0.0216 | -| std | 0.0059 | -| value_loss | 4.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24538 | -| time_elapsed | 133558 | -| total_timesteps | 3140864 | -| train/ | | -| approx_kl | 0.012371764 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 245370 | -| policy_gradient_loss | 0.0079 | -| std | 0.0059 | -| value_loss | 2.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24539 | -| time_elapsed | 133563 | -| total_timesteps | 3140992 | -| train/ | | -| approx_kl | 0.017146774 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.00664 | -| n_updates | 245380 | -| policy_gradient_loss | 0.0276 | -| std | 0.00587 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24540 | -| time_elapsed | 133568 | -| total_timesteps | 3141120 | -| train/ | | -| approx_kl | 0.17631799 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 245390 | -| policy_gradient_loss | 0.134 | -| std | 0.00585 | -| value_loss | 1.88e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24541 | -| time_elapsed | 133581 | -| total_timesteps | 3141248 | -| train/ | | -| approx_kl | 0.22675818 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | 0.0598 | -| n_updates | 245400 | -| policy_gradient_loss | 0.0282 | -| std | 0.00584 | -| value_loss | 0.00129 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24542 | -| time_elapsed | 133585 | -| total_timesteps | 3141376 | -| train/ | | -| approx_kl | 0.033717457 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.052 | -| n_updates | 245410 | -| policy_gradient_loss | 0.0279 | -| std | 0.00584 | -| value_loss | 2.06e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24543 | -| time_elapsed | 133589 | -| total_timesteps | 3141504 | -| train/ | | -| approx_kl | 0.35022473 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0143 | -| learning_rate | 0.0003 | -| loss | 0.191 | -| n_updates | 245420 | -| policy_gradient_loss | 0.199 | -| std | 0.00584 | -| value_loss | 2.37e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24544 | -| time_elapsed | 133594 | -| total_timesteps | 3141632 | -| train/ | | -| approx_kl | 0.21494351 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 245430 | -| policy_gradient_loss | 0.149 | -| std | 0.00584 | -| value_loss | 1.82e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24545 | -| time_elapsed | 133599 | -| total_timesteps | 3141760 | -| train/ | | -| approx_kl | 0.1967961 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 245440 | -| policy_gradient_loss | 0.136 | -| std | 0.00584 | -| value_loss | 1.39e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 24546 | -| time_elapsed | 133604 | -| total_timesteps | 3141888 | -| train/ | | -| approx_kl | 0.19883701 | -| clip_fraction | 0.75 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 245450 | -| policy_gradient_loss | 0.189 | -| std | 0.00584 | -| value_loss | 1.16e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24547 | -| time_elapsed | 133610 | -| total_timesteps | 3142016 | -| train/ | | -| approx_kl | 0.03924179 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 245460 | -| policy_gradient_loss | 0.0359 | -| std | 0.00584 | -| value_loss | 9.06e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24548 | -| time_elapsed | 133621 | -| total_timesteps | 3142144 | -| train/ | | -| approx_kl | 0.101994015 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.849 | -| learning_rate | 0.0003 | -| loss | -0.00738 | -| n_updates | 245470 | -| policy_gradient_loss | -0.0036 | -| std | 0.00584 | -| value_loss | 0.00064 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24549 | -| time_elapsed | 133626 | -| total_timesteps | 3142272 | -| train/ | | -| approx_kl | 0.01833613 | -| clip_fraction | 0.583 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.585 | -| learning_rate | 0.0003 | -| loss | -0.0306 | -| n_updates | 245480 | -| policy_gradient_loss | 0.0749 | -| std | 0.00584 | -| value_loss | 1.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24550 | -| time_elapsed | 133631 | -| total_timesteps | 3142400 | -| train/ | | -| approx_kl | 0.032908734 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0792 | -| learning_rate | 0.0003 | -| loss | 0.0857 | -| n_updates | 245490 | -| policy_gradient_loss | 0.0957 | -| std | 0.00584 | -| value_loss | 1.14e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24551 | -| time_elapsed | 133637 | -| total_timesteps | 3142528 | -| train/ | | -| approx_kl | 0.7640714 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0713 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 245500 | -| policy_gradient_loss | 0.0578 | -| std | 0.00585 | -| value_loss | 8.45e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24552 | -| time_elapsed | 133642 | -| total_timesteps | 3142656 | -| train/ | | -| approx_kl | 0.17085147 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0165 | -| learning_rate | 0.0003 | -| loss | 0.0952 | -| n_updates | 245510 | -| policy_gradient_loss | 0.0549 | -| std | 0.00585 | -| value_loss | 1.55e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24553 | -| time_elapsed | 133647 | -| total_timesteps | 3142784 | -| train/ | | -| approx_kl | 0.008487964 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.014 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 245520 | -| policy_gradient_loss | -0.00353 | -| std | 0.00585 | -| value_loss | 2.44e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24554 | -| time_elapsed | 133652 | -| total_timesteps | 3142912 | -| train/ | | -| approx_kl | 0.00024392316 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 245530 | -| policy_gradient_loss | 0.00715 | -| std | 0.00585 | -| value_loss | 1.31e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24555 | -| time_elapsed | 133656 | -| total_timesteps | 3143040 | -| train/ | | -| approx_kl | 0.091586836 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.067 | -| n_updates | 245540 | -| policy_gradient_loss | 0.145 | -| std | 0.00585 | -| value_loss | 1.06e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24556 | -| time_elapsed | 133668 | -| total_timesteps | 3143168 | -| train/ | | -| approx_kl | 0.47476086 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.643 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 245550 | -| policy_gradient_loss | 0.0652 | -| std | 0.00585 | -| value_loss | 0.011 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24557 | -| time_elapsed | 133672 | -| total_timesteps | 3143296 | -| train/ | | -| approx_kl | 0.20551914 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.711 | -| learning_rate | 0.0003 | -| loss | 0.0857 | -| n_updates | 245560 | -| policy_gradient_loss | 0.0245 | -| std | 0.00585 | -| value_loss | 0.000375 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24558 | -| time_elapsed | 133676 | -| total_timesteps | 3143424 | -| train/ | | -| approx_kl | 0.018908253 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 245570 | -| policy_gradient_loss | -0.00141 | -| std | 0.00585 | -| value_loss | 4.64e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24559 | -| time_elapsed | 133681 | -| total_timesteps | 3143552 | -| train/ | | -| approx_kl | 0.014875604 | -| clip_fraction | 0.118 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.00277 | -| n_updates | 245580 | -| policy_gradient_loss | 0.00107 | -| std | 0.00585 | -| value_loss | 2.14e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24560 | -| time_elapsed | 133686 | -| total_timesteps | 3143680 | -| train/ | | -| approx_kl | 0.017626954 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0521 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 245590 | -| policy_gradient_loss | -0.00134 | -| std | 0.00585 | -| value_loss | 1.54e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24561 | -| time_elapsed | 133690 | -| total_timesteps | 3143808 | -| train/ | | -| approx_kl | 0.035396565 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 245600 | -| policy_gradient_loss | 0.0522 | -| std | 0.00585 | -| value_loss | 9.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24562 | -| time_elapsed | 133695 | -| total_timesteps | 3143936 | -| train/ | | -| approx_kl | 0.39037865 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 245610 | -| policy_gradient_loss | 0.154 | -| std | 0.00585 | -| value_loss | 7.18e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24563 | -| time_elapsed | 133699 | -| total_timesteps | 3144064 | -| train/ | | -| approx_kl | 0.056542546 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 245620 | -| policy_gradient_loss | 0.0288 | -| std | 0.00585 | -| value_loss | 5.34e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24564 | -| time_elapsed | 133706 | -| total_timesteps | 3144192 | -| train/ | | -| approx_kl | 0.0221531 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.833 | -| learning_rate | 0.0003 | -| loss | 0.00927 | -| n_updates | 245630 | -| policy_gradient_loss | 0.00211 | -| std | 0.00585 | -| value_loss | 0.00353 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24565 | -| time_elapsed | 133711 | -| total_timesteps | 3144320 | -| train/ | | -| approx_kl | 0.11174354 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | 0.0701 | -| n_updates | 245640 | -| policy_gradient_loss | 0.0354 | -| std | 0.00584 | -| value_loss | 2.16e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24566 | -| time_elapsed | 133717 | -| total_timesteps | 3144448 | -| train/ | | -| approx_kl | 1.6611535e-05 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.000766 | -| n_updates | 245650 | -| policy_gradient_loss | 0.0329 | -| std | 0.00584 | -| value_loss | 3.39e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24567 | -| time_elapsed | 133722 | -| total_timesteps | 3144576 | -| train/ | | -| approx_kl | 0.00044071767 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | 0.000735 | -| n_updates | 245660 | -| policy_gradient_loss | 0.0335 | -| std | 0.00584 | -| value_loss | 3.72e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24568 | -| time_elapsed | 133726 | -| total_timesteps | 3144704 | -| train/ | | -| approx_kl | 0.0012126644 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | -0.00206 | -| n_updates | 245670 | -| policy_gradient_loss | 0.0341 | -| std | 0.00584 | -| value_loss | 2.76e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24569 | -| time_elapsed | 133732 | -| total_timesteps | 3144832 | -| train/ | | -| approx_kl | 0.6154555 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 245680 | -| policy_gradient_loss | 0.0637 | -| std | 0.00584 | -| value_loss | 2.11e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 24570 | -| time_elapsed | 133737 | -| total_timesteps | 3144960 | -| train/ | | -| approx_kl | 0.0074770125 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 245690 | -| policy_gradient_loss | 0.00738 | -| std | 0.00584 | -| value_loss | 1.56e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24571 | -| time_elapsed | 133741 | -| total_timesteps | 3145088 | -| train/ | | -| approx_kl | 0.091270104 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 245700 | -| policy_gradient_loss | 0.000101 | -| std | 0.00584 | -| value_loss | 1.09e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24572 | -| time_elapsed | 133750 | -| total_timesteps | 3145216 | -| train/ | | -| approx_kl | 0.036252346 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.867 | -| learning_rate | 0.0003 | -| loss | -0.0273 | -| n_updates | 245710 | -| policy_gradient_loss | -0.00699 | -| std | 0.00584 | -| value_loss | 0.00272 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24573 | -| time_elapsed | 133756 | -| total_timesteps | 3145344 | -| train/ | | -| approx_kl | 1.5476253e-05 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.000809 | -| learning_rate | 0.0003 | -| loss | -0.000151 | -| n_updates | 245720 | -| policy_gradient_loss | 0.0375 | -| std | 0.00584 | -| value_loss | 1.11e-05 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24574 | -| time_elapsed | 133761 | -| total_timesteps | 3145472 | -| train/ | | -| approx_kl | 0.5738148 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 245730 | -| policy_gradient_loss | 0.0664 | -| std | 0.00584 | -| value_loss | 1.81e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24575 | -| time_elapsed | 133765 | -| total_timesteps | 3145600 | -| train/ | | -| approx_kl | 0.009705019 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | -0.00698 | -| n_updates | 245740 | -| policy_gradient_loss | 0.00977 | -| std | 0.00584 | -| value_loss | 1.52e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24576 | -| time_elapsed | 133770 | -| total_timesteps | 3145728 | -| train/ | | -| approx_kl | 0.0015251599 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0362 | -| learning_rate | 0.0003 | -| loss | 0.00684 | -| n_updates | 245750 | -| policy_gradient_loss | 0.00913 | -| std | 0.00584 | -| value_loss | 1.18e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24577 | -| time_elapsed | 133775 | -| total_timesteps | 3145856 | -| train/ | | -| approx_kl | 0.07228754 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 245760 | -| policy_gradient_loss | 0.0123 | -| std | 0.00584 | -| value_loss | 7.03e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24578 | -| time_elapsed | 133780 | -| total_timesteps | 3145984 | -| train/ | | -| approx_kl | 0.010917418 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 245770 | -| policy_gradient_loss | 0.00479 | -| std | 0.00584 | -| value_loss | 5.52e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24579 | -| time_elapsed | 133784 | -| total_timesteps | 3146112 | -| train/ | | -| approx_kl | 0.0028810147 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | -0.00264 | -| n_updates | 245780 | -| policy_gradient_loss | 0.0097 | -| std | 0.00584 | -| value_loss | 3.19e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24580 | -| time_elapsed | 133796 | -| total_timesteps | 3146240 | -| train/ | | -| approx_kl | 0.24508768 | -| clip_fraction | 0.754 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -1.62 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 245790 | -| policy_gradient_loss | 0.0301 | -| std | 0.00584 | -| value_loss | 0.00329 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24581 | -| time_elapsed | 133800 | -| total_timesteps | 3146368 | -| train/ | | -| approx_kl | 0.019394577 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -7.53 | -| learning_rate | 0.0003 | -| loss | 0.00472 | -| n_updates | 245800 | -| policy_gradient_loss | 0.0186 | -| std | 0.00585 | -| value_loss | 6.51e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24582 | -| time_elapsed | 133805 | -| total_timesteps | 3146496 | -| train/ | | -| approx_kl | 0.05763352 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00108 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 245810 | -| policy_gradient_loss | 0.0453 | -| std | 0.00586 | -| value_loss | 1.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24583 | -| time_elapsed | 133811 | -| total_timesteps | 3146624 | -| train/ | | -| approx_kl | 0.50483894 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00662 | -| learning_rate | 0.0003 | -| loss | 0.252 | -| n_updates | 245820 | -| policy_gradient_loss | 0.152 | -| std | 0.00586 | -| value_loss | 1.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24584 | -| time_elapsed | 133816 | -| total_timesteps | 3146752 | -| train/ | | -| approx_kl | 0.22031985 | -| clip_fraction | 0.735 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00838 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 245830 | -| policy_gradient_loss | 0.125 | -| std | 0.00586 | -| value_loss | 7.92e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24585 | -| time_elapsed | 133822 | -| total_timesteps | 3146880 | -| train/ | | -| approx_kl | 0.19972138 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 245840 | -| policy_gradient_loss | 0.139 | -| std | 0.00586 | -| value_loss | 5.72e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24586 | -| time_elapsed | 133827 | -| total_timesteps | 3147008 | -| train/ | | -| approx_kl | 0.044772856 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 245850 | -| policy_gradient_loss | 0.0396 | -| std | 0.00586 | -| value_loss | 3.98e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24587 | -| time_elapsed | 133840 | -| total_timesteps | 3147136 | -| train/ | | -| approx_kl | 0.014852487 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 245860 | -| policy_gradient_loss | -0.00442 | -| std | 0.00586 | -| value_loss | 0.000115 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24588 | -| time_elapsed | 133846 | -| total_timesteps | 3147264 | -| train/ | | -| approx_kl | 0.0032860278 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0907 | -| learning_rate | 0.0003 | -| loss | -0.00758 | -| n_updates | 245870 | -| policy_gradient_loss | 0.0223 | -| std | 0.00586 | -| value_loss | 0.00268 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24589 | -| time_elapsed | 133851 | -| total_timesteps | 3147392 | -| train/ | | -| approx_kl | 0.0004771063 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | -0.00155 | -| n_updates | 245880 | -| policy_gradient_loss | 0.0376 | -| std | 0.00586 | -| value_loss | 7.38e-05 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24590 | -| time_elapsed | 133855 | -| total_timesteps | 3147520 | -| train/ | | -| approx_kl | 0.922229 | -| clip_fraction | 0.578 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 245890 | -| policy_gradient_loss | 0.0682 | -| std | 0.00587 | -| value_loss | 4.64e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24591 | -| time_elapsed | 133861 | -| total_timesteps | 3147648 | -| train/ | | -| approx_kl | 0.017761104 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | -0.00749 | -| n_updates | 245900 | -| policy_gradient_loss | 0.0102 | -| std | 0.00587 | -| value_loss | 3.59e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24592 | -| time_elapsed | 133866 | -| total_timesteps | 3147776 | -| train/ | | -| approx_kl | 0.10818095 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.00864 | -| n_updates | 245910 | -| policy_gradient_loss | -0.00196 | -| std | 0.00587 | -| value_loss | 2.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 24593 | -| time_elapsed | 133870 | -| total_timesteps | 3147904 | -| train/ | | -| approx_kl | 0.053057186 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 245920 | -| policy_gradient_loss | 0.0139 | -| std | 0.00587 | -| value_loss | 1.75e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24594 | -| time_elapsed | 133875 | -| total_timesteps | 3148032 | -| train/ | | -| approx_kl | 0.0092387805 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | -0.00714 | -| n_updates | 245930 | -| policy_gradient_loss | 0.00914 | -| std | 0.00587 | -| value_loss | 1.14e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24595 | -| time_elapsed | 133884 | -| total_timesteps | 3148160 | -| train/ | | -| approx_kl | 0.018100087 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 245940 | -| policy_gradient_loss | -0.001 | -| std | 0.00587 | -| value_loss | 0.000417 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24596 | -| time_elapsed | 133888 | -| total_timesteps | 3148288 | -| train/ | | -| approx_kl | 0.05364758 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0193 | -| learning_rate | 0.0003 | -| loss | 0.0281 | -| n_updates | 245950 | -| policy_gradient_loss | 0.0161 | -| std | 0.00587 | -| value_loss | 3.28e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24597 | -| time_elapsed | 133892 | -| total_timesteps | 3148416 | -| train/ | | -| approx_kl | 0.008160607 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0082 | -| learning_rate | 0.0003 | -| loss | -0.0157 | -| n_updates | 245960 | -| policy_gradient_loss | 0.00665 | -| std | 0.00587 | -| value_loss | 8.99e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24598 | -| time_elapsed | 133896 | -| total_timesteps | 3148544 | -| train/ | | -| approx_kl | 0.0025878 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | -0.00843 | -| n_updates | 245970 | -| policy_gradient_loss | 0.0129 | -| std | 0.00587 | -| value_loss | 7.8e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24599 | -| time_elapsed | 133903 | -| total_timesteps | 3148672 | -| train/ | | -| approx_kl | 0.051013514 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | 0.0599 | -| n_updates | 245980 | -| policy_gradient_loss | 0.113 | -| std | 0.00586 | -| value_loss | 4.43e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24600 | -| time_elapsed | 133907 | -| total_timesteps | 3148800 | -| train/ | | -| approx_kl | 0.012448493 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 245990 | -| policy_gradient_loss | 0.0285 | -| std | 0.00586 | -| value_loss | 1.55e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24601 | -| time_elapsed | 133912 | -| total_timesteps | 3148928 | -| train/ | | -| approx_kl | 3.0407682e-07 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -7.67e-05 | -| n_updates | 246000 | -| policy_gradient_loss | 0.0284 | -| std | 0.00586 | -| value_loss | 1.78e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24602 | -| time_elapsed | 133916 | -| total_timesteps | 3149056 | -| train/ | | -| approx_kl | 1.0024998 | -| clip_fraction | 0.564 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.429 | -| n_updates | 246010 | -| policy_gradient_loss | 0.11 | -| std | 0.00586 | -| value_loss | 4.3e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24603 | -| time_elapsed | 133925 | -| total_timesteps | 3149184 | -| train/ | | -| approx_kl | 0.027007561 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.304 | -| learning_rate | 0.0003 | -| loss | -0.0298 | -| n_updates | 246020 | -| policy_gradient_loss | -0.00785 | -| std | 0.00586 | -| value_loss | 0.0017 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24604 | -| time_elapsed | 133931 | -| total_timesteps | 3149312 | -| train/ | | -| approx_kl | 0.27316093 | -| clip_fraction | 0.6 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.939 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 246030 | -| policy_gradient_loss | 0.0819 | -| std | 0.00586 | -| value_loss | 3.43e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24605 | -| time_elapsed | 133936 | -| total_timesteps | 3149440 | -| train/ | | -| approx_kl | 0.0070234383 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0692 | -| learning_rate | 0.0003 | -| loss | 0.00884 | -| n_updates | 246040 | -| policy_gradient_loss | 0.0135 | -| std | 0.00586 | -| value_loss | 4.57e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24606 | -| time_elapsed | 133942 | -| total_timesteps | 3149568 | -| train/ | | -| approx_kl | 0.0050927345 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00321 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 246050 | -| policy_gradient_loss | 0.00942 | -| std | 0.00586 | -| value_loss | 1.68e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24607 | -| time_elapsed | 133948 | -| total_timesteps | 3149696 | -| train/ | | -| approx_kl | 0.10195297 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0633 | -| n_updates | 246060 | -| policy_gradient_loss | 0.0249 | -| std | 0.00586 | -| value_loss | 1.22e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24608 | -| time_elapsed | 133953 | -| total_timesteps | 3149824 | -| train/ | | -| approx_kl | 0.046987332 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 246070 | -| policy_gradient_loss | 0.0109 | -| std | 0.00586 | -| value_loss | 7.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24609 | -| time_elapsed | 133957 | -| total_timesteps | 3149952 | -| train/ | | -| approx_kl | 0.007478209 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | -0.000857 | -| n_updates | 246080 | -| policy_gradient_loss | 0.00624 | -| std | 0.00586 | -| value_loss | 4.67e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24610 | -| time_elapsed | 133963 | -| total_timesteps | 3150080 | -| train/ | | -| approx_kl | 0.0016670693 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.068 | -| learning_rate | 0.0003 | -| loss | 0.00965 | -| n_updates | 246090 | -| policy_gradient_loss | 0.00659 | -| std | 0.00586 | -| value_loss | 3.73e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24611 | -| time_elapsed | 133973 | -| total_timesteps | 3150208 | -| train/ | | -| approx_kl | 0.028485235 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | -0.0249 | -| n_updates | 246100 | -| policy_gradient_loss | -0.0132 | -| std | 0.00586 | -| value_loss | 0.00278 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24612 | -| time_elapsed | 133978 | -| total_timesteps | 3150336 | -| train/ | | -| approx_kl | 0.17706893 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.327 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 246110 | -| policy_gradient_loss | 0.126 | -| std | 0.00586 | -| value_loss | 3.39e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24613 | -| time_elapsed | 133982 | -| total_timesteps | 3150464 | -| train/ | | -| approx_kl | 0.036014184 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0238 | -| learning_rate | 0.0003 | -| loss | -0.0045 | -| n_updates | 246120 | -| policy_gradient_loss | 0.034 | -| std | 0.00586 | -| value_loss | 6.12e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24614 | -| time_elapsed | 133987 | -| total_timesteps | 3150592 | -| train/ | | -| approx_kl | 0.657041 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00332 | -| learning_rate | 0.0003 | -| loss | 0.202 | -| n_updates | 246130 | -| policy_gradient_loss | 0.0681 | -| std | 0.00586 | -| value_loss | 2.65e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24615 | -| time_elapsed | 133992 | -| total_timesteps | 3150720 | -| train/ | | -| approx_kl | 0.013871029 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0249 | -| learning_rate | 0.0003 | -| loss | 0.00251 | -| n_updates | 246140 | -| policy_gradient_loss | 0.0093 | -| std | 0.00586 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24616 | -| time_elapsed | 133997 | -| total_timesteps | 3150848 | -| train/ | | -| approx_kl | 0.0009128079 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.067 | -| learning_rate | 0.0003 | -| loss | 0.00882 | -| n_updates | 246150 | -| policy_gradient_loss | 0.0014 | -| std | 0.00586 | -| value_loss | 9.99e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 24617 | -| time_elapsed | 134002 | -| total_timesteps | 3150976 | -| train/ | | -| approx_kl | 0.0067400523 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | -0.00753 | -| n_updates | 246160 | -| policy_gradient_loss | 0.00504 | -| std | 0.00586 | -| value_loss | 6.87e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24618 | -| time_elapsed | 134007 | -| total_timesteps | 3151104 | -| train/ | | -| approx_kl | 0.03985016 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.0486 | -| n_updates | 246170 | -| policy_gradient_loss | 0.103 | -| std | 0.00587 | -| value_loss | 8.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24619 | -| time_elapsed | 134019 | -| total_timesteps | 3151232 | -| train/ | | -| approx_kl | 0.59124964 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 246180 | -| policy_gradient_loss | 0.0478 | -| std | 0.00587 | -| value_loss | 0.000198 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24620 | -| time_elapsed | 134023 | -| total_timesteps | 3151360 | -| train/ | | -| approx_kl | 0.003909126 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0661 | -| learning_rate | 0.0003 | -| loss | -0.0134 | -| n_updates | 246190 | -| policy_gradient_loss | 0.0209 | -| std | 0.00587 | -| value_loss | 1.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24621 | -| time_elapsed | 134028 | -| total_timesteps | 3151488 | -| train/ | | -| approx_kl | 0.123660915 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | 0.0388 | -| n_updates | 246200 | -| policy_gradient_loss | 0.0389 | -| std | 0.00587 | -| value_loss | 1.31e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24622 | -| time_elapsed | 134033 | -| total_timesteps | 3151616 | -| train/ | | -| approx_kl | 0.35620925 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 246210 | -| policy_gradient_loss | 0.155 | -| std | 0.00587 | -| value_loss | 8.76e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24623 | -| time_elapsed | 134038 | -| total_timesteps | 3151744 | -| train/ | | -| approx_kl | 0.2374236 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 246220 | -| policy_gradient_loss | 0.157 | -| std | 0.00587 | -| value_loss | 6.15e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.97 | -| time/ | | -| fps | 23 | -| iterations | 24624 | -| time_elapsed | 134042 | -| total_timesteps | 3151872 | -| train/ | | -| approx_kl | 0.04022003 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0925 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 246230 | -| policy_gradient_loss | 0.0265 | -| std | 0.00587 | -| value_loss | 3.44e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24625 | -| time_elapsed | 134046 | -| total_timesteps | 3152000 | -| train/ | | -| approx_kl | 0.20525551 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0925 | -| learning_rate | 0.0003 | -| loss | 0.0816 | -| n_updates | 246240 | -| policy_gradient_loss | 0.0228 | -| std | 0.00587 | -| value_loss | 1.66e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24626 | -| time_elapsed | 134052 | -| total_timesteps | 3152128 | -| train/ | | -| approx_kl | 0.029898189 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00674 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 246250 | -| policy_gradient_loss | 0.0354 | -| std | 0.00587 | -| value_loss | 6.79e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24627 | -| time_elapsed | 134064 | -| total_timesteps | 3152256 | -| train/ | | -| approx_kl | 0.09014869 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 246260 | -| policy_gradient_loss | 0.00905 | -| std | 0.00587 | -| value_loss | 0.00116 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24628 | -| time_elapsed | 134069 | -| total_timesteps | 3152384 | -| train/ | | -| approx_kl | 0.060033835 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 246270 | -| policy_gradient_loss | 0.024 | -| std | 0.00587 | -| value_loss | 7.7e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24629 | -| time_elapsed | 134075 | -| total_timesteps | 3152512 | -| train/ | | -| approx_kl | 0.3265516 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0126 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 246280 | -| policy_gradient_loss | 0.128 | -| std | 0.00587 | -| value_loss | 6.86e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24630 | -| time_elapsed | 134082 | -| total_timesteps | 3152640 | -| train/ | | -| approx_kl | 0.07417927 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0564 | -| n_updates | 246290 | -| policy_gradient_loss | 0.0387 | -| std | 0.00587 | -| value_loss | 1.01e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24631 | -| time_elapsed | 134087 | -| total_timesteps | 3152768 | -| train/ | | -| approx_kl | 0.00052457536 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.000291 | -| n_updates | 246300 | -| policy_gradient_loss | 0.0365 | -| std | 0.00587 | -| value_loss | 4.5e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 24632 | -| time_elapsed | 134093 | -| total_timesteps | 3152896 | -| train/ | | -| approx_kl | 0.26619345 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 246310 | -| policy_gradient_loss | 0.0302 | -| std | 0.00587 | -| value_loss | 8.33e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24633 | -| time_elapsed | 134099 | -| total_timesteps | 3153024 | -| train/ | | -| approx_kl | 0.024846774 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 246320 | -| policy_gradient_loss | 0.0209 | -| std | 0.00587 | -| value_loss | 2.19e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24634 | -| time_elapsed | 134112 | -| total_timesteps | 3153152 | -| train/ | | -| approx_kl | 0.014113715 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.114 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 246330 | -| policy_gradient_loss | -0.000324 | -| std | 0.00587 | -| value_loss | 0.00199 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24635 | -| time_elapsed | 134117 | -| total_timesteps | 3153280 | -| train/ | | -| approx_kl | 0.03119051 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 246340 | -| policy_gradient_loss | 0.0159 | -| std | 0.00587 | -| value_loss | 1.19e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24636 | -| time_elapsed | 134122 | -| total_timesteps | 3153408 | -| train/ | | -| approx_kl | 0.014634221 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 246350 | -| policy_gradient_loss | -0.000265 | -| std | 0.00587 | -| value_loss | 8.03e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24637 | -| time_elapsed | 134128 | -| total_timesteps | 3153536 | -| train/ | | -| approx_kl | 0.16226195 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0632 | -| n_updates | 246360 | -| policy_gradient_loss | 0.0457 | -| std | 0.00587 | -| value_loss | 6.38e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24638 | -| time_elapsed | 134132 | -| total_timesteps | 3153664 | -| train/ | | -| approx_kl | 0.05572402 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.062 | -| learning_rate | 0.0003 | -| loss | -0.0196 | -| n_updates | 246370 | -| policy_gradient_loss | 0.0656 | -| std | 0.00587 | -| value_loss | 3.4e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24639 | -| time_elapsed | 134136 | -| total_timesteps | 3153792 | -| train/ | | -| approx_kl | 0.3540958 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 246380 | -| policy_gradient_loss | 0.0517 | -| std | 0.00587 | -| value_loss | 2.61e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 24640 | -| time_elapsed | 134142 | -| total_timesteps | 3153920 | -| train/ | | -| approx_kl | 0.09085178 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 246390 | -| policy_gradient_loss | 0.0755 | -| std | 0.00587 | -| value_loss | 1.5e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24641 | -| time_elapsed | 134147 | -| total_timesteps | 3154048 | -| train/ | | -| approx_kl | 0.34146628 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 246400 | -| policy_gradient_loss | 0.061 | -| std | 0.00587 | -| value_loss | 1.08e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24642 | -| time_elapsed | 134155 | -| total_timesteps | 3154176 | -| train/ | | -| approx_kl | 0.009512793 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.829 | -| learning_rate | 0.0003 | -| loss | -0.0244 | -| n_updates | 246410 | -| policy_gradient_loss | 0.0159 | -| std | 0.00587 | -| value_loss | 0.00276 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24643 | -| time_elapsed | 134158 | -| total_timesteps | 3154304 | -| train/ | | -| approx_kl | 0.028720234 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00781 | -| learning_rate | 0.0003 | -| loss | 0.0451 | -| n_updates | 246420 | -| policy_gradient_loss | 0.0395 | -| std | 0.00587 | -| value_loss | 0.000149 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24644 | -| time_elapsed | 134162 | -| total_timesteps | 3154432 | -| train/ | | -| approx_kl | 0.52376866 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.235 | -| n_updates | 246430 | -| policy_gradient_loss | 0.148 | -| std | 0.00587 | -| value_loss | 4.03e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24645 | -| time_elapsed | 134166 | -| total_timesteps | 3154560 | -| train/ | | -| approx_kl | 0.31238222 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00972 | -| learning_rate | 0.0003 | -| loss | 0.197 | -| n_updates | 246440 | -| policy_gradient_loss | 0.148 | -| std | 0.00587 | -| value_loss | 8.67e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24646 | -| time_elapsed | 134171 | -| total_timesteps | 3154688 | -| train/ | | -| approx_kl | 0.046110343 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.00369 | -| n_updates | 246450 | -| policy_gradient_loss | 0.0224 | -| std | 0.00587 | -| value_loss | 5.92e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24647 | -| time_elapsed | 134176 | -| total_timesteps | 3154816 | -| train/ | | -| approx_kl | 0.5884721 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0991 | -| n_updates | 246460 | -| policy_gradient_loss | 0.0475 | -| std | 0.00587 | -| value_loss | 4.36e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.969 | -| time/ | | -| fps | 23 | -| iterations | 24648 | -| time_elapsed | 134181 | -| total_timesteps | 3154944 | -| train/ | | -| approx_kl | 0.01424048 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | -0.000601 | -| n_updates | 246470 | -| policy_gradient_loss | 0.00872 | -| std | 0.00587 | -| value_loss | 2.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24649 | -| time_elapsed | 134184 | -| total_timesteps | 3155072 | -| train/ | | -| approx_kl | 0.096152656 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.0495 | -| n_updates | 246480 | -| policy_gradient_loss | 0.0199 | -| std | 0.00588 | -| value_loss | 1.73e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24650 | -| time_elapsed | 134192 | -| total_timesteps | 3155200 | -| train/ | | -| approx_kl | 0.033920914 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.927 | -| learning_rate | 0.0003 | -| loss | 0.056 | -| n_updates | 246490 | -| policy_gradient_loss | 0.0208 | -| std | 0.00587 | -| value_loss | 0.00105 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24651 | -| time_elapsed | 134198 | -| total_timesteps | 3155328 | -| train/ | | -| approx_kl | 0.19455358 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | 0.0866 | -| n_updates | 246500 | -| policy_gradient_loss | 0.0199 | -| std | 0.00587 | -| value_loss | 4.89e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24652 | -| time_elapsed | 134203 | -| total_timesteps | 3155456 | -| train/ | | -| approx_kl | 0.06812221 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.0361 | -| n_updates | 246510 | -| policy_gradient_loss | 0.0436 | -| std | 0.00587 | -| value_loss | 1.12e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24653 | -| time_elapsed | 134208 | -| total_timesteps | 3155584 | -| train/ | | -| approx_kl | 0.41427246 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.225 | -| n_updates | 246520 | -| policy_gradient_loss | 0.195 | -| std | 0.00587 | -| value_loss | 7.59e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24654 | -| time_elapsed | 134212 | -| total_timesteps | 3155712 | -| train/ | | -| approx_kl | 0.06349322 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.041 | -| n_updates | 246530 | -| policy_gradient_loss | 0.0298 | -| std | 0.00587 | -| value_loss | 1.22e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24655 | -| time_elapsed | 134218 | -| total_timesteps | 3155840 | -| train/ | | -| approx_kl | 0.00213697 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 1.05e-05 | -| n_updates | 246540 | -| policy_gradient_loss | 0.0258 | -| std | 0.00587 | -| value_loss | 9.02e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24656 | -| time_elapsed | 134223 | -| total_timesteps | 3155968 | -| train/ | | -| approx_kl | 0.24464057 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00702 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 246550 | -| policy_gradient_loss | 0.0655 | -| std | 0.00588 | -| value_loss | 3.3e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24657 | -| time_elapsed | 134228 | -| total_timesteps | 3156096 | -| train/ | | -| approx_kl | 0.0023488305 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0183 | -| learning_rate | 0.0003 | -| loss | 0.00586 | -| n_updates | 246560 | -| policy_gradient_loss | 0.0185 | -| std | 0.00588 | -| value_loss | 2.89e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24658 | -| time_elapsed | 134238 | -| total_timesteps | 3156224 | -| train/ | | -| approx_kl | 0.015304089 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.84 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 246570 | -| policy_gradient_loss | -0.0155 | -| std | 0.00588 | -| value_loss | 0.00346 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24659 | -| time_elapsed | 134244 | -| total_timesteps | 3156352 | -| train/ | | -| approx_kl | 0.011496334 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -7.6 | -| learning_rate | 0.0003 | -| loss | 0.00216 | -| n_updates | 246580 | -| policy_gradient_loss | 0.0053 | -| std | 0.00588 | -| value_loss | 6.3e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24660 | -| time_elapsed | 134249 | -| total_timesteps | 3156480 | -| train/ | | -| approx_kl | 0.04731481 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.25 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 246590 | -| policy_gradient_loss | 0.0561 | -| std | 0.00588 | -| value_loss | 9.18e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24661 | -| time_elapsed | 134254 | -| total_timesteps | 3156608 | -| train/ | | -| approx_kl | 0.16788873 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00247 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 246600 | -| policy_gradient_loss | 0.0686 | -| std | 0.00589 | -| value_loss | 5.21e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24662 | -| time_elapsed | 134259 | -| total_timesteps | 3156736 | -| train/ | | -| approx_kl | 0.05462567 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0926 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 246610 | -| policy_gradient_loss | 0.0502 | -| std | 0.00589 | -| value_loss | 3.62e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24663 | -| time_elapsed | 134265 | -| total_timesteps | 3156864 | -| train/ | | -| approx_kl | 1.1221948 | -| clip_fraction | 0.764 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.358 | -| n_updates | 246620 | -| policy_gradient_loss | 0.224 | -| std | 0.00589 | -| value_loss | 3.03e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24664 | -| time_elapsed | 134269 | -| total_timesteps | 3156992 | -| train/ | | -| approx_kl | 0.046030626 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0269 | -| learning_rate | 0.0003 | -| loss | 0.00506 | -| n_updates | 246630 | -| policy_gradient_loss | -0.00444 | -| std | 0.00589 | -| value_loss | 2.16e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24665 | -| time_elapsed | 134273 | -| total_timesteps | 3157120 | -| train/ | | -| approx_kl | 0.024887495 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 246640 | -| policy_gradient_loss | 0.044 | -| std | 0.00589 | -| value_loss | 1.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24666 | -| time_elapsed | 134286 | -| total_timesteps | 3157248 | -| train/ | | -| approx_kl | 0.53232384 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.87 | -| learning_rate | 0.0003 | -| loss | 0.084 | -| n_updates | 246650 | -| policy_gradient_loss | 0.0731 | -| std | 0.00588 | -| value_loss | 0.00243 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24667 | -| time_elapsed | 134291 | -| total_timesteps | 3157376 | -| train/ | | -| approx_kl | 0.5870095 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.322 | -| n_updates | 246660 | -| policy_gradient_loss | 0.203 | -| std | 0.00588 | -| value_loss | 6.97e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24668 | -| time_elapsed | 134296 | -| total_timesteps | 3157504 | -| train/ | | -| approx_kl | 0.41121897 | -| clip_fraction | 0.748 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.259 | -| n_updates | 246670 | -| policy_gradient_loss | 0.207 | -| std | 0.00589 | -| value_loss | 1.6e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24669 | -| time_elapsed | 134301 | -| total_timesteps | 3157632 | -| train/ | | -| approx_kl | 0.24447718 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00545 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 246680 | -| policy_gradient_loss | 0.187 | -| std | 0.00588 | -| value_loss | 9.08e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24670 | -| time_elapsed | 134306 | -| total_timesteps | 3157760 | -| train/ | | -| approx_kl | 0.14378284 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | 0.0888 | -| n_updates | 246690 | -| policy_gradient_loss | 0.115 | -| std | 0.00589 | -| value_loss | 6.68e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24671 | -| time_elapsed | 134312 | -| total_timesteps | 3157888 | -| train/ | | -| approx_kl | 0.19215485 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 246700 | -| policy_gradient_loss | 0.143 | -| std | 0.00589 | -| value_loss | 5.11e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24672 | -| time_elapsed | 134318 | -| total_timesteps | 3158016 | -| train/ | | -| approx_kl | 0.035904285 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 246710 | -| policy_gradient_loss | 0.0312 | -| std | 0.00589 | -| value_loss | 4.03e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24673 | -| time_elapsed | 134329 | -| total_timesteps | 3158144 | -| train/ | | -| approx_kl | 0.21713123 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.813 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 246720 | -| policy_gradient_loss | 0.00591 | -| std | 0.00589 | -| value_loss | 0.00447 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24674 | -| time_elapsed | 134334 | -| total_timesteps | 3158272 | -| train/ | | -| approx_kl | 0.034490008 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0075 | -| n_updates | 246730 | -| policy_gradient_loss | 0.00105 | -| std | 0.00588 | -| value_loss | 0.00111 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24675 | -| time_elapsed | 134338 | -| total_timesteps | 3158400 | -| train/ | | -| approx_kl | 0.02393457 | -| clip_fraction | 0.174 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00727 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 246740 | -| policy_gradient_loss | 0.00771 | -| std | 0.00588 | -| value_loss | 7.44e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24676 | -| time_elapsed | 134343 | -| total_timesteps | 3158528 | -| train/ | | -| approx_kl | 0.028496547 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 246750 | -| policy_gradient_loss | 0.0338 | -| std | 0.00588 | -| value_loss | 3.1e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24677 | -| time_elapsed | 134349 | -| total_timesteps | 3158656 | -| train/ | | -| approx_kl | 0.12824783 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.063 | -| learning_rate | 0.0003 | -| loss | 0.0651 | -| n_updates | 246760 | -| policy_gradient_loss | 0.0323 | -| std | 0.00588 | -| value_loss | 2.19e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24678 | -| time_elapsed | 134355 | -| total_timesteps | 3158784 | -| train/ | | -| approx_kl | 0.78569937 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 246770 | -| policy_gradient_loss | 0.0507 | -| std | 0.00588 | -| value_loss | 1.66e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 24679 | -| time_elapsed | 134361 | -| total_timesteps | 3158912 | -| train/ | | -| approx_kl | 0.04627884 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 246780 | -| policy_gradient_loss | 0.00965 | -| std | 0.00588 | -| value_loss | 9.11e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24680 | -| time_elapsed | 134366 | -| total_timesteps | 3159040 | -| train/ | | -| approx_kl | 0.0077933725 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 246790 | -| policy_gradient_loss | 0.00386 | -| std | 0.00588 | -| value_loss | 7.25e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24681 | -| time_elapsed | 134374 | -| total_timesteps | 3159168 | -| train/ | | -| approx_kl | 0.9925913 | -| clip_fraction | 0.766 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.725 | -| learning_rate | 0.0003 | -| loss | 0.086 | -| n_updates | 246800 | -| policy_gradient_loss | 0.0485 | -| std | 0.00588 | -| value_loss | 0.00259 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24682 | -| time_elapsed | 134379 | -| total_timesteps | 3159296 | -| train/ | | -| approx_kl | 0.0038894145 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.47 | -| learning_rate | 0.0003 | -| loss | -0.00754 | -| n_updates | 246810 | -| policy_gradient_loss | 0.0181 | -| std | 0.00588 | -| value_loss | 2.6e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24683 | -| time_elapsed | 134384 | -| total_timesteps | 3159424 | -| train/ | | -| approx_kl | 0.10566956 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.000107 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 246820 | -| policy_gradient_loss | 0.016 | -| std | 0.00588 | -| value_loss | 3.45e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24684 | -| time_elapsed | 134387 | -| total_timesteps | 3159552 | -| train/ | | -| approx_kl | 0.05061693 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -1.89 | -| learning_rate | 0.0003 | -| loss | 0.00865 | -| n_updates | 246830 | -| policy_gradient_loss | 0.0248 | -| std | 0.00588 | -| value_loss | 3.82e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24685 | -| time_elapsed | 134392 | -| total_timesteps | 3159680 | -| train/ | | -| approx_kl | 0.0040795817 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | -0.000248 | -| n_updates | 246840 | -| policy_gradient_loss | 0.027 | -| std | 0.00588 | -| value_loss | 6.25e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24686 | -| time_elapsed | 134397 | -| total_timesteps | 3159808 | -| train/ | | -| approx_kl | 0.061733976 | -| clip_fraction | 0.468 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | 0.046 | -| n_updates | 246850 | -| policy_gradient_loss | 0.0859 | -| std | 0.00588 | -| value_loss | 6.26e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24687 | -| time_elapsed | 134402 | -| total_timesteps | 3159936 | -| train/ | | -| approx_kl | 0.0045898366 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | -0.00381 | -| n_updates | 246860 | -| policy_gradient_loss | 0.0989 | -| std | 0.00588 | -| value_loss | 3.6e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24688 | -| time_elapsed | 134407 | -| total_timesteps | 3160064 | -| train/ | | -| approx_kl | 0.008514866 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | -0.00695 | -| n_updates | 246870 | -| policy_gradient_loss | 0.0234 | -| std | 0.00588 | -| value_loss | 1.5e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24689 | -| time_elapsed | 134417 | -| total_timesteps | 3160192 | -| train/ | | -| approx_kl | 0.010532921 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.833 | -| learning_rate | 0.0003 | -| loss | -0.00301 | -| n_updates | 246880 | -| policy_gradient_loss | 0.0358 | -| std | 0.00587 | -| value_loss | 0.00382 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24690 | -| time_elapsed | 134423 | -| total_timesteps | 3160320 | -| train/ | | -| approx_kl | 0.016407609 | -| clip_fraction | 0.592 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.00679 | -| n_updates | 246890 | -| policy_gradient_loss | 0.0946 | -| std | 0.00586 | -| value_loss | 8.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24691 | -| time_elapsed | 134428 | -| total_timesteps | 3160448 | -| train/ | | -| approx_kl | 0.012636946 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | -0.0124 | -| n_updates | 246900 | -| policy_gradient_loss | 0.00418 | -| std | 0.00585 | -| value_loss | 1.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24692 | -| time_elapsed | 134432 | -| total_timesteps | 3160576 | -| train/ | | -| approx_kl | 0.05687594 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.0285 | -| n_updates | 246910 | -| policy_gradient_loss | 0.0666 | -| std | 0.00585 | -| value_loss | 4.12e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24693 | -| time_elapsed | 134437 | -| total_timesteps | 3160704 | -| train/ | | -| approx_kl | 0.19901885 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0896 | -| n_updates | 246920 | -| policy_gradient_loss | 0.0513 | -| std | 0.00585 | -| value_loss | 3.73e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24694 | -| time_elapsed | 134441 | -| total_timesteps | 3160832 | -| train/ | | -| approx_kl | 0.046421632 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 246930 | -| policy_gradient_loss | 0.0746 | -| std | 0.00585 | -| value_loss | 2.32e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24695 | -| time_elapsed | 134445 | -| total_timesteps | 3160960 | -| train/ | | -| approx_kl | 0.331703 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | 0.0753 | -| n_updates | 246940 | -| policy_gradient_loss | 0.0442 | -| std | 0.00585 | -| value_loss | 2.06e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24696 | -| time_elapsed | 134451 | -| total_timesteps | 3161088 | -| train/ | | -| approx_kl | 0.001140479 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 246950 | -| policy_gradient_loss | 0.0168 | -| std | 0.00585 | -| value_loss | 1.18e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24697 | -| time_elapsed | 134458 | -| total_timesteps | 3161216 | -| train/ | | -| approx_kl | 0.050361298 | -| clip_fraction | 0.622 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 246960 | -| policy_gradient_loss | 0.0413 | -| std | 0.00585 | -| value_loss | 0.00151 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24698 | -| time_elapsed | 134463 | -| total_timesteps | 3161344 | -| train/ | | -| approx_kl | 0.010389533 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 246970 | -| policy_gradient_loss | 0.0358 | -| std | 0.00585 | -| value_loss | 1.1e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24699 | -| time_elapsed | 134467 | -| total_timesteps | 3161472 | -| train/ | | -| approx_kl | 0.047224402 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.0295 | -| n_updates | 246980 | -| policy_gradient_loss | 0.0768 | -| std | 0.00585 | -| value_loss | 8.64e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24700 | -| time_elapsed | 134473 | -| total_timesteps | 3161600 | -| train/ | | -| approx_kl | 0.20458063 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | 0.0797 | -| n_updates | 246990 | -| policy_gradient_loss | 0.0448 | -| std | 0.00585 | -| value_loss | 4.48e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24701 | -| time_elapsed | 134477 | -| total_timesteps | 3161728 | -| train/ | | -| approx_kl | 0.055799264 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 247000 | -| policy_gradient_loss | 0.0855 | -| std | 0.00585 | -| value_loss | 2.71e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24702 | -| time_elapsed | 134481 | -| total_timesteps | 3161856 | -| train/ | | -| approx_kl | 0.115234256 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0751 | -| learning_rate | 0.0003 | -| loss | 0.0689 | -| n_updates | 247010 | -| policy_gradient_loss | 0.0361 | -| std | 0.00585 | -| value_loss | 4.21e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24703 | -| time_elapsed | 134484 | -| total_timesteps | 3161984 | -| train/ | | -| approx_kl | 0.10604418 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.206 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 247020 | -| policy_gradient_loss | 0.0649 | -| std | 0.00585 | -| value_loss | 4.49e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24704 | -| time_elapsed | 134489 | -| total_timesteps | 3162112 | -| train/ | | -| approx_kl | 0.2498799 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 247030 | -| policy_gradient_loss | 0.0493 | -| std | 0.00585 | -| value_loss | 3.27e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24705 | -| time_elapsed | 134501 | -| total_timesteps | 3162240 | -| train/ | | -| approx_kl | 0.021038136 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.824 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 247040 | -| policy_gradient_loss | 0.0547 | -| std | 0.00585 | -| value_loss | 0.00236 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24706 | -| time_elapsed | 134506 | -| total_timesteps | 3162368 | -| train/ | | -| approx_kl | 0.00038992707 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.148 | -| learning_rate | 0.0003 | -| loss | 0.000308 | -| n_updates | 247050 | -| policy_gradient_loss | 0.035 | -| std | 0.00585 | -| value_loss | 3.8e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24707 | -| time_elapsed | 134510 | -| total_timesteps | 3162496 | -| train/ | | -| approx_kl | 0.03424185 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 247060 | -| policy_gradient_loss | 0.00972 | -| std | 0.00586 | -| value_loss | 0.000155 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24708 | -| time_elapsed | 134515 | -| total_timesteps | 3162624 | -| train/ | | -| approx_kl | 0.050785314 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -11.1 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 247070 | -| policy_gradient_loss | 0.0278 | -| std | 0.00587 | -| value_loss | 3.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24709 | -| time_elapsed | 134520 | -| total_timesteps | 3162752 | -| train/ | | -| approx_kl | 0.020649068 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0723 | -| learning_rate | 0.0003 | -| loss | -0.00306 | -| n_updates | 247080 | -| policy_gradient_loss | 0.0159 | -| std | 0.00587 | -| value_loss | 4.86e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 24710 | -| time_elapsed | 134524 | -| total_timesteps | 3162880 | -| train/ | | -| approx_kl | 0.2202426 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 247090 | -| policy_gradient_loss | 0.0565 | -| std | 0.00587 | -| value_loss | 3.44e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24711 | -| time_elapsed | 134529 | -| total_timesteps | 3163008 | -| train/ | | -| approx_kl | 0.06429925 | -| clip_fraction | 0.611 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.0419 | -| n_updates | 247100 | -| policy_gradient_loss | 0.0759 | -| std | 0.00587 | -| value_loss | 1.82e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24712 | -| time_elapsed | 134541 | -| total_timesteps | 3163136 | -| train/ | | -| approx_kl | 0.061526988 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 247110 | -| policy_gradient_loss | -0.0215 | -| std | 0.00587 | -| value_loss | 0.000166 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24713 | -| time_elapsed | 134546 | -| total_timesteps | 3163264 | -| train/ | | -| approx_kl | 0.005168706 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.851 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 247120 | -| policy_gradient_loss | -0.00502 | -| std | 0.00587 | -| value_loss | 2.89e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24714 | -| time_elapsed | 134551 | -| total_timesteps | 3163392 | -| train/ | | -| approx_kl | 7.886998e-05 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00359 | -| learning_rate | 0.0003 | -| loss | 0.000267 | -| n_updates | 247130 | -| policy_gradient_loss | 0.0089 | -| std | 0.00588 | -| value_loss | 1.86e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24715 | -| time_elapsed | 134554 | -| total_timesteps | 3163520 | -| train/ | | -| approx_kl | 0.080510765 | -| clip_fraction | 0.604 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0366 | -| n_updates | 247140 | -| policy_gradient_loss | 0.0708 | -| std | 0.00588 | -| value_loss | 1.65e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24716 | -| time_elapsed | 134557 | -| total_timesteps | 3163648 | -| train/ | | -| approx_kl | 0.31757748 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 247150 | -| policy_gradient_loss | 0.0599 | -| std | 0.00588 | -| value_loss | 5.11e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24717 | -| time_elapsed | 134562 | -| total_timesteps | 3163776 | -| train/ | | -| approx_kl | 0.0017160978 | -| clip_fraction | 0.2 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00811 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 247160 | -| policy_gradient_loss | 0.0148 | -| std | 0.00588 | -| value_loss | 2.4e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 24718 | -| time_elapsed | 134566 | -| total_timesteps | 3163904 | -| train/ | | -| approx_kl | 1.2229197e-05 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0544 | -| learning_rate | 0.0003 | -| loss | -0.000539 | -| n_updates | 247170 | -| policy_gradient_loss | 0.00736 | -| std | 0.00589 | -| value_loss | 2.13e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24719 | -| time_elapsed | 134570 | -| total_timesteps | 3164032 | -| train/ | | -| approx_kl | 0.00029449165 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 247180 | -| policy_gradient_loss | 0.0116 | -| std | 0.00589 | -| value_loss | 1.09e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24720 | -| time_elapsed | 134579 | -| total_timesteps | 3164160 | -| train/ | | -| approx_kl | 0.013924659 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 247190 | -| policy_gradient_loss | 0.0302 | -| std | 0.00589 | -| value_loss | 0.000791 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24721 | -| time_elapsed | 134584 | -| total_timesteps | 3164288 | -| train/ | | -| approx_kl | 0.042751648 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.82 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 247200 | -| policy_gradient_loss | 0.067 | -| std | 0.00589 | -| value_loss | 3.47e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24722 | -| time_elapsed | 134588 | -| total_timesteps | 3164416 | -| train/ | | -| approx_kl | 0.01623055 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00501 | -| learning_rate | 0.0003 | -| loss | -0.000956 | -| n_updates | 247210 | -| policy_gradient_loss | 0.0203 | -| std | 0.00589 | -| value_loss | 3.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24723 | -| time_elapsed | 134593 | -| total_timesteps | 3164544 | -| train/ | | -| approx_kl | 0.17414002 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0718 | -| n_updates | 247220 | -| policy_gradient_loss | 0.0131 | -| std | 0.00589 | -| value_loss | 1.56e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24724 | -| time_elapsed | 134597 | -| total_timesteps | 3164672 | -| train/ | | -| approx_kl | 0.0039217845 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | 0.00544 | -| n_updates | 247230 | -| policy_gradient_loss | 0.0277 | -| std | 0.00589 | -| value_loss | 1.14e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24725 | -| time_elapsed | 134602 | -| total_timesteps | 3164800 | -| train/ | | -| approx_kl | 0.61746895 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0708 | -| learning_rate | 0.0003 | -| loss | 0.358 | -| n_updates | 247240 | -| policy_gradient_loss | 0.21 | -| std | 0.00589 | -| value_loss | 6.41e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 24726 | -| time_elapsed | 134607 | -| total_timesteps | 3164928 | -| train/ | | -| approx_kl | 0.09922034 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 247250 | -| policy_gradient_loss | 0.0287 | -| std | 0.00589 | -| value_loss | 5.5e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24727 | -| time_elapsed | 134612 | -| total_timesteps | 3165056 | -| train/ | | -| approx_kl | 0.004256595 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.00219 | -| n_updates | 247260 | -| policy_gradient_loss | 0.034 | -| std | 0.00589 | -| value_loss | 2.88e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24728 | -| time_elapsed | 134617 | -| total_timesteps | 3165184 | -| train/ | | -| approx_kl | 0.015171139 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.665 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 247270 | -| policy_gradient_loss | 0.000821 | -| std | 0.00588 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24729 | -| time_elapsed | 134619 | -| total_timesteps | 3165312 | -| train/ | | -| approx_kl | 0.0014015906 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0523 | -| learning_rate | 0.0003 | -| loss | 0.00555 | -| n_updates | 247280 | -| policy_gradient_loss | 0.0318 | -| std | 0.00588 | -| value_loss | 1.92e-06 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24730 | -| time_elapsed | 134622 | -| total_timesteps | 3165440 | -| train/ | | -| approx_kl | 0.574221 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.487 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 247290 | -| policy_gradient_loss | 0.0473 | -| std | 0.00589 | -| value_loss | 3.6e-07 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24731 | -| time_elapsed | 134625 | -| total_timesteps | 3165568 | -| train/ | | -| approx_kl | 7.9469755e-05 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | -0.0026 | -| n_updates | 247300 | -| policy_gradient_loss | -0.00386 | -| std | 0.00589 | -| value_loss | 3.14e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24732 | -| time_elapsed | 134629 | -| total_timesteps | 3165696 | -| train/ | | -| approx_kl | 0.069585875 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 247310 | -| policy_gradient_loss | 0.0104 | -| std | 0.00589 | -| value_loss | 1.45e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24733 | -| time_elapsed | 134634 | -| total_timesteps | 3165824 | -| train/ | | -| approx_kl | 0.0409718 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.00679 | -| n_updates | 247320 | -| policy_gradient_loss | 0.00322 | -| std | 0.00589 | -| value_loss | 1.1e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24734 | -| time_elapsed | 134638 | -| total_timesteps | 3165952 | -| train/ | | -| approx_kl | 0.049061976 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 247330 | -| policy_gradient_loss | 0.016 | -| std | 0.00589 | -| value_loss | 6.72e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24735 | -| time_elapsed | 134644 | -| total_timesteps | 3166080 | -| train/ | | -| approx_kl | 0.008320333 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.00257 | -| n_updates | 247340 | -| policy_gradient_loss | 0.00829 | -| std | 0.00589 | -| value_loss | 7.13e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24736 | -| time_elapsed | 134654 | -| total_timesteps | 3166208 | -| train/ | | -| approx_kl | 0.025906593 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 247350 | -| policy_gradient_loss | -0.0259 | -| std | 0.00589 | -| value_loss | 0.00252 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24737 | -| time_elapsed | 134660 | -| total_timesteps | 3166336 | -| train/ | | -| approx_kl | 0.043658257 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | -1.55e-05 | -| n_updates | 247360 | -| policy_gradient_loss | 0.00377 | -| std | 0.00589 | -| value_loss | 1.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24738 | -| time_elapsed | 134666 | -| total_timesteps | 3166464 | -| train/ | | -| approx_kl | 0.008077406 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0079 | -| learning_rate | 0.0003 | -| loss | -0.0011 | -| n_updates | 247370 | -| policy_gradient_loss | 0.00981 | -| std | 0.00589 | -| value_loss | 1.21e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24739 | -| time_elapsed | 134671 | -| total_timesteps | 3166592 | -| train/ | | -| approx_kl | 0.083043315 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.00315 | -| n_updates | 247380 | -| policy_gradient_loss | 0.0245 | -| std | 0.00589 | -| value_loss | 9.55e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24740 | -| time_elapsed | 134677 | -| total_timesteps | 3166720 | -| train/ | | -| approx_kl | 1.1204346 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.32 | -| n_updates | 247390 | -| policy_gradient_loss | 0.221 | -| std | 0.00589 | -| value_loss | 4.68e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24741 | -| time_elapsed | 134682 | -| total_timesteps | 3166848 | -| train/ | | -| approx_kl | 0.008946111 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 247400 | -| policy_gradient_loss | 0.0271 | -| std | 0.00589 | -| value_loss | 3.9e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24742 | -| time_elapsed | 134686 | -| total_timesteps | 3166976 | -| train/ | | -| approx_kl | 0.15814812 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.0641 | -| n_updates | 247410 | -| policy_gradient_loss | 0.0227 | -| std | 0.00589 | -| value_loss | 2.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 24743 | -| time_elapsed | 134692 | -| total_timesteps | 3167104 | -| train/ | | -| approx_kl | 0.027938187 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 247420 | -| policy_gradient_loss | 0.0373 | -| std | 0.00589 | -| value_loss | 1.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 24744 | -| time_elapsed | 134702 | -| total_timesteps | 3167232 | -| train/ | | -| approx_kl | 0.017331325 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 247430 | -| policy_gradient_loss | -0.00864 | -| std | 0.00589 | -| value_loss | 0.000122 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 24745 | -| time_elapsed | 134707 | -| total_timesteps | 3167360 | -| train/ | | -| approx_kl | 0.00010305224 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0503 | -| learning_rate | 0.0003 | -| loss | -0.00134 | -| n_updates | 247440 | -| policy_gradient_loss | 0.0269 | -| std | 0.00589 | -| value_loss | 1.42e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 24746 | -| time_elapsed | 134713 | -| total_timesteps | 3167488 | -| train/ | | -| approx_kl | 0.6573975 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 247450 | -| policy_gradient_loss | 0.0616 | -| std | 0.00589 | -| value_loss | 1.09e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 24747 | -| time_elapsed | 134717 | -| total_timesteps | 3167616 | -| train/ | | -| approx_kl | 0.01216583 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.000758 | -| n_updates | 247460 | -| policy_gradient_loss | 0.00961 | -| std | 0.00589 | -| value_loss | 7.57e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 24748 | -| time_elapsed | 134723 | -| total_timesteps | 3167744 | -| train/ | | -| approx_kl | 0.00077497493 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.00318 | -| n_updates | 247470 | -| policy_gradient_loss | 0.0048 | -| std | 0.00589 | -| value_loss | 5.06e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.962 | -| time/ | | -| fps | 23 | -| iterations | 24749 | -| time_elapsed | 134729 | -| total_timesteps | 3167872 | -| train/ | | -| approx_kl | 0.0047397474 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | 0.000792 | -| n_updates | 247480 | -| policy_gradient_loss | 0.0102 | -| std | 0.00587 | -| value_loss | 3.37e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24750 | -| time_elapsed | 134733 | -| total_timesteps | 3168000 | -| train/ | | -| approx_kl | 0.078110084 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.56 | -| learning_rate | 0.0003 | -| loss | 0.00976 | -| n_updates | 247490 | -| policy_gradient_loss | 0.00077 | -| std | 0.00586 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24751 | -| time_elapsed | 134738 | -| total_timesteps | 3168128 | -| train/ | | -| approx_kl | 0.013640726 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0132 | -| learning_rate | 0.0003 | -| loss | -0.00176 | -| n_updates | 247500 | -| policy_gradient_loss | 0.0063 | -| std | 0.00586 | -| value_loss | 1.34e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24752 | -| time_elapsed | 134748 | -| total_timesteps | 3168256 | -| train/ | | -| approx_kl | 0.0951324 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 247510 | -| policy_gradient_loss | 0.0112 | -| std | 0.00586 | -| value_loss | 0.00085 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24753 | -| time_elapsed | 134752 | -| total_timesteps | 3168384 | -| train/ | | -| approx_kl | 0.12696177 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.0514 | -| n_updates | 247520 | -| policy_gradient_loss | 0.037 | -| std | 0.00586 | -| value_loss | 4.84e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24754 | -| time_elapsed | 134757 | -| total_timesteps | 3168512 | -| train/ | | -| approx_kl | 0.21112143 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0129 | -| learning_rate | 0.0003 | -| loss | 0.0808 | -| n_updates | 247530 | -| policy_gradient_loss | 0.0325 | -| std | 0.00586 | -| value_loss | 3.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24755 | -| time_elapsed | 134760 | -| total_timesteps | 3168640 | -| train/ | | -| approx_kl | 0.010745324 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0329 | -| learning_rate | 0.0003 | -| loss | 0.00306 | -| n_updates | 247540 | -| policy_gradient_loss | 0.0242 | -| std | 0.00585 | -| value_loss | 1.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24756 | -| time_elapsed | 134764 | -| total_timesteps | 3168768 | -| train/ | | -| approx_kl | 0.24435307 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0155 | -| learning_rate | 0.0003 | -| loss | 0.0914 | -| n_updates | 247550 | -| policy_gradient_loss | 0.0244 | -| std | 0.00585 | -| value_loss | 1.07e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 24757 | -| time_elapsed | 134767 | -| total_timesteps | 3168896 | -| train/ | | -| approx_kl | 0.02735477 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00589 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 247560 | -| policy_gradient_loss | 0.0468 | -| std | 0.00585 | -| value_loss | 2.92e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24758 | -| time_elapsed | 134773 | -| total_timesteps | 3169024 | -| train/ | | -| approx_kl | 0.09582394 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.0575 | -| n_updates | 247570 | -| policy_gradient_loss | 0.0282 | -| std | 0.00585 | -| value_loss | 2.28e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24759 | -| time_elapsed | 134783 | -| total_timesteps | 3169152 | -| train/ | | -| approx_kl | 0.13005598 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.23 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 247580 | -| policy_gradient_loss | -0.0216 | -| std | 0.00584 | -| value_loss | 0.00335 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24760 | -| time_elapsed | 134789 | -| total_timesteps | 3169280 | -| train/ | | -| approx_kl | 0.00864898 | -| clip_fraction | 0.579 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.504 | -| learning_rate | 0.0003 | -| loss | 0.00491 | -| n_updates | 247590 | -| policy_gradient_loss | 0.158 | -| std | 0.00583 | -| value_loss | 1.57e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24761 | -| time_elapsed | 134794 | -| total_timesteps | 3169408 | -| train/ | | -| approx_kl | 0.013878627 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 247600 | -| policy_gradient_loss | 0.0305 | -| std | 0.00583 | -| value_loss | 1.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24762 | -| time_elapsed | 134799 | -| total_timesteps | 3169536 | -| train/ | | -| approx_kl | 0.29324597 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.716 | -| learning_rate | 0.0003 | -| loss | 0.058 | -| n_updates | 247610 | -| policy_gradient_loss | 0.075 | -| std | 0.00583 | -| value_loss | 9.59e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24763 | -| time_elapsed | 134805 | -| total_timesteps | 3169664 | -| train/ | | -| approx_kl | 0.06628968 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.000289 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 247620 | -| policy_gradient_loss | 0.0175 | -| std | 0.00583 | -| value_loss | 3.81e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24764 | -| time_elapsed | 134811 | -| total_timesteps | 3169792 | -| train/ | | -| approx_kl | 0.18507221 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00649 | -| learning_rate | 0.0003 | -| loss | 0.0786 | -| n_updates | 247630 | -| policy_gradient_loss | 0.021 | -| std | 0.00583 | -| value_loss | 2.31e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 24765 | -| time_elapsed | 134816 | -| total_timesteps | 3169920 | -| train/ | | -| approx_kl | 0.019101853 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.00724 | -| n_updates | 247640 | -| policy_gradient_loss | 0.00312 | -| std | 0.00583 | -| value_loss | 1.52e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24766 | -| time_elapsed | 134821 | -| total_timesteps | 3170048 | -| train/ | | -| approx_kl | 0.0130083 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 247650 | -| policy_gradient_loss | -0.00277 | -| std | 0.00583 | -| value_loss | 1.23e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24767 | -| time_elapsed | 134830 | -| total_timesteps | 3170176 | -| train/ | | -| approx_kl | 0.011136558 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.714 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 247660 | -| policy_gradient_loss | -0.00412 | -| std | 0.00583 | -| value_loss | 0.00175 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24768 | -| time_elapsed | 134835 | -| total_timesteps | 3170304 | -| train/ | | -| approx_kl | 0.021584995 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.00217 | -| n_updates | 247670 | -| policy_gradient_loss | 0.0319 | -| std | 0.00583 | -| value_loss | 6.15e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24769 | -| time_elapsed | 134840 | -| total_timesteps | 3170432 | -| train/ | | -| approx_kl | 0.4525924 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0156 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 247680 | -| policy_gradient_loss | 0.15 | -| std | 0.00584 | -| value_loss | 6.95e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24770 | -| time_elapsed | 134844 | -| total_timesteps | 3170560 | -| train/ | | -| approx_kl | 0.05828109 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | 0.0291 | -| n_updates | 247690 | -| policy_gradient_loss | 0.0305 | -| std | 0.00584 | -| value_loss | 4.34e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24771 | -| time_elapsed | 134850 | -| total_timesteps | 3170688 | -| train/ | | -| approx_kl | 0.0009652497 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.000802 | -| n_updates | 247700 | -| policy_gradient_loss | 0.0427 | -| std | 0.00584 | -| value_loss | 2.45e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24772 | -| time_elapsed | 134853 | -| total_timesteps | 3170816 | -| train/ | | -| approx_kl | 0.5984105 | -| clip_fraction | 0.534 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.214 | -| n_updates | 247710 | -| policy_gradient_loss | 0.0698 | -| std | 0.00584 | -| value_loss | 2.74e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 24773 | -| time_elapsed | 134858 | -| total_timesteps | 3170944 | -| train/ | | -| approx_kl | 0.014684323 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0189 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 247720 | -| policy_gradient_loss | 0.0111 | -| std | 0.00584 | -| value_loss | 1.64e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24774 | -| time_elapsed | 134863 | -| total_timesteps | 3171072 | -| train/ | | -| approx_kl | 0.09390865 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.054 | -| n_updates | 247730 | -| policy_gradient_loss | 0.0226 | -| std | 0.00584 | -| value_loss | 9.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24775 | -| time_elapsed | 134870 | -| total_timesteps | 3171200 | -| train/ | | -| approx_kl | 0.03857118 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.616 | -| learning_rate | 0.0003 | -| loss | -0.0204 | -| n_updates | 247740 | -| policy_gradient_loss | -0.00787 | -| std | 0.00584 | -| value_loss | 0.00118 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24776 | -| time_elapsed | 134876 | -| total_timesteps | 3171328 | -| train/ | | -| approx_kl | 0.0012982883 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.000926 | -| learning_rate | 0.0003 | -| loss | -0.00854 | -| n_updates | 247750 | -| policy_gradient_loss | 0.0231 | -| std | 0.00584 | -| value_loss | 2.15e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24777 | -| time_elapsed | 134882 | -| total_timesteps | 3171456 | -| train/ | | -| approx_kl | 0.56527245 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 247760 | -| policy_gradient_loss | 0.0464 | -| std | 0.00584 | -| value_loss | 6.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24778 | -| time_elapsed | 134887 | -| total_timesteps | 3171584 | -| train/ | | -| approx_kl | 0.012667569 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.00128 | -| n_updates | 247770 | -| policy_gradient_loss | 0.00938 | -| std | 0.00584 | -| value_loss | 4.43e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24779 | -| time_elapsed | 134891 | -| total_timesteps | 3171712 | -| train/ | | -| approx_kl | 0.08072831 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 247780 | -| policy_gradient_loss | 0.00624 | -| std | 0.00584 | -| value_loss | 3.42e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24780 | -| time_elapsed | 134895 | -| total_timesteps | 3171840 | -| train/ | | -| approx_kl | 0.070881404 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0442 | -| n_updates | 247790 | -| policy_gradient_loss | 0.023 | -| std | 0.00584 | -| value_loss | 2.35e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.947 | -| time/ | | -| fps | 23 | -| iterations | 24781 | -| time_elapsed | 134899 | -| total_timesteps | 3171968 | -| train/ | | -| approx_kl | 0.010174101 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 247800 | -| policy_gradient_loss | 0.0103 | -| std | 0.00584 | -| value_loss | 1.39e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24782 | -| time_elapsed | 134904 | -| total_timesteps | 3172096 | -| train/ | | -| approx_kl | 0.0848099 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.0335 | -| n_updates | 247810 | -| policy_gradient_loss | 0.0119 | -| std | 0.00584 | -| value_loss | 9.52e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24783 | -| time_elapsed | 134914 | -| total_timesteps | 3172224 | -| train/ | | -| approx_kl | 0.030917779 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 247820 | -| policy_gradient_loss | 0.00644 | -| std | 0.00584 | -| value_loss | 0.00104 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24784 | -| time_elapsed | 134919 | -| total_timesteps | 3172352 | -| train/ | | -| approx_kl | 0.0035479763 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0678 | -| learning_rate | 0.0003 | -| loss | -0.00551 | -| n_updates | 247830 | -| policy_gradient_loss | 0.0111 | -| std | 0.00583 | -| value_loss | 5.28e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24785 | -| time_elapsed | 134924 | -| total_timesteps | 3172480 | -| train/ | | -| approx_kl | 0.045172818 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0146 | -| learning_rate | 0.0003 | -| loss | 0.0335 | -| n_updates | 247840 | -| policy_gradient_loss | 0.0961 | -| std | 0.00584 | -| value_loss | 1.43e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24786 | -| time_elapsed | 134927 | -| total_timesteps | 3172608 | -| train/ | | -| approx_kl | 0.014509546 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.00387 | -| n_updates | 247850 | -| policy_gradient_loss | 0.0368 | -| std | 0.00584 | -| value_loss | 1.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24787 | -| time_elapsed | 134931 | -| total_timesteps | 3172736 | -| train/ | | -| approx_kl | 0.89373076 | -| clip_fraction | 0.565 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | 0.329 | -| n_updates | 247860 | -| policy_gradient_loss | 0.0977 | -| std | 0.00584 | -| value_loss | 7.78e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24788 | -| time_elapsed | 134936 | -| total_timesteps | 3172864 | -| train/ | | -| approx_kl | 0.051723693 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.00141 | -| n_updates | 247870 | -| policy_gradient_loss | 0.00109 | -| std | 0.00584 | -| value_loss | 7.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 24789 | -| time_elapsed | 134941 | -| total_timesteps | 3172992 | -| train/ | | -| approx_kl | 0.058733903 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 247880 | -| policy_gradient_loss | 0.0149 | -| std | 0.00584 | -| value_loss | 4.54e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 24790 | -| time_elapsed | 134947 | -| total_timesteps | 3173120 | -| train/ | | -| approx_kl | 0.009224532 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | -0.00389 | -| n_updates | 247890 | -| policy_gradient_loss | 0.00676 | -| std | 0.00583 | -| value_loss | 2.8e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 24791 | -| time_elapsed | 134959 | -| total_timesteps | 3173248 | -| train/ | | -| approx_kl | 0.04479763 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 247900 | -| policy_gradient_loss | 0.0018 | -| std | 0.00583 | -| value_loss | 0.000375 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 24792 | -| time_elapsed | 134965 | -| total_timesteps | 3173376 | -| train/ | | -| approx_kl | 0.7016791 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.254 | -| n_updates | 247910 | -| policy_gradient_loss | 0.0791 | -| std | 0.00583 | -| value_loss | 4.46e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 24793 | -| time_elapsed | 134969 | -| total_timesteps | 3173504 | -| train/ | | -| approx_kl | 0.051016487 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 247920 | -| policy_gradient_loss | 0.0128 | -| std | 0.00583 | -| value_loss | 5.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 24794 | -| time_elapsed | 134973 | -| total_timesteps | 3173632 | -| train/ | | -| approx_kl | 0.009855914 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0811 | -| learning_rate | 0.0003 | -| loss | -0.00406 | -| n_updates | 247930 | -| policy_gradient_loss | 0.00672 | -| std | 0.00583 | -| value_loss | 2.1e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 24795 | -| time_elapsed | 134976 | -| total_timesteps | 3173760 | -| train/ | | -| approx_kl | 0.0012005414 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | 0.00643 | -| n_updates | 247940 | -| policy_gradient_loss | 0.00372 | -| std | 0.00583 | -| value_loss | 1.46e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 24796 | -| time_elapsed | 134979 | -| total_timesteps | 3173888 | -| train/ | | -| approx_kl | 0.05776041 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.0129 | -| n_updates | 247950 | -| policy_gradient_loss | 0.00462 | -| std | 0.00583 | -| value_loss | 9.85e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24797 | -| time_elapsed | 134983 | -| total_timesteps | 3174016 | -| train/ | | -| approx_kl | 0.05271367 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 247960 | -| policy_gradient_loss | 0.00957 | -| std | 0.00583 | -| value_loss | 6.98e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24798 | -| time_elapsed | 134996 | -| total_timesteps | 3174144 | -| train/ | | -| approx_kl | 0.05236758 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 247970 | -| policy_gradient_loss | -0.00429 | -| std | 0.00583 | -| value_loss | 0.000814 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24799 | -| time_elapsed | 135001 | -| total_timesteps | 3174272 | -| train/ | | -| approx_kl | 0.0059522213 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.118 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 247980 | -| policy_gradient_loss | 0.0122 | -| std | 0.00584 | -| value_loss | 8.49e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24800 | -| time_elapsed | 135007 | -| total_timesteps | 3174400 | -| train/ | | -| approx_kl | 0.06741456 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 247990 | -| policy_gradient_loss | 0.00645 | -| std | 0.00584 | -| value_loss | 4.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24801 | -| time_elapsed | 135013 | -| total_timesteps | 3174528 | -| train/ | | -| approx_kl | 0.014775135 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | -0.00636 | -| n_updates | 248000 | -| policy_gradient_loss | 0.00991 | -| std | 0.00585 | -| value_loss | 3.28e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24802 | -| time_elapsed | 135017 | -| total_timesteps | 3174656 | -| train/ | | -| approx_kl | 0.0022290368 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0262 | -| learning_rate | 0.0003 | -| loss | 0.000167 | -| n_updates | 248010 | -| policy_gradient_loss | 0.00585 | -| std | 0.00584 | -| value_loss | 2.86e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24803 | -| time_elapsed | 135022 | -| total_timesteps | 3174784 | -| train/ | | -| approx_kl | 0.0787284 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.209 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 248020 | -| policy_gradient_loss | 0.0343 | -| std | 0.00584 | -| value_loss | 3.05e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.948 | -| time/ | | -| fps | 23 | -| iterations | 24804 | -| time_elapsed | 135027 | -| total_timesteps | 3174912 | -| train/ | | -| approx_kl | 0.17176493 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0155 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 248030 | -| policy_gradient_loss | 0.078 | -| std | 0.00584 | -| value_loss | 1.81e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24805 | -| time_elapsed | 135031 | -| total_timesteps | 3175040 | -| train/ | | -| approx_kl | 2.7649105e-05 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 6.84e-05 | -| n_updates | 248040 | -| policy_gradient_loss | 0.0111 | -| std | 0.00584 | -| value_loss | 8.19e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24806 | -| time_elapsed | 135038 | -| total_timesteps | 3175168 | -| train/ | | -| approx_kl | 0.016694494 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.88 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 248050 | -| policy_gradient_loss | -0.0107 | -| std | 0.00584 | -| value_loss | 0.00204 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24807 | -| time_elapsed | 135043 | -| total_timesteps | 3175296 | -| train/ | | -| approx_kl | 0.0015250142 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.549 | -| learning_rate | 0.0003 | -| loss | -0.0047 | -| n_updates | 248060 | -| policy_gradient_loss | 0.0365 | -| std | 0.00584 | -| value_loss | 1.33e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24808 | -| time_elapsed | 135048 | -| total_timesteps | 3175424 | -| train/ | | -| approx_kl | 0.21215066 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0967 | -| n_updates | 248070 | -| policy_gradient_loss | 0.0273 | -| std | 0.00584 | -| value_loss | 3.25e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24809 | -| time_elapsed | 135055 | -| total_timesteps | 3175552 | -| train/ | | -| approx_kl | 0.02664515 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 248080 | -| policy_gradient_loss | 0.0393 | -| std | 0.00584 | -| value_loss | 8.48e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24810 | -| time_elapsed | 135059 | -| total_timesteps | 3175680 | -| train/ | | -| approx_kl | 0.37807745 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 248090 | -| policy_gradient_loss | 0.15 | -| std | 0.00584 | -| value_loss | 4.99e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24811 | -| time_elapsed | 135064 | -| total_timesteps | 3175808 | -| train/ | | -| approx_kl | 0.178866 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 248100 | -| policy_gradient_loss | 0.141 | -| std | 0.00585 | -| value_loss | 3.32e-07 | --------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.949 | -| time/ | | -| fps | 23 | -| iterations | 24812 | -| time_elapsed | 135069 | -| total_timesteps | 3175936 | -| train/ | | -| approx_kl | 0.1544843 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 248110 | -| policy_gradient_loss | 0.145 | -| std | 0.00585 | -| value_loss | 2.03e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24813 | -| time_elapsed | 135074 | -| total_timesteps | 3176064 | -| train/ | | -| approx_kl | 0.13129987 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0402 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 248120 | -| policy_gradient_loss | 0.111 | -| std | 0.00585 | -| value_loss | 1.58e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24814 | -| time_elapsed | 135081 | -| total_timesteps | 3176192 | -| train/ | | -| approx_kl | 0.17921418 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.902 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 248130 | -| policy_gradient_loss | 0.0261 | -| std | 0.00585 | -| value_loss | 0.000431 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24815 | -| time_elapsed | 135087 | -| total_timesteps | 3176320 | -| train/ | | -| approx_kl | 0.040523462 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -4.07 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 248140 | -| policy_gradient_loss | 0.0141 | -| std | 0.00585 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24816 | -| time_elapsed | 135093 | -| total_timesteps | 3176448 | -| train/ | | -| approx_kl | 0.75306785 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -8.77 | -| learning_rate | 0.0003 | -| loss | 0.247 | -| n_updates | 248150 | -| policy_gradient_loss | 0.07 | -| std | 0.00585 | -| value_loss | 1.35e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24817 | -| time_elapsed | 135098 | -| total_timesteps | 3176576 | -| train/ | | -| approx_kl | 0.015224988 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.00492 | -| n_updates | 248160 | -| policy_gradient_loss | 0.012 | -| std | 0.00585 | -| value_loss | 2.25e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24818 | -| time_elapsed | 135103 | -| total_timesteps | 3176704 | -| train/ | | -| approx_kl | 0.074495584 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.516 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 248170 | -| policy_gradient_loss | 0.00608 | -| std | 0.00585 | -| value_loss | 1.16e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24819 | -| time_elapsed | 135107 | -| total_timesteps | 3176832 | -| train/ | | -| approx_kl | 0.047094688 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0996 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 248180 | -| policy_gradient_loss | 0.0156 | -| std | 0.00585 | -| value_loss | 6.65e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 24820 | -| time_elapsed | 135112 | -| total_timesteps | 3176960 | -| train/ | | -| approx_kl | 0.010672996 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0657 | -| learning_rate | 0.0003 | -| loss | 0.00299 | -| n_updates | 248190 | -| policy_gradient_loss | 0.0122 | -| std | 0.00584 | -| value_loss | 4.08e-11 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24821 | -| time_elapsed | 135116 | -| total_timesteps | 3177088 | -| train/ | | -| approx_kl | 0.0012114551 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0753 | -| learning_rate | 0.0003 | -| loss | 0.00198 | -| n_updates | 248200 | -| policy_gradient_loss | 0.011 | -| std | 0.00584 | -| value_loss | 3.85e-11 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24822 | -| time_elapsed | 135124 | -| total_timesteps | 3177216 | -| train/ | | -| approx_kl | 0.11265187 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.97 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 248210 | -| policy_gradient_loss | 0.00351 | -| std | 0.00584 | -| value_loss | 0.000161 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24823 | -| time_elapsed | 135129 | -| total_timesteps | 3177344 | -| train/ | | -| approx_kl | 0.007417961 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0984 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 248220 | -| policy_gradient_loss | 0.0438 | -| std | 0.00584 | -| value_loss | 5.47e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24824 | -| time_elapsed | 135132 | -| total_timesteps | 3177472 | -| train/ | | -| approx_kl | 0.34395102 | -| clip_fraction | 0.729 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0138 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 248230 | -| policy_gradient_loss | 0.205 | -| std | 0.00583 | -| value_loss | 5.07e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24825 | -| time_elapsed | 135137 | -| total_timesteps | 3177600 | -| train/ | | -| approx_kl | 0.27721518 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 248240 | -| policy_gradient_loss | 0.158 | -| std | 0.00583 | -| value_loss | 3.69e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24826 | -| time_elapsed | 135141 | -| total_timesteps | 3177728 | -| train/ | | -| approx_kl | 0.20641725 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.171 | -| n_updates | 248250 | -| policy_gradient_loss | 0.177 | -| std | 0.00584 | -| value_loss | 3.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24827 | -| time_elapsed | 135145 | -| total_timesteps | 3177856 | -| train/ | | -| approx_kl | 0.041161187 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.00818 | -| n_updates | 248260 | -| policy_gradient_loss | 0.0352 | -| std | 0.00584 | -| value_loss | 2.56e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.939 | -| time/ | | -| fps | 23 | -| iterations | 24828 | -| time_elapsed | 135150 | -| total_timesteps | 3177984 | -| train/ | | -| approx_kl | 0.20611897 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0994 | -| n_updates | 248270 | -| policy_gradient_loss | 0.0275 | -| std | 0.00583 | -| value_loss | 4.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 24829 | -| time_elapsed | 135154 | -| total_timesteps | 3178112 | -| train/ | | -| approx_kl | 0.025594283 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | 0.00922 | -| n_updates | 248280 | -| policy_gradient_loss | 0.0309 | -| std | 0.00583 | -| value_loss | 1.87e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 24830 | -| time_elapsed | 135163 | -| total_timesteps | 3178240 | -| train/ | | -| approx_kl | 0.9421634 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.841 | -| learning_rate | 0.0003 | -| loss | 0.0648 | -| n_updates | 248290 | -| policy_gradient_loss | 0.0727 | -| std | 0.00583 | -| value_loss | 0.000681 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 24831 | -| time_elapsed | 135169 | -| total_timesteps | 3178368 | -| train/ | | -| approx_kl | 0.13429797 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.0627 | -| n_updates | 248300 | -| policy_gradient_loss | 0.0174 | -| std | 0.00584 | -| value_loss | 1.92e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 24832 | -| time_elapsed | 135174 | -| total_timesteps | 3178496 | -| train/ | | -| approx_kl | 0.11605293 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0152 | -| learning_rate | 0.0003 | -| loss | 0.0705 | -| n_updates | 248310 | -| policy_gradient_loss | 0.0369 | -| std | 0.00585 | -| value_loss | 1.71e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 24833 | -| time_elapsed | 135177 | -| total_timesteps | 3178624 | -| train/ | | -| approx_kl | 0.0006664358 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00988 | -| learning_rate | 0.0003 | -| loss | 0.00154 | -| n_updates | 248320 | -| policy_gradient_loss | 0.0292 | -| std | 0.00587 | -| value_loss | 5.7e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 24834 | -| time_elapsed | 135181 | -| total_timesteps | 3178752 | -| train/ | | -| approx_kl | 0.7795094 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00869 | -| learning_rate | 0.0003 | -| loss | 0.201 | -| n_updates | 248330 | -| policy_gradient_loss | 0.0722 | -| std | 0.00587 | -| value_loss | 4.1e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 24835 | -| time_elapsed | 135185 | -| total_timesteps | 3178880 | -| train/ | | -| approx_kl | 0.05609562 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.01 | -| learning_rate | 0.0003 | -| loss | 0.00807 | -| n_updates | 248340 | -| policy_gradient_loss | 0.00457 | -| std | 0.00587 | -| value_loss | 7.26e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24836 | -| time_elapsed | 135189 | -| total_timesteps | 3179008 | -| train/ | | -| approx_kl | 0.009499283 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.199 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 248350 | -| policy_gradient_loss | 0.00833 | -| std | 0.00587 | -| value_loss | 6.54e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24837 | -| time_elapsed | 135200 | -| total_timesteps | 3179136 | -| train/ | | -| approx_kl | 0.03565098 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 248360 | -| policy_gradient_loss | 0.0134 | -| std | 0.00587 | -| value_loss | 3.94e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24838 | -| time_elapsed | 135205 | -| total_timesteps | 3179264 | -| train/ | | -| approx_kl | 0.10990879 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.58 | -| learning_rate | 0.0003 | -| loss | 0.0664 | -| n_updates | 248370 | -| policy_gradient_loss | 0.0332 | -| std | 0.00587 | -| value_loss | 2.01e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24839 | -| time_elapsed | 135210 | -| total_timesteps | 3179392 | -| train/ | | -| approx_kl | 0.0525295 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00655 | -| learning_rate | 0.0003 | -| loss | 0.0214 | -| n_updates | 248380 | -| policy_gradient_loss | 0.0493 | -| std | 0.00587 | -| value_loss | 4.31e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24840 | -| time_elapsed | 135214 | -| total_timesteps | 3179520 | -| train/ | | -| approx_kl | 0.18299885 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00149 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 248390 | -| policy_gradient_loss | 0.0712 | -| std | 0.00587 | -| value_loss | 1.05e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24841 | -| time_elapsed | 135219 | -| total_timesteps | 3179648 | -| train/ | | -| approx_kl | 0.23563457 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 248400 | -| policy_gradient_loss | 0.04 | -| std | 0.00587 | -| value_loss | 6.71e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24842 | -| time_elapsed | 135223 | -| total_timesteps | 3179776 | -| train/ | | -| approx_kl | 0.0011408366 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.00487 | -| n_updates | 248410 | -| policy_gradient_loss | 0.0339 | -| std | 0.00587 | -| value_loss | 4.03e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24843 | -| time_elapsed | 135228 | -| total_timesteps | 3179904 | -| train/ | | -| approx_kl | 0.00012681913 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0397 | -| learning_rate | 0.0003 | -| loss | 0.00388 | -| n_updates | 248420 | -| policy_gradient_loss | -0.00259 | -| std | 0.00587 | -| value_loss | 8.96e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24844 | -| time_elapsed | 135233 | -| total_timesteps | 3180032 | -| train/ | | -| approx_kl | 0.21174257 | -| clip_fraction | 0.749 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.315 | -| learning_rate | 0.0003 | -| loss | 0.0907 | -| n_updates | 248430 | -| policy_gradient_loss | 0.122 | -| std | 0.00587 | -| value_loss | 5.01e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24845 | -| time_elapsed | 135244 | -| total_timesteps | 3180160 | -| train/ | | -| approx_kl | 0.24485303 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.775 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 248440 | -| policy_gradient_loss | 0.16 | -| std | 0.00587 | -| value_loss | 0.00485 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24846 | -| time_elapsed | 135248 | -| total_timesteps | 3180288 | -| train/ | | -| approx_kl | 0.043294597 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.58 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 248450 | -| policy_gradient_loss | 0.0313 | -| std | 0.00587 | -| value_loss | 8.91e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24847 | -| time_elapsed | 135253 | -| total_timesteps | 3180416 | -| train/ | | -| approx_kl | 0.68668777 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0135 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 248460 | -| policy_gradient_loss | 0.0553 | -| std | 0.00587 | -| value_loss | 2.8e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24848 | -| time_elapsed | 135257 | -| total_timesteps | 3180544 | -| train/ | | -| approx_kl | 0.06603198 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.0236 | -| n_updates | 248470 | -| policy_gradient_loss | 0.0133 | -| std | 0.00587 | -| value_loss | 1.55e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24849 | -| time_elapsed | 135263 | -| total_timesteps | 3180672 | -| train/ | | -| approx_kl | 0.010356588 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -0.00587 | -| n_updates | 248480 | -| policy_gradient_loss | 0.00929 | -| std | 0.00587 | -| value_loss | 1.06e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24850 | -| time_elapsed | 135268 | -| total_timesteps | 3180800 | -| train/ | | -| approx_kl | 0.09498612 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | -0.00705 | -| n_updates | 248490 | -| policy_gradient_loss | 0.0158 | -| std | 0.00588 | -| value_loss | 7.65e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24851 | -| time_elapsed | 135273 | -| total_timesteps | 3180928 | -| train/ | | -| approx_kl | 0.9594874 | -| clip_fraction | 0.759 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.311 | -| n_updates | 248500 | -| policy_gradient_loss | 0.188 | -| std | 0.00587 | -| value_loss | 1.22e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24852 | -| time_elapsed | 135277 | -| total_timesteps | 3181056 | -| train/ | | -| approx_kl | 0.006444126 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.179 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 248510 | -| policy_gradient_loss | 0.025 | -| std | 0.00587 | -| value_loss | 1.58e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24853 | -| time_elapsed | 135286 | -| total_timesteps | 3181184 | -| train/ | | -| approx_kl | 0.05649484 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.891 | -| learning_rate | 0.0003 | -| loss | -0.0237 | -| n_updates | 248520 | -| policy_gradient_loss | -0.0153 | -| std | 0.00587 | -| value_loss | 0.000472 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24854 | -| time_elapsed | 135291 | -| total_timesteps | 3181312 | -| train/ | | -| approx_kl | 0.083208084 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.559 | -| learning_rate | 0.0003 | -| loss | 0.0576 | -| n_updates | 248530 | -| policy_gradient_loss | 0.0399 | -| std | 0.00588 | -| value_loss | 1.31e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24855 | -| time_elapsed | 135296 | -| total_timesteps | 3181440 | -| train/ | | -| approx_kl | 0.20416556 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.488 | -| learning_rate | 0.0003 | -| loss | 0.0565 | -| n_updates | 248540 | -| policy_gradient_loss | 0.024 | -| std | 0.00588 | -| value_loss | 5.71e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24856 | -| time_elapsed | 135299 | -| total_timesteps | 3181568 | -| train/ | | -| approx_kl | 0.033244662 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0796 | -| learning_rate | 0.0003 | -| loss | 0.000152 | -| n_updates | 248550 | -| policy_gradient_loss | 0.0376 | -| std | 0.00588 | -| value_loss | 3.82e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24857 | -| time_elapsed | 135303 | -| total_timesteps | 3181696 | -| train/ | | -| approx_kl | 0.37732562 | -| clip_fraction | 0.75 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 248560 | -| policy_gradient_loss | 0.202 | -| std | 0.00588 | -| value_loss | 9.99e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24858 | -| time_elapsed | 135308 | -| total_timesteps | 3181824 | -| train/ | | -| approx_kl | 0.05964205 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.277 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 248570 | -| policy_gradient_loss | 0.0271 | -| std | 0.00588 | -| value_loss | 8.76e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 24859 | -| time_elapsed | 135312 | -| total_timesteps | 3181952 | -| train/ | | -| approx_kl | 0.0015814216 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0891 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 248580 | -| policy_gradient_loss | 0.0299 | -| std | 0.00588 | -| value_loss | 3.71e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24860 | -| time_elapsed | 135316 | -| total_timesteps | 3182080 | -| train/ | | -| approx_kl | 0.0007535503 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 248590 | -| policy_gradient_loss | 0.0326 | -| std | 0.00588 | -| value_loss | 2.14e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24861 | -| time_elapsed | 135323 | -| total_timesteps | 3182208 | -| train/ | | -| approx_kl | 0.020358663 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | 0.00554 | -| n_updates | 248600 | -| policy_gradient_loss | -0.00252 | -| std | 0.00588 | -| value_loss | 0.00429 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24862 | -| time_elapsed | 135326 | -| total_timesteps | 3182336 | -| train/ | | -| approx_kl | 0.092746854 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.208 | -| learning_rate | 0.0003 | -| loss | 0.0614 | -| n_updates | 248610 | -| policy_gradient_loss | 0.0276 | -| std | 0.00588 | -| value_loss | 5.26e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24863 | -| time_elapsed | 135330 | -| total_timesteps | 3182464 | -| train/ | | -| approx_kl | 0.052465845 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00379 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 248620 | -| policy_gradient_loss | 0.0167 | -| std | 0.00588 | -| value_loss | 2.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24864 | -| time_elapsed | 135335 | -| total_timesteps | 3182592 | -| train/ | | -| approx_kl | 0.062732324 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 248630 | -| policy_gradient_loss | 0.0102 | -| std | 0.00588 | -| value_loss | 2.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24865 | -| time_elapsed | 135339 | -| total_timesteps | 3182720 | -| train/ | | -| approx_kl | 0.010516904 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00269 | -| learning_rate | 0.0003 | -| loss | -0.00943 | -| n_updates | 248640 | -| policy_gradient_loss | 0.00619 | -| std | 0.00588 | -| value_loss | 6.77e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24866 | -| time_elapsed | 135344 | -| total_timesteps | 3182848 | -| train/ | | -| approx_kl | 0.0004502721 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | 0.000602 | -| n_updates | 248650 | -| policy_gradient_loss | 0.044 | -| std | 0.00587 | -| value_loss | 3.88e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24867 | -| time_elapsed | 135349 | -| total_timesteps | 3182976 | -| train/ | | -| approx_kl | 0.23163714 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.146 | -| n_updates | 248660 | -| policy_gradient_loss | 0.0737 | -| std | 0.00587 | -| value_loss | 3.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24868 | -| time_elapsed | 135353 | -| total_timesteps | 3183104 | -| train/ | | -| approx_kl | 0.01708877 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.0387 | -| n_updates | 248670 | -| policy_gradient_loss | 0.00276 | -| std | 0.00587 | -| value_loss | 2.66e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24869 | -| time_elapsed | 135363 | -| total_timesteps | 3183232 | -| train/ | | -| approx_kl | 0.0023498656 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 248680 | -| policy_gradient_loss | 0.0151 | -| std | 0.00587 | -| value_loss | 0.00172 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24870 | -| time_elapsed | 135369 | -| total_timesteps | 3183360 | -| train/ | | -| approx_kl | 0.00940221 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | 0.00759 | -| n_updates | 248690 | -| policy_gradient_loss | 0.0119 | -| std | 0.00587 | -| value_loss | 8.95e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24871 | -| time_elapsed | 135374 | -| total_timesteps | 3183488 | -| train/ | | -| approx_kl | 0.0920683 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | 0.0572 | -| n_updates | 248700 | -| policy_gradient_loss | 0.0247 | -| std | 0.00587 | -| value_loss | 3.05e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24872 | -| time_elapsed | 135377 | -| total_timesteps | 3183616 | -| train/ | | -| approx_kl | 0.06239048 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | 0.0473 | -| n_updates | 248710 | -| policy_gradient_loss | 0.0238 | -| std | 0.00587 | -| value_loss | 3.16e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24873 | -| time_elapsed | 135383 | -| total_timesteps | 3183744 | -| train/ | | -| approx_kl | 0.07259681 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 248720 | -| policy_gradient_loss | 0.0104 | -| std | 0.00587 | -| value_loss | 9.84e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24874 | -| time_elapsed | 135388 | -| total_timesteps | 3183872 | -| train/ | | -| approx_kl | 0.011495743 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 248730 | -| policy_gradient_loss | 0.00916 | -| std | 0.00587 | -| value_loss | 1.53e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24875 | -| time_elapsed | 135393 | -| total_timesteps | 3184000 | -| train/ | | -| approx_kl | 0.082997106 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.0464 | -| n_updates | 248740 | -| policy_gradient_loss | 0.0188 | -| std | 0.00587 | -| value_loss | 9.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24876 | -| time_elapsed | 135397 | -| total_timesteps | 3184128 | -| train/ | | -| approx_kl | 0.048244312 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00655 | -| learning_rate | 0.0003 | -| loss | 0.00662 | -| n_updates | 248750 | -| policy_gradient_loss | 0.00437 | -| std | 0.00586 | -| value_loss | 5.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24877 | -| time_elapsed | 135408 | -| total_timesteps | 3184256 | -| train/ | | -| approx_kl | 0.030433469 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.00207 | -| n_updates | 248760 | -| policy_gradient_loss | 0.00239 | -| std | 0.00586 | -| value_loss | 2.54e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24878 | -| time_elapsed | 135413 | -| total_timesteps | 3184384 | -| train/ | | -| approx_kl | 0.011719389 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00345 | -| learning_rate | 0.0003 | -| loss | 0.00194 | -| n_updates | 248770 | -| policy_gradient_loss | 0.0124 | -| std | 0.00586 | -| value_loss | 7.68e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24879 | -| time_elapsed | 135419 | -| total_timesteps | 3184512 | -| train/ | | -| approx_kl | 0.0015475643 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00929 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 248780 | -| policy_gradient_loss | 0.00385 | -| std | 0.00586 | -| value_loss | 3.48e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24880 | -| time_elapsed | 135424 | -| total_timesteps | 3184640 | -| train/ | | -| approx_kl | 0.06731728 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0309 | -| learning_rate | 0.0003 | -| loss | 0.0398 | -| n_updates | 248790 | -| policy_gradient_loss | 0.0177 | -| std | 0.00586 | -| value_loss | 1.99e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24881 | -| time_elapsed | 135428 | -| total_timesteps | 3184768 | -| train/ | | -| approx_kl | 0.062801205 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 248800 | -| policy_gradient_loss | 0.0124 | -| std | 0.00586 | -| value_loss | 1.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24882 | -| time_elapsed | 135433 | -| total_timesteps | 3184896 | -| train/ | | -| approx_kl | 0.015734108 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | -0.00503 | -| n_updates | 248810 | -| policy_gradient_loss | 0.0167 | -| std | 0.00586 | -| value_loss | 1.04e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24883 | -| time_elapsed | 135437 | -| total_timesteps | 3185024 | -| train/ | | -| approx_kl | 0.0031200196 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 3.15e-05 | -| n_updates | 248820 | -| policy_gradient_loss | 0.0151 | -| std | 0.00587 | -| value_loss | 6.34e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24884 | -| time_elapsed | 135448 | -| total_timesteps | 3185152 | -| train/ | | -| approx_kl | 0.23408931 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.532 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 248830 | -| policy_gradient_loss | 0.0235 | -| std | 0.00587 | -| value_loss | 0.0219 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24885 | -| time_elapsed | 135452 | -| total_timesteps | 3185280 | -| train/ | | -| approx_kl | 0.00022877334 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.828 | -| learning_rate | 0.0003 | -| loss | 0.00016 | -| n_updates | 248840 | -| policy_gradient_loss | 0.0333 | -| std | 0.00587 | -| value_loss | 0.000384 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24886 | -| time_elapsed | 135455 | -| total_timesteps | 3185408 | -| train/ | | -| approx_kl | 0.712837 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0152 | -| learning_rate | 0.0003 | -| loss | 0.23 | -| n_updates | 248850 | -| policy_gradient_loss | 0.0708 | -| std | 0.00587 | -| value_loss | 0.000207 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24887 | -| time_elapsed | 135460 | -| total_timesteps | 3185536 | -| train/ | | -| approx_kl | 0.058740236 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.587 | -| learning_rate | 0.0003 | -| loss | -0.00989 | -| n_updates | 248860 | -| policy_gradient_loss | -0.00363 | -| std | 0.00587 | -| value_loss | 7.11e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24888 | -| time_elapsed | 135463 | -| total_timesteps | 3185664 | -| train/ | | -| approx_kl | 0.07854095 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | 0.0523 | -| n_updates | 248870 | -| policy_gradient_loss | 0.0248 | -| std | 0.00587 | -| value_loss | 4.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24889 | -| time_elapsed | 135468 | -| total_timesteps | 3185792 | -| train/ | | -| approx_kl | 0.013862626 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 248880 | -| policy_gradient_loss | 0.0133 | -| std | 0.00588 | -| value_loss | 2.97e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24890 | -| time_elapsed | 135471 | -| total_timesteps | 3185920 | -| train/ | | -| approx_kl | 0.086561546 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 248890 | -| policy_gradient_loss | -0.0122 | -| std | 0.00588 | -| value_loss | 2.42e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24891 | -| time_elapsed | 135476 | -| total_timesteps | 3186048 | -| train/ | | -| approx_kl | 0.014056449 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | -0.0212 | -| n_updates | 248900 | -| policy_gradient_loss | 0.00161 | -| std | 0.00588 | -| value_loss | 1.7e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24892 | -| time_elapsed | 135482 | -| total_timesteps | 3186176 | -| train/ | | -| approx_kl | 0.04757692 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.134 | -| learning_rate | 0.0003 | -| loss | -0.0292 | -| n_updates | 248910 | -| policy_gradient_loss | -0.0106 | -| std | 0.00588 | -| value_loss | 0.00196 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24893 | -| time_elapsed | 135488 | -| total_timesteps | 3186304 | -| train/ | | -| approx_kl | 0.181748 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -6.94 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 248920 | -| policy_gradient_loss | 0.0487 | -| std | 0.00588 | -| value_loss | 1.66e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24894 | -| time_elapsed | 135493 | -| total_timesteps | 3186432 | -| train/ | | -| approx_kl | 0.010531584 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 248930 | -| policy_gradient_loss | 0.0141 | -| std | 0.00588 | -| value_loss | 7e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24895 | -| time_elapsed | 135499 | -| total_timesteps | 3186560 | -| train/ | | -| approx_kl | 0.0041831695 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00876 | -| learning_rate | 0.0003 | -| loss | -0.00598 | -| n_updates | 248940 | -| policy_gradient_loss | 0.00705 | -| std | 0.00588 | -| value_loss | 3.84e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24896 | -| time_elapsed | 135505 | -| total_timesteps | 3186688 | -| train/ | | -| approx_kl | 0.0021592937 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0227 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 248950 | -| policy_gradient_loss | 0.00267 | -| std | 0.00588 | -| value_loss | 1.15e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24897 | -| time_elapsed | 135509 | -| total_timesteps | 3186816 | -| train/ | | -| approx_kl | 0.006064369 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00754 | -| learning_rate | 0.0003 | -| loss | -0.00502 | -| n_updates | 248960 | -| policy_gradient_loss | 0.0103 | -| std | 0.00588 | -| value_loss | 2.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 24898 | -| time_elapsed | 135514 | -| total_timesteps | 3186944 | -| train/ | | -| approx_kl | 0.049152628 | -| clip_fraction | 0.648 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 248970 | -| policy_gradient_loss | 0.131 | -| std | 0.00588 | -| value_loss | 2.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24899 | -| time_elapsed | 135517 | -| total_timesteps | 3187072 | -| train/ | | -| approx_kl | 0.10388992 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | 0.0821 | -| n_updates | 248980 | -| policy_gradient_loss | 0.0877 | -| std | 0.00588 | -| value_loss | 1.33e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24900 | -| time_elapsed | 135526 | -| total_timesteps | 3187200 | -| train/ | | -| approx_kl | 0.0023330958 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.973 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 248990 | -| policy_gradient_loss | 0.0182 | -| std | 0.00588 | -| value_loss | 0.000319 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24901 | -| time_elapsed | 135530 | -| total_timesteps | 3187328 | -| train/ | | -| approx_kl | 0.017544076 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.964 | -| learning_rate | 0.0003 | -| loss | 0.0022 | -| n_updates | 249000 | -| policy_gradient_loss | 0.0267 | -| std | 0.00588 | -| value_loss | 4.91e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24902 | -| time_elapsed | 135536 | -| total_timesteps | 3187456 | -| train/ | | -| approx_kl | 0.2034537 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0109 | -| learning_rate | 0.0003 | -| loss | 0.0664 | -| n_updates | 249010 | -| policy_gradient_loss | 0.0354 | -| std | 0.00588 | -| value_loss | 1.11e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24903 | -| time_elapsed | 135541 | -| total_timesteps | 3187584 | -| train/ | | -| approx_kl | 0.08371658 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.512 | -| learning_rate | 0.0003 | -| loss | 0.0445 | -| n_updates | 249020 | -| policy_gradient_loss | 0.0724 | -| std | 0.00588 | -| value_loss | 4.21e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24904 | -| time_elapsed | 135548 | -| total_timesteps | 3187712 | -| train/ | | -| approx_kl | 0.24056828 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0714 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 249030 | -| policy_gradient_loss | 0.0524 | -| std | 0.00587 | -| value_loss | 1.96e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24905 | -| time_elapsed | 135553 | -| total_timesteps | 3187840 | -| train/ | | -| approx_kl | 0.0039737984 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 249040 | -| policy_gradient_loss | 0.0196 | -| std | 0.00587 | -| value_loss | 1.1e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.924 | -| time/ | | -| fps | 23 | -| iterations | 24906 | -| time_elapsed | 135557 | -| total_timesteps | 3187968 | -| train/ | | -| approx_kl | 0.026169822 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | -0.0252 | -| n_updates | 249050 | -| policy_gradient_loss | 0.106 | -| std | 0.00587 | -| value_loss | 1.12e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24907 | -| time_elapsed | 135561 | -| total_timesteps | 3188096 | -| train/ | | -| approx_kl | 0.095812246 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0236 | -| learning_rate | 0.0003 | -| loss | 0.0702 | -| n_updates | 249060 | -| policy_gradient_loss | 0.0339 | -| std | 0.00587 | -| value_loss | 5.76e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24908 | -| time_elapsed | 135571 | -| total_timesteps | 3188224 | -| train/ | | -| approx_kl | 0.042285163 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | 0.000983 | -| n_updates | 249070 | -| policy_gradient_loss | 0.0249 | -| std | 0.00587 | -| value_loss | 0.00461 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24909 | -| time_elapsed | 135576 | -| total_timesteps | 3188352 | -| train/ | | -| approx_kl | 0.1653095 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 249080 | -| policy_gradient_loss | 0.0585 | -| std | 0.00588 | -| value_loss | 1.55e-05 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24910 | -| time_elapsed | 135582 | -| total_timesteps | 3188480 | -| train/ | | -| approx_kl | 0.036621 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00954 | -| learning_rate | 0.0003 | -| loss | 0.0297 | -| n_updates | 249090 | -| policy_gradient_loss | 0.0229 | -| std | 0.00589 | -| value_loss | 2.18e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24911 | -| time_elapsed | 135587 | -| total_timesteps | 3188608 | -| train/ | | -| approx_kl | 0.026492814 | -| clip_fraction | 0.611 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | -0.00472 | -| n_updates | 249100 | -| policy_gradient_loss | 0.0704 | -| std | 0.0059 | -| value_loss | 2.3e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24912 | -| time_elapsed | 135593 | -| total_timesteps | 3188736 | -| train/ | | -| approx_kl | 0.016748019 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00323 | -| n_updates | 249110 | -| policy_gradient_loss | 0.022 | -| std | 0.0059 | -| value_loss | 3.18e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24913 | -| time_elapsed | 135598 | -| total_timesteps | 3188864 | -| train/ | | -| approx_kl | 0.21789113 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.091 | -| n_updates | 249120 | -| policy_gradient_loss | 0.017 | -| std | 0.0059 | -| value_loss | 1.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 24914 | -| time_elapsed | 135602 | -| total_timesteps | 3188992 | -| train/ | | -| approx_kl | 0.007920494 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | 0.0007 | -| n_updates | 249130 | -| policy_gradient_loss | 0.0307 | -| std | 0.00591 | -| value_loss | 9.21e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24915 | -| time_elapsed | 135607 | -| total_timesteps | 3189120 | -| train/ | | -| approx_kl | 0.027155992 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00413 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 249140 | -| policy_gradient_loss | 0.00407 | -| std | 0.00592 | -| value_loss | 2.61e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24916 | -| time_elapsed | 135618 | -| total_timesteps | 3189248 | -| train/ | | -| approx_kl | 0.3659448 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 249150 | -| policy_gradient_loss | 0.00193 | -| std | 0.00592 | -| value_loss | 7.39e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24917 | -| time_elapsed | 135623 | -| total_timesteps | 3189376 | -| train/ | | -| approx_kl | 0.03795889 | -| clip_fraction | 0.602 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.00755 | -| n_updates | 249160 | -| policy_gradient_loss | 0.0815 | -| std | 0.00592 | -| value_loss | 2.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24918 | -| time_elapsed | 135627 | -| total_timesteps | 3189504 | -| train/ | | -| approx_kl | 0.020726023 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00113 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 249170 | -| policy_gradient_loss | 0.0251 | -| std | 0.00592 | -| value_loss | 8.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24919 | -| time_elapsed | 135632 | -| total_timesteps | 3189632 | -| train/ | | -| approx_kl | 0.04871989 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 249180 | -| policy_gradient_loss | 0.0737 | -| std | 0.00591 | -| value_loss | 1.89e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24920 | -| time_elapsed | 135637 | -| total_timesteps | 3189760 | -| train/ | | -| approx_kl | 0.006805553 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0368 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 249190 | -| policy_gradient_loss | 0.106 | -| std | 0.00591 | -| value_loss | 9.21e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24921 | -| time_elapsed | 135641 | -| total_timesteps | 3189888 | -| train/ | | -| approx_kl | 0.009786007 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00938 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 249200 | -| policy_gradient_loss | 0.0236 | -| std | 0.0059 | -| value_loss | 9.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24922 | -| time_elapsed | 135645 | -| total_timesteps | 3190016 | -| train/ | | -| approx_kl | 0.051965795 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 249210 | -| policy_gradient_loss | 0.0783 | -| std | 0.0059 | -| value_loss | 4.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24923 | -| time_elapsed | 135658 | -| total_timesteps | 3190144 | -| train/ | | -| approx_kl | 0.024694083 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | 0.00906 | -| n_updates | 249220 | -| policy_gradient_loss | 0.087 | -| std | 0.00589 | -| value_loss | 0.00467 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24924 | -| time_elapsed | 135662 | -| total_timesteps | 3190272 | -| train/ | | -| approx_kl | 0.0061998568 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0158 | -| learning_rate | 0.0003 | -| loss | -0.000533 | -| n_updates | 249230 | -| policy_gradient_loss | 0.0538 | -| std | 0.00588 | -| value_loss | 0.00125 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24925 | -| time_elapsed | 135667 | -| total_timesteps | 3190400 | -| train/ | | -| approx_kl | 0.19886152 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00875 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 249240 | -| policy_gradient_loss | 0.512 | -| std | 0.00588 | -| value_loss | 1.61e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24926 | -| time_elapsed | 135673 | -| total_timesteps | 3190528 | -| train/ | | -| approx_kl | 0.09024065 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.217 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 249250 | -| policy_gradient_loss | 0.0346 | -| std | 0.00588 | -| value_loss | 9.26e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24927 | -| time_elapsed | 135678 | -| total_timesteps | 3190656 | -| train/ | | -| approx_kl | 0.46548036 | -| clip_fraction | 0.758 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0846 | -| learning_rate | 0.0003 | -| loss | 0.244 | -| n_updates | 249260 | -| policy_gradient_loss | 0.171 | -| std | 0.00588 | -| value_loss | 7.43e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24928 | -| time_elapsed | 135683 | -| total_timesteps | 3190784 | -| train/ | | -| approx_kl | 0.077259414 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | 0.0242 | -| n_updates | 249270 | -| policy_gradient_loss | 0.0301 | -| std | 0.00588 | -| value_loss | 5.85e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 24929 | -| time_elapsed | 135689 | -| total_timesteps | 3190912 | -| train/ | | -| approx_kl | 0.18464985 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.0935 | -| n_updates | 249280 | -| policy_gradient_loss | 0.0282 | -| std | 0.00588 | -| value_loss | 3.31e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24930 | -| time_elapsed | 135694 | -| total_timesteps | 3191040 | -| train/ | | -| approx_kl | 0.03307773 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0578 | -| learning_rate | 0.0003 | -| loss | -0.00233 | -| n_updates | 249290 | -| policy_gradient_loss | 0.0332 | -| std | 0.00588 | -| value_loss | 2.59e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24931 | -| time_elapsed | 135703 | -| total_timesteps | 3191168 | -| train/ | | -| approx_kl | 0.022159949 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0444 | -| learning_rate | 0.0003 | -| loss | -0.0178 | -| n_updates | 249300 | -| policy_gradient_loss | 0.00705 | -| std | 0.00588 | -| value_loss | 0.002 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24932 | -| time_elapsed | 135707 | -| total_timesteps | 3191296 | -| train/ | | -| approx_kl | 0.08263673 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.214 | -| learning_rate | 0.0003 | -| loss | 0.0779 | -| n_updates | 249310 | -| policy_gradient_loss | 0.0421 | -| std | 0.00589 | -| value_loss | 4.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24933 | -| time_elapsed | 135712 | -| total_timesteps | 3191424 | -| train/ | | -| approx_kl | 0.09118803 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.0643 | -| n_updates | 249320 | -| policy_gradient_loss | 0.0379 | -| std | 0.00587 | -| value_loss | 3.8e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24934 | -| time_elapsed | 135716 | -| total_timesteps | 3191552 | -| train/ | | -| approx_kl | 0.43498737 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00453 | -| learning_rate | 0.0003 | -| loss | 0.253 | -| n_updates | 249330 | -| policy_gradient_loss | 0.0853 | -| std | 0.00585 | -| value_loss | 5.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24935 | -| time_elapsed | 135721 | -| total_timesteps | 3191680 | -| train/ | | -| approx_kl | 0.068126835 | -| clip_fraction | 0.636 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 249340 | -| policy_gradient_loss | 0.108 | -| std | 0.00585 | -| value_loss | 9.39e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24936 | -| time_elapsed | 135727 | -| total_timesteps | 3191808 | -| train/ | | -| approx_kl | 0.00049422076 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.00426 | -| n_updates | 249350 | -| policy_gradient_loss | 0.0896 | -| std | 0.00585 | -| value_loss | 1.85e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24937 | -| time_elapsed | 135732 | -| total_timesteps | 3191936 | -| train/ | | -| approx_kl | 0.14824165 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.537 | -| learning_rate | 0.0003 | -| loss | 0.0902 | -| n_updates | 249360 | -| policy_gradient_loss | 0.161 | -| std | 0.00585 | -| value_loss | 1.15e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24938 | -| time_elapsed | 135737 | -| total_timesteps | 3192064 | -| train/ | | -| approx_kl | 0.106747285 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.701 | -| learning_rate | 0.0003 | -| loss | 0.0496 | -| n_updates | 249370 | -| policy_gradient_loss | 0.0423 | -| std | 0.00585 | -| value_loss | 3.86e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24939 | -| time_elapsed | 135746 | -| total_timesteps | 3192192 | -| train/ | | -| approx_kl | 0.036077127 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.731 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 249380 | -| policy_gradient_loss | -0.00799 | -| std | 0.00585 | -| value_loss | 0.00092 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24940 | -| time_elapsed | 135751 | -| total_timesteps | 3192320 | -| train/ | | -| approx_kl | 0.03120436 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.884 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 249390 | -| policy_gradient_loss | 0.00726 | -| std | 0.00585 | -| value_loss | 7.31e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24941 | -| time_elapsed | 135756 | -| total_timesteps | 3192448 | -| train/ | | -| approx_kl | 0.028600633 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0148 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 249400 | -| policy_gradient_loss | 0.0757 | -| std | 0.00584 | -| value_loss | 2.38e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24942 | -| time_elapsed | 135761 | -| total_timesteps | 3192576 | -| train/ | | -| approx_kl | 0.34146836 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 249410 | -| policy_gradient_loss | 0.154 | -| std | 0.00584 | -| value_loss | 2.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24943 | -| time_elapsed | 135764 | -| total_timesteps | 3192704 | -| train/ | | -| approx_kl | 0.24756813 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0146 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 249420 | -| policy_gradient_loss | 0.161 | -| std | 0.00583 | -| value_loss | 5.11e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24944 | -| time_elapsed | 135769 | -| total_timesteps | 3192832 | -| train/ | | -| approx_kl | 0.18083616 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00697 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 249430 | -| policy_gradient_loss | 0.158 | -| std | 0.00584 | -| value_loss | 1.55e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 24945 | -| time_elapsed | 135773 | -| total_timesteps | 3192960 | -| train/ | | -| approx_kl | 0.12019884 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 249440 | -| policy_gradient_loss | 0.0957 | -| std | 0.00584 | -| value_loss | 1.17e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24946 | -| time_elapsed | 135776 | -| total_timesteps | 3193088 | -| train/ | | -| approx_kl | 0.1618233 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 249450 | -| policy_gradient_loss | 0.124 | -| std | 0.00584 | -| value_loss | 9.21e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24947 | -| time_elapsed | 135785 | -| total_timesteps | 3193216 | -| train/ | | -| approx_kl | 0.09547904 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.932 | -| learning_rate | 0.0003 | -| loss | -0.0201 | -| n_updates | 249460 | -| policy_gradient_loss | -0.0143 | -| std | 0.00584 | -| value_loss | 0.00098 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24948 | -| time_elapsed | 135788 | -| total_timesteps | 3193344 | -| train/ | | -| approx_kl | 0.02731555 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 249470 | -| policy_gradient_loss | 0.0185 | -| std | 0.00584 | -| value_loss | 1.16e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24949 | -| time_elapsed | 135793 | -| total_timesteps | 3193472 | -| train/ | | -| approx_kl | 0.18894987 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 249480 | -| policy_gradient_loss | 0.0322 | -| std | 0.00584 | -| value_loss | 7.93e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24950 | -| time_elapsed | 135797 | -| total_timesteps | 3193600 | -| train/ | | -| approx_kl | 0.0014332375 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0852 | -| learning_rate | 0.0003 | -| loss | 0.00344 | -| n_updates | 249490 | -| policy_gradient_loss | 0.00531 | -| std | 0.00583 | -| value_loss | 4.05e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24951 | -| time_elapsed | 135802 | -| total_timesteps | 3193728 | -| train/ | | -| approx_kl | 0.20561782 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0585 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 249500 | -| policy_gradient_loss | 0.138 | -| std | 0.00583 | -| value_loss | 2.52e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24952 | -| time_elapsed | 135807 | -| total_timesteps | 3193856 | -| train/ | | -| approx_kl | 0.04487109 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.0055 | -| n_updates | 249510 | -| policy_gradient_loss | 0.0318 | -| std | 0.00583 | -| value_loss | 2.23e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24953 | -| time_elapsed | 135812 | -| total_timesteps | 3193984 | -| train/ | | -| approx_kl | 0.0015913742 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.00125 | -| n_updates | 249520 | -| policy_gradient_loss | 0.0323 | -| std | 0.00584 | -| value_loss | 1.27e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24954 | -| time_elapsed | 135818 | -| total_timesteps | 3194112 | -| train/ | | -| approx_kl | 4.174048e-05 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | 6.29e-05 | -| n_updates | 249530 | -| policy_gradient_loss | 0.0275 | -| std | 0.00584 | -| value_loss | 2.69e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24955 | -| time_elapsed | 135830 | -| total_timesteps | 3194240 | -| train/ | | -| approx_kl | 0.072447404 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.218 | -| learning_rate | 0.0003 | -| loss | -0.0185 | -| n_updates | 249540 | -| policy_gradient_loss | -0.0133 | -| std | 0.00583 | -| value_loss | 0.00186 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24956 | -| time_elapsed | 135835 | -| total_timesteps | 3194368 | -| train/ | | -| approx_kl | 0.017796908 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0181 | -| learning_rate | 0.0003 | -| loss | 0.00122 | -| n_updates | 249550 | -| policy_gradient_loss | 0.0292 | -| std | 0.00583 | -| value_loss | 1.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24957 | -| time_elapsed | 135839 | -| total_timesteps | 3194496 | -| train/ | | -| approx_kl | 0.045314938 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0654 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 249560 | -| policy_gradient_loss | 0.0823 | -| std | 0.00583 | -| value_loss | 6.38e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24958 | -| time_elapsed | 135843 | -| total_timesteps | 3194624 | -| train/ | | -| approx_kl | 0.08103666 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 249570 | -| policy_gradient_loss | 0.00825 | -| std | 0.00582 | -| value_loss | 6.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24959 | -| time_elapsed | 135848 | -| total_timesteps | 3194752 | -| train/ | | -| approx_kl | 0.020547144 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | -0.000409 | -| n_updates | 249580 | -| policy_gradient_loss | 0.0854 | -| std | 0.00582 | -| value_loss | 2.56e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 24960 | -| time_elapsed | 135853 | -| total_timesteps | 3194880 | -| train/ | | -| approx_kl | 0.012283318 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.186 | -| learning_rate | 0.0003 | -| loss | -0.00758 | -| n_updates | 249590 | -| policy_gradient_loss | 0.0164 | -| std | 0.00582 | -| value_loss | 4.37e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24961 | -| time_elapsed | 135858 | -| total_timesteps | 3195008 | -| train/ | | -| approx_kl | 0.06392808 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.00327 | -| n_updates | 249600 | -| policy_gradient_loss | 0.0531 | -| std | 0.00582 | -| value_loss | 3.77e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24962 | -| time_elapsed | 135869 | -| total_timesteps | 3195136 | -| train/ | | -| approx_kl | 0.008576481 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | -0.00501 | -| n_updates | 249610 | -| policy_gradient_loss | 0.00424 | -| std | 0.00582 | -| value_loss | 0.00389 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24963 | -| time_elapsed | 135873 | -| total_timesteps | 3195264 | -| train/ | | -| approx_kl | 0.5565692 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.489 | -| learning_rate | 0.0003 | -| loss | 0.184 | -| n_updates | 249620 | -| policy_gradient_loss | 0.111 | -| std | 0.00582 | -| value_loss | 4.22e-05 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24964 | -| time_elapsed | 135876 | -| total_timesteps | 3195392 | -| train/ | | -| approx_kl | 0.1072908 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | 0.0519 | -| n_updates | 249630 | -| policy_gradient_loss | 0.0389 | -| std | 0.00582 | -| value_loss | 1.02e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24965 | -| time_elapsed | 135881 | -| total_timesteps | 3195520 | -| train/ | | -| approx_kl | 0.1808497 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0229 | -| learning_rate | 0.0003 | -| loss | 0.0848 | -| n_updates | 249640 | -| policy_gradient_loss | 0.0277 | -| std | 0.00582 | -| value_loss | 4.91e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24966 | -| time_elapsed | 135886 | -| total_timesteps | 3195648 | -| train/ | | -| approx_kl | 0.03111092 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0537 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 249650 | -| policy_gradient_loss | 0.0378 | -| std | 0.00582 | -| value_loss | 3.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24967 | -| time_elapsed | 135893 | -| total_timesteps | 3195776 | -| train/ | | -| approx_kl | 0.15267174 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0875 | -| n_updates | 249660 | -| policy_gradient_loss | 0.0416 | -| std | 0.00582 | -| value_loss | 2.19e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.927 | -| time/ | | -| fps | 23 | -| iterations | 24968 | -| time_elapsed | 135898 | -| total_timesteps | 3195904 | -| train/ | | -| approx_kl | 0.63383836 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0663 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 249670 | -| policy_gradient_loss | 0.0495 | -| std | 0.00582 | -| value_loss | 5.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24969 | -| time_elapsed | 135903 | -| total_timesteps | 3196032 | -| train/ | | -| approx_kl | 0.016207334 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -4.33 | -| learning_rate | 0.0003 | -| loss | 0.000258 | -| n_updates | 249680 | -| policy_gradient_loss | 0.00282 | -| std | 0.00583 | -| value_loss | 1.5e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24970 | -| time_elapsed | 135915 | -| total_timesteps | 3196160 | -| train/ | | -| approx_kl | 0.01070212 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.92 | -| learning_rate | 0.0003 | -| loss | -0.0214 | -| n_updates | 249690 | -| policy_gradient_loss | -0.00822 | -| std | 0.00583 | -| value_loss | 0.000421 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24971 | -| time_elapsed | 135919 | -| total_timesteps | 3196288 | -| train/ | | -| approx_kl | 0.006376558 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | -0.00533 | -| n_updates | 249700 | -| policy_gradient_loss | 0.0396 | -| std | 0.00583 | -| value_loss | 1.63e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24972 | -| time_elapsed | 135924 | -| total_timesteps | 3196416 | -| train/ | | -| approx_kl | 0.65243405 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0163 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 249710 | -| policy_gradient_loss | 0.0675 | -| std | 0.00583 | -| value_loss | 7.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24973 | -| time_elapsed | 135929 | -| total_timesteps | 3196544 | -| train/ | | -| approx_kl | 0.011303354 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | -0.00132 | -| n_updates | 249720 | -| policy_gradient_loss | 0.0101 | -| std | 0.00583 | -| value_loss | 4.66e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24974 | -| time_elapsed | 135934 | -| total_timesteps | 3196672 | -| train/ | | -| approx_kl | 0.0016077454 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.00896 | -| n_updates | 249730 | -| policy_gradient_loss | 0.01 | -| std | 0.00583 | -| value_loss | 4.1e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24975 | -| time_elapsed | 135939 | -| total_timesteps | 3196800 | -| train/ | | -| approx_kl | 0.007730219 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | -0.00556 | -| n_updates | 249740 | -| policy_gradient_loss | 0.00958 | -| std | 0.00583 | -| value_loss | 2.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24976 | -| time_elapsed | 135945 | -| total_timesteps | 3196928 | -| train/ | | -| approx_kl | 0.08141766 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.0401 | -| n_updates | 249750 | -| policy_gradient_loss | 0.0162 | -| std | 0.00583 | -| value_loss | 1.6e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24977 | -| time_elapsed | 135949 | -| total_timesteps | 3197056 | -| train/ | | -| approx_kl | 0.047381006 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | 0.0326 | -| n_updates | 249760 | -| policy_gradient_loss | 0.017 | -| std | 0.00583 | -| value_loss | 9.92e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24978 | -| time_elapsed | 135957 | -| total_timesteps | 3197184 | -| train/ | | -| approx_kl | 0.02762893 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | -0.0175 | -| n_updates | 249770 | -| policy_gradient_loss | -0.00501 | -| std | 0.00583 | -| value_loss | 0.00116 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24979 | -| time_elapsed | 135963 | -| total_timesteps | 3197312 | -| train/ | | -| approx_kl | 0.21995331 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.106 | -| n_updates | 249780 | -| policy_gradient_loss | 0.0462 | -| std | 0.00583 | -| value_loss | 0.000122 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24980 | -| time_elapsed | 135967 | -| total_timesteps | 3197440 | -| train/ | | -| approx_kl | 0.06746577 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0135 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 249790 | -| policy_gradient_loss | 0.0821 | -| std | 0.00583 | -| value_loss | 1.29e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24981 | -| time_elapsed | 135971 | -| total_timesteps | 3197568 | -| train/ | | -| approx_kl | 0.0040603704 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 249800 | -| policy_gradient_loss | 0.114 | -| std | 0.00583 | -| value_loss | 8.96e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24982 | -| time_elapsed | 135975 | -| total_timesteps | 3197696 | -| train/ | | -| approx_kl | 0.010105077 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 249810 | -| policy_gradient_loss | 0.015 | -| std | 0.00582 | -| value_loss | 8.33e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24983 | -| time_elapsed | 135979 | -| total_timesteps | 3197824 | -| train/ | | -| approx_kl | 0.17718813 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 249820 | -| policy_gradient_loss | 0.0136 | -| std | 0.00582 | -| value_loss | 8.61e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 24984 | -| time_elapsed | 135984 | -| total_timesteps | 3197952 | -| train/ | | -| approx_kl | 0.006932652 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.202 | -| learning_rate | 0.0003 | -| loss | 0.00708 | -| n_updates | 249830 | -| policy_gradient_loss | 0.0192 | -| std | 0.00583 | -| value_loss | 2.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24985 | -| time_elapsed | 135987 | -| total_timesteps | 3198080 | -| train/ | | -| approx_kl | 0.026781753 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 249840 | -| policy_gradient_loss | 0.00383 | -| std | 0.00582 | -| value_loss | 9.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24986 | -| time_elapsed | 135996 | -| total_timesteps | 3198208 | -| train/ | | -| approx_kl | 0.007859452 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 249850 | -| policy_gradient_loss | -0.00787 | -| std | 0.00581 | -| value_loss | 0.000773 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24987 | -| time_elapsed | 136000 | -| total_timesteps | 3198336 | -| train/ | | -| approx_kl | 0.29450095 | -| clip_fraction | 0.744 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0159 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 249860 | -| policy_gradient_loss | 0.2 | -| std | 0.00581 | -| value_loss | 3.74e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24988 | -| time_elapsed | 136003 | -| total_timesteps | 3198464 | -| train/ | | -| approx_kl | 0.22118662 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 249870 | -| policy_gradient_loss | 0.147 | -| std | 0.0058 | -| value_loss | 2.09e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24989 | -| time_elapsed | 136008 | -| total_timesteps | 3198592 | -| train/ | | -| approx_kl | 0.21424434 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.00848 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 249880 | -| policy_gradient_loss | 0.181 | -| std | 0.0058 | -| value_loss | 1.4e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24990 | -| time_elapsed | 136011 | -| total_timesteps | 3198720 | -| train/ | | -| approx_kl | 0.18736413 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0228 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 249890 | -| policy_gradient_loss | 0.169 | -| std | 0.0058 | -| value_loss | 1.14e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24991 | -| time_elapsed | 136016 | -| total_timesteps | 3198848 | -| train/ | | -| approx_kl | 0.05346035 | -| clip_fraction | 0.479 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | 0.0356 | -| n_updates | 249900 | -| policy_gradient_loss | 0.0467 | -| std | 0.0058 | -| value_loss | 7.31e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 24992 | -| time_elapsed | 136020 | -| total_timesteps | 3198976 | -| train/ | | -| approx_kl | 0.0005923719 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.00215 | -| n_updates | 249910 | -| policy_gradient_loss | 0.0396 | -| std | 0.00581 | -| value_loss | 4.77e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 24993 | -| time_elapsed | 136024 | -| total_timesteps | 3199104 | -| train/ | | -| approx_kl | 0.5592201 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 249920 | -| policy_gradient_loss | 0.065 | -| std | 0.00581 | -| value_loss | 3.61e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 24994 | -| time_elapsed | 136034 | -| total_timesteps | 3199232 | -| train/ | | -| approx_kl | 0.015199197 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.738 | -| learning_rate | 0.0003 | -| loss | -0.00547 | -| n_updates | 249930 | -| policy_gradient_loss | 0.0046 | -| std | 0.00581 | -| value_loss | 0.00763 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 24995 | -| time_elapsed | 136040 | -| total_timesteps | 3199360 | -| train/ | | -| approx_kl | 0.0035733706 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | -0.000971 | -| n_updates | 249940 | -| policy_gradient_loss | 0.0106 | -| std | 0.00581 | -| value_loss | 5.81e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 24996 | -| time_elapsed | 136045 | -| total_timesteps | 3199488 | -| train/ | | -| approx_kl | 0.0004538591 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.667 | -| learning_rate | 0.0003 | -| loss | 0.00103 | -| n_updates | 249950 | -| policy_gradient_loss | 0.0311 | -| std | 0.00581 | -| value_loss | 0.00271 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 24997 | -| time_elapsed | 136049 | -| total_timesteps | 3199616 | -| train/ | | -| approx_kl | 0.8964982 | -| clip_fraction | 0.784 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.554 | -| learning_rate | 0.0003 | -| loss | 0.345 | -| n_updates | 249960 | -| policy_gradient_loss | 0.201 | -| std | 0.00581 | -| value_loss | 3.63e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 24998 | -| time_elapsed | 136054 | -| total_timesteps | 3199744 | -| train/ | | -| approx_kl | 0.031230746 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.00895 | -| n_updates | 249970 | -| policy_gradient_loss | 0.000739 | -| std | 0.00581 | -| value_loss | 2.52e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.935 | -| time/ | | -| fps | 23 | -| iterations | 24999 | -| time_elapsed | 136059 | -| total_timesteps | 3199872 | -| train/ | | -| approx_kl | 0.022173759 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.0134 | -| n_updates | 249980 | -| policy_gradient_loss | 0.00508 | -| std | 0.00581 | -| value_loss | 1.67e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25000 | -| time_elapsed | 136063 | -| total_timesteps | 3200000 | -| train/ | | -| approx_kl | 0.033655368 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 249990 | -| policy_gradient_loss | 0.0157 | -| std | 0.00581 | -| value_loss | 1.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25001 | -| time_elapsed | 136069 | -| total_timesteps | 3200128 | -| train/ | | -| approx_kl | 0.30972633 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00479 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 250000 | -| policy_gradient_loss | 0.139 | -| std | 0.00581 | -| value_loss | 6.9e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25002 | -| time_elapsed | 136081 | -| total_timesteps | 3200256 | -| train/ | | -| approx_kl | 0.020295572 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.95 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 250010 | -| policy_gradient_loss | 0.0327 | -| std | 0.00581 | -| value_loss | 0.000787 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25003 | -| time_elapsed | 136085 | -| total_timesteps | 3200384 | -| train/ | | -| approx_kl | 0.10190813 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -74.5 | -| learning_rate | 0.0003 | -| loss | 0.0489 | -| n_updates | 250020 | -| policy_gradient_loss | 0.00853 | -| std | 0.00581 | -| value_loss | 4.35e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25004 | -| time_elapsed | 136090 | -| total_timesteps | 3200512 | -| train/ | | -| approx_kl | 0.5394929 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.614 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 250030 | -| policy_gradient_loss | 0.0583 | -| std | 0.00581 | -| value_loss | 5.59e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25005 | -| time_elapsed | 136095 | -| total_timesteps | 3200640 | -| train/ | | -| approx_kl | 0.08728359 | -| clip_fraction | 0.623 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 250040 | -| policy_gradient_loss | 0.0617 | -| std | 0.00581 | -| value_loss | 1.67e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25006 | -| time_elapsed | 136099 | -| total_timesteps | 3200768 | -| train/ | | -| approx_kl | 3.1700358e-05 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.000194 | -| n_updates | 250050 | -| policy_gradient_loss | 0.0915 | -| std | 0.00581 | -| value_loss | 1.07e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25007 | -| time_elapsed | 136104 | -| total_timesteps | 3200896 | -| train/ | | -| approx_kl | 0.1610049 | -| clip_fraction | 0.704 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0549 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 250060 | -| policy_gradient_loss | 0.229 | -| std | 0.00582 | -| value_loss | 7.17e-09 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25008 | -| time_elapsed | 136109 | -| total_timesteps | 3201024 | -| train/ | | -| approx_kl | 0.0150358565 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 250070 | -| policy_gradient_loss | 0.0368 | -| std | 0.00582 | -| value_loss | 4.94e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25009 | -| time_elapsed | 136117 | -| total_timesteps | 3201152 | -| train/ | | -| approx_kl | 0.04898544 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -6.9 | -| learning_rate | 0.0003 | -| loss | -0.0292 | -| n_updates | 250080 | -| policy_gradient_loss | -0.0118 | -| std | 0.00582 | -| value_loss | 0.00501 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25010 | -| time_elapsed | 136121 | -| total_timesteps | 3201280 | -| train/ | | -| approx_kl | 0.003170509 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.446 | -| learning_rate | 0.0003 | -| loss | -0.00982 | -| n_updates | 250090 | -| policy_gradient_loss | 0.0288 | -| std | 0.00582 | -| value_loss | 9.17e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25011 | -| time_elapsed | 136126 | -| total_timesteps | 3201408 | -| train/ | | -| approx_kl | 0.7147991 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 250100 | -| policy_gradient_loss | 0.0705 | -| std | 0.00582 | -| value_loss | 1.1e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25012 | -| time_elapsed | 136131 | -| total_timesteps | 3201536 | -| train/ | | -| approx_kl | 0.07167375 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.00984 | -| learning_rate | 0.0003 | -| loss | 0.0483 | -| n_updates | 250110 | -| policy_gradient_loss | 0.0222 | -| std | 0.00582 | -| value_loss | 4.53e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25013 | -| time_elapsed | 136136 | -| total_timesteps | 3201664 | -| train/ | | -| approx_kl | 0.0099174585 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | -0.000368 | -| n_updates | 250120 | -| policy_gradient_loss | 0.0115 | -| std | 0.00582 | -| value_loss | 3.21e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25014 | -| time_elapsed | 136140 | -| total_timesteps | 3201792 | -| train/ | | -| approx_kl | 0.09802601 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 250130 | -| policy_gradient_loss | 0.000724 | -| std | 0.00582 | -| value_loss | 2.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25015 | -| time_elapsed | 136145 | -| total_timesteps | 3201920 | -| train/ | | -| approx_kl | 0.05046419 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 250140 | -| policy_gradient_loss | 0.00733 | -| std | 0.00582 | -| value_loss | 2.03e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25016 | -| time_elapsed | 136151 | -| total_timesteps | 3202048 | -| train/ | | -| approx_kl | 0.009304365 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | -0.0077 | -| n_updates | 250150 | -| policy_gradient_loss | 0.00842 | -| std | 0.00582 | -| value_loss | 1.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25017 | -| time_elapsed | 136160 | -| total_timesteps | 3202176 | -| train/ | | -| approx_kl | 0.029688554 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0848 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 250160 | -| policy_gradient_loss | 0.00673 | -| std | 0.00582 | -| value_loss | 0.0174 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25018 | -| time_elapsed | 136166 | -| total_timesteps | 3202304 | -| train/ | | -| approx_kl | 0.2523885 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.597 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 250170 | -| policy_gradient_loss | 0.0379 | -| std | 0.00582 | -| value_loss | 0.000239 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25019 | -| time_elapsed | 136171 | -| total_timesteps | 3202432 | -| train/ | | -| approx_kl | 0.20879674 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 250180 | -| policy_gradient_loss | 0.0338 | -| std | 0.00582 | -| value_loss | 2.91e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25020 | -| time_elapsed | 136176 | -| total_timesteps | 3202560 | -| train/ | | -| approx_kl | 0.023751091 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 250190 | -| policy_gradient_loss | 0.00684 | -| std | 0.00583 | -| value_loss | 6.52e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25021 | -| time_elapsed | 136181 | -| total_timesteps | 3202688 | -| train/ | | -| approx_kl | 0.008830309 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00118 | -| n_updates | 250200 | -| policy_gradient_loss | 0.00108 | -| std | 0.00582 | -| value_loss | 5.84e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25022 | -| time_elapsed | 136185 | -| total_timesteps | 3202816 | -| train/ | | -| approx_kl | 0.012292684 | -| clip_fraction | 0.104 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.00728 | -| learning_rate | 0.0003 | -| loss | 0.00578 | -| n_updates | 250210 | -| policy_gradient_loss | 0.00407 | -| std | 0.00582 | -| value_loss | 3.21e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25023 | -| time_elapsed | 136190 | -| total_timesteps | 3202944 | -| train/ | | -| approx_kl | 0.01380055 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0647 | -| learning_rate | 0.0003 | -| loss | -0.000398 | -| n_updates | 250220 | -| policy_gradient_loss | 0.000189 | -| std | 0.00582 | -| value_loss | 2.21e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25024 | -| time_elapsed | 136194 | -| total_timesteps | 3203072 | -| train/ | | -| approx_kl | 0.047028605 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | 0.00655 | -| n_updates | 250230 | -| policy_gradient_loss | 0.0425 | -| std | 0.00582 | -| value_loss | 1.86e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25025 | -| time_elapsed | 136201 | -| total_timesteps | 3203200 | -| train/ | | -| approx_kl | 0.19277391 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.783 | -| learning_rate | 0.0003 | -| loss | 0.0501 | -| n_updates | 250240 | -| policy_gradient_loss | 0.019 | -| std | 0.00582 | -| value_loss | 0.00374 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25026 | -| time_elapsed | 136206 | -| total_timesteps | 3203328 | -| train/ | | -| approx_kl | 0.0066050817 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 250250 | -| policy_gradient_loss | 0.0393 | -| std | 0.00582 | -| value_loss | 3.96e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25027 | -| time_elapsed | 136211 | -| total_timesteps | 3203456 | -| train/ | | -| approx_kl | 0.33950782 | -| clip_fraction | 0.759 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00888 | -| learning_rate | 0.0003 | -| loss | 0.231 | -| n_updates | 250260 | -| policy_gradient_loss | 0.159 | -| std | 0.00581 | -| value_loss | 0.000142 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25028 | -| time_elapsed | 136217 | -| total_timesteps | 3203584 | -| train/ | | -| approx_kl | 0.06548557 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -32.4 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 250270 | -| policy_gradient_loss | 0.0179 | -| std | 0.00581 | -| value_loss | 1.19e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25029 | -| time_elapsed | 136222 | -| total_timesteps | 3203712 | -| train/ | | -| approx_kl | 0.7389818 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.312 | -| n_updates | 250280 | -| policy_gradient_loss | 0.0936 | -| std | 0.00581 | -| value_loss | 1.11e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25030 | -| time_elapsed | 136226 | -| total_timesteps | 3203840 | -| train/ | | -| approx_kl | 0.014859497 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0225 | -| learning_rate | 0.0003 | -| loss | -0.00197 | -| n_updates | 250290 | -| policy_gradient_loss | 0.0098 | -| std | 0.00581 | -| value_loss | 2.87e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 25031 | -| time_elapsed | 136230 | -| total_timesteps | 3203968 | -| train/ | | -| approx_kl | 0.0034558936 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00366 | -| n_updates | 250300 | -| policy_gradient_loss | 0.0104 | -| std | 0.00581 | -| value_loss | 1.8e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25032 | -| time_elapsed | 136234 | -| total_timesteps | 3204096 | -| train/ | | -| approx_kl | 0.049388595 | -| clip_fraction | 0.666 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0564 | -| learning_rate | 0.0003 | -| loss | 0.0321 | -| n_updates | 250310 | -| policy_gradient_loss | 0.102 | -| std | 0.00581 | -| value_loss | 1.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25033 | -| time_elapsed | 136242 | -| total_timesteps | 3204224 | -| train/ | | -| approx_kl | 0.063318014 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 250320 | -| policy_gradient_loss | 0.0356 | -| std | 0.00581 | -| value_loss | 0.0017 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25034 | -| time_elapsed | 136248 | -| total_timesteps | 3204352 | -| train/ | | -| approx_kl | 0.0014207796 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -1.75 | -| learning_rate | 0.0003 | -| loss | 0.00887 | -| n_updates | 250330 | -| policy_gradient_loss | 0.0082 | -| std | 0.00582 | -| value_loss | 1.6e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25035 | -| time_elapsed | 136253 | -| total_timesteps | 3204480 | -| train/ | | -| approx_kl | 0.0011815233 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.00778 | -| learning_rate | 0.0003 | -| loss | -0.00063 | -| n_updates | 250340 | -| policy_gradient_loss | 0.0119 | -| std | 0.00582 | -| value_loss | 7.47e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25036 | -| time_elapsed | 136258 | -| total_timesteps | 3204608 | -| train/ | | -| approx_kl | 0.12841281 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -1.15 | -| learning_rate | 0.0003 | -| loss | 0.0467 | -| n_updates | 250350 | -| policy_gradient_loss | 0.0134 | -| std | 0.00583 | -| value_loss | 1.19e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25037 | -| time_elapsed | 136263 | -| total_timesteps | 3204736 | -| train/ | | -| approx_kl | 0.3583191 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0121 | -| learning_rate | 0.0003 | -| loss | 0.229 | -| n_updates | 250360 | -| policy_gradient_loss | 0.0445 | -| std | 0.00583 | -| value_loss | 1.67e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25038 | -| time_elapsed | 136268 | -| total_timesteps | 3204864 | -| train/ | | -| approx_kl | 0.21471614 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 250370 | -| policy_gradient_loss | 0.0334 | -| std | 0.00583 | -| value_loss | 9.16e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 25039 | -| time_elapsed | 136274 | -| total_timesteps | 3204992 | -| train/ | | -| approx_kl | 0.03250643 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.211 | -| learning_rate | 0.0003 | -| loss | 0.00978 | -| n_updates | 250380 | -| policy_gradient_loss | 0.0362 | -| std | 0.00583 | -| value_loss | 2.37e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25040 | -| time_elapsed | 136280 | -| total_timesteps | 3205120 | -| train/ | | -| approx_kl | 0.35913116 | -| clip_fraction | 0.739 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.223 | -| n_updates | 250390 | -| policy_gradient_loss | 0.17 | -| std | 0.00583 | -| value_loss | 1.39e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25041 | -| time_elapsed | 136291 | -| total_timesteps | 3205248 | -| train/ | | -| approx_kl | 0.09442437 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.836 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 250400 | -| policy_gradient_loss | 0.0315 | -| std | 0.00583 | -| value_loss | 0.00204 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25042 | -| time_elapsed | 136295 | -| total_timesteps | 3205376 | -| train/ | | -| approx_kl | 0.19049433 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 250410 | -| policy_gradient_loss | 0.0301 | -| std | 0.00583 | -| value_loss | 1.63e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25043 | -| time_elapsed | 136299 | -| total_timesteps | 3205504 | -| train/ | | -| approx_kl | 0.017428363 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00447 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 250420 | -| policy_gradient_loss | -0.00662 | -| std | 0.00583 | -| value_loss | 2.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25044 | -| time_elapsed | 136304 | -| total_timesteps | 3205632 | -| train/ | | -| approx_kl | 0.014034085 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0214 | -| learning_rate | 0.0003 | -| loss | -0.00632 | -| n_updates | 250430 | -| policy_gradient_loss | -0.00318 | -| std | 0.00583 | -| value_loss | 1.08e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25045 | -| time_elapsed | 136310 | -| total_timesteps | 3205760 | -| train/ | | -| approx_kl | 0.019156033 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | 0.00955 | -| n_updates | 250440 | -| policy_gradient_loss | 0.00512 | -| std | 0.00584 | -| value_loss | 7.66e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25046 | -| time_elapsed | 136315 | -| total_timesteps | 3205888 | -| train/ | | -| approx_kl | 0.035854608 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 250450 | -| policy_gradient_loss | 0.0428 | -| std | 0.00585 | -| value_loss | 1.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25047 | -| time_elapsed | 136321 | -| total_timesteps | 3206016 | -| train/ | | -| approx_kl | 0.33538094 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00718 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 250460 | -| policy_gradient_loss | 0.132 | -| std | 0.00586 | -| value_loss | 4.8e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25048 | -| time_elapsed | 136333 | -| total_timesteps | 3206144 | -| train/ | | -| approx_kl | 0.025420595 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.866 | -| learning_rate | 0.0003 | -| loss | -0.00214 | -| n_updates | 250470 | -| policy_gradient_loss | 0.0128 | -| std | 0.00586 | -| value_loss | 0.00298 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25049 | -| time_elapsed | 136338 | -| total_timesteps | 3206272 | -| train/ | | -| approx_kl | 0.025923684 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00708 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 250480 | -| policy_gradient_loss | 0.026 | -| std | 0.00586 | -| value_loss | 5.9e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25050 | -| time_elapsed | 136343 | -| total_timesteps | 3206400 | -| train/ | | -| approx_kl | 0.19510305 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 250490 | -| policy_gradient_loss | 0.0636 | -| std | 0.00586 | -| value_loss | 2.01e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25051 | -| time_elapsed | 136347 | -| total_timesteps | 3206528 | -| train/ | | -| approx_kl | 0.012456803 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.00654 | -| n_updates | 250500 | -| policy_gradient_loss | 0.0148 | -| std | 0.00586 | -| value_loss | 4.67e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25052 | -| time_elapsed | 136352 | -| total_timesteps | 3206656 | -| train/ | | -| approx_kl | 0.08915302 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 250510 | -| policy_gradient_loss | 0.0135 | -| std | 0.00585 | -| value_loss | 0.00046 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25053 | -| time_elapsed | 136356 | -| total_timesteps | 3206784 | -| train/ | | -| approx_kl | 0.053630576 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0191 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 250520 | -| policy_gradient_loss | 0.0184 | -| std | 0.00585 | -| value_loss | 2.65e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.945 | -| time/ | | -| fps | 23 | -| iterations | 25054 | -| time_elapsed | 136361 | -| total_timesteps | 3206912 | -| train/ | | -| approx_kl | 0.0097862985 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | -0.00291 | -| n_updates | 250530 | -| policy_gradient_loss | 0.00907 | -| std | 0.00585 | -| value_loss | 2.11e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25055 | -| time_elapsed | 136365 | -| total_timesteps | 3207040 | -| train/ | | -| approx_kl | 0.08659033 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 250540 | -| policy_gradient_loss | 0.00941 | -| std | 0.00585 | -| value_loss | 1.57e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25056 | -| time_elapsed | 136374 | -| total_timesteps | 3207168 | -| train/ | | -| approx_kl | 0.01475174 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.794 | -| learning_rate | 0.0003 | -| loss | -0.0237 | -| n_updates | 250550 | -| policy_gradient_loss | -0.0159 | -| std | 0.00586 | -| value_loss | 0.00598 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25057 | -| time_elapsed | 136379 | -| total_timesteps | 3207296 | -| train/ | | -| approx_kl | 0.0010765754 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00201 | -| learning_rate | 0.0003 | -| loss | -0.000693 | -| n_updates | 250560 | -| policy_gradient_loss | 0.0173 | -| std | 0.00586 | -| value_loss | 1.24e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25058 | -| time_elapsed | 136384 | -| total_timesteps | 3207424 | -| train/ | | -| approx_kl | 0.20175897 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0663 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 250570 | -| policy_gradient_loss | 0.0339 | -| std | 0.00586 | -| value_loss | 7.97e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25059 | -| time_elapsed | 136388 | -| total_timesteps | 3207552 | -| train/ | | -| approx_kl | 0.95731133 | -| clip_fraction | 0.583 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.266 | -| n_updates | 250580 | -| policy_gradient_loss | 0.0815 | -| std | 0.00587 | -| value_loss | 3.02e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25060 | -| time_elapsed | 136392 | -| total_timesteps | 3207680 | -| train/ | | -| approx_kl | 0.011288509 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0856 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 250590 | -| policy_gradient_loss | 0.0047 | -| std | 0.00587 | -| value_loss | 2.51e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25061 | -| time_elapsed | 136397 | -| total_timesteps | 3207808 | -| train/ | | -| approx_kl | 0.09925208 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.0487 | -| n_updates | 250600 | -| policy_gradient_loss | 0.0204 | -| std | 0.00587 | -| value_loss | 1.51e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 25062 | -| time_elapsed | 136401 | -| total_timesteps | 3207936 | -| train/ | | -| approx_kl | 0.015885811 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0762 | -| learning_rate | 0.0003 | -| loss | -0.00747 | -| n_updates | 250610 | -| policy_gradient_loss | 0.00855 | -| std | 0.00587 | -| value_loss | 1.15e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25063 | -| time_elapsed | 136405 | -| total_timesteps | 3208064 | -| train/ | | -| approx_kl | 0.09790971 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.062 | -| n_updates | 250620 | -| policy_gradient_loss | 0.0268 | -| std | 0.00587 | -| value_loss | 7.09e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25064 | -| time_elapsed | 136415 | -| total_timesteps | 3208192 | -| train/ | | -| approx_kl | 0.07747021 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | -0.00573 | -| n_updates | 250630 | -| policy_gradient_loss | 0.00351 | -| std | 0.00587 | -| value_loss | 0.00206 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25065 | -| time_elapsed | 136419 | -| total_timesteps | 3208320 | -| train/ | | -| approx_kl | 0.005126978 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.00139 | -| n_updates | 250640 | -| policy_gradient_loss | 0.0129 | -| std | 0.00585 | -| value_loss | 9.44e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25066 | -| time_elapsed | 136423 | -| total_timesteps | 3208448 | -| train/ | | -| approx_kl | 0.052357487 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -3.55 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 250650 | -| policy_gradient_loss | 0.0169 | -| std | 0.00583 | -| value_loss | 2.86e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25067 | -| time_elapsed | 136427 | -| total_timesteps | 3208576 | -| train/ | | -| approx_kl | 1.0685073 | -| clip_fraction | 0.76 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -6.5 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 250660 | -| policy_gradient_loss | 0.113 | -| std | 0.00583 | -| value_loss | 6.75e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25068 | -| time_elapsed | 136431 | -| total_timesteps | 3208704 | -| train/ | | -| approx_kl | 9.366637e-05 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00488 | -| learning_rate | 0.0003 | -| loss | 0.000436 | -| n_updates | 250670 | -| policy_gradient_loss | 0.0257 | -| std | 0.00583 | -| value_loss | 5.87e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25069 | -| time_elapsed | 136434 | -| total_timesteps | 3208832 | -| train/ | | -| approx_kl | 0.096688956 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | 0.0231 | -| n_updates | 250680 | -| policy_gradient_loss | 0.0311 | -| std | 0.00583 | -| value_loss | 1.33e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25070 | -| time_elapsed | 136438 | -| total_timesteps | 3208960 | -| train/ | | -| approx_kl | 0.40264904 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.194 | -| n_updates | 250690 | -| policy_gradient_loss | 0.174 | -| std | 0.00583 | -| value_loss | 2.44e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25071 | -| time_elapsed | 136443 | -| total_timesteps | 3209088 | -| train/ | | -| approx_kl | 0.06572388 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00109 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 250700 | -| policy_gradient_loss | 0.0349 | -| std | 0.00583 | -| value_loss | 7.29e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25072 | -| time_elapsed | 136453 | -| total_timesteps | 3209216 | -| train/ | | -| approx_kl | 0.037251547 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.921 | -| learning_rate | 0.0003 | -| loss | -0.029 | -| n_updates | 250710 | -| policy_gradient_loss | -0.0207 | -| std | 0.00583 | -| value_loss | 0.000468 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25073 | -| time_elapsed | 136457 | -| total_timesteps | 3209344 | -| train/ | | -| approx_kl | 0.0070406883 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.00622 | -| n_updates | 250720 | -| policy_gradient_loss | 0.0125 | -| std | 0.00582 | -| value_loss | 4.51e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25074 | -| time_elapsed | 136462 | -| total_timesteps | 3209472 | -| train/ | | -| approx_kl | 0.0044252286 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0097 | -| learning_rate | 0.0003 | -| loss | -0.00713 | -| n_updates | 250730 | -| policy_gradient_loss | 0.00732 | -| std | 0.00582 | -| value_loss | 1.63e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25075 | -| time_elapsed | 136467 | -| total_timesteps | 3209600 | -| train/ | | -| approx_kl | 0.043097932 | -| clip_fraction | 0.651 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.334 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 250740 | -| policy_gradient_loss | 0.0797 | -| std | 0.00582 | -| value_loss | 2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25076 | -| time_elapsed | 136471 | -| total_timesteps | 3209728 | -| train/ | | -| approx_kl | 0.122876465 | -| clip_fraction | 0.675 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.758 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 250750 | -| policy_gradient_loss | 0.0955 | -| std | 0.00582 | -| value_loss | 9.79e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25077 | -| time_elapsed | 136475 | -| total_timesteps | 3209856 | -| train/ | | -| approx_kl | 0.022890951 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.00582 | -| n_updates | 250760 | -| policy_gradient_loss | 0.0302 | -| std | 0.00582 | -| value_loss | 4.29e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.961 | -| time/ | | -| fps | 23 | -| iterations | 25078 | -| time_elapsed | 136480 | -| total_timesteps | 3209984 | -| train/ | | -| approx_kl | 0.6964639 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 250770 | -| policy_gradient_loss | 0.0724 | -| std | 0.00582 | -| value_loss | 2.52e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 25079 | -| time_elapsed | 136485 | -| total_timesteps | 3210112 | -| train/ | | -| approx_kl | 0.05462632 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.055 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 250780 | -| policy_gradient_loss | 0.0064 | -| std | 0.00582 | -| value_loss | 2.02e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 25080 | -| time_elapsed | 136498 | -| total_timesteps | 3210240 | -| train/ | | -| approx_kl | 0.03522776 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.871 | -| learning_rate | 0.0003 | -| loss | -0.0263 | -| n_updates | 250790 | -| policy_gradient_loss | -0.0172 | -| std | 0.00582 | -| value_loss | 0.0031 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 25081 | -| time_elapsed | 136503 | -| total_timesteps | 3210368 | -| train/ | | -| approx_kl | 0.09266539 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 250800 | -| policy_gradient_loss | 0.0116 | -| std | 0.00583 | -| value_loss | 2.38e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 25082 | -| time_elapsed | 136508 | -| total_timesteps | 3210496 | -| train/ | | -| approx_kl | 0.013068565 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | -4.94e-05 | -| n_updates | 250810 | -| policy_gradient_loss | 0.00984 | -| std | 0.00583 | -| value_loss | 3.44e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 25083 | -| time_elapsed | 136512 | -| total_timesteps | 3210624 | -| train/ | | -| approx_kl | 0.11123426 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0114 | -| learning_rate | 0.0003 | -| loss | 0.0743 | -| n_updates | 250820 | -| policy_gradient_loss | 0.0317 | -| std | 0.00582 | -| value_loss | 1.45e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 25084 | -| time_elapsed | 136517 | -| total_timesteps | 3210752 | -| train/ | | -| approx_kl | 0.016117234 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.00945 | -| n_updates | 250830 | -| policy_gradient_loss | 0.0145 | -| std | 0.00582 | -| value_loss | 9.53e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.964 | -| time/ | | -| fps | 23 | -| iterations | 25085 | -| time_elapsed | 136521 | -| total_timesteps | 3210880 | -| train/ | | -| approx_kl | 0.0037242551 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.00638 | -| n_updates | 250840 | -| policy_gradient_loss | 0.0106 | -| std | 0.00582 | -| value_loss | 4.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25086 | -| time_elapsed | 136524 | -| total_timesteps | 3211008 | -| train/ | | -| approx_kl | 0.055134427 | -| clip_fraction | 0.657 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | 0.057 | -| n_updates | 250850 | -| policy_gradient_loss | 0.141 | -| std | 0.00582 | -| value_loss | 3.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25087 | -| time_elapsed | 136535 | -| total_timesteps | 3211136 | -| train/ | | -| approx_kl | 0.06779428 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.473 | -| learning_rate | 0.0003 | -| loss | -0.0251 | -| n_updates | 250860 | -| policy_gradient_loss | -0.0169 | -| std | 0.00582 | -| value_loss | 0.00293 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25088 | -| time_elapsed | 136540 | -| total_timesteps | 3211264 | -| train/ | | -| approx_kl | 0.002487096 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.717 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 250870 | -| policy_gradient_loss | 0.0081 | -| std | 0.00582 | -| value_loss | 2.55e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25089 | -| time_elapsed | 136544 | -| total_timesteps | 3211392 | -| train/ | | -| approx_kl | 0.16265935 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.00174 | -| n_updates | 250880 | -| policy_gradient_loss | -0.0147 | -| std | 0.00583 | -| value_loss | 4.21e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25090 | -| time_elapsed | 136550 | -| total_timesteps | 3211520 | -| train/ | | -| approx_kl | 0.0295422 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0677 | -| learning_rate | 0.0003 | -| loss | -0.00612 | -| n_updates | 250890 | -| policy_gradient_loss | 0.002 | -| std | 0.00583 | -| value_loss | 8.99e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25091 | -| time_elapsed | 136554 | -| total_timesteps | 3211648 | -| train/ | | -| approx_kl | 0.068883866 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.00687 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 250900 | -| policy_gradient_loss | 0.0164 | -| std | 0.00584 | -| value_loss | 3.29e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25092 | -| time_elapsed | 136559 | -| total_timesteps | 3211776 | -| train/ | | -| approx_kl | 0.057308227 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0739 | -| learning_rate | 0.0003 | -| loss | 0.00624 | -| n_updates | 250910 | -| policy_gradient_loss | 0.00358 | -| std | 0.00585 | -| value_loss | 1.01e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 25093 | -| time_elapsed | 136563 | -| total_timesteps | 3211904 | -| train/ | | -| approx_kl | 0.009686114 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0061 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 250920 | -| policy_gradient_loss | 0.0116 | -| std | 0.00585 | -| value_loss | 2.4e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25094 | -| time_elapsed | 136568 | -| total_timesteps | 3212032 | -| train/ | | -| approx_kl | 0.0012311926 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.00339 | -| n_updates | 250930 | -| policy_gradient_loss | 0.00364 | -| std | 0.00585 | -| value_loss | 1.76e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25095 | -| time_elapsed | 136578 | -| total_timesteps | 3212160 | -| train/ | | -| approx_kl | 0.011424409 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.722 | -| learning_rate | 0.0003 | -| loss | -0.0238 | -| n_updates | 250940 | -| policy_gradient_loss | -0.0154 | -| std | 0.00585 | -| value_loss | 0.0011 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25096 | -| time_elapsed | 136583 | -| total_timesteps | 3212288 | -| train/ | | -| approx_kl | 0.0022802623 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.127 | -| learning_rate | 0.0003 | -| loss | -0.00724 | -| n_updates | 250950 | -| policy_gradient_loss | 0.037 | -| std | 0.00586 | -| value_loss | 2.39e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25097 | -| time_elapsed | 136587 | -| total_timesteps | 3212416 | -| train/ | | -| approx_kl | 1.0859994 | -| clip_fraction | 0.782 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00407 | -| learning_rate | 0.0003 | -| loss | 0.546 | -| n_updates | 250960 | -| policy_gradient_loss | 0.273 | -| std | 0.00586 | -| value_loss | 5.23e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25098 | -| time_elapsed | 136592 | -| total_timesteps | 3212544 | -| train/ | | -| approx_kl | 0.013714868 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00957 | -| n_updates | 250970 | -| policy_gradient_loss | 0.0229 | -| std | 0.00586 | -| value_loss | 3.93e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25099 | -| time_elapsed | 136597 | -| total_timesteps | 3212672 | -| train/ | | -| approx_kl | 0.3372076 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0223 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 250980 | -| policy_gradient_loss | 0.172 | -| std | 0.00586 | -| value_loss | 2.1e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25100 | -| time_elapsed | 136601 | -| total_timesteps | 3212800 | -| train/ | | -| approx_kl | 0.051661357 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0445 | -| learning_rate | 0.0003 | -| loss | 0.0222 | -| n_updates | 250990 | -| policy_gradient_loss | 0.0305 | -| std | 0.00586 | -| value_loss | 1.87e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.96 | -| time/ | | -| fps | 23 | -| iterations | 25101 | -| time_elapsed | 136605 | -| total_timesteps | 3212928 | -| train/ | | -| approx_kl | 0.7605639 | -| clip_fraction | 0.519 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 251000 | -| policy_gradient_loss | 0.0485 | -| std | 0.00586 | -| value_loss | 1.46e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25102 | -| time_elapsed | 136611 | -| total_timesteps | 3213056 | -| train/ | | -| approx_kl | 0.042769317 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 251010 | -| policy_gradient_loss | 0.0121 | -| std | 0.00589 | -| value_loss | 9.37e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25103 | -| time_elapsed | 136617 | -| total_timesteps | 3213184 | -| train/ | | -| approx_kl | 0.12517682 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.987 | -| learning_rate | 0.0003 | -| loss | 0.0334 | -| n_updates | 251020 | -| policy_gradient_loss | 0.0182 | -| std | 0.0059 | -| value_loss | 0.000167 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25104 | -| time_elapsed | 136623 | -| total_timesteps | 3213312 | -| train/ | | -| approx_kl | 0.20305295 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.667 | -| learning_rate | 0.0003 | -| loss | 0.0527 | -| n_updates | 251030 | -| policy_gradient_loss | 0.0178 | -| std | 0.00591 | -| value_loss | 2.8e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25105 | -| time_elapsed | 136626 | -| total_timesteps | 3213440 | -| train/ | | -| approx_kl | 0.0016421182 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0144 | -| learning_rate | 0.0003 | -| loss | -0.00638 | -| n_updates | 251040 | -| policy_gradient_loss | 0.0303 | -| std | 0.0059 | -| value_loss | 2.62e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25106 | -| time_elapsed | 136631 | -| total_timesteps | 3213568 | -| train/ | | -| approx_kl | 0.053847585 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -13 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 251050 | -| policy_gradient_loss | -0.0105 | -| std | 0.0059 | -| value_loss | 4.97e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25107 | -| time_elapsed | 136635 | -| total_timesteps | 3213696 | -| train/ | | -| approx_kl | 0.13214229 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.71 | -| learning_rate | 0.0003 | -| loss | 0.0385 | -| n_updates | 251060 | -| policy_gradient_loss | 0.0737 | -| std | 0.00591 | -| value_loss | 5.36e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25108 | -| time_elapsed | 136640 | -| total_timesteps | 3213824 | -| train/ | | -| approx_kl | 0.17171253 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 251070 | -| policy_gradient_loss | 0.143 | -| std | 0.00591 | -| value_loss | 3.17e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25109 | -| time_elapsed | 136644 | -| total_timesteps | 3213952 | -| train/ | | -| approx_kl | 0.15464224 | -| clip_fraction | 0.729 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 251080 | -| policy_gradient_loss | 0.128 | -| std | 0.00591 | -| value_loss | 2.32e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25110 | -| time_elapsed | 136649 | -| total_timesteps | 3214080 | -| train/ | | -| approx_kl | 0.029530682 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -0.00106 | -| n_updates | 251090 | -| policy_gradient_loss | 0.0241 | -| std | 0.00591 | -| value_loss | 1.74e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25111 | -| time_elapsed | 136657 | -| total_timesteps | 3214208 | -| train/ | | -| approx_kl | 0.62183845 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.683 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 251100 | -| policy_gradient_loss | 0.0562 | -| std | 0.00592 | -| value_loss | 0.0115 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25112 | -| time_elapsed | 136661 | -| total_timesteps | 3214336 | -| train/ | | -| approx_kl | 0.09659532 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.342 | -| learning_rate | 0.0003 | -| loss | 0.041 | -| n_updates | 251110 | -| policy_gradient_loss | 0.0159 | -| std | 0.00592 | -| value_loss | 9.61e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25113 | -| time_elapsed | 136666 | -| total_timesteps | 3214464 | -| train/ | | -| approx_kl | 0.038311668 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00149 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 251120 | -| policy_gradient_loss | 0.0123 | -| std | 0.00592 | -| value_loss | 7.45e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25114 | -| time_elapsed | 136670 | -| total_timesteps | 3214592 | -| train/ | | -| approx_kl | 0.06359212 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0841 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 251130 | -| policy_gradient_loss | 0.0152 | -| std | 0.00593 | -| value_loss | 4.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25115 | -| time_elapsed | 136674 | -| total_timesteps | 3214720 | -| train/ | | -| approx_kl | 0.012113143 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 251140 | -| policy_gradient_loss | 0.00999 | -| std | 0.00593 | -| value_loss | 3.22e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25116 | -| time_elapsed | 136679 | -| total_timesteps | 3214848 | -| train/ | | -| approx_kl | 0.0008050869 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.00416 | -| n_updates | 251150 | -| policy_gradient_loss | 0.00229 | -| std | 0.00593 | -| value_loss | 1.52e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25117 | -| time_elapsed | 136684 | -| total_timesteps | 3214976 | -| train/ | | -| approx_kl | 0.060050968 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0697 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 251160 | -| policy_gradient_loss | 0.0137 | -| std | 0.00593 | -| value_loss | 9.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25118 | -| time_elapsed | 136690 | -| total_timesteps | 3215104 | -| train/ | | -| approx_kl | 0.011715028 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.063 | -| learning_rate | 0.0003 | -| loss | -0.00087 | -| n_updates | 251170 | -| policy_gradient_loss | 0.0109 | -| std | 0.00593 | -| value_loss | 7.02e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25119 | -| time_elapsed | 136700 | -| total_timesteps | 3215232 | -| train/ | | -| approx_kl | 0.014321019 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.863 | -| learning_rate | 0.0003 | -| loss | -0.00664 | -| n_updates | 251180 | -| policy_gradient_loss | 5.7e-05 | -| std | 0.00593 | -| value_loss | 0.003 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25120 | -| time_elapsed | 136705 | -| total_timesteps | 3215360 | -| train/ | | -| approx_kl | 0.0016224054 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -6.74 | -| learning_rate | 0.0003 | -| loss | 0.00279 | -| n_updates | 251190 | -| policy_gradient_loss | 0.00976 | -| std | 0.00593 | -| value_loss | 4.39e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25121 | -| time_elapsed | 136710 | -| total_timesteps | 3215488 | -| train/ | | -| approx_kl | 0.07488039 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0692 | -| learning_rate | 0.0003 | -| loss | -0.0023 | -| n_updates | 251200 | -| policy_gradient_loss | -0.00331 | -| std | 0.00593 | -| value_loss | 1.46e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25122 | -| time_elapsed | 136715 | -| total_timesteps | 3215616 | -| train/ | | -| approx_kl | 0.009488817 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | -0.00618 | -| n_updates | 251210 | -| policy_gradient_loss | 0.00685 | -| std | 0.00593 | -| value_loss | 9.97e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25123 | -| time_elapsed | 136720 | -| total_timesteps | 3215744 | -| train/ | | -| approx_kl | 0.003783341 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.000195 | -| n_updates | 251220 | -| policy_gradient_loss | 0.0153 | -| std | 0.00593 | -| value_loss | 6.53e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25124 | -| time_elapsed | 136726 | -| total_timesteps | 3215872 | -| train/ | | -| approx_kl | 0.07945326 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.0399 | -| n_updates | 251230 | -| policy_gradient_loss | 0.0139 | -| std | 0.00592 | -| value_loss | 4.98e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25125 | -| time_elapsed | 136731 | -| total_timesteps | 3216000 | -| train/ | | -| approx_kl | 0.012818044 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.00613 | -| n_updates | 251240 | -| policy_gradient_loss | 0.0113 | -| std | 0.00592 | -| value_loss | 2.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25126 | -| time_elapsed | 136735 | -| total_timesteps | 3216128 | -| train/ | | -| approx_kl | 0.079202384 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00873 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 251250 | -| policy_gradient_loss | 0.00761 | -| std | 0.00592 | -| value_loss | 1.28e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25127 | -| time_elapsed | 136746 | -| total_timesteps | 3216256 | -| train/ | | -| approx_kl | 0.030524367 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.918 | -| learning_rate | 0.0003 | -| loss | -0.0255 | -| n_updates | 251260 | -| policy_gradient_loss | 0.00487 | -| std | 0.00592 | -| value_loss | 0.00143 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25128 | -| time_elapsed | 136752 | -| total_timesteps | 3216384 | -| train/ | | -| approx_kl | 0.23042402 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 251270 | -| policy_gradient_loss | 0.0684 | -| std | 0.00592 | -| value_loss | 3.1e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25129 | -| time_elapsed | 136757 | -| total_timesteps | 3216512 | -| train/ | | -| approx_kl | 0.24575236 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00442 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 251280 | -| policy_gradient_loss | 0.0397 | -| std | 0.00592 | -| value_loss | 1.78e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25130 | -| time_elapsed | 136761 | -| total_timesteps | 3216640 | -| train/ | | -| approx_kl | 0.19870564 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0633 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 251290 | -| policy_gradient_loss | 0.0249 | -| std | 0.00592 | -| value_loss | 5.26e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25131 | -| time_elapsed | 136766 | -| total_timesteps | 3216768 | -| train/ | | -| approx_kl | 0.031316213 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0016 | -| learning_rate | 0.0003 | -| loss | 0.00484 | -| n_updates | 251300 | -| policy_gradient_loss | 0.035 | -| std | 0.00592 | -| value_loss | 2.02e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.952 | -| time/ | | -| fps | 23 | -| iterations | 25132 | -| time_elapsed | 136770 | -| total_timesteps | 3216896 | -| train/ | | -| approx_kl | 6.2366016e-06 | -| clip_fraction | 0.0383 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.000406 | -| n_updates | 251310 | -| policy_gradient_loss | 0.00103 | -| std | 0.0059 | -| value_loss | 2.52e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25133 | -| time_elapsed | 136773 | -| total_timesteps | 3217024 | -| train/ | | -| approx_kl | 0.05108787 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0946 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 251320 | -| policy_gradient_loss | 0.0396 | -| std | 0.00589 | -| value_loss | 1.14e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25134 | -| time_elapsed | 136783 | -| total_timesteps | 3217152 | -| train/ | | -| approx_kl | 0.31676653 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.596 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 251330 | -| policy_gradient_loss | 0.135 | -| std | 0.00589 | -| value_loss | 0.0108 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25135 | -| time_elapsed | 136786 | -| total_timesteps | 3217280 | -| train/ | | -| approx_kl | 0.059548013 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 251340 | -| policy_gradient_loss | 0.022 | -| std | 0.00589 | -| value_loss | 9.08e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25136 | -| time_elapsed | 136789 | -| total_timesteps | 3217408 | -| train/ | | -| approx_kl | 0.17617033 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0158 | -| learning_rate | 0.0003 | -| loss | 0.0663 | -| n_updates | 251350 | -| policy_gradient_loss | 0.0224 | -| std | 0.00589 | -| value_loss | 1.92e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25137 | -| time_elapsed | 136793 | -| total_timesteps | 3217536 | -| train/ | | -| approx_kl | 0.016526466 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.00164 | -| n_updates | 251360 | -| policy_gradient_loss | 0.000428 | -| std | 0.00589 | -| value_loss | 9.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25138 | -| time_elapsed | 136797 | -| total_timesteps | 3217664 | -| train/ | | -| approx_kl | 0.015787287 | -| clip_fraction | 0.12 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.00463 | -| n_updates | 251370 | -| policy_gradient_loss | 0.00211 | -| std | 0.00589 | -| value_loss | 5.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25139 | -| time_elapsed | 136803 | -| total_timesteps | 3217792 | -| train/ | | -| approx_kl | 0.028896037 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0891 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 251380 | -| policy_gradient_loss | 0.0363 | -| std | 0.00589 | -| value_loss | 3.82e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25140 | -| time_elapsed | 136807 | -| total_timesteps | 3217920 | -| train/ | | -| approx_kl | 0.34080082 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 251390 | -| policy_gradient_loss | 0.146 | -| std | 0.00589 | -| value_loss | 3.41e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25141 | -| time_elapsed | 136812 | -| total_timesteps | 3218048 | -| train/ | | -| approx_kl | 0.05754798 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.0204 | -| n_updates | 251400 | -| policy_gradient_loss | 0.0241 | -| std | 0.00589 | -| value_loss | 2.26e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25142 | -| time_elapsed | 136819 | -| total_timesteps | 3218176 | -| train/ | | -| approx_kl | 0.01944313 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.86 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 251410 | -| policy_gradient_loss | -0.0105 | -| std | 0.00589 | -| value_loss | 0.00312 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25143 | -| time_elapsed | 136824 | -| total_timesteps | 3218304 | -| train/ | | -| approx_kl | 0.05753974 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00901 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 251420 | -| policy_gradient_loss | 0.0146 | -| std | 0.00589 | -| value_loss | 1.43e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25144 | -| time_elapsed | 136829 | -| total_timesteps | 3218432 | -| train/ | | -| approx_kl | 0.056203686 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0107 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 251430 | -| policy_gradient_loss | 0.0061 | -| std | 0.00588 | -| value_loss | 3.71e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25145 | -| time_elapsed | 136833 | -| total_timesteps | 3218560 | -| train/ | | -| approx_kl | 0.008195847 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 251440 | -| policy_gradient_loss | 0.00326 | -| std | 0.00588 | -| value_loss | 2.32e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25146 | -| time_elapsed | 136836 | -| total_timesteps | 3218688 | -| train/ | | -| approx_kl | 0.09314411 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.0516 | -| n_updates | 251450 | -| policy_gradient_loss | 0.0206 | -| std | 0.00588 | -| value_loss | 1.5e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25147 | -| time_elapsed | 136840 | -| total_timesteps | 3218816 | -| train/ | | -| approx_kl | 0.048970085 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0629 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 251460 | -| policy_gradient_loss | 0.0131 | -| std | 0.00588 | -| value_loss | 9.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25148 | -| time_elapsed | 136844 | -| total_timesteps | 3218944 | -| train/ | | -| approx_kl | 0.011130245 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | -0.00251 | -| n_updates | 251470 | -| policy_gradient_loss | 0.0123 | -| std | 0.00587 | -| value_loss | 6.6e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25149 | -| time_elapsed | 136848 | -| total_timesteps | 3219072 | -| train/ | | -| approx_kl | 0.07464379 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0155 | -| learning_rate | 0.0003 | -| loss | 0.0286 | -| n_updates | 251480 | -| policy_gradient_loss | 0.00943 | -| std | 0.00587 | -| value_loss | 1.56e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25150 | -| time_elapsed | 136857 | -| total_timesteps | 3219200 | -| train/ | | -| approx_kl | 0.04112679 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.00237 | -| n_updates | 251490 | -| policy_gradient_loss | 0.00245 | -| std | 0.00587 | -| value_loss | 0.000113 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25151 | -| time_elapsed | 136862 | -| total_timesteps | 3219328 | -| train/ | | -| approx_kl | 0.0022411528 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0088 | -| learning_rate | 0.0003 | -| loss | -0.00211 | -| n_updates | 251500 | -| policy_gradient_loss | 0.0112 | -| std | 0.00588 | -| value_loss | 1.12e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25152 | -| time_elapsed | 136867 | -| total_timesteps | 3219456 | -| train/ | | -| approx_kl | 9.309966e-06 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0828 | -| learning_rate | 0.0003 | -| loss | -0.000545 | -| n_updates | 251510 | -| policy_gradient_loss | 0.0431 | -| std | 0.00588 | -| value_loss | 4.39e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25153 | -| time_elapsed | 136872 | -| total_timesteps | 3219584 | -| train/ | | -| approx_kl | 0.20623788 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.125 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 251520 | -| policy_gradient_loss | 0.0751 | -| std | 0.00588 | -| value_loss | 2.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25154 | -| time_elapsed | 136877 | -| total_timesteps | 3219712 | -| train/ | | -| approx_kl | 0.27637583 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0972 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 251530 | -| policy_gradient_loss | 0.0385 | -| std | 0.00588 | -| value_loss | 1.29e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25155 | -| time_elapsed | 136882 | -| total_timesteps | 3219840 | -| train/ | | -| approx_kl | 0.6898542 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0863 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 251540 | -| policy_gradient_loss | 0.0613 | -| std | 0.00588 | -| value_loss | 9.63e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.953 | -| time/ | | -| fps | 23 | -| iterations | 25156 | -| time_elapsed | 136887 | -| total_timesteps | 3219968 | -| train/ | | -| approx_kl | 0.0447002 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.022 | -| n_updates | 251550 | -| policy_gradient_loss | 0.0117 | -| std | 0.00589 | -| value_loss | 6.22e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25157 | -| time_elapsed | 136891 | -| total_timesteps | 3220096 | -| train/ | | -| approx_kl | 0.053266454 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0659 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 251560 | -| policy_gradient_loss | 0.00758 | -| std | 0.00588 | -| value_loss | 4.21e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25158 | -| time_elapsed | 136903 | -| total_timesteps | 3220224 | -| train/ | | -| approx_kl | 0.03687886 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.691 | -| learning_rate | 0.0003 | -| loss | 0.00905 | -| n_updates | 251570 | -| policy_gradient_loss | 0.00678 | -| std | 0.00588 | -| value_loss | 0.00891 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25159 | -| time_elapsed | 136907 | -| total_timesteps | 3220352 | -| train/ | | -| approx_kl | 0.008004826 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.295 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 251580 | -| policy_gradient_loss | 0.0122 | -| std | 0.00588 | -| value_loss | 0.000235 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25160 | -| time_elapsed | 136912 | -| total_timesteps | 3220480 | -| train/ | | -| approx_kl | 0.0015930543 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0155 | -| learning_rate | 0.0003 | -| loss | 0.00934 | -| n_updates | 251590 | -| policy_gradient_loss | 0.00455 | -| std | 0.00589 | -| value_loss | 4.24e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25161 | -| time_elapsed | 136917 | -| total_timesteps | 3220608 | -| train/ | | -| approx_kl | 0.06316352 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | 0.0363 | -| n_updates | 251600 | -| policy_gradient_loss | 0.0163 | -| std | 0.00589 | -| value_loss | 1.82e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25162 | -| time_elapsed | 136921 | -| total_timesteps | 3220736 | -| train/ | | -| approx_kl | 0.014685795 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | 0.00642 | -| n_updates | 251610 | -| policy_gradient_loss | 0.0137 | -| std | 0.0059 | -| value_loss | 1.2e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25163 | -| time_elapsed | 136926 | -| total_timesteps | 3220864 | -| train/ | | -| approx_kl | 0.07264982 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0582 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 251620 | -| policy_gradient_loss | 0.00511 | -| std | 0.0059 | -| value_loss | 8.65e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.95 | -| time/ | | -| fps | 23 | -| iterations | 25164 | -| time_elapsed | 136931 | -| total_timesteps | 3220992 | -| train/ | | -| approx_kl | 0.012610785 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | -0.000683 | -| n_updates | 251630 | -| policy_gradient_loss | 0.00644 | -| std | 0.0059 | -| value_loss | 5.52e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25165 | -| time_elapsed | 136937 | -| total_timesteps | 3221120 | -| train/ | | -| approx_kl | 0.00082535995 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0657 | -| learning_rate | 0.0003 | -| loss | 0.00249 | -| n_updates | 251640 | -| policy_gradient_loss | 0.00605 | -| std | 0.0059 | -| value_loss | 3.81e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25166 | -| time_elapsed | 136952 | -| total_timesteps | 3221248 | -| train/ | | -| approx_kl | 0.045067288 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 251650 | -| policy_gradient_loss | -0.0117 | -| std | 0.0059 | -| value_loss | 0.000631 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25167 | -| time_elapsed | 136958 | -| total_timesteps | 3221376 | -| train/ | | -| approx_kl | 0.06621513 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.00559 | -| n_updates | 251660 | -| policy_gradient_loss | -0.000363 | -| std | 0.0059 | -| value_loss | 2.36e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25168 | -| time_elapsed | 136964 | -| total_timesteps | 3221504 | -| train/ | | -| approx_kl | 0.014809892 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.01 | -| learning_rate | 0.0003 | -| loss | -0.000628 | -| n_updates | 251670 | -| policy_gradient_loss | 0.00995 | -| std | 0.0059 | -| value_loss | 4.89e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25169 | -| time_elapsed | 136969 | -| total_timesteps | 3221632 | -| train/ | | -| approx_kl | 0.00087060034 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 251680 | -| policy_gradient_loss | 0.00478 | -| std | 0.0059 | -| value_loss | 3.26e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25170 | -| time_elapsed | 136974 | -| total_timesteps | 3221760 | -| train/ | | -| approx_kl | 0.076092966 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0736 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 251690 | -| policy_gradient_loss | 0.0131 | -| std | 0.0059 | -| value_loss | 1.73e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 25171 | -| time_elapsed | 136979 | -| total_timesteps | 3221888 | -| train/ | | -| approx_kl | 0.013306413 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0695 | -| learning_rate | 0.0003 | -| loss | -0.00872 | -| n_updates | 251700 | -| policy_gradient_loss | 0.00964 | -| std | 0.0059 | -| value_loss | 1.46e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25172 | -| time_elapsed | 136984 | -| total_timesteps | 3222016 | -| train/ | | -| approx_kl | 0.080703385 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.0435 | -| n_updates | 251710 | -| policy_gradient_loss | 0.0182 | -| std | 0.00591 | -| value_loss | 1.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25173 | -| time_elapsed | 136996 | -| total_timesteps | 3222144 | -| train/ | | -| approx_kl | 0.038905896 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 251720 | -| policy_gradient_loss | -0.00782 | -| std | 0.00592 | -| value_loss | 0.000115 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25174 | -| time_elapsed | 137002 | -| total_timesteps | 3222272 | -| train/ | | -| approx_kl | 0.17058344 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.26 | -| learning_rate | 0.0003 | -| loss | 0.0673 | -| n_updates | 251730 | -| policy_gradient_loss | 0.0515 | -| std | 0.00592 | -| value_loss | 2.94e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25175 | -| time_elapsed | 137007 | -| total_timesteps | 3222400 | -| train/ | | -| approx_kl | 0.006017178 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.325 | -| learning_rate | 0.0003 | -| loss | -0.00466 | -| n_updates | 251740 | -| policy_gradient_loss | 0.0107 | -| std | 0.00592 | -| value_loss | 1.6e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25176 | -| time_elapsed | 137012 | -| total_timesteps | 3222528 | -| train/ | | -| approx_kl | 0.0001139259 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | 0.00289 | -| n_updates | 251750 | -| policy_gradient_loss | -0.00561 | -| std | 0.00591 | -| value_loss | 2e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25177 | -| time_elapsed | 137017 | -| total_timesteps | 3222656 | -| train/ | | -| approx_kl | 0.09132191 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0173 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 251760 | -| policy_gradient_loss | 0.0828 | -| std | 0.00591 | -| value_loss | 1.12e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25178 | -| time_elapsed | 137022 | -| total_timesteps | 3222784 | -| train/ | | -| approx_kl | 0.06052434 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.0724 | -| n_updates | 251770 | -| policy_gradient_loss | 0.0295 | -| std | 0.00591 | -| value_loss | 8.69e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.951 | -| time/ | | -| fps | 23 | -| iterations | 25179 | -| time_elapsed | 137027 | -| total_timesteps | 3222912 | -| train/ | | -| approx_kl | 0.00065640314 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | -0.000325 | -| n_updates | 251780 | -| policy_gradient_loss | 0.0933 | -| std | 0.00591 | -| value_loss | 6.66e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25180 | -| time_elapsed | 137030 | -| total_timesteps | 3223040 | -| train/ | | -| approx_kl | 0.105770364 | -| clip_fraction | 0.669 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | 0.0932 | -| n_updates | 251790 | -| policy_gradient_loss | 0.135 | -| std | 0.00591 | -| value_loss | 1.98e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25181 | -| time_elapsed | 137039 | -| total_timesteps | 3223168 | -| train/ | | -| approx_kl | 0.196138 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -4.6 | -| learning_rate | 0.0003 | -| loss | 0.00608 | -| n_updates | 251800 | -| policy_gradient_loss | -0.00514 | -| std | 0.00591 | -| value_loss | 0.00469 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25182 | -| time_elapsed | 137044 | -| total_timesteps | 3223296 | -| train/ | | -| approx_kl | 0.15674196 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.0782 | -| n_updates | 251810 | -| policy_gradient_loss | 0.0428 | -| std | 0.00591 | -| value_loss | 4.67e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25183 | -| time_elapsed | 137048 | -| total_timesteps | 3223424 | -| train/ | | -| approx_kl | 0.041161135 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0049 | -| learning_rate | 0.0003 | -| loss | 0.0011 | -| n_updates | 251820 | -| policy_gradient_loss | 0.055 | -| std | 0.00592 | -| value_loss | 3.72e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25184 | -| time_elapsed | 137053 | -| total_timesteps | 3223552 | -| train/ | | -| approx_kl | 0.3240217 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 251830 | -| policy_gradient_loss | 0.048 | -| std | 0.00592 | -| value_loss | 2.51e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25185 | -| time_elapsed | 137057 | -| total_timesteps | 3223680 | -| train/ | | -| approx_kl | 0.09175783 | -| clip_fraction | 0.673 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 251840 | -| policy_gradient_loss | 0.111 | -| std | 0.00592 | -| value_loss | 2.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25186 | -| time_elapsed | 137061 | -| total_timesteps | 3223808 | -| train/ | | -| approx_kl | 0.023017494 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | -0.014 | -| n_updates | 251850 | -| policy_gradient_loss | 0.00622 | -| std | 0.00592 | -| value_loss | 1.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 25187 | -| time_elapsed | 137065 | -| total_timesteps | 3223936 | -| train/ | | -| approx_kl | 0.033807468 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.0032 | -| n_updates | 251860 | -| policy_gradient_loss | 0.04 | -| std | 0.00592 | -| value_loss | 1.06e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25188 | -| time_elapsed | 137071 | -| total_timesteps | 3224064 | -| train/ | | -| approx_kl | 0.21702032 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | 0.0923 | -| n_updates | 251870 | -| policy_gradient_loss | 0.049 | -| std | 0.00592 | -| value_loss | 7.54e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25189 | -| time_elapsed | 137080 | -| total_timesteps | 3224192 | -| train/ | | -| approx_kl | 0.03448175 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.66 | -| learning_rate | 0.0003 | -| loss | -0.0247 | -| n_updates | 251880 | -| policy_gradient_loss | 0.0226 | -| std | 0.00592 | -| value_loss | 0.00291 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25190 | -| time_elapsed | 137085 | -| total_timesteps | 3224320 | -| train/ | | -| approx_kl | 0.009499976 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0876 | -| learning_rate | 0.0003 | -| loss | -0.000919 | -| n_updates | 251890 | -| policy_gradient_loss | 0.0264 | -| std | 0.00593 | -| value_loss | 6.58e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25191 | -| time_elapsed | 137090 | -| total_timesteps | 3224448 | -| train/ | | -| approx_kl | 0.14911582 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00901 | -| learning_rate | 0.0003 | -| loss | 0.0527 | -| n_updates | 251900 | -| policy_gradient_loss | 0.0119 | -| std | 0.00594 | -| value_loss | 2.39e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25192 | -| time_elapsed | 137095 | -| total_timesteps | 3224576 | -| train/ | | -| approx_kl | 0.23002595 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 251910 | -| policy_gradient_loss | 0.0165 | -| std | 0.00594 | -| value_loss | 4.82e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25193 | -| time_elapsed | 137100 | -| total_timesteps | 3224704 | -| train/ | | -| approx_kl | 0.06795286 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.468 | -| learning_rate | 0.0003 | -| loss | -0.0168 | -| n_updates | 251920 | -| policy_gradient_loss | 0.00264 | -| std | 0.00594 | -| value_loss | 4.13e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25194 | -| time_elapsed | 137105 | -| total_timesteps | 3224832 | -| train/ | | -| approx_kl | 0.039452597 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 251930 | -| policy_gradient_loss | 0.0209 | -| std | 0.00594 | -| value_loss | 1.85e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.954 | -| time/ | | -| fps | 23 | -| iterations | 25195 | -| time_elapsed | 137110 | -| total_timesteps | 3224960 | -| train/ | | -| approx_kl | 0.033314303 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | 0.00719 | -| n_updates | 251940 | -| policy_gradient_loss | 0.0366 | -| std | 0.00594 | -| value_loss | 1e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25196 | -| time_elapsed | 137115 | -| total_timesteps | 3225088 | -| train/ | | -| approx_kl | 0.06327531 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0592 | -| learning_rate | 0.0003 | -| loss | 0.0416 | -| n_updates | 251950 | -| policy_gradient_loss | 0.0301 | -| std | 0.00594 | -| value_loss | 1.03e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25197 | -| time_elapsed | 137128 | -| total_timesteps | 3225216 | -| train/ | | -| approx_kl | 0.02591721 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -3.91 | -| learning_rate | 0.0003 | -| loss | -0.0301 | -| n_updates | 251960 | -| policy_gradient_loss | -0.0138 | -| std | 0.00594 | -| value_loss | 0.00414 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25198 | -| time_elapsed | 137132 | -| total_timesteps | 3225344 | -| train/ | | -| approx_kl | 0.004405149 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.298 | -| learning_rate | 0.0003 | -| loss | -0.00839 | -| n_updates | 251970 | -| policy_gradient_loss | 0.0322 | -| std | 0.00594 | -| value_loss | 1.92e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25199 | -| time_elapsed | 137136 | -| total_timesteps | 3225472 | -| train/ | | -| approx_kl | 0.5777097 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00953 | -| learning_rate | 0.0003 | -| loss | 0.19 | -| n_updates | 251980 | -| policy_gradient_loss | 0.0734 | -| std | 0.00594 | -| value_loss | 3.12e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25200 | -| time_elapsed | 137141 | -| total_timesteps | 3225600 | -| train/ | | -| approx_kl | 0.07025012 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 251990 | -| policy_gradient_loss | 0.0154 | -| std | 0.00594 | -| value_loss | 2.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25201 | -| time_elapsed | 137145 | -| total_timesteps | 3225728 | -| train/ | | -| approx_kl | 0.013508962 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | 0.00396 | -| n_updates | 252000 | -| policy_gradient_loss | 0.0179 | -| std | 0.00595 | -| value_loss | 1.38e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25202 | -| time_elapsed | 137149 | -| total_timesteps | 3225856 | -| train/ | | -| approx_kl | 0.0034004534 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 252010 | -| policy_gradient_loss | 0.0142 | -| std | 0.00595 | -| value_loss | 9.38e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 25203 | -| time_elapsed | 137154 | -| total_timesteps | 3225984 | -| train/ | | -| approx_kl | 3.6200508e-06 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 6.37e-05 | -| n_updates | 252020 | -| policy_gradient_loss | 0.0407 | -| std | 0.00594 | -| value_loss | 6.72e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25204 | -| time_elapsed | 137160 | -| total_timesteps | 3226112 | -| train/ | | -| approx_kl | 0.26082733 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0504 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 252030 | -| policy_gradient_loss | 0.0636 | -| std | 0.00594 | -| value_loss | 5.71e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25205 | -| time_elapsed | 137173 | -| total_timesteps | 3226240 | -| train/ | | -| approx_kl | 0.02338458 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 252040 | -| policy_gradient_loss | -0.00973 | -| std | 0.00594 | -| value_loss | 0.000892 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25206 | -| time_elapsed | 137178 | -| total_timesteps | 3226368 | -| train/ | | -| approx_kl | 0.0030088047 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | 0.00763 | -| n_updates | 252050 | -| policy_gradient_loss | 0.00911 | -| std | 0.00594 | -| value_loss | 1.44e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25207 | -| time_elapsed | 137182 | -| total_timesteps | 3226496 | -| train/ | | -| approx_kl | 0.06283568 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00967 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 252060 | -| policy_gradient_loss | 0.0101 | -| std | 0.00593 | -| value_loss | 7.58e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25208 | -| time_elapsed | 137188 | -| total_timesteps | 3226624 | -| train/ | | -| approx_kl | 0.06380214 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.034 | -| n_updates | 252070 | -| policy_gradient_loss | 0.0173 | -| std | 0.00593 | -| value_loss | 6.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25209 | -| time_elapsed | 137191 | -| total_timesteps | 3226752 | -| train/ | | -| approx_kl | 0.008663962 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | -0.000578 | -| n_updates | 252080 | -| policy_gradient_loss | 0.00739 | -| std | 0.00593 | -| value_loss | 3.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 25210 | -| time_elapsed | 137195 | -| total_timesteps | 3226880 | -| train/ | | -| approx_kl | 0.002672289 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.0063 | -| n_updates | 252090 | -| policy_gradient_loss | 0.00881 | -| std | 0.00592 | -| value_loss | 2.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25211 | -| time_elapsed | 137199 | -| total_timesteps | 3227008 | -| train/ | | -| approx_kl | 0.05151768 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | 0.0572 | -| n_updates | 252100 | -| policy_gradient_loss | 0.106 | -| std | 0.00593 | -| value_loss | 1.53e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25212 | -| time_elapsed | 137208 | -| total_timesteps | 3227136 | -| train/ | | -| approx_kl | 0.13490947 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 252110 | -| policy_gradient_loss | 0.000964 | -| std | 0.00593 | -| value_loss | 0.000199 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25213 | -| time_elapsed | 137212 | -| total_timesteps | 3227264 | -| train/ | | -| approx_kl | 0.2278461 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.649 | -| learning_rate | 0.0003 | -| loss | 0.0653 | -| n_updates | 252120 | -| policy_gradient_loss | 0.0188 | -| std | 0.00593 | -| value_loss | 1.75e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25214 | -| time_elapsed | 137218 | -| total_timesteps | 3227392 | -| train/ | | -| approx_kl | 0.019909576 | -| clip_fraction | 0.162 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0117 | -| learning_rate | 0.0003 | -| loss | -0.00031 | -| n_updates | 252130 | -| policy_gradient_loss | -0.000639 | -| std | 0.00593 | -| value_loss | 3.77e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25215 | -| time_elapsed | 137223 | -| total_timesteps | 3227520 | -| train/ | | -| approx_kl | 0.032512106 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0293 | -| learning_rate | 0.0003 | -| loss | 0.00929 | -| n_updates | 252140 | -| policy_gradient_loss | 0.0341 | -| std | 0.00594 | -| value_loss | 1.5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25216 | -| time_elapsed | 137229 | -| total_timesteps | 3227648 | -| train/ | | -| approx_kl | 0.09289997 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 252150 | -| policy_gradient_loss | 0.0206 | -| std | 0.00594 | -| value_loss | 1.2e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25217 | -| time_elapsed | 137234 | -| total_timesteps | 3227776 | -| train/ | | -| approx_kl | 0.20162126 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.093 | -| n_updates | 252160 | -| policy_gradient_loss | 0.0324 | -| std | 0.00594 | -| value_loss | 7.08e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.934 | -| time/ | | -| fps | 23 | -| iterations | 25218 | -| time_elapsed | 137237 | -| total_timesteps | 3227904 | -| train/ | | -| approx_kl | 0.0130348485 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.059 | -| learning_rate | 0.0003 | -| loss | -0.00515 | -| n_updates | 252170 | -| policy_gradient_loss | -0.0022 | -| std | 0.00594 | -| value_loss | 5.16e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25219 | -| time_elapsed | 137241 | -| total_timesteps | 3228032 | -| train/ | | -| approx_kl | 0.031577703 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 252180 | -| policy_gradient_loss | 0.0417 | -| std | 0.00593 | -| value_loss | 4.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25220 | -| time_elapsed | 137253 | -| total_timesteps | 3228160 | -| train/ | | -| approx_kl | 0.17342456 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.818 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 252190 | -| policy_gradient_loss | 0.0292 | -| std | 0.00593 | -| value_loss | 0.00468 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25221 | -| time_elapsed | 137258 | -| total_timesteps | 3228288 | -| train/ | | -| approx_kl | 0.53539383 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.384 | -| learning_rate | 0.0003 | -| loss | 0.184 | -| n_updates | 252200 | -| policy_gradient_loss | 0.0646 | -| std | 0.00593 | -| value_loss | 1.08e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25222 | -| time_elapsed | 137264 | -| total_timesteps | 3228416 | -| train/ | | -| approx_kl | 0.06282052 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.012 | -| learning_rate | 0.0003 | -| loss | 0.018 | -| n_updates | 252210 | -| policy_gradient_loss | 0.0087 | -| std | 0.00593 | -| value_loss | 3.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25223 | -| time_elapsed | 137269 | -| total_timesteps | 3228544 | -| train/ | | -| approx_kl | 0.05654678 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0256 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 252220 | -| policy_gradient_loss | 0.0187 | -| std | 0.00593 | -| value_loss | 1.71e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25224 | -| time_elapsed | 137274 | -| total_timesteps | 3228672 | -| train/ | | -| approx_kl | 0.01026108 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | -0.0239 | -| n_updates | 252230 | -| policy_gradient_loss | 0.00378 | -| std | 0.00594 | -| value_loss | 4.41e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25225 | -| time_elapsed | 137279 | -| total_timesteps | 3228800 | -| train/ | | -| approx_kl | 0.00027865265 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00105 | -| learning_rate | 0.0003 | -| loss | 0.00056 | -| n_updates | 252240 | -| policy_gradient_loss | 0.0346 | -| std | 0.00594 | -| value_loss | 1.03e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25226 | -| time_elapsed | 137283 | -| total_timesteps | 3228928 | -| train/ | | -| approx_kl | 0.25004154 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 252250 | -| policy_gradient_loss | 0.0662 | -| std | 0.00594 | -| value_loss | 1.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25227 | -| time_elapsed | 137288 | -| total_timesteps | 3229056 | -| train/ | | -| approx_kl | 0.001499414 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0151 | -| learning_rate | 0.0003 | -| loss | 0.000869 | -| n_updates | 252260 | -| policy_gradient_loss | 0.0149 | -| std | 0.00593 | -| value_loss | 6.59e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25228 | -| time_elapsed | 137298 | -| total_timesteps | 3229184 | -| train/ | | -| approx_kl | 0.049826294 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.513 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 252270 | -| policy_gradient_loss | -0.00148 | -| std | 0.00593 | -| value_loss | 0.00154 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25229 | -| time_elapsed | 137303 | -| total_timesteps | 3229312 | -| train/ | | -| approx_kl | 0.1852078 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.267 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 252280 | -| policy_gradient_loss | 0.0651 | -| std | 0.00593 | -| value_loss | 9.14e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25230 | -| time_elapsed | 137307 | -| total_timesteps | 3229440 | -| train/ | | -| approx_kl | 0.008376234 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.00983 | -| n_updates | 252290 | -| policy_gradient_loss | 0.00606 | -| std | 0.00593 | -| value_loss | 6.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25231 | -| time_elapsed | 137312 | -| total_timesteps | 3229568 | -| train/ | | -| approx_kl | 0.25663725 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0719 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 252300 | -| policy_gradient_loss | 0.036 | -| std | 0.00593 | -| value_loss | 4.74e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25232 | -| time_elapsed | 137316 | -| total_timesteps | 3229696 | -| train/ | | -| approx_kl | 0.15720667 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0481 | -| learning_rate | 0.0003 | -| loss | 0.0736 | -| n_updates | 252310 | -| policy_gradient_loss | 0.0224 | -| std | 0.00592 | -| value_loss | 4.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25233 | -| time_elapsed | 137321 | -| total_timesteps | 3229824 | -| train/ | | -| approx_kl | 0.013968833 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | -0.00604 | -| n_updates | 252320 | -| policy_gradient_loss | -0.00353 | -| std | 0.00592 | -| value_loss | 1.15e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.932 | -| time/ | | -| fps | 23 | -| iterations | 25234 | -| time_elapsed | 137325 | -| total_timesteps | 3229952 | -| train/ | | -| approx_kl | 0.014743743 | -| clip_fraction | 0.111 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0839 | -| learning_rate | 0.0003 | -| loss | 0.00453 | -| n_updates | 252330 | -| policy_gradient_loss | 0.00218 | -| std | 0.00593 | -| value_loss | 7.02e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25235 | -| time_elapsed | 137330 | -| total_timesteps | 3230080 | -| train/ | | -| approx_kl | 0.014903888 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 252340 | -| policy_gradient_loss | 0.00203 | -| std | 0.00593 | -| value_loss | 4.21e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25236 | -| time_elapsed | 137338 | -| total_timesteps | 3230208 | -| train/ | | -| approx_kl | 0.026723485 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.623 | -| learning_rate | 0.0003 | -| loss | -0.0219 | -| n_updates | 252350 | -| policy_gradient_loss | -0.0169 | -| std | 0.00593 | -| value_loss | 0.0013 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25237 | -| time_elapsed | 137345 | -| total_timesteps | 3230336 | -| train/ | | -| approx_kl | 0.079780206 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.0456 | -| n_updates | 252360 | -| policy_gradient_loss | 0.0259 | -| std | 0.00594 | -| value_loss | 1.11e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25238 | -| time_elapsed | 137350 | -| total_timesteps | 3230464 | -| train/ | | -| approx_kl | 0.2014255 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0111 | -| learning_rate | 0.0003 | -| loss | 0.0901 | -| n_updates | 252370 | -| policy_gradient_loss | 0.0313 | -| std | 0.00594 | -| value_loss | 3.83e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25239 | -| time_elapsed | 137355 | -| total_timesteps | 3230592 | -| train/ | | -| approx_kl | 0.02504424 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00749 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 252380 | -| policy_gradient_loss | 0.0337 | -| std | 0.00594 | -| value_loss | 3.92e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25240 | -| time_elapsed | 137359 | -| total_timesteps | 3230720 | -| train/ | | -| approx_kl | 0.30188122 | -| clip_fraction | 0.735 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0136 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 252390 | -| policy_gradient_loss | 0.148 | -| std | 0.00594 | -| value_loss | 2.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25241 | -| time_elapsed | 137365 | -| total_timesteps | 3230848 | -| train/ | | -| approx_kl | 0.21585795 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0263 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 252400 | -| policy_gradient_loss | 0.138 | -| std | 0.00594 | -| value_loss | 1.11e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25242 | -| time_elapsed | 137371 | -| total_timesteps | 3230976 | -| train/ | | -| approx_kl | 0.038155522 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0637 | -| learning_rate | 0.0003 | -| loss | 0.00833 | -| n_updates | 252410 | -| policy_gradient_loss | 0.028 | -| std | 0.00594 | -| value_loss | 8.77e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 25243 | -| time_elapsed | 137375 | -| total_timesteps | 3231104 | -| train/ | | -| approx_kl | 0.0018167407 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.00235 | -| n_updates | 252420 | -| policy_gradient_loss | 0.0367 | -| std | 0.00594 | -| value_loss | 5.99e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 25244 | -| time_elapsed | 137385 | -| total_timesteps | 3231232 | -| train/ | | -| approx_kl | 0.058070783 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.0356 | -| n_updates | 252430 | -| policy_gradient_loss | -0.023 | -| std | 0.00594 | -| value_loss | 0.000222 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 25245 | -| time_elapsed | 137390 | -| total_timesteps | 3231360 | -| train/ | | -| approx_kl | 0.070764326 | -| clip_fraction | 0.638 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.45 | -| learning_rate | 0.0003 | -| loss | 0.0479 | -| n_updates | 252440 | -| policy_gradient_loss | 0.0925 | -| std | 0.00596 | -| value_loss | 1.09e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 25246 | -| time_elapsed | 137395 | -| total_timesteps | 3231488 | -| train/ | | -| approx_kl | 0.23123722 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.79 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 252450 | -| policy_gradient_loss | 0.0954 | -| std | 0.00597 | -| value_loss | 3.69e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 25247 | -| time_elapsed | 137400 | -| total_timesteps | 3231616 | -| train/ | | -| approx_kl | 0.0068827393 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.0112 | -| n_updates | 252460 | -| policy_gradient_loss | 0.0219 | -| std | 0.00597 | -| value_loss | 1.66e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 25248 | -| time_elapsed | 137404 | -| total_timesteps | 3231744 | -| train/ | | -| approx_kl | 0.0025879215 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | -0.00491 | -| n_updates | 252470 | -| policy_gradient_loss | 0.026 | -| std | 0.00597 | -| value_loss | 1.16e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 25249 | -| time_elapsed | 137409 | -| total_timesteps | 3231872 | -| train/ | | -| approx_kl | 0.015492491 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0811 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 252480 | -| policy_gradient_loss | 0.021 | -| std | 0.00597 | -| value_loss | 6.24e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25250 | -| time_elapsed | 137413 | -| total_timesteps | 3232000 | -| train/ | | -| approx_kl | 0.0812599 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0574 | -| learning_rate | 0.0003 | -| loss | 0.0559 | -| n_updates | 252490 | -| policy_gradient_loss | 0.0201 | -| std | 0.00598 | -| value_loss | 3.94e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25251 | -| time_elapsed | 137417 | -| total_timesteps | 3232128 | -| train/ | | -| approx_kl | 0.035599932 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00742 | -| learning_rate | 0.0003 | -| loss | -0.00928 | -| n_updates | 252500 | -| policy_gradient_loss | 0.0159 | -| std | 0.00598 | -| value_loss | 2.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25252 | -| time_elapsed | 137430 | -| total_timesteps | 3232256 | -| train/ | | -| approx_kl | 0.037696168 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -5.69 | -| learning_rate | 0.0003 | -| loss | -0.00726 | -| n_updates | 252510 | -| policy_gradient_loss | 0.0179 | -| std | 0.00599 | -| value_loss | 0.00411 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25253 | -| time_elapsed | 137435 | -| total_timesteps | 3232384 | -| train/ | | -| approx_kl | 0.19193324 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.311 | -| learning_rate | 0.0003 | -| loss | 0.0892 | -| n_updates | 252520 | -| policy_gradient_loss | 0.0537 | -| std | 0.00599 | -| value_loss | 5.62e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25254 | -| time_elapsed | 137440 | -| total_timesteps | 3232512 | -| train/ | | -| approx_kl | 0.05811533 | -| clip_fraction | 0.571 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0127 | -| learning_rate | 0.0003 | -| loss | 0.00287 | -| n_updates | 252530 | -| policy_gradient_loss | 0.0681 | -| std | 0.00599 | -| value_loss | 1.79e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25255 | -| time_elapsed | 137445 | -| total_timesteps | 3232640 | -| train/ | | -| approx_kl | 0.00025095185 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0131 | -| learning_rate | 0.0003 | -| loss | 0.000549 | -| n_updates | 252540 | -| policy_gradient_loss | 0.0938 | -| std | 0.00599 | -| value_loss | 8.6e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25256 | -| time_elapsed | 137450 | -| total_timesteps | 3232768 | -| train/ | | -| approx_kl | 7.1624417 | -| clip_fraction | 0.873 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.237 | -| n_updates | 252550 | -| policy_gradient_loss | 0.229 | -| std | 0.006 | -| value_loss | 1.48e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25257 | -| time_elapsed | 137455 | -| total_timesteps | 3232896 | -| train/ | | -| approx_kl | 0.008940248 | -| clip_fraction | 0.0828 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | 0.0005 | -| n_updates | 252560 | -| policy_gradient_loss | 0.00101 | -| std | 0.00601 | -| value_loss | 5.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25258 | -| time_elapsed | 137460 | -| total_timesteps | 3233024 | -| train/ | | -| approx_kl | 0.011696901 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 252570 | -| policy_gradient_loss | -0.00594 | -| std | 0.00601 | -| value_loss | 1.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25259 | -| time_elapsed | 137470 | -| total_timesteps | 3233152 | -| train/ | | -| approx_kl | 0.010655239 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -3.06 | -| learning_rate | 0.0003 | -| loss | -0.0262 | -| n_updates | 252580 | -| policy_gradient_loss | -0.00685 | -| std | 0.00601 | -| value_loss | 0.00337 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25260 | -| time_elapsed | 137475 | -| total_timesteps | 3233280 | -| train/ | | -| approx_kl | 0.27004558 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.172 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 252590 | -| policy_gradient_loss | 0.131 | -| std | 0.00601 | -| value_loss | 2.95e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25261 | -| time_elapsed | 137479 | -| total_timesteps | 3233408 | -| train/ | | -| approx_kl | 0.04258838 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 252600 | -| policy_gradient_loss | 0.0256 | -| std | 0.00601 | -| value_loss | 8.57e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25262 | -| time_elapsed | 137482 | -| total_timesteps | 3233536 | -| train/ | | -| approx_kl | 0.0017138426 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00894 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 252610 | -| policy_gradient_loss | 0.0307 | -| std | 0.00602 | -| value_loss | 5.6e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25263 | -| time_elapsed | 137486 | -| total_timesteps | 3233664 | -| train/ | | -| approx_kl | 0.45808053 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 252620 | -| policy_gradient_loss | 0.0427 | -| std | 0.00602 | -| value_loss | 1.47e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25264 | -| time_elapsed | 137489 | -| total_timesteps | 3233792 | -| train/ | | -| approx_kl | 0.058297046 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 252630 | -| policy_gradient_loss | -0.00554 | -| std | 0.00603 | -| value_loss | 1.53e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.914 | -| time/ | | -| fps | 23 | -| iterations | 25265 | -| time_elapsed | 137493 | -| total_timesteps | 3233920 | -| train/ | | -| approx_kl | 0.046219956 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 252640 | -| policy_gradient_loss | 0.0096 | -| std | 0.00603 | -| value_loss | 2.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25266 | -| time_elapsed | 137498 | -| total_timesteps | 3234048 | -| train/ | | -| approx_kl | 0.009941658 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.000249 | -| n_updates | 252650 | -| policy_gradient_loss | 0.00651 | -| std | 0.00604 | -| value_loss | 8.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25267 | -| time_elapsed | 137507 | -| total_timesteps | 3234176 | -| train/ | | -| approx_kl | 0.27132645 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.693 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 252660 | -| policy_gradient_loss | 0.0373 | -| std | 0.00604 | -| value_loss | 0.00348 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25268 | -| time_elapsed | 137513 | -| total_timesteps | 3234304 | -| train/ | | -| approx_kl | 0.0017868704 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | -0.00326 | -| n_updates | 252670 | -| policy_gradient_loss | 0.0313 | -| std | 0.00604 | -| value_loss | 0.000171 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25269 | -| time_elapsed | 137519 | -| total_timesteps | 3234432 | -| train/ | | -| approx_kl | 0.17212735 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00701 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 252680 | -| policy_gradient_loss | 0.0271 | -| std | 0.00603 | -| value_loss | 6.43e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25270 | -| time_elapsed | 137523 | -| total_timesteps | 3234560 | -| train/ | | -| approx_kl | 0.030578032 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.489 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 252690 | -| policy_gradient_loss | 0.0361 | -| std | 0.00602 | -| value_loss | 1.87e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25271 | -| time_elapsed | 137528 | -| total_timesteps | 3234688 | -| train/ | | -| approx_kl | 0.3333195 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.613 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 252700 | -| policy_gradient_loss | 0.115 | -| std | 0.00602 | -| value_loss | 8.78e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25272 | -| time_elapsed | 137533 | -| total_timesteps | 3234816 | -| train/ | | -| approx_kl | 0.04994999 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 252710 | -| policy_gradient_loss | 0.0239 | -| std | 0.00602 | -| value_loss | 1.86e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 25273 | -| time_elapsed | 137536 | -| total_timesteps | 3234944 | -| train/ | | -| approx_kl | 0.13453911 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | 0.0592 | -| n_updates | 252720 | -| policy_gradient_loss | 0.0166 | -| std | 0.00602 | -| value_loss | 1.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25274 | -| time_elapsed | 137541 | -| total_timesteps | 3235072 | -| train/ | | -| approx_kl | 0.024874466 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 252730 | -| policy_gradient_loss | 0.0347 | -| std | 0.00602 | -| value_loss | 2.79e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25275 | -| time_elapsed | 137549 | -| total_timesteps | 3235200 | -| train/ | | -| approx_kl | 0.025758404 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.802 | -| learning_rate | 0.0003 | -| loss | -0.00256 | -| n_updates | 252740 | -| policy_gradient_loss | 0.00874 | -| std | 0.00602 | -| value_loss | 0.0047 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25276 | -| time_elapsed | 137553 | -| total_timesteps | 3235328 | -| train/ | | -| approx_kl | 0.062126428 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 252750 | -| policy_gradient_loss | 0.0241 | -| std | 0.00603 | -| value_loss | 1.75e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25277 | -| time_elapsed | 137556 | -| total_timesteps | 3235456 | -| train/ | | -| approx_kl | 0.14105056 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -72.9 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 252760 | -| policy_gradient_loss | 0.0164 | -| std | 0.00603 | -| value_loss | 9.8e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25278 | -| time_elapsed | 137561 | -| total_timesteps | 3235584 | -| train/ | | -| approx_kl | 0.45962536 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.02 | -| learning_rate | 0.0003 | -| loss | 0.0979 | -| n_updates | 252770 | -| policy_gradient_loss | 0.0727 | -| std | 0.00604 | -| value_loss | 3.15e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25279 | -| time_elapsed | 137566 | -| total_timesteps | 3235712 | -| train/ | | -| approx_kl | 0.05813072 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -54.7 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 252780 | -| policy_gradient_loss | 0.0131 | -| std | 0.00605 | -| value_loss | 3.83e-09 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25280 | -| time_elapsed | 137570 | -| total_timesteps | 3235840 | -| train/ | | -| approx_kl | 0.00025845878 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.00078 | -| n_updates | 252790 | -| policy_gradient_loss | 0.0392 | -| std | 0.00605 | -| value_loss | 3.37e-11 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 25281 | -| time_elapsed | 137574 | -| total_timesteps | 3235968 | -| train/ | | -| approx_kl | 0.00024386821 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.55 | -| learning_rate | 0.0003 | -| loss | 0.000618 | -| n_updates | 252800 | -| policy_gradient_loss | 0.0263 | -| std | 0.00605 | -| value_loss | 3.06e-12 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25282 | -| time_elapsed | 137579 | -| total_timesteps | 3236096 | -| train/ | | -| approx_kl | 0.69674987 | -| clip_fraction | 0.544 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.262 | -| learning_rate | 0.0003 | -| loss | 0.378 | -| n_updates | 252810 | -| policy_gradient_loss | 0.0958 | -| std | 0.00605 | -| value_loss | 1.14e-12 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25283 | -| time_elapsed | 137587 | -| total_timesteps | 3236224 | -| train/ | | -| approx_kl | 0.010422731 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.566 | -| learning_rate | 0.0003 | -| loss | -0.0292 | -| n_updates | 252820 | -| policy_gradient_loss | -0.0174 | -| std | 0.00604 | -| value_loss | 0.00117 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25284 | -| time_elapsed | 137591 | -| total_timesteps | 3236352 | -| train/ | | -| approx_kl | 0.0062528783 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.26 | -| learning_rate | 0.0003 | -| loss | 0.00935 | -| n_updates | 252830 | -| policy_gradient_loss | 0.0138 | -| std | 0.00604 | -| value_loss | 1.75e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25285 | -| time_elapsed | 137595 | -| total_timesteps | 3236480 | -| train/ | | -| approx_kl | 0.06340362 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0179 | -| learning_rate | 0.0003 | -| loss | 0.029 | -| n_updates | 252840 | -| policy_gradient_loss | 0.0118 | -| std | 0.00604 | -| value_loss | 1.35e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25286 | -| time_elapsed | 137601 | -| total_timesteps | 3236608 | -| train/ | | -| approx_kl | 0.050533768 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0263 | -| n_updates | 252850 | -| policy_gradient_loss | 0.0139 | -| std | 0.00604 | -| value_loss | 9.39e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25287 | -| time_elapsed | 137606 | -| total_timesteps | 3236736 | -| train/ | | -| approx_kl | 0.009449786 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0253 | -| learning_rate | 0.0003 | -| loss | 0.00118 | -| n_updates | 252860 | -| policy_gradient_loss | 0.0123 | -| std | 0.00604 | -| value_loss | 5.33e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25288 | -| time_elapsed | 137611 | -| total_timesteps | 3236864 | -| train/ | | -| approx_kl | 0.0010477342 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.00379 | -| n_updates | 252870 | -| policy_gradient_loss | 0.00623 | -| std | 0.00604 | -| value_loss | 4.26e-08 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25289 | -| time_elapsed | 137616 | -| total_timesteps | 3236992 | -| train/ | | -| approx_kl | 0.0061884704 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 252880 | -| policy_gradient_loss | 0.00795 | -| std | 0.00603 | -| value_loss | 2.31e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25290 | -| time_elapsed | 137620 | -| total_timesteps | 3237120 | -| train/ | | -| approx_kl | 0.07720425 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0499 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 252890 | -| policy_gradient_loss | 0.00193 | -| std | 0.00603 | -| value_loss | 2.02e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25291 | -| time_elapsed | 137632 | -| total_timesteps | 3237248 | -| train/ | | -| approx_kl | 0.031908847 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0201 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 252900 | -| policy_gradient_loss | 0.00442 | -| std | 0.00603 | -| value_loss | 0.00188 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25292 | -| time_elapsed | 137637 | -| total_timesteps | 3237376 | -| train/ | | -| approx_kl | 0.025605481 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.00903 | -| n_updates | 252910 | -| policy_gradient_loss | 0.033 | -| std | 0.00603 | -| value_loss | 7.52e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25293 | -| time_elapsed | 137643 | -| total_timesteps | 3237504 | -| train/ | | -| approx_kl | 0.28376454 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 252920 | -| policy_gradient_loss | 0.13 | -| std | 0.00603 | -| value_loss | 1.78e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25294 | -| time_elapsed | 137647 | -| total_timesteps | 3237632 | -| train/ | | -| approx_kl | 0.19444662 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0194 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 252930 | -| policy_gradient_loss | 0.132 | -| std | 0.00603 | -| value_loss | 1.14e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25295 | -| time_elapsed | 137652 | -| total_timesteps | 3237760 | -| train/ | | -| approx_kl | 0.17920037 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 252940 | -| policy_gradient_loss | 0.156 | -| std | 0.00603 | -| value_loss | 7.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25296 | -| time_elapsed | 137656 | -| total_timesteps | 3237888 | -| train/ | | -| approx_kl | 0.03469159 | -| clip_fraction | 0.426 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0275 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 252950 | -| policy_gradient_loss | 0.0321 | -| std | 0.00604 | -| value_loss | 7.18e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25297 | -| time_elapsed | 137661 | -| total_timesteps | 3238016 | -| train/ | | -| approx_kl | 0.60799897 | -| clip_fraction | 0.5 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 252960 | -| policy_gradient_loss | 0.0539 | -| std | 0.00604 | -| value_loss | 1.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25298 | -| time_elapsed | 137672 | -| total_timesteps | 3238144 | -| train/ | | -| approx_kl | 0.054374866 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 252970 | -| policy_gradient_loss | 0.00763 | -| std | 0.00604 | -| value_loss | 0.000663 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25299 | -| time_elapsed | 137676 | -| total_timesteps | 3238272 | -| train/ | | -| approx_kl | 0.05785945 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00571 | -| learning_rate | 0.0003 | -| loss | 0.0101 | -| n_updates | 252980 | -| policy_gradient_loss | 0.0047 | -| std | 0.00604 | -| value_loss | 4.37e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25300 | -| time_elapsed | 137680 | -| total_timesteps | 3238400 | -| train/ | | -| approx_kl | 0.056377195 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0152 | -| learning_rate | 0.0003 | -| loss | 0.0292 | -| n_updates | 252990 | -| policy_gradient_loss | 0.0141 | -| std | 0.00604 | -| value_loss | 1.74e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25301 | -| time_elapsed | 137685 | -| total_timesteps | 3238528 | -| train/ | | -| approx_kl | 0.007949185 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 253000 | -| policy_gradient_loss | 0.00356 | -| std | 0.00604 | -| value_loss | 1.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25302 | -| time_elapsed | 137688 | -| total_timesteps | 3238656 | -| train/ | | -| approx_kl | 0.028069457 | -| clip_fraction | 0.59 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 253010 | -| policy_gradient_loss | 0.0695 | -| std | 0.00605 | -| value_loss | 7.51e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25303 | -| time_elapsed | 137692 | -| total_timesteps | 3238784 | -| train/ | | -| approx_kl | 0.09520596 | -| clip_fraction | 0.677 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0472 | -| learning_rate | 0.0003 | -| loss | 0.0866 | -| n_updates | 253020 | -| policy_gradient_loss | 0.131 | -| std | 0.00605 | -| value_loss | 4.74e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.912 | -| time/ | | -| fps | 23 | -| iterations | 25304 | -| time_elapsed | 137696 | -| total_timesteps | 3238912 | -| train/ | | -| approx_kl | 0.025012877 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | -0.00881 | -| n_updates | 253030 | -| policy_gradient_loss | 0.0354 | -| std | 0.00605 | -| value_loss | 4.3e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25305 | -| time_elapsed | 137702 | -| total_timesteps | 3239040 | -| train/ | | -| approx_kl | 0.003605361 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 253040 | -| policy_gradient_loss | 0.0341 | -| std | 0.00605 | -| value_loss | 2.32e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25306 | -| time_elapsed | 137711 | -| total_timesteps | 3239168 | -| train/ | | -| approx_kl | 0.07409676 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.851 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 253050 | -| policy_gradient_loss | -0.00471 | -| std | 0.00604 | -| value_loss | 0.00277 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25307 | -| time_elapsed | 137716 | -| total_timesteps | 3239296 | -| train/ | | -| approx_kl | 0.6805559 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.215 | -| n_updates | 253060 | -| policy_gradient_loss | 0.0594 | -| std | 0.00604 | -| value_loss | 1.42e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25308 | -| time_elapsed | 137720 | -| total_timesteps | 3239424 | -| train/ | | -| approx_kl | 0.010175277 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 253070 | -| policy_gradient_loss | 0.00467 | -| std | 0.00604 | -| value_loss | 2.93e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25309 | -| time_elapsed | 137725 | -| total_timesteps | 3239552 | -| train/ | | -| approx_kl | 0.000721863 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.00329 | -| n_updates | 253080 | -| policy_gradient_loss | 0.0053 | -| std | 0.00603 | -| value_loss | 1.41e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25310 | -| time_elapsed | 137729 | -| total_timesteps | 3239680 | -| train/ | | -| approx_kl | 0.065524116 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 253090 | -| policy_gradient_loss | 0.00744 | -| std | 0.00603 | -| value_loss | 9.87e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25311 | -| time_elapsed | 137735 | -| total_timesteps | 3239808 | -| train/ | | -| approx_kl | 0.011024665 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0365 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 253100 | -| policy_gradient_loss | 0.00791 | -| std | 0.00603 | -| value_loss | 7.04e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.917 | -| time/ | | -| fps | 23 | -| iterations | 25312 | -| time_elapsed | 137738 | -| total_timesteps | 3239936 | -| train/ | | -| approx_kl | 0.085043825 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.043 | -| n_updates | 253110 | -| policy_gradient_loss | 0.0176 | -| std | 0.00602 | -| value_loss | 4.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25313 | -| time_elapsed | 137743 | -| total_timesteps | 3240064 | -| train/ | | -| approx_kl | 0.045891903 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 253120 | -| policy_gradient_loss | 0.0102 | -| std | 0.00601 | -| value_loss | 5.82e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25314 | -| time_elapsed | 137752 | -| total_timesteps | 3240192 | -| train/ | | -| approx_kl | 0.03591939 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 253130 | -| policy_gradient_loss | -0.0143 | -| std | 0.00601 | -| value_loss | 0.00409 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25315 | -| time_elapsed | 137756 | -| total_timesteps | 3240320 | -| train/ | | -| approx_kl | 0.0885601 | -| clip_fraction | 0.682 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | 0.0943 | -| n_updates | 253140 | -| policy_gradient_loss | 0.138 | -| std | 0.00601 | -| value_loss | 2.95e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25316 | -| time_elapsed | 137761 | -| total_timesteps | 3240448 | -| train/ | | -| approx_kl | 0.11938792 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00911 | -| learning_rate | 0.0003 | -| loss | 0.0835 | -| n_updates | 253150 | -| policy_gradient_loss | 0.127 | -| std | 0.00601 | -| value_loss | 2.75e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25317 | -| time_elapsed | 137767 | -| total_timesteps | 3240576 | -| train/ | | -| approx_kl | 0.15879457 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0277 | -| learning_rate | 0.0003 | -| loss | 0.0863 | -| n_updates | 253160 | -| policy_gradient_loss | 0.185 | -| std | 0.00602 | -| value_loss | 9.5e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25318 | -| time_elapsed | 137772 | -| total_timesteps | 3240704 | -| train/ | | -| approx_kl | 0.13312308 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.379 | -| learning_rate | 0.0003 | -| loss | 0.0941 | -| n_updates | 253170 | -| policy_gradient_loss | 0.13 | -| std | 0.00602 | -| value_loss | 5.8e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25319 | -| time_elapsed | 137777 | -| total_timesteps | 3240832 | -| train/ | | -| approx_kl | 0.03996072 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.095 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 253180 | -| policy_gradient_loss | 0.0429 | -| std | 0.00602 | -| value_loss | 1.38e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25320 | -| time_elapsed | 137783 | -| total_timesteps | 3240960 | -| train/ | | -| approx_kl | 0.51888573 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.422 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 253190 | -| policy_gradient_loss | 0.0394 | -| std | 0.00602 | -| value_loss | 7.68e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25321 | -| time_elapsed | 137787 | -| total_timesteps | 3241088 | -| train/ | | -| approx_kl | 0.011749169 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0977 | -| learning_rate | 0.0003 | -| loss | -0.00481 | -| n_updates | 253200 | -| policy_gradient_loss | 0.00699 | -| std | 0.00602 | -| value_loss | 2.92e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25322 | -| time_elapsed | 137796 | -| total_timesteps | 3241216 | -| train/ | | -| approx_kl | 0.033971794 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.932 | -| learning_rate | 0.0003 | -| loss | -0.0156 | -| n_updates | 253210 | -| policy_gradient_loss | -0.0152 | -| std | 0.00602 | -| value_loss | 0.000687 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25323 | -| time_elapsed | 137802 | -| total_timesteps | 3241344 | -| train/ | | -| approx_kl | 0.03129819 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0194 | -| n_updates | 253220 | -| policy_gradient_loss | 0.0498 | -| std | 0.00602 | -| value_loss | 1.46e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25324 | -| time_elapsed | 137807 | -| total_timesteps | 3241472 | -| train/ | | -| approx_kl | 0.11575038 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0141 | -| learning_rate | 0.0003 | -| loss | 0.0811 | -| n_updates | 253230 | -| policy_gradient_loss | 0.0375 | -| std | 0.00602 | -| value_loss | 2.95e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25325 | -| time_elapsed | 137811 | -| total_timesteps | 3241600 | -| train/ | | -| approx_kl | 0.00020895246 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | -0.000181 | -| n_updates | 253240 | -| policy_gradient_loss | 0.0371 | -| std | 0.00601 | -| value_loss | 1.09e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25326 | -| time_elapsed | 137815 | -| total_timesteps | 3241728 | -| train/ | | -| approx_kl | 0.0005392558 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.00275 | -| n_updates | 253250 | -| policy_gradient_loss | 0.0316 | -| std | 0.00599 | -| value_loss | 0.000183 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25327 | -| time_elapsed | 137819 | -| total_timesteps | 3241856 | -| train/ | | -| approx_kl | 0.0011284864 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00142 | -| n_updates | 253260 | -| policy_gradient_loss | 0.0394 | -| std | 0.00599 | -| value_loss | 6.08e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25328 | -| time_elapsed | 137824 | -| total_timesteps | 3241984 | -| train/ | | -| approx_kl | 0.0026340545 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | -0.00255 | -| n_updates | 253270 | -| policy_gradient_loss | 0.0329 | -| std | 0.00599 | -| value_loss | 4e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25329 | -| time_elapsed | 137829 | -| total_timesteps | 3242112 | -| train/ | | -| approx_kl | 0.4418773 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 253280 | -| policy_gradient_loss | 0.056 | -| std | 0.006 | -| value_loss | 2.72e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25330 | -| time_elapsed | 137841 | -| total_timesteps | 3242240 | -| train/ | | -| approx_kl | 0.0123836165 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | -0.0281 | -| n_updates | 253290 | -| policy_gradient_loss | -0.0146 | -| std | 0.006 | -| value_loss | 0.000488 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25331 | -| time_elapsed | 137846 | -| total_timesteps | 3242368 | -| train/ | | -| approx_kl | 0.05118861 | -| clip_fraction | 0.645 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.0302 | -| n_updates | 253300 | -| policy_gradient_loss | 0.135 | -| std | 0.006 | -| value_loss | 2.42e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25332 | -| time_elapsed | 137851 | -| total_timesteps | 3242496 | -| train/ | | -| approx_kl | 0.117388494 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.273 | -| learning_rate | 0.0003 | -| loss | 0.0775 | -| n_updates | 253310 | -| policy_gradient_loss | 0.137 | -| std | 0.00601 | -| value_loss | 5.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25333 | -| time_elapsed | 137855 | -| total_timesteps | 3242624 | -| train/ | | -| approx_kl | 0.024607562 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -4.02 | -| learning_rate | 0.0003 | -| loss | 0.00341 | -| n_updates | 253320 | -| policy_gradient_loss | 0.0122 | -| std | 0.00601 | -| value_loss | 1.83e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25334 | -| time_elapsed | 137860 | -| total_timesteps | 3242752 | -| train/ | | -| approx_kl | 0.61279047 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.934 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 253330 | -| policy_gradient_loss | 0.0408 | -| std | 0.00602 | -| value_loss | 5.04e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25335 | -| time_elapsed | 137864 | -| total_timesteps | 3242880 | -| train/ | | -| approx_kl | 0.011418599 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0206 | -| learning_rate | 0.0003 | -| loss | -0.00411 | -| n_updates | 253340 | -| policy_gradient_loss | 0.00722 | -| std | 0.00602 | -| value_loss | 2.08e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25336 | -| time_elapsed | 137868 | -| total_timesteps | 3243008 | -| train/ | | -| approx_kl | 0.000847179 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0377 | -| learning_rate | 0.0003 | -| loss | 0.00575 | -| n_updates | 253350 | -| policy_gradient_loss | 0.00337 | -| std | 0.00602 | -| value_loss | 1.66e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25337 | -| time_elapsed | 137879 | -| total_timesteps | 3243136 | -| train/ | | -| approx_kl | 0.11089437 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 253360 | -| policy_gradient_loss | -0.00607 | -| std | 0.00602 | -| value_loss | 0.000542 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25338 | -| time_elapsed | 137884 | -| total_timesteps | 3243264 | -| train/ | | -| approx_kl | 0.0009323112 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.254 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 253370 | -| policy_gradient_loss | 0.0628 | -| std | 0.00602 | -| value_loss | 0.000258 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25339 | -| time_elapsed | 137888 | -| total_timesteps | 3243392 | -| train/ | | -| approx_kl | 0.10111914 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -5.38 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 253380 | -| policy_gradient_loss | 0.0201 | -| std | 0.00601 | -| value_loss | 1.87e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25340 | -| time_elapsed | 137893 | -| total_timesteps | 3243520 | -| train/ | | -| approx_kl | 0.006895762 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.191 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 253390 | -| policy_gradient_loss | 0.0151 | -| std | 0.006 | -| value_loss | 2.04e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25341 | -| time_elapsed | 137897 | -| total_timesteps | 3243648 | -| train/ | | -| approx_kl | 0.04315459 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.801 | -| learning_rate | 0.0003 | -| loss | -0.00528 | -| n_updates | 253400 | -| policy_gradient_loss | 0.031 | -| std | 0.00599 | -| value_loss | 2.92e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25342 | -| time_elapsed | 137901 | -| total_timesteps | 3243776 | -| train/ | | -| approx_kl | 0.8550819 | -| clip_fraction | 0.757 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.59 | -| learning_rate | 0.0003 | -| loss | 0.325 | -| n_updates | 253410 | -| policy_gradient_loss | 0.106 | -| std | 0.00599 | -| value_loss | 6.12e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.926 | -| time/ | | -| fps | 23 | -| iterations | 25343 | -| time_elapsed | 137907 | -| total_timesteps | 3243904 | -| train/ | | -| approx_kl | 0.04655532 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 253420 | -| policy_gradient_loss | -0.00842 | -| std | 0.00599 | -| value_loss | 8.69e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25344 | -| time_elapsed | 137913 | -| total_timesteps | 3244032 | -| train/ | | -| approx_kl | 0.01873577 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.00433 | -| n_updates | 253430 | -| policy_gradient_loss | -0.00355 | -| std | 0.00599 | -| value_loss | 6.06e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25345 | -| time_elapsed | 137925 | -| total_timesteps | 3244160 | -| train/ | | -| approx_kl | 0.012294864 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.754 | -| learning_rate | 0.0003 | -| loss | -0.00933 | -| n_updates | 253440 | -| policy_gradient_loss | 0.000538 | -| std | 0.00599 | -| value_loss | 0.00709 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25346 | -| time_elapsed | 137930 | -| total_timesteps | 3244288 | -| train/ | | -| approx_kl | 0.10520658 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.839 | -| learning_rate | 0.0003 | -| loss | 0.0494 | -| n_updates | 253450 | -| policy_gradient_loss | 0.0436 | -| std | 0.00599 | -| value_loss | 2.89e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25347 | -| time_elapsed | 137935 | -| total_timesteps | 3244416 | -| train/ | | -| approx_kl | 0.18667552 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0109 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 253460 | -| policy_gradient_loss | 0.0508 | -| std | 0.006 | -| value_loss | 2.38e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25348 | -| time_elapsed | 137939 | -| total_timesteps | 3244544 | -| train/ | | -| approx_kl | 0.0010823733 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 253470 | -| policy_gradient_loss | 0.0311 | -| std | 0.006 | -| value_loss | 1.81e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25349 | -| time_elapsed | 137944 | -| total_timesteps | 3244672 | -| train/ | | -| approx_kl | 0.73655206 | -| clip_fraction | 0.56 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 253480 | -| policy_gradient_loss | 0.0591 | -| std | 0.006 | -| value_loss | 1.56e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25350 | -| time_elapsed | 137949 | -| total_timesteps | 3244800 | -| train/ | | -| approx_kl | 0.013780692 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 253490 | -| policy_gradient_loss | 0.00255 | -| std | 0.00601 | -| value_loss | 1.14e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.916 | -| time/ | | -| fps | 23 | -| iterations | 25351 | -| time_elapsed | 137954 | -| total_timesteps | 3244928 | -| train/ | | -| approx_kl | 0.0027821078 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | -0.00361 | -| n_updates | 253500 | -| policy_gradient_loss | 0.00754 | -| std | 0.00601 | -| value_loss | 6.35e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25352 | -| time_elapsed | 137958 | -| total_timesteps | 3245056 | -| train/ | | -| approx_kl | 0.048153445 | -| clip_fraction | 0.672 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.0613 | -| n_updates | 253510 | -| policy_gradient_loss | 0.145 | -| std | 0.00601 | -| value_loss | 5.48e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25353 | -| time_elapsed | 137964 | -| total_timesteps | 3245184 | -| train/ | | -| approx_kl | 0.0060949563 | -| clip_fraction | 0.36 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.00238 | -| n_updates | 253520 | -| policy_gradient_loss | -0.00296 | -| std | 0.006 | -| value_loss | 0.00381 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25354 | -| time_elapsed | 137969 | -| total_timesteps | 3245312 | -| train/ | | -| approx_kl | 0.096608855 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.419 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 253530 | -| policy_gradient_loss | 0.028 | -| std | 0.00599 | -| value_loss | 4.98e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25355 | -| time_elapsed | 137973 | -| total_timesteps | 3245440 | -| train/ | | -| approx_kl | 0.17055818 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0139 | -| learning_rate | 0.0003 | -| loss | 0.0476 | -| n_updates | 253540 | -| policy_gradient_loss | 0.0215 | -| std | 0.00599 | -| value_loss | 1.27e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25356 | -| time_elapsed | 137977 | -| total_timesteps | 3245568 | -| train/ | | -| approx_kl | 0.01415058 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0175 | -| learning_rate | 0.0003 | -| loss | 0.000781 | -| n_updates | 253550 | -| policy_gradient_loss | 0.000352 | -| std | 0.00599 | -| value_loss | 6.21e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25357 | -| time_elapsed | 137981 | -| total_timesteps | 3245696 | -| train/ | | -| approx_kl | 0.027741913 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 253560 | -| policy_gradient_loss | 0.0354 | -| std | 0.00599 | -| value_loss | 4.22e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25358 | -| time_elapsed | 137986 | -| total_timesteps | 3245824 | -| train/ | | -| approx_kl | 0.3238751 | -| clip_fraction | 0.758 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.248 | -| n_updates | 253570 | -| policy_gradient_loss | 0.159 | -| std | 0.00599 | -| value_loss | 3.71e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25359 | -| time_elapsed | 137989 | -| total_timesteps | 3245952 | -| train/ | | -| approx_kl | 0.18705058 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 253580 | -| policy_gradient_loss | 0.109 | -| std | 0.00599 | -| value_loss | 2.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25360 | -| time_elapsed | 137993 | -| total_timesteps | 3246080 | -| train/ | | -| approx_kl | 0.16424814 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 253590 | -| policy_gradient_loss | 0.144 | -| std | 0.00599 | -| value_loss | 1.88e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25361 | -| time_elapsed | 138001 | -| total_timesteps | 3246208 | -| train/ | | -| approx_kl | 0.0140743125 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -4.1 | -| learning_rate | 0.0003 | -| loss | -0.0265 | -| n_updates | 253600 | -| policy_gradient_loss | -0.00648 | -| std | 0.006 | -| value_loss | 0.00398 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25362 | -| time_elapsed | 138005 | -| total_timesteps | 3246336 | -| train/ | | -| approx_kl | 0.000114386436 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -6.13 | -| learning_rate | 0.0003 | -| loss | -0.000363 | -| n_updates | 253610 | -| policy_gradient_loss | 0.00867 | -| std | 0.00601 | -| value_loss | 2.31e-06 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25363 | -| time_elapsed | 138009 | -| total_timesteps | 3246464 | -| train/ | | -| approx_kl | 0.29332572 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.059 | -| n_updates | 253620 | -| policy_gradient_loss | 0.0124 | -| std | 0.00601 | -| value_loss | 1.82e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25364 | -| time_elapsed | 138015 | -| total_timesteps | 3246592 | -| train/ | | -| approx_kl | 0.017469872 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0086 | -| n_updates | 253630 | -| policy_gradient_loss | 0.0283 | -| std | 0.00602 | -| value_loss | 1.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25365 | -| time_elapsed | 138020 | -| total_timesteps | 3246720 | -| train/ | | -| approx_kl | 0.40119806 | -| clip_fraction | 0.752 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0618 | -| learning_rate | 0.0003 | -| loss | 0.279 | -| n_updates | 253640 | -| policy_gradient_loss | 0.221 | -| std | 0.00602 | -| value_loss | 8.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25366 | -| time_elapsed | 138025 | -| total_timesteps | 3246848 | -| train/ | | -| approx_kl | 0.056823097 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | 0.0361 | -| n_updates | 253650 | -| policy_gradient_loss | 0.0299 | -| std | 0.00603 | -| value_loss | 5.45e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25367 | -| time_elapsed | 138030 | -| total_timesteps | 3246976 | -| train/ | | -| approx_kl | 0.0008036378 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0936 | -| learning_rate | 0.0003 | -| loss | 1.89e-05 | -| n_updates | 253660 | -| policy_gradient_loss | 0.0307 | -| std | 0.00603 | -| value_loss | 2.33e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25368 | -| time_elapsed | 138035 | -| total_timesteps | 3247104 | -| train/ | | -| approx_kl | 0.19006005 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0161 | -| learning_rate | 0.0003 | -| loss | 0.0944 | -| n_updates | 253670 | -| policy_gradient_loss | 0.0254 | -| std | 0.00605 | -| value_loss | 4.6e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25369 | -| time_elapsed | 138046 | -| total_timesteps | 3247232 | -| train/ | | -| approx_kl | 0.1117245 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 253680 | -| policy_gradient_loss | 0.0178 | -| std | 0.00606 | -| value_loss | 0.000596 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25370 | -| time_elapsed | 138052 | -| total_timesteps | 3247360 | -| train/ | | -| approx_kl | 0.5392679 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.76 | -| learning_rate | 0.0003 | -| loss | 0.143 | -| n_updates | 253690 | -| policy_gradient_loss | 0.0584 | -| std | 0.00606 | -| value_loss | 6.98e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25371 | -| time_elapsed | 138055 | -| total_timesteps | 3247488 | -| train/ | | -| approx_kl | 0.06197542 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00985 | -| learning_rate | 0.0003 | -| loss | 0.0144 | -| n_updates | 253700 | -| policy_gradient_loss | 0.00894 | -| std | 0.00606 | -| value_loss | 4.6e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25372 | -| time_elapsed | 138059 | -| total_timesteps | 3247616 | -| train/ | | -| approx_kl | 0.06415504 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0396 | -| learning_rate | 0.0003 | -| loss | 0.055 | -| n_updates | 253710 | -| policy_gradient_loss | 0.0262 | -| std | 0.00607 | -| value_loss | 3.67e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25373 | -| time_elapsed | 138064 | -| total_timesteps | 3247744 | -| train/ | | -| approx_kl | 0.04847467 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.066 | -| learning_rate | 0.0003 | -| loss | 0.0295 | -| n_updates | 253720 | -| policy_gradient_loss | 0.0143 | -| std | 0.00608 | -| value_loss | 5.89e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25374 | -| time_elapsed | 138069 | -| total_timesteps | 3247872 | -| train/ | | -| approx_kl | 0.059379775 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0118 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 253730 | -| policy_gradient_loss | 0.0156 | -| std | 0.00609 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25375 | -| time_elapsed | 138073 | -| total_timesteps | 3248000 | -| train/ | | -| approx_kl | 0.009929344 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | -0.00719 | -| n_updates | 253740 | -| policy_gradient_loss | 0.00574 | -| std | 0.00609 | -| value_loss | 1.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25376 | -| time_elapsed | 138077 | -| total_timesteps | 3248128 | -| train/ | | -| approx_kl | 0.08059161 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.005 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 253750 | -| policy_gradient_loss | 0.0243 | -| std | 0.00609 | -| value_loss | 6.21e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25377 | -| time_elapsed | 138087 | -| total_timesteps | 3248256 | -| train/ | | -| approx_kl | 1.0718645 | -| clip_fraction | 0.766 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.995 | -| learning_rate | 0.0003 | -| loss | 0.253 | -| n_updates | 253760 | -| policy_gradient_loss | 0.171 | -| std | 0.0061 | -| value_loss | 4.28e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25378 | -| time_elapsed | 138091 | -| total_timesteps | 3248384 | -| train/ | | -| approx_kl | 0.048274186 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00545 | -| learning_rate | 0.0003 | -| loss | 0.0497 | -| n_updates | 253770 | -| policy_gradient_loss | 0.00525 | -| std | 0.00609 | -| value_loss | 7.82e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25379 | -| time_elapsed | 138097 | -| total_timesteps | 3248512 | -| train/ | | -| approx_kl | 0.121558286 | -| clip_fraction | 0.609 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -11 | -| learning_rate | 0.0003 | -| loss | 0.0126 | -| n_updates | 253780 | -| policy_gradient_loss | 0.0136 | -| std | 0.00611 | -| value_loss | 1.06e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25380 | -| time_elapsed | 138101 | -| total_timesteps | 3248640 | -| train/ | | -| approx_kl | 0.085236885 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 253790 | -| policy_gradient_loss | -0.00125 | -| std | 0.00612 | -| value_loss | 6.14e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25381 | -| time_elapsed | 138106 | -| total_timesteps | 3248768 | -| train/ | | -| approx_kl | 0.3102409 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0188 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 253800 | -| policy_gradient_loss | 0.0399 | -| std | 0.00615 | -| value_loss | 1.62e-05 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25382 | -| time_elapsed | 138110 | -| total_timesteps | 3248896 | -| train/ | | -| approx_kl | 0.5090285 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -2.53 | -| learning_rate | 0.0003 | -| loss | 0.0784 | -| n_updates | 253810 | -| policy_gradient_loss | 0.0249 | -| std | 0.00617 | -| value_loss | 1.5e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25383 | -| time_elapsed | 138115 | -| total_timesteps | 3249024 | -| train/ | | -| approx_kl | 0.010759702 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0146 | -| learning_rate | 0.0003 | -| loss | 0.00754 | -| n_updates | 253820 | -| policy_gradient_loss | 0.0114 | -| std | 0.00618 | -| value_loss | 1.35e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25384 | -| time_elapsed | 138126 | -| total_timesteps | 3249152 | -| train/ | | -| approx_kl | 0.04157018 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.719 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 253830 | -| policy_gradient_loss | 0.00207 | -| std | 0.00618 | -| value_loss | 0.00981 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25385 | -| time_elapsed | 138131 | -| total_timesteps | 3249280 | -| train/ | | -| approx_kl | 0.0148690585 | -| clip_fraction | 0.224 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.355 | -| learning_rate | 0.0003 | -| loss | -0.00928 | -| n_updates | 253840 | -| policy_gradient_loss | 0.00398 | -| std | 0.00619 | -| value_loss | 0.000136 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25386 | -| time_elapsed | 138135 | -| total_timesteps | 3249408 | -| train/ | | -| approx_kl | 0.0029112739 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00948 | -| learning_rate | 0.0003 | -| loss | -0.00454 | -| n_updates | 253850 | -| policy_gradient_loss | 0.00707 | -| std | 0.00618 | -| value_loss | 8.98e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25387 | -| time_elapsed | 138140 | -| total_timesteps | 3249536 | -| train/ | | -| approx_kl | 0.034957483 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0756 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 253860 | -| policy_gradient_loss | 0.0965 | -| std | 0.00618 | -| value_loss | 7.11e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25388 | -| time_elapsed | 138145 | -| total_timesteps | 3249664 | -| train/ | | -| approx_kl | 0.008803386 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | -0.00328 | -| n_updates | 253870 | -| policy_gradient_loss | 0.0194 | -| std | 0.00619 | -| value_loss | 4.12e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25389 | -| time_elapsed | 138150 | -| total_timesteps | 3249792 | -| train/ | | -| approx_kl | 0.24043044 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0675 | -| learning_rate | 0.0003 | -| loss | 0.0874 | -| n_updates | 253880 | -| policy_gradient_loss | 0.0228 | -| std | 0.00619 | -| value_loss | 3.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.919 | -| time/ | | -| fps | 23 | -| iterations | 25390 | -| time_elapsed | 138154 | -| total_timesteps | 3249920 | -| train/ | | -| approx_kl | 0.02301074 | -| clip_fraction | 0.464 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 253890 | -| policy_gradient_loss | 0.0434 | -| std | 0.00619 | -| value_loss | 4.42e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25391 | -| time_elapsed | 138158 | -| total_timesteps | 3250048 | -| train/ | | -| approx_kl | 0.09485079 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.0467 | -| n_updates | 253900 | -| policy_gradient_loss | 0.0228 | -| std | 0.0062 | -| value_loss | 9.43e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25392 | -| time_elapsed | 138166 | -| total_timesteps | 3250176 | -| train/ | | -| approx_kl | 0.11853446 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.721 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 253910 | -| policy_gradient_loss | -0.0185 | -| std | 0.0062 | -| value_loss | 0.00266 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25393 | -| time_elapsed | 138171 | -| total_timesteps | 3250304 | -| train/ | | -| approx_kl | 0.2556959 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -2.38 | -| learning_rate | 0.0003 | -| loss | 0.0778 | -| n_updates | 253920 | -| policy_gradient_loss | 0.0293 | -| std | 0.0062 | -| value_loss | 1.23e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25394 | -| time_elapsed | 138176 | -| total_timesteps | 3250432 | -| train/ | | -| approx_kl | 0.0010322277 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | -0.00482 | -| n_updates | 253930 | -| policy_gradient_loss | 0.00236 | -| std | 0.0062 | -| value_loss | 4.36e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25395 | -| time_elapsed | 138181 | -| total_timesteps | 3250560 | -| train/ | | -| approx_kl | 0.06144964 | -| clip_fraction | 0.582 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0688 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 253940 | -| policy_gradient_loss | 0.0532 | -| std | 0.0062 | -| value_loss | 2.53e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25396 | -| time_elapsed | 138185 | -| total_timesteps | 3250688 | -| train/ | | -| approx_kl | 0.2636199 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 253950 | -| policy_gradient_loss | 0.0508 | -| std | 0.0062 | -| value_loss | 2.01e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25397 | -| time_elapsed | 138191 | -| total_timesteps | 3250816 | -| train/ | | -| approx_kl | 0.055342723 | -| clip_fraction | 0.598 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0418 | -| n_updates | 253960 | -| policy_gradient_loss | 0.0723 | -| std | 0.0062 | -| value_loss | 1.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 25398 | -| time_elapsed | 138196 | -| total_timesteps | 3250944 | -| train/ | | -| approx_kl | 0.05582284 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0809 | -| learning_rate | 0.0003 | -| loss | 0.0566 | -| n_updates | 253970 | -| policy_gradient_loss | 0.0365 | -| std | 0.0062 | -| value_loss | 8.35e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25399 | -| time_elapsed | 138201 | -| total_timesteps | 3251072 | -| train/ | | -| approx_kl | 0.29402432 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0839 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 253980 | -| policy_gradient_loss | 0.0618 | -| std | 0.0062 | -| value_loss | 4.46e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25400 | -| time_elapsed | 138209 | -| total_timesteps | 3251200 | -| train/ | | -| approx_kl | 0.21643463 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.702 | -| learning_rate | 0.0003 | -| loss | 0.0606 | -| n_updates | 253990 | -| policy_gradient_loss | -0.00192 | -| std | 0.0062 | -| value_loss | 0.00105 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25401 | -| time_elapsed | 138214 | -| total_timesteps | 3251328 | -| train/ | | -| approx_kl | 0.025341894 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.79 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 254000 | -| policy_gradient_loss | 0.0237 | -| std | 0.0062 | -| value_loss | 3.96e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25402 | -| time_elapsed | 138218 | -| total_timesteps | 3251456 | -| train/ | | -| approx_kl | 0.005582922 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -3.9 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 254010 | -| policy_gradient_loss | 0.00137 | -| std | 0.00621 | -| value_loss | 1.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25403 | -| time_elapsed | 138223 | -| total_timesteps | 3251584 | -| train/ | | -| approx_kl | 0.058041874 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.0065 | -| n_updates | 254020 | -| policy_gradient_loss | 0.00935 | -| std | 0.00621 | -| value_loss | 1.34e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25404 | -| time_elapsed | 138227 | -| total_timesteps | 3251712 | -| train/ | | -| approx_kl | 0.08272073 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0797 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 254030 | -| policy_gradient_loss | 0.0305 | -| std | 0.00622 | -| value_loss | 6.61e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25405 | -| time_elapsed | 138231 | -| total_timesteps | 3251840 | -| train/ | | -| approx_kl | 0.010766538 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.38 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 254040 | -| policy_gradient_loss | 0.0069 | -| std | 0.00624 | -| value_loss | 0.000636 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.923 | -| time/ | | -| fps | 23 | -| iterations | 25406 | -| time_elapsed | 138236 | -| total_timesteps | 3251968 | -| train/ | | -| approx_kl | 0.0009055971 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | 0.00406 | -| n_updates | 254050 | -| policy_gradient_loss | 0.00561 | -| std | 0.00624 | -| value_loss | 5.91e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25407 | -| time_elapsed | 138240 | -| total_timesteps | 3252096 | -| train/ | | -| approx_kl | 0.046707574 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 254060 | -| policy_gradient_loss | 0.00648 | -| std | 0.00625 | -| value_loss | 3.07e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25408 | -| time_elapsed | 138250 | -| total_timesteps | 3252224 | -| train/ | | -| approx_kl | 0.08851583 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.517 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 254070 | -| policy_gradient_loss | -0.00232 | -| std | 0.00625 | -| value_loss | 0.00146 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25409 | -| time_elapsed | 138256 | -| total_timesteps | 3252352 | -| train/ | | -| approx_kl | 0.007951182 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | 0.00435 | -| n_updates | 254080 | -| policy_gradient_loss | 0.00512 | -| std | 0.00625 | -| value_loss | 9.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25410 | -| time_elapsed | 138261 | -| total_timesteps | 3252480 | -| train/ | | -| approx_kl | 0.079533644 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0948 | -| learning_rate | 0.0003 | -| loss | 0.0495 | -| n_updates | 254090 | -| policy_gradient_loss | 0.0203 | -| std | 0.00624 | -| value_loss | 6.14e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25411 | -| time_elapsed | 138265 | -| total_timesteps | 3252608 | -| train/ | | -| approx_kl | 0.012852857 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0754 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 254100 | -| policy_gradient_loss | 0.00315 | -| std | 0.00624 | -| value_loss | 4.96e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25412 | -| time_elapsed | 138267 | -| total_timesteps | 3252736 | -| train/ | | -| approx_kl | 0.09195915 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0452 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 254110 | -| policy_gradient_loss | 0.00698 | -| std | 0.00624 | -| value_loss | 3.53e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25413 | -| time_elapsed | 138271 | -| total_timesteps | 3252864 | -| train/ | | -| approx_kl | 0.01072053 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 254120 | -| policy_gradient_loss | 0.00718 | -| std | 0.00623 | -| value_loss | 2.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.921 | -| time/ | | -| fps | 23 | -| iterations | 25414 | -| time_elapsed | 138275 | -| total_timesteps | 3252992 | -| train/ | | -| approx_kl | 0.047665782 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 254130 | -| policy_gradient_loss | 0.0431 | -| std | 0.00623 | -| value_loss | 2.27e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25415 | -| time_elapsed | 138278 | -| total_timesteps | 3253120 | -| train/ | | -| approx_kl | 0.97285455 | -| clip_fraction | 0.749 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | 0.373 | -| n_updates | 254140 | -| policy_gradient_loss | 0.272 | -| std | 0.00623 | -| value_loss | 1.96e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25416 | -| time_elapsed | 138289 | -| total_timesteps | 3253248 | -| train/ | | -| approx_kl | 0.19226581 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | 0.0569 | -| n_updates | 254150 | -| policy_gradient_loss | 0.0112 | -| std | 0.00623 | -| value_loss | 0.00403 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25417 | -| time_elapsed | 138294 | -| total_timesteps | 3253376 | -| train/ | | -| approx_kl | 0.0015530647 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0035 | -| learning_rate | 0.0003 | -| loss | 0.00717 | -| n_updates | 254160 | -| policy_gradient_loss | 0.00776 | -| std | 0.00624 | -| value_loss | 8.21e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25418 | -| time_elapsed | 138299 | -| total_timesteps | 3253504 | -| train/ | | -| approx_kl | 0.014796926 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0064 | -| n_updates | 254170 | -| policy_gradient_loss | 0.0333 | -| std | 0.00624 | -| value_loss | 1.65e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25419 | -| time_elapsed | 138303 | -| total_timesteps | 3253632 | -| train/ | | -| approx_kl | 0.10677861 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 254180 | -| policy_gradient_loss | 0.0228 | -| std | 0.00624 | -| value_loss | 1.52e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25420 | -| time_elapsed | 138308 | -| total_timesteps | 3253760 | -| train/ | | -| approx_kl | 6.756559e-05 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.000115 | -| n_updates | 254190 | -| policy_gradient_loss | 0.0351 | -| std | 0.00624 | -| value_loss | 8.31e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.915 | -| time/ | | -| fps | 23 | -| iterations | 25421 | -| time_elapsed | 138313 | -| total_timesteps | 3253888 | -| train/ | | -| approx_kl | 0.6415938 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.179 | -| n_updates | 254200 | -| policy_gradient_loss | 0.0589 | -| std | 0.00623 | -| value_loss | 1.62e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25422 | -| time_elapsed | 138318 | -| total_timesteps | 3254016 | -| train/ | | -| approx_kl | 0.009609479 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00432 | -| learning_rate | 0.0003 | -| loss | -0.00859 | -| n_updates | 254210 | -| policy_gradient_loss | 0.00365 | -| std | 0.00623 | -| value_loss | 7.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25423 | -| time_elapsed | 138330 | -| total_timesteps | 3254144 | -| train/ | | -| approx_kl | 0.01121245 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | 0.00376 | -| n_updates | 254220 | -| policy_gradient_loss | -0.00198 | -| std | 0.00623 | -| value_loss | 0.000863 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25424 | -| time_elapsed | 138334 | -| total_timesteps | 3254272 | -| train/ | | -| approx_kl | 0.0009498461 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 254230 | -| policy_gradient_loss | 0.00666 | -| std | 0.00622 | -| value_loss | 9.96e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25425 | -| time_elapsed | 138339 | -| total_timesteps | 3254400 | -| train/ | | -| approx_kl | 0.0063365097 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -2.85 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 254240 | -| policy_gradient_loss | -0.00194 | -| std | 0.00622 | -| value_loss | 8.38e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25426 | -| time_elapsed | 138344 | -| total_timesteps | 3254528 | -| train/ | | -| approx_kl | 0.026265386 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -50.9 | -| learning_rate | 0.0003 | -| loss | 0.00202 | -| n_updates | 254250 | -| policy_gradient_loss | 0.0107 | -| std | 0.00622 | -| value_loss | 4.96e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25427 | -| time_elapsed | 138349 | -| total_timesteps | 3254656 | -| train/ | | -| approx_kl | 0.7145428 | -| clip_fraction | 0.728 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.05 | -| learning_rate | 0.0003 | -| loss | 0.22 | -| n_updates | 254260 | -| policy_gradient_loss | 0.111 | -| std | 0.00623 | -| value_loss | 3.12e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25428 | -| time_elapsed | 138354 | -| total_timesteps | 3254784 | -| train/ | | -| approx_kl | 0.031423807 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -4.13 | -| learning_rate | 0.0003 | -| loss | 0.00209 | -| n_updates | 254270 | -| policy_gradient_loss | -0.00369 | -| std | 0.00623 | -| value_loss | 6.36e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 25429 | -| time_elapsed | 138359 | -| total_timesteps | 3254912 | -| train/ | | -| approx_kl | 0.01875123 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.492 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 254280 | -| policy_gradient_loss | 0.0231 | -| std | 0.00623 | -| value_loss | 4.03e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25430 | -| time_elapsed | 138364 | -| total_timesteps | 3255040 | -| train/ | | -| approx_kl | 0.11309465 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0746 | -| learning_rate | 0.0003 | -| loss | 0.0345 | -| n_updates | 254290 | -| policy_gradient_loss | 0.0206 | -| std | 0.00623 | -| value_loss | 3.31e-11 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25431 | -| time_elapsed | 138374 | -| total_timesteps | 3255168 | -| train/ | | -| approx_kl | 0.47666168 | -| clip_fraction | 0.518 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.914 | -| learning_rate | 0.0003 | -| loss | 0.031 | -| n_updates | 254300 | -| policy_gradient_loss | 0.0121 | -| std | 0.00623 | -| value_loss | 0.00141 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25432 | -| time_elapsed | 138379 | -| total_timesteps | 3255296 | -| train/ | | -| approx_kl | 0.07831835 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.952 | -| learning_rate | 0.0003 | -| loss | 0.0608 | -| n_updates | 254310 | -| policy_gradient_loss | 0.0257 | -| std | 0.00622 | -| value_loss | 1.92e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25433 | -| time_elapsed | 138385 | -| total_timesteps | 3255424 | -| train/ | | -| approx_kl | 0.052614324 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0415 | -| learning_rate | 0.0003 | -| loss | 0.023 | -| n_updates | 254320 | -| policy_gradient_loss | 0.0117 | -| std | 0.0062 | -| value_loss | 0.000112 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25434 | -| time_elapsed | 138390 | -| total_timesteps | 3255552 | -| train/ | | -| approx_kl | 0.009526232 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 254330 | -| policy_gradient_loss | 0.005 | -| std | 0.0062 | -| value_loss | 3.97e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25435 | -| time_elapsed | 138395 | -| total_timesteps | 3255680 | -| train/ | | -| approx_kl | 0.0738693 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | 0.0441 | -| n_updates | 254340 | -| policy_gradient_loss | 0.0161 | -| std | 0.0062 | -| value_loss | 3.47e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25436 | -| time_elapsed | 138400 | -| total_timesteps | 3255808 | -| train/ | | -| approx_kl | 0.047095306 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.00655 | -| n_updates | 254350 | -| policy_gradient_loss | 0.00509 | -| std | 0.0062 | -| value_loss | 3.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25437 | -| time_elapsed | 138405 | -| total_timesteps | 3255936 | -| train/ | | -| approx_kl | 0.00774688 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.00429 | -| n_updates | 254360 | -| policy_gradient_loss | 0.00728 | -| std | 0.0062 | -| value_loss | 2.14e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25438 | -| time_elapsed | 138410 | -| total_timesteps | 3256064 | -| train/ | | -| approx_kl | 0.0011798926 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.00269 | -| n_updates | 254370 | -| policy_gradient_loss | 0.00658 | -| std | 0.0062 | -| value_loss | 1.54e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25439 | -| time_elapsed | 138418 | -| total_timesteps | 3256192 | -| train/ | | -| approx_kl | 0.012485158 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.902 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 254380 | -| policy_gradient_loss | -0.00239 | -| std | 0.0062 | -| value_loss | 0.00164 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25440 | -| time_elapsed | 138422 | -| total_timesteps | 3256320 | -| train/ | | -| approx_kl | 0.009950786 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0147 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 254390 | -| policy_gradient_loss | 0.012 | -| std | 0.0062 | -| value_loss | 7.4e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25441 | -| time_elapsed | 138426 | -| total_timesteps | 3256448 | -| train/ | | -| approx_kl | 0.0037590382 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00871 | -| learning_rate | 0.0003 | -| loss | -0.00129 | -| n_updates | 254400 | -| policy_gradient_loss | 0.0111 | -| std | 0.0062 | -| value_loss | 1.67e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25442 | -| time_elapsed | 138429 | -| total_timesteps | 3256576 | -| train/ | | -| approx_kl | 0.024681317 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 254410 | -| policy_gradient_loss | 0.0196 | -| std | 0.0062 | -| value_loss | 1.36e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25443 | -| time_elapsed | 138434 | -| total_timesteps | 3256704 | -| train/ | | -| approx_kl | 0.123918615 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 254420 | -| policy_gradient_loss | -0.00244 | -| std | 0.00619 | -| value_loss | 9e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25444 | -| time_elapsed | 138439 | -| total_timesteps | 3256832 | -| train/ | | -| approx_kl | 0.01934752 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.094 | -| learning_rate | 0.0003 | -| loss | 0.00738 | -| n_updates | 254430 | -| policy_gradient_loss | 0.00919 | -| std | 0.00618 | -| value_loss | 1.09e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.931 | -| time/ | | -| fps | 23 | -| iterations | 25445 | -| time_elapsed | 138443 | -| total_timesteps | 3256960 | -| train/ | | -| approx_kl | 0.0038942788 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.27 | -| learning_rate | 0.0003 | -| loss | -0.000612 | -| n_updates | 254440 | -| policy_gradient_loss | 0.00746 | -| std | 0.00618 | -| value_loss | 1.82e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25446 | -| time_elapsed | 138448 | -| total_timesteps | 3257088 | -| train/ | | -| approx_kl | 0.077415824 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0896 | -| learning_rate | 0.0003 | -| loss | 0.0423 | -| n_updates | 254450 | -| policy_gradient_loss | 0.0157 | -| std | 0.00618 | -| value_loss | 1.34e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25447 | -| time_elapsed | 138457 | -| total_timesteps | 3257216 | -| train/ | | -| approx_kl | 0.017578822 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -4.86 | -| learning_rate | 0.0003 | -| loss | -0.0275 | -| n_updates | 254460 | -| policy_gradient_loss | -0.00536 | -| std | 0.00617 | -| value_loss | 0.00405 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25448 | -| time_elapsed | 138463 | -| total_timesteps | 3257344 | -| train/ | | -| approx_kl | 0.9860738 | -| clip_fraction | 0.759 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.353 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 254470 | -| policy_gradient_loss | 0.136 | -| std | 0.00618 | -| value_loss | 2.6e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25449 | -| time_elapsed | 138468 | -| total_timesteps | 3257472 | -| train/ | | -| approx_kl | 0.029324228 | -| clip_fraction | 0.177 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00345 | -| learning_rate | 0.0003 | -| loss | -0.00761 | -| n_updates | 254480 | -| policy_gradient_loss | -0.00794 | -| std | 0.00618 | -| value_loss | 5.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25450 | -| time_elapsed | 138473 | -| total_timesteps | 3257600 | -| train/ | | -| approx_kl | 0.017582867 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 254490 | -| policy_gradient_loss | 0.0216 | -| std | 0.00618 | -| value_loss | 4.13e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25451 | -| time_elapsed | 138478 | -| total_timesteps | 3257728 | -| train/ | | -| approx_kl | 0.12893894 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0253 | -| n_updates | 254500 | -| policy_gradient_loss | 0.0182 | -| std | 0.00618 | -| value_loss | 3.43e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25452 | -| time_elapsed | 138484 | -| total_timesteps | 3257856 | -| train/ | | -| approx_kl | 0.0056259925 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 254510 | -| policy_gradient_loss | 0.0117 | -| std | 0.00618 | -| value_loss | 2.57e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 25453 | -| time_elapsed | 138488 | -| total_timesteps | 3257984 | -| train/ | | -| approx_kl | 0.059580922 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 254520 | -| policy_gradient_loss | 0.0196 | -| std | 0.00618 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25454 | -| time_elapsed | 138492 | -| total_timesteps | 3258112 | -| train/ | | -| approx_kl | 0.60148644 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0489 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 254530 | -| policy_gradient_loss | 0.0702 | -| std | 0.00618 | -| value_loss | 1.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25455 | -| time_elapsed | 138503 | -| total_timesteps | 3258240 | -| train/ | | -| approx_kl | 0.017358933 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.476 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 254540 | -| policy_gradient_loss | -0.00377 | -| std | 0.00618 | -| value_loss | 0.00159 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25456 | -| time_elapsed | 138508 | -| total_timesteps | 3258368 | -| train/ | | -| approx_kl | 0.23466381 | -| clip_fraction | 0.522 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -2.56 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 254550 | -| policy_gradient_loss | 0.0607 | -| std | 0.00618 | -| value_loss | 4.83e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25457 | -| time_elapsed | 138512 | -| total_timesteps | 3258496 | -| train/ | | -| approx_kl | 0.07569681 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0686 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 254560 | -| policy_gradient_loss | 0.0048 | -| std | 0.00618 | -| value_loss | 7.14e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25458 | -| time_elapsed | 138517 | -| total_timesteps | 3258624 | -| train/ | | -| approx_kl | 0.03906585 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00169 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 254570 | -| policy_gradient_loss | 0.0138 | -| std | 0.00618 | -| value_loss | 1.73e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25459 | -| time_elapsed | 138521 | -| total_timesteps | 3258752 | -| train/ | | -| approx_kl | 0.0071804835 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0805 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 254580 | -| policy_gradient_loss | 0.00675 | -| std | 0.00617 | -| value_loss | 1.32e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.93 | -| time/ | | -| fps | 23 | -| iterations | 25460 | -| time_elapsed | 138524 | -| total_timesteps | 3258880 | -| train/ | | -| approx_kl | 0.08351463 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 254590 | -| policy_gradient_loss | 0.00905 | -| std | 0.00617 | -| value_loss | 1.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25461 | -| time_elapsed | 138527 | -| total_timesteps | 3259008 | -| train/ | | -| approx_kl | 0.046616152 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.00879 | -| n_updates | 254600 | -| policy_gradient_loss | 0.00583 | -| std | 0.00617 | -| value_loss | 8.43e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25462 | -| time_elapsed | 138538 | -| total_timesteps | 3259136 | -| train/ | | -| approx_kl | 0.017021686 | -| clip_fraction | 0.207 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.789 | -| learning_rate | 0.0003 | -| loss | -0.0241 | -| n_updates | 254610 | -| policy_gradient_loss | -0.0154 | -| std | 0.00617 | -| value_loss | 0.00249 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25463 | -| time_elapsed | 138543 | -| total_timesteps | 3259264 | -| train/ | | -| approx_kl | 0.1299312 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.517 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 254620 | -| policy_gradient_loss | 0.00766 | -| std | 0.00616 | -| value_loss | 3.38e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25464 | -| time_elapsed | 138548 | -| total_timesteps | 3259392 | -| train/ | | -| approx_kl | 0.04436364 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 254630 | -| policy_gradient_loss | 0.0165 | -| std | 0.00616 | -| value_loss | 2.49e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25465 | -| time_elapsed | 138553 | -| total_timesteps | 3259520 | -| train/ | | -| approx_kl | 1.0181396 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.281 | -| n_updates | 254640 | -| policy_gradient_loss | 0.169 | -| std | 0.00616 | -| value_loss | 2.27e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25466 | -| time_elapsed | 138558 | -| total_timesteps | 3259648 | -| train/ | | -| approx_kl | 0.0013947212 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | 0.000545 | -| n_updates | 254650 | -| policy_gradient_loss | 0.00267 | -| std | 0.00616 | -| value_loss | 4.55e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25467 | -| time_elapsed | 138564 | -| total_timesteps | 3259776 | -| train/ | | -| approx_kl | 0.21934569 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0152 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 254660 | -| policy_gradient_loss | 0.0663 | -| std | 0.00617 | -| value_loss | 1.03e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25468 | -| time_elapsed | 138568 | -| total_timesteps | 3259904 | -| train/ | | -| approx_kl | 0.0034115398 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00655 | -| learning_rate | 0.0003 | -| loss | -0.0114 | -| n_updates | 254670 | -| policy_gradient_loss | 0.0902 | -| std | 0.00617 | -| value_loss | 2.34e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25469 | -| time_elapsed | 138573 | -| total_timesteps | 3260032 | -| train/ | | -| approx_kl | 0.13152558 | -| clip_fraction | 0.687 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 254680 | -| policy_gradient_loss | 0.207 | -| std | 0.00617 | -| value_loss | 2.08e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25470 | -| time_elapsed | 138583 | -| total_timesteps | 3260160 | -| train/ | | -| approx_kl | 0.29694295 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.887 | -| learning_rate | 0.0003 | -| loss | 0.00762 | -| n_updates | 254690 | -| policy_gradient_loss | -0.00662 | -| std | 0.00617 | -| value_loss | 0.000462 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25471 | -| time_elapsed | 138589 | -| total_timesteps | 3260288 | -| train/ | | -| approx_kl | 0.006530011 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0183 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 254700 | -| policy_gradient_loss | -0.000926 | -| std | 0.00617 | -| value_loss | 5.89e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25472 | -| time_elapsed | 138594 | -| total_timesteps | 3260416 | -| train/ | | -| approx_kl | 0.00018827291 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00332 | -| learning_rate | 0.0003 | -| loss | 6.04e-05 | -| n_updates | 254710 | -| policy_gradient_loss | 0.0135 | -| std | 0.00617 | -| value_loss | 2.85e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25473 | -| time_elapsed | 138599 | -| total_timesteps | 3260544 | -| train/ | | -| approx_kl | 0.00042715808 | -| clip_fraction | 0.221 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0087 | -| learning_rate | 0.0003 | -| loss | -0.000289 | -| n_updates | 254720 | -| policy_gradient_loss | 0.0163 | -| std | 0.00617 | -| value_loss | 2.13e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25474 | -| time_elapsed | 138604 | -| total_timesteps | 3260672 | -| train/ | | -| approx_kl | 0.0842077 | -| clip_fraction | 0.611 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0688 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 254730 | -| policy_gradient_loss | 0.0581 | -| std | 0.00616 | -| value_loss | 9.97e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25475 | -| time_elapsed | 138608 | -| total_timesteps | 3260800 | -| train/ | | -| approx_kl | 0.02656228 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0159 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 254740 | -| policy_gradient_loss | 0.00632 | -| std | 0.00616 | -| value_loss | 3.21e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.918 | -| time/ | | -| fps | 23 | -| iterations | 25476 | -| time_elapsed | 138613 | -| total_timesteps | 3260928 | -| train/ | | -| approx_kl | 0.18355489 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00725 | -| learning_rate | 0.0003 | -| loss | 0.0765 | -| n_updates | 254750 | -| policy_gradient_loss | 0.0305 | -| std | 0.00616 | -| value_loss | 1.04e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25477 | -| time_elapsed | 138617 | -| total_timesteps | 3261056 | -| train/ | | -| approx_kl | 0.15708067 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0875 | -| learning_rate | 0.0003 | -| loss | 0.0673 | -| n_updates | 254760 | -| policy_gradient_loss | 0.0162 | -| std | 0.00617 | -| value_loss | 6.35e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25478 | -| time_elapsed | 138623 | -| total_timesteps | 3261184 | -| train/ | | -| approx_kl | 0.024637172 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0852 | -| learning_rate | 0.0003 | -| loss | -0.0229 | -| n_updates | 254770 | -| policy_gradient_loss | -0.00176 | -| std | 0.00617 | -| value_loss | 0.00186 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25479 | -| time_elapsed | 138629 | -| total_timesteps | 3261312 | -| train/ | | -| approx_kl | 2.0224135e-05 | -| clip_fraction | 0.374 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | -0.000379 | -| n_updates | 254780 | -| policy_gradient_loss | 0.0194 | -| std | 0.00618 | -| value_loss | 9.17e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25480 | -| time_elapsed | 138634 | -| total_timesteps | 3261440 | -| train/ | | -| approx_kl | 0.0015713326 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | -0.00109 | -| n_updates | 254790 | -| policy_gradient_loss | 0.0377 | -| std | 0.00618 | -| value_loss | 2.15e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25481 | -| time_elapsed | 138639 | -| total_timesteps | 3261568 | -| train/ | | -| approx_kl | 0.6266377 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 254800 | -| policy_gradient_loss | 0.0399 | -| std | 0.00619 | -| value_loss | 5.3e-07 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25482 | -| time_elapsed | 138644 | -| total_timesteps | 3261696 | -| train/ | | -| approx_kl | 2.3902394e-06 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | 3.45e-05 | -| n_updates | 254810 | -| policy_gradient_loss | 0.00574 | -| std | 0.00619 | -| value_loss | 1.4e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25483 | -| time_elapsed | 138648 | -| total_timesteps | 3261824 | -| train/ | | -| approx_kl | 0.009875739 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.938 | -| learning_rate | 0.0003 | -| loss | -0.00162 | -| n_updates | 254820 | -| policy_gradient_loss | 0.00579 | -| std | 0.0062 | -| value_loss | 1.87e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 25484 | -| time_elapsed | 138653 | -| total_timesteps | 3261952 | -| train/ | | -| approx_kl | 0.06719801 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0156 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 254830 | -| policy_gradient_loss | 0.0258 | -| std | 0.0062 | -| value_loss | 2.87e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25485 | -| time_elapsed | 138657 | -| total_timesteps | 3262080 | -| train/ | | -| approx_kl | 1.3250546 | -| clip_fraction | 0.766 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | 0.4 | -| n_updates | 254840 | -| policy_gradient_loss | 0.202 | -| std | 0.0062 | -| value_loss | 1.9e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25486 | -| time_elapsed | 138668 | -| total_timesteps | 3262208 | -| train/ | | -| approx_kl | 0.07846099 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.978 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 254850 | -| policy_gradient_loss | -0.0135 | -| std | 0.0062 | -| value_loss | 0.000113 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25487 | -| time_elapsed | 138673 | -| total_timesteps | 3262336 | -| train/ | | -| approx_kl | 0.004947315 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00641 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 254860 | -| policy_gradient_loss | 0.02 | -| std | 0.0062 | -| value_loss | 1.54e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25488 | -| time_elapsed | 138678 | -| total_timesteps | 3262464 | -| train/ | | -| approx_kl | 0.012629296 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00939 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 254870 | -| policy_gradient_loss | 0.0338 | -| std | 0.0062 | -| value_loss | 3.16e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25489 | -| time_elapsed | 138683 | -| total_timesteps | 3262592 | -| train/ | | -| approx_kl | 0.05636735 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0562 | -| n_updates | 254880 | -| policy_gradient_loss | 0.0106 | -| std | 0.0062 | -| value_loss | 2.06e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25490 | -| time_elapsed | 138688 | -| total_timesteps | 3262720 | -| train/ | | -| approx_kl | 0.013436604 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | -0.00804 | -| n_updates | 254890 | -| policy_gradient_loss | 0.0174 | -| std | 0.0062 | -| value_loss | 1.15e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25491 | -| time_elapsed | 138693 | -| total_timesteps | 3262848 | -| train/ | | -| approx_kl | 0.24207178 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0474 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 254900 | -| policy_gradient_loss | 0.0193 | -| std | 0.00619 | -| value_loss | 8.98e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 25492 | -| time_elapsed | 138698 | -| total_timesteps | 3262976 | -| train/ | | -| approx_kl | 0.0039357035 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 254910 | -| policy_gradient_loss | 0.0296 | -| std | 0.00619 | -| value_loss | 5.55e-10 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25493 | -| time_elapsed | 138702 | -| total_timesteps | 3263104 | -| train/ | | -| approx_kl | 0.0018274393 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0753 | -| learning_rate | 0.0003 | -| loss | -0.00582 | -| n_updates | 254920 | -| policy_gradient_loss | 0.0252 | -| std | 0.00619 | -| value_loss | 3.6e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25494 | -| time_elapsed | 138714 | -| total_timesteps | 3263232 | -| train/ | | -| approx_kl | 0.029599011 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.694 | -| learning_rate | 0.0003 | -| loss | -0.0269 | -| n_updates | 254930 | -| policy_gradient_loss | -0.0117 | -| std | 0.00619 | -| value_loss | 0.00217 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25495 | -| time_elapsed | 138718 | -| total_timesteps | 3263360 | -| train/ | | -| approx_kl | 0.08133313 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 254940 | -| policy_gradient_loss | 0.0278 | -| std | 0.00619 | -| value_loss | 2.47e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25496 | -| time_elapsed | 138724 | -| total_timesteps | 3263488 | -| train/ | | -| approx_kl | 0.7729294 | -| clip_fraction | 0.556 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 254950 | -| policy_gradient_loss | 0.0512 | -| std | 0.00619 | -| value_loss | 2.76e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25497 | -| time_elapsed | 138729 | -| total_timesteps | 3263616 | -| train/ | | -| approx_kl | 0.0465006 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.0125 | -| n_updates | 254960 | -| policy_gradient_loss | 0.00812 | -| std | 0.0062 | -| value_loss | 2.23e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25498 | -| time_elapsed | 138734 | -| total_timesteps | 3263744 | -| train/ | | -| approx_kl | 0.047644928 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.03 | -| learning_rate | 0.0003 | -| loss | 0.00788 | -| n_updates | 254970 | -| policy_gradient_loss | 0.00302 | -| std | 0.0062 | -| value_loss | 1.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25499 | -| time_elapsed | 138738 | -| total_timesteps | 3263872 | -| train/ | | -| approx_kl | 0.053190447 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0291 | -| learning_rate | 0.0003 | -| loss | 0.0199 | -| n_updates | 254980 | -| policy_gradient_loss | 0.00973 | -| std | 0.0062 | -| value_loss | 1.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25500 | -| time_elapsed | 138743 | -| total_timesteps | 3264000 | -| train/ | | -| approx_kl | 0.058956333 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | 0.0261 | -| n_updates | 254990 | -| policy_gradient_loss | 0.0124 | -| std | 0.0062 | -| value_loss | 7.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25501 | -| time_elapsed | 138748 | -| total_timesteps | 3264128 | -| train/ | | -| approx_kl | 0.060705043 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00554 | -| learning_rate | 0.0003 | -| loss | 0.0379 | -| n_updates | 255000 | -| policy_gradient_loss | 0.0183 | -| std | 0.0062 | -| value_loss | 3.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25502 | -| time_elapsed | 138759 | -| total_timesteps | 3264256 | -| train/ | | -| approx_kl | 0.005123736 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.771 | -| learning_rate | 0.0003 | -| loss | -0.00344 | -| n_updates | 255010 | -| policy_gradient_loss | 0.000851 | -| std | 0.00619 | -| value_loss | 0.00218 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25503 | -| time_elapsed | 138764 | -| total_timesteps | 3264384 | -| train/ | | -| approx_kl | 0.0040726773 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.072 | -| learning_rate | 0.0003 | -| loss | -0.00148 | -| n_updates | 255020 | -| policy_gradient_loss | 0.00781 | -| std | 0.00619 | -| value_loss | 1.85e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25504 | -| time_elapsed | 138769 | -| total_timesteps | 3264512 | -| train/ | | -| approx_kl | 0.099379234 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0114 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 255030 | -| policy_gradient_loss | 0.00137 | -| std | 0.0062 | -| value_loss | 3.98e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25505 | -| time_elapsed | 138774 | -| total_timesteps | 3264640 | -| train/ | | -| approx_kl | 0.22025672 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 255040 | -| policy_gradient_loss | 0.0419 | -| std | 0.0062 | -| value_loss | 7.23e-08 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25506 | -| time_elapsed | 138780 | -| total_timesteps | 3264768 | -| train/ | | -| approx_kl | 0.654146 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0463 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 255050 | -| policy_gradient_loss | 0.0503 | -| std | 0.0062 | -| value_loss | 5.99e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25507 | -| time_elapsed | 138784 | -| total_timesteps | 3264896 | -| train/ | | -| approx_kl | 0.011758696 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | 0.00135 | -| n_updates | 255060 | -| policy_gradient_loss | 0.00553 | -| std | 0.0062 | -| value_loss | 3.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25508 | -| time_elapsed | 138789 | -| total_timesteps | 3265024 | -| train/ | | -| approx_kl | 0.063438274 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0881 | -| learning_rate | 0.0003 | -| loss | 0.0585 | -| n_updates | 255070 | -| policy_gradient_loss | 0.0244 | -| std | 0.00619 | -| value_loss | 1.96e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25509 | -| time_elapsed | 138799 | -| total_timesteps | 3265152 | -| train/ | | -| approx_kl | 0.033827256 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.947 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 255080 | -| policy_gradient_loss | -0.00742 | -| std | 0.00618 | -| value_loss | 0.000597 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25510 | -| time_elapsed | 138802 | -| total_timesteps | 3265280 | -| train/ | | -| approx_kl | 0.062313654 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.963 | -| learning_rate | 0.0003 | -| loss | 0.00984 | -| n_updates | 255090 | -| policy_gradient_loss | 0.00546 | -| std | 0.00617 | -| value_loss | 7.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25511 | -| time_elapsed | 138807 | -| total_timesteps | 3265408 | -| train/ | | -| approx_kl | 0.020339876 | -| clip_fraction | 0.597 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00816 | -| learning_rate | 0.0003 | -| loss | -0.00776 | -| n_updates | 255100 | -| policy_gradient_loss | 0.074 | -| std | 0.00617 | -| value_loss | 9.47e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25512 | -| time_elapsed | 138812 | -| total_timesteps | 3265536 | -| train/ | | -| approx_kl | 0.014684228 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0138 | -| learning_rate | 0.0003 | -| loss | -0.00847 | -| n_updates | 255110 | -| policy_gradient_loss | 0.0163 | -| std | 0.00617 | -| value_loss | 7.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25513 | -| time_elapsed | 138817 | -| total_timesteps | 3265664 | -| train/ | | -| approx_kl | 0.14926875 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.071 | -| n_updates | 255120 | -| policy_gradient_loss | 0.0118 | -| std | 0.00617 | -| value_loss | 3.83e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25514 | -| time_elapsed | 138821 | -| total_timesteps | 3265792 | -| train/ | | -| approx_kl | 0.007205126 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0479 | -| learning_rate | 0.0003 | -| loss | 0.00498 | -| n_updates | 255130 | -| policy_gradient_loss | 0.0227 | -| std | 0.00616 | -| value_loss | 2.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25515 | -| time_elapsed | 138826 | -| total_timesteps | 3265920 | -| train/ | | -| approx_kl | 0.016499303 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0789 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 255140 | -| policy_gradient_loss | 0.0194 | -| std | 0.00616 | -| value_loss | 1.5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25516 | -| time_elapsed | 138831 | -| total_timesteps | 3266048 | -| train/ | | -| approx_kl | 0.11461153 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.0581 | -| n_updates | 255150 | -| policy_gradient_loss | 0.0303 | -| std | 0.00616 | -| value_loss | 1.08e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25517 | -| time_elapsed | 138840 | -| total_timesteps | 3266176 | -| train/ | | -| approx_kl | 0.10448607 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.963 | -| learning_rate | 0.0003 | -| loss | 0.00677 | -| n_updates | 255160 | -| policy_gradient_loss | 0.0161 | -| std | 0.00616 | -| value_loss | 0.000174 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25518 | -| time_elapsed | 138845 | -| total_timesteps | 3266304 | -| train/ | | -| approx_kl | 0.9479512 | -| clip_fraction | 0.78 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.905 | -| learning_rate | 0.0003 | -| loss | 0.253 | -| n_updates | 255170 | -| policy_gradient_loss | 0.107 | -| std | 0.00616 | -| value_loss | 9.98e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25519 | -| time_elapsed | 138850 | -| total_timesteps | 3266432 | -| train/ | | -| approx_kl | 0.026536655 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.873 | -| learning_rate | 0.0003 | -| loss | 0.0203 | -| n_updates | 255180 | -| policy_gradient_loss | 0.016 | -| std | 0.00613 | -| value_loss | 7.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25520 | -| time_elapsed | 138855 | -| total_timesteps | 3266560 | -| train/ | | -| approx_kl | 0.20624976 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -1.93 | -| learning_rate | 0.0003 | -| loss | 0.099 | -| n_updates | 255190 | -| policy_gradient_loss | 0.12 | -| std | 0.00611 | -| value_loss | 4.51e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25521 | -| time_elapsed | 138859 | -| total_timesteps | 3266688 | -| train/ | | -| approx_kl | 0.18308851 | -| clip_fraction | 0.692 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0735 | -| learning_rate | 0.0003 | -| loss | 0.237 | -| n_updates | 255200 | -| policy_gradient_loss | 0.159 | -| std | 0.0061 | -| value_loss | 6.82e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25522 | -| time_elapsed | 138863 | -| total_timesteps | 3266816 | -| train/ | | -| approx_kl | 0.1656159 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00778 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 255210 | -| policy_gradient_loss | 0.108 | -| std | 0.00609 | -| value_loss | 3.19e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.889 | -| time/ | | -| fps | 23 | -| iterations | 25523 | -| time_elapsed | 138867 | -| total_timesteps | 3266944 | -| train/ | | -| approx_kl | 0.15767704 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.014 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 255220 | -| policy_gradient_loss | 0.186 | -| std | 0.00609 | -| value_loss | 2.18e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25524 | -| time_elapsed | 138873 | -| total_timesteps | 3267072 | -| train/ | | -| approx_kl | 0.1253566 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.0687 | -| n_updates | 255230 | -| policy_gradient_loss | 0.077 | -| std | 0.0061 | -| value_loss | 9.93e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25525 | -| time_elapsed | 138881 | -| total_timesteps | 3267200 | -| train/ | | -| approx_kl | 0.030854732 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | 0.00437 | -| n_updates | 255240 | -| policy_gradient_loss | 0.0325 | -| std | 0.0061 | -| value_loss | 0.00305 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25526 | -| time_elapsed | 138886 | -| total_timesteps | 3267328 | -| train/ | | -| approx_kl | 0.0023086816 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.299 | -| learning_rate | 0.0003 | -| loss | 0.000295 | -| n_updates | 255250 | -| policy_gradient_loss | 0.0353 | -| std | 0.00611 | -| value_loss | 1.55e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25527 | -| time_elapsed | 138891 | -| total_timesteps | 3267456 | -| train/ | | -| approx_kl | 0.0032697348 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -2.65 | -| learning_rate | 0.0003 | -| loss | -0.000511 | -| n_updates | 255260 | -| policy_gradient_loss | 0.0116 | -| std | 0.00614 | -| value_loss | 0.00246 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25528 | -| time_elapsed | 138894 | -| total_timesteps | 3267584 | -| train/ | | -| approx_kl | 5.9669837e-06 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.24 | -| learning_rate | 0.0003 | -| loss | 0.000197 | -| n_updates | 255270 | -| policy_gradient_loss | 0.0158 | -| std | 0.00615 | -| value_loss | 0.000158 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25529 | -| time_elapsed | 138898 | -| total_timesteps | 3267712 | -| train/ | | -| approx_kl | 0.068554886 | -| clip_fraction | 0.606 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | 0.0186 | -| n_updates | 255280 | -| policy_gradient_loss | 0.0511 | -| std | 0.00615 | -| value_loss | 0.000137 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25530 | -| time_elapsed | 138902 | -| total_timesteps | 3267840 | -| train/ | | -| approx_kl | 0.25436974 | -| clip_fraction | 0.432 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0157 | -| learning_rate | 0.0003 | -| loss | 0.107 | -| n_updates | 255290 | -| policy_gradient_loss | 0.0429 | -| std | 0.00615 | -| value_loss | 3.96e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25531 | -| time_elapsed | 138907 | -| total_timesteps | 3267968 | -| train/ | | -| approx_kl | 0.0015366906 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 255300 | -| policy_gradient_loss | 0.00953 | -| std | 0.00615 | -| value_loss | 2.39e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25532 | -| time_elapsed | 138912 | -| total_timesteps | 3268096 | -| train/ | | -| approx_kl | 0.095514454 | -| clip_fraction | 0.596 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 255310 | -| policy_gradient_loss | 0.0491 | -| std | 0.00615 | -| value_loss | 1.7e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25533 | -| time_elapsed | 138918 | -| total_timesteps | 3268224 | -| train/ | | -| approx_kl | 0.005764998 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | -0.0148 | -| n_updates | 255320 | -| policy_gradient_loss | 0.00859 | -| std | 0.00615 | -| value_loss | 0.00032 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25534 | -| time_elapsed | 138923 | -| total_timesteps | 3268352 | -| train/ | | -| approx_kl | 0.046893455 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0885 | -| learning_rate | 0.0003 | -| loss | 0.0195 | -| n_updates | 255330 | -| policy_gradient_loss | 0.0539 | -| std | 0.00615 | -| value_loss | 5.78e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25535 | -| time_elapsed | 138927 | -| total_timesteps | 3268480 | -| train/ | | -| approx_kl | 0.18473518 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 255340 | -| policy_gradient_loss | 0.0589 | -| std | 0.00615 | -| value_loss | 3.53e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25536 | -| time_elapsed | 138931 | -| total_timesteps | 3268608 | -| train/ | | -| approx_kl | 0.0040217405 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | -0.0165 | -| n_updates | 255350 | -| policy_gradient_loss | 0.00103 | -| std | 0.00615 | -| value_loss | 3.55e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25537 | -| time_elapsed | 138937 | -| total_timesteps | 3268736 | -| train/ | | -| approx_kl | 0.09723023 | -| clip_fraction | 0.595 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0244 | -| learning_rate | 0.0003 | -| loss | 0.0426 | -| n_updates | 255360 | -| policy_gradient_loss | 0.0746 | -| std | 0.00615 | -| value_loss | 2.88e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25538 | -| time_elapsed | 138942 | -| total_timesteps | 3268864 | -| train/ | | -| approx_kl | 2.747029e-05 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | -0.0005 | -| n_updates | 255370 | -| policy_gradient_loss | 0.117 | -| std | 0.00615 | -| value_loss | 2.03e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.884 | -| time/ | | -| fps | 23 | -| iterations | 25539 | -| time_elapsed | 138947 | -| total_timesteps | 3268992 | -| train/ | | -| approx_kl | 0.027596721 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0834 | -| learning_rate | 0.0003 | -| loss | 0.0178 | -| n_updates | 255380 | -| policy_gradient_loss | 0.0297 | -| std | 0.00615 | -| value_loss | 8.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25540 | -| time_elapsed | 138951 | -| total_timesteps | 3269120 | -| train/ | | -| approx_kl | 0.41714716 | -| clip_fraction | 0.746 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0886 | -| learning_rate | 0.0003 | -| loss | 0.242 | -| n_updates | 255390 | -| policy_gradient_loss | 0.212 | -| std | 0.00615 | -| value_loss | 6.14e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25541 | -| time_elapsed | 138964 | -| total_timesteps | 3269248 | -| train/ | | -| approx_kl | 0.020395448 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.928 | -| learning_rate | 0.0003 | -| loss | -0.00396 | -| n_updates | 255400 | -| policy_gradient_loss | 0.0233 | -| std | 0.00615 | -| value_loss | 0.000582 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25542 | -| time_elapsed | 138967 | -| total_timesteps | 3269376 | -| train/ | | -| approx_kl | 0.20403121 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -12.8 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 255410 | -| policy_gradient_loss | 0.00551 | -| std | 0.00615 | -| value_loss | 5.08e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25543 | -| time_elapsed | 138972 | -| total_timesteps | 3269504 | -| train/ | | -| approx_kl | 0.021197826 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.724 | -| learning_rate | 0.0003 | -| loss | -0.00915 | -| n_updates | 255420 | -| policy_gradient_loss | 0.02 | -| std | 0.00615 | -| value_loss | 1.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25544 | -| time_elapsed | 138976 | -| total_timesteps | 3269632 | -| train/ | | -| approx_kl | 0.14915395 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 6.56e-06 | -| learning_rate | 0.0003 | -| loss | 0.0909 | -| n_updates | 255430 | -| policy_gradient_loss | 0.0431 | -| std | 0.00616 | -| value_loss | 6.01e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25545 | -| time_elapsed | 138981 | -| total_timesteps | 3269760 | -| train/ | | -| approx_kl | 0.17005081 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0585 | -| n_updates | 255440 | -| policy_gradient_loss | 0.0249 | -| std | 0.00616 | -| value_loss | 3.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.882 | -| time/ | | -| fps | 23 | -| iterations | 25546 | -| time_elapsed | 138984 | -| total_timesteps | 3269888 | -| train/ | | -| approx_kl | 0.012623717 | -| clip_fraction | 0.109 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.065 | -| learning_rate | 0.0003 | -| loss | -0.000875 | -| n_updates | 255450 | -| policy_gradient_loss | -0.000269 | -| std | 0.00616 | -| value_loss | 1.93e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25547 | -| time_elapsed | 138989 | -| total_timesteps | 3270016 | -| train/ | | -| approx_kl | 0.014128375 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0798 | -| learning_rate | 0.0003 | -| loss | 0.00611 | -| n_updates | 255460 | -| policy_gradient_loss | 0.00314 | -| std | 0.00617 | -| value_loss | 1.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25548 | -| time_elapsed | 139000 | -| total_timesteps | 3270144 | -| train/ | | -| approx_kl | 0.28832677 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.657 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 255470 | -| policy_gradient_loss | 0.00187 | -| std | 0.00617 | -| value_loss | 0.000907 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25549 | -| time_elapsed | 139005 | -| total_timesteps | 3270272 | -| train/ | | -| approx_kl | 0.00863494 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0276 | -| learning_rate | 0.0003 | -| loss | 0.00715 | -| n_updates | 255480 | -| policy_gradient_loss | 0.0317 | -| std | 0.00617 | -| value_loss | 6e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25550 | -| time_elapsed | 139010 | -| total_timesteps | 3270400 | -| train/ | | -| approx_kl | 0.6040381 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.525 | -| learning_rate | 0.0003 | -| loss | 0.24 | -| n_updates | 255490 | -| policy_gradient_loss | 0.148 | -| std | 0.00617 | -| value_loss | 5.88e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25551 | -| time_elapsed | 139012 | -| total_timesteps | 3270528 | -| train/ | | -| approx_kl | 0.06704827 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00561 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 255500 | -| policy_gradient_loss | 0.0265 | -| std | 0.00617 | -| value_loss | 1.1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25552 | -| time_elapsed | 139015 | -| total_timesteps | 3270656 | -| train/ | | -| approx_kl | 0.03802865 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | -0.029 | -| n_updates | 255510 | -| policy_gradient_loss | -0.0109 | -| std | 0.00617 | -| value_loss | 4.35e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25553 | -| time_elapsed | 139019 | -| total_timesteps | 3270784 | -| train/ | | -| approx_kl | 0.02263691 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 255520 | -| policy_gradient_loss | 0.0214 | -| std | 0.00617 | -| value_loss | 3.2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.888 | -| time/ | | -| fps | 23 | -| iterations | 25554 | -| time_elapsed | 139024 | -| total_timesteps | 3270912 | -| train/ | | -| approx_kl | 0.083884194 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.0285 | -| n_updates | 255530 | -| policy_gradient_loss | 0.0272 | -| std | 0.00617 | -| value_loss | 2.58e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25555 | -| time_elapsed | 139028 | -| total_timesteps | 3271040 | -| train/ | | -| approx_kl | 0.2732871 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 255540 | -| policy_gradient_loss | 0.0381 | -| std | 0.00617 | -| value_loss | 1.99e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25556 | -| time_elapsed | 139039 | -| total_timesteps | 3271168 | -| train/ | | -| approx_kl | 0.40270576 | -| clip_fraction | 0.54 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 255550 | -| policy_gradient_loss | 0.0493 | -| std | 0.00617 | -| value_loss | 0.00614 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25557 | -| time_elapsed | 139044 | -| total_timesteps | 3271296 | -| train/ | | -| approx_kl | 0.29048407 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.455 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 255560 | -| policy_gradient_loss | 0.0506 | -| std | 0.00617 | -| value_loss | 1.52e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25558 | -| time_elapsed | 139047 | -| total_timesteps | 3271424 | -| train/ | | -| approx_kl | 0.0006552418 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | 0.000491 | -| n_updates | 255570 | -| policy_gradient_loss | 0.0322 | -| std | 0.00616 | -| value_loss | 2.37e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25559 | -| time_elapsed | 139051 | -| total_timesteps | 3271552 | -| train/ | | -| approx_kl | 0.21630955 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | 0.0561 | -| n_updates | 255580 | -| policy_gradient_loss | 0.0139 | -| std | 0.00616 | -| value_loss | 8.64e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25560 | -| time_elapsed | 139056 | -| total_timesteps | 3271680 | -| train/ | | -| approx_kl | 0.024375582 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0615 | -| learning_rate | 0.0003 | -| loss | -0.000269 | -| n_updates | 255590 | -| policy_gradient_loss | -0.00237 | -| std | 0.00616 | -| value_loss | 5.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25561 | -| time_elapsed | 139061 | -| total_timesteps | 3271808 | -| train/ | | -| approx_kl | 0.031302195 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 255600 | -| policy_gradient_loss | 0.0264 | -| std | 0.00616 | -| value_loss | 5.48e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.885 | -| time/ | | -| fps | 23 | -| iterations | 25562 | -| time_elapsed | 139065 | -| total_timesteps | 3271936 | -| train/ | | -| approx_kl | 0.017802445 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 255610 | -| policy_gradient_loss | 0.033 | -| std | 0.00618 | -| value_loss | 1.32e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25563 | -| time_elapsed | 139070 | -| total_timesteps | 3272064 | -| train/ | | -| approx_kl | 0.06175491 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -48 | -| learning_rate | 0.0003 | -| loss | 0.00441 | -| n_updates | 255620 | -| policy_gradient_loss | 0.0137 | -| std | 0.00619 | -| value_loss | 8.65e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25564 | -| time_elapsed | 139080 | -| total_timesteps | 3272192 | -| train/ | | -| approx_kl | 0.5332309 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.972 | -| learning_rate | 0.0003 | -| loss | 0.227 | -| n_updates | 255630 | -| policy_gradient_loss | 0.158 | -| std | 0.00619 | -| value_loss | 0.000191 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25565 | -| time_elapsed | 139084 | -| total_timesteps | 3272320 | -| train/ | | -| approx_kl | 0.0686282 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 0.0465 | -| n_updates | 255640 | -| policy_gradient_loss | 0.0302 | -| std | 0.0062 | -| value_loss | 4.68e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25566 | -| time_elapsed | 139088 | -| total_timesteps | 3272448 | -| train/ | | -| approx_kl | 0.17718273 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00237 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 255650 | -| policy_gradient_loss | 0.0327 | -| std | 0.0062 | -| value_loss | 2.31e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25567 | -| time_elapsed | 139093 | -| total_timesteps | 3272576 | -| train/ | | -| approx_kl | 0.01800564 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.272 | -| learning_rate | 0.0003 | -| loss | -0.0179 | -| n_updates | 255660 | -| policy_gradient_loss | -0.0095 | -| std | 0.0062 | -| value_loss | 3.33e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25568 | -| time_elapsed | 139097 | -| total_timesteps | 3272704 | -| train/ | | -| approx_kl | 0.025656322 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0769 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 255670 | -| policy_gradient_loss | 0.0197 | -| std | 0.0062 | -| value_loss | 2.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25569 | -| time_elapsed | 139103 | -| total_timesteps | 3272832 | -| train/ | | -| approx_kl | 0.12251035 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0757 | -| n_updates | 255680 | -| policy_gradient_loss | 0.0363 | -| std | 0.0062 | -| value_loss | 1.98e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.895 | -| time/ | | -| fps | 23 | -| iterations | 25570 | -| time_elapsed | 139108 | -| total_timesteps | 3272960 | -| train/ | | -| approx_kl | 0.00022373162 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0378 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 255690 | -| policy_gradient_loss | 0.0357 | -| std | 0.0062 | -| value_loss | 1.57e-08 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25571 | -| time_elapsed | 139114 | -| total_timesteps | 3273088 | -| train/ | | -| approx_kl | 0.0006692838 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | 0.00268 | -| n_updates | 255700 | -| policy_gradient_loss | 0.0356 | -| std | 0.0062 | -| value_loss | 1.21e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25572 | -| time_elapsed | 139121 | -| total_timesteps | 3273216 | -| train/ | | -| approx_kl | 0.07233336 | -| clip_fraction | 0.18 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.77 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 255710 | -| policy_gradient_loss | -0.0155 | -| std | 0.0062 | -| value_loss | 0.00544 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25573 | -| time_elapsed | 139126 | -| total_timesteps | 3273344 | -| train/ | | -| approx_kl | 0.027024776 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.291 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 255720 | -| policy_gradient_loss | 0.0248 | -| std | 0.00621 | -| value_loss | 4.03e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25574 | -| time_elapsed | 139129 | -| total_timesteps | 3273472 | -| train/ | | -| approx_kl | 0.08984735 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.85 | -| learning_rate | 0.0003 | -| loss | 0.0658 | -| n_updates | 255730 | -| policy_gradient_loss | 0.0209 | -| std | 0.00621 | -| value_loss | 5.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25575 | -| time_elapsed | 139133 | -| total_timesteps | 3273600 | -| train/ | | -| approx_kl | 0.008515047 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | -0.000398 | -| n_updates | 255740 | -| policy_gradient_loss | 0.000743 | -| std | 0.00621 | -| value_loss | 1.68e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25576 | -| time_elapsed | 139137 | -| total_timesteps | 3273728 | -| train/ | | -| approx_kl | 0.013236351 | -| clip_fraction | 0.1 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.00792 | -| n_updates | 255750 | -| policy_gradient_loss | 0.00463 | -| std | 0.00621 | -| value_loss | 3.73e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25577 | -| time_elapsed | 139140 | -| total_timesteps | 3273856 | -| train/ | | -| approx_kl | 0.03208217 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0771 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 255760 | -| policy_gradient_loss | 0.0371 | -| std | 0.00622 | -| value_loss | 2.33e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.893 | -| time/ | | -| fps | 23 | -| iterations | 25578 | -| time_elapsed | 139144 | -| total_timesteps | 3273984 | -| train/ | | -| approx_kl | 0.3137576 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0294 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 255770 | -| policy_gradient_loss | 0.138 | -| std | 0.00622 | -| value_loss | 2.13e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25579 | -| time_elapsed | 139148 | -| total_timesteps | 3274112 | -| train/ | | -| approx_kl | 0.06004805 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 255780 | -| policy_gradient_loss | 0.03 | -| std | 0.00621 | -| value_loss | 1.08e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25580 | -| time_elapsed | 139157 | -| total_timesteps | 3274240 | -| train/ | | -| approx_kl | 0.018485961 | -| clip_fraction | 0.15 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.882 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 255790 | -| policy_gradient_loss | -0.00787 | -| std | 0.00621 | -| value_loss | 0.00067 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25581 | -| time_elapsed | 139163 | -| total_timesteps | 3274368 | -| train/ | | -| approx_kl | 0.00961045 | -| clip_fraction | 0.0938 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | -0.00329 | -| n_updates | 255800 | -| policy_gradient_loss | -0.000806 | -| std | 0.00621 | -| value_loss | 1.55e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25582 | -| time_elapsed | 139168 | -| total_timesteps | 3274496 | -| train/ | | -| approx_kl | 0.02901806 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0109 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 255810 | -| policy_gradient_loss | 0.0198 | -| std | 0.00621 | -| value_loss | 2.2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25583 | -| time_elapsed | 139172 | -| total_timesteps | 3274624 | -| train/ | | -| approx_kl | 0.116504565 | -| clip_fraction | 0.322 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | 0.0406 | -| n_updates | 255820 | -| policy_gradient_loss | 0.0237 | -| std | 0.00621 | -| value_loss | 1.71e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25584 | -| time_elapsed | 139175 | -| total_timesteps | 3274752 | -| train/ | | -| approx_kl | 0.00029015122 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0247 | -| learning_rate | 0.0003 | -| loss | -0.000204 | -| n_updates | 255830 | -| policy_gradient_loss | 0.0392 | -| std | 0.00621 | -| value_loss | 7.43e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25585 | -| time_elapsed | 139180 | -| total_timesteps | 3274880 | -| train/ | | -| approx_kl | 0.28588438 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0791 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 255840 | -| policy_gradient_loss | 0.0393 | -| std | 0.00621 | -| value_loss | 7.67e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25586 | -| time_elapsed | 139185 | -| total_timesteps | 3275008 | -| train/ | | -| approx_kl | 0.01793256 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0391 | -| learning_rate | 0.0003 | -| loss | 0.00613 | -| n_updates | 255850 | -| policy_gradient_loss | 0.00229 | -| std | 0.0062 | -| value_loss | 4.26e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25587 | -| time_elapsed | 139195 | -| total_timesteps | 3275136 | -| train/ | | -| approx_kl | 0.6794714 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.836 | -| learning_rate | 0.0003 | -| loss | 0.0819 | -| n_updates | 255860 | -| policy_gradient_loss | 0.0104 | -| std | 0.0062 | -| value_loss | 0.00329 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25588 | -| time_elapsed | 139199 | -| total_timesteps | 3275264 | -| train/ | | -| approx_kl | 0.024871973 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.298 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 255870 | -| policy_gradient_loss | -0.00102 | -| std | 0.0062 | -| value_loss | 0.000142 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25589 | -| time_elapsed | 139203 | -| total_timesteps | 3275392 | -| train/ | | -| approx_kl | 0.08744714 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.0509 | -| n_updates | 255880 | -| policy_gradient_loss | 0.0231 | -| std | 0.0062 | -| value_loss | 1.46e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25590 | -| time_elapsed | 139208 | -| total_timesteps | 3275520 | -| train/ | | -| approx_kl | 0.0106472885 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00464 | -| learning_rate | 0.0003 | -| loss | 0.000992 | -| n_updates | 255890 | -| policy_gradient_loss | 0.00843 | -| std | 0.0062 | -| value_loss | 4.55e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25591 | -| time_elapsed | 139212 | -| total_timesteps | 3275648 | -| train/ | | -| approx_kl | 0.0026625944 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | -0.00432 | -| n_updates | 255900 | -| policy_gradient_loss | 0.0104 | -| std | 0.0062 | -| value_loss | 2.61e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25592 | -| time_elapsed | 139217 | -| total_timesteps | 3275776 | -| train/ | | -| approx_kl | 6.8447553e-06 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.053 | -| learning_rate | 0.0003 | -| loss | 0.000101 | -| n_updates | 255910 | -| policy_gradient_loss | 0.0414 | -| std | 0.0062 | -| value_loss | 1.61e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25593 | -| time_elapsed | 139222 | -| total_timesteps | 3275904 | -| train/ | | -| approx_kl | 0.9509137 | -| clip_fraction | 0.766 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0634 | -| learning_rate | 0.0003 | -| loss | 0.344 | -| n_updates | 255920 | -| policy_gradient_loss | 0.216 | -| std | 0.0062 | -| value_loss | 1.31e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25594 | -| time_elapsed | 139227 | -| total_timesteps | 3276032 | -| train/ | | -| approx_kl | 0.014471261 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 255930 | -| policy_gradient_loss | 0.0225 | -| std | 0.0062 | -| value_loss | 1.13e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25595 | -| time_elapsed | 139237 | -| total_timesteps | 3276160 | -| train/ | | -| approx_kl | 0.3580007 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0974 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 255940 | -| policy_gradient_loss | 0.0229 | -| std | 0.0062 | -| value_loss | 0.00203 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25596 | -| time_elapsed | 139241 | -| total_timesteps | 3276288 | -| train/ | | -| approx_kl | 0.114935875 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | 0.0653 | -| n_updates | 255950 | -| policy_gradient_loss | 0.0512 | -| std | 0.0062 | -| value_loss | 1.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25597 | -| time_elapsed | 139247 | -| total_timesteps | 3276416 | -| train/ | | -| approx_kl | 0.37773123 | -| clip_fraction | 0.746 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | 0.149 | -| n_updates | 255960 | -| policy_gradient_loss | 0.126 | -| std | 0.0062 | -| value_loss | 2.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25598 | -| time_elapsed | 139252 | -| total_timesteps | 3276544 | -| train/ | | -| approx_kl | 0.23640719 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0155 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 255970 | -| policy_gradient_loss | 0.136 | -| std | 0.0062 | -| value_loss | 7.52e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25599 | -| time_elapsed | 139256 | -| total_timesteps | 3276672 | -| train/ | | -| approx_kl | 0.0379531 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 255980 | -| policy_gradient_loss | 0.0226 | -| std | 0.0062 | -| value_loss | 5.04e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25600 | -| time_elapsed | 139260 | -| total_timesteps | 3276800 | -| train/ | | -| approx_kl | 0.73039055 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.233 | -| n_updates | 255990 | -| policy_gradient_loss | 0.0654 | -| std | 0.0062 | -| value_loss | 3.65e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25601 | -| time_elapsed | 139266 | -| total_timesteps | 3276928 | -| train/ | | -| approx_kl | 0.05440378 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 256000 | -| policy_gradient_loss | 0.0179 | -| std | 0.00621 | -| value_loss | 2.57e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25602 | -| time_elapsed | 139270 | -| total_timesteps | 3277056 | -| train/ | | -| approx_kl | 0.054934666 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0326 | -| n_updates | 256010 | -| policy_gradient_loss | 0.0153 | -| std | 0.0062 | -| value_loss | 1.27e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25603 | -| time_elapsed | 139280 | -| total_timesteps | 3277184 | -| train/ | | -| approx_kl | 0.010266768 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.919 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 256020 | -| policy_gradient_loss | 0.00839 | -| std | 0.0062 | -| value_loss | 0.00119 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25604 | -| time_elapsed | 139284 | -| total_timesteps | 3277312 | -| train/ | | -| approx_kl | 0.13503462 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.266 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 256030 | -| policy_gradient_loss | 0.0741 | -| std | 0.0062 | -| value_loss | 3.54e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25605 | -| time_elapsed | 139289 | -| total_timesteps | 3277440 | -| train/ | | -| approx_kl | 0.04157848 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0099 | -| n_updates | 256040 | -| policy_gradient_loss | 0.0414 | -| std | 0.0062 | -| value_loss | 9.39e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25606 | -| time_elapsed | 139295 | -| total_timesteps | 3277568 | -| train/ | | -| approx_kl | 1.1344014 | -| clip_fraction | 0.781 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00864 | -| learning_rate | 0.0003 | -| loss | 0.393 | -| n_updates | 256050 | -| policy_gradient_loss | 0.232 | -| std | 0.0062 | -| value_loss | 1.02e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25607 | -| time_elapsed | 139299 | -| total_timesteps | 3277696 | -| train/ | | -| approx_kl | 0.008831411 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.351 | -| learning_rate | 0.0003 | -| loss | -0.00397 | -| n_updates | 256060 | -| policy_gradient_loss | 0.0239 | -| std | 0.0062 | -| value_loss | 1.27e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25608 | -| time_elapsed | 139303 | -| total_timesteps | 3277824 | -| train/ | | -| approx_kl | 0.11880199 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.0636 | -| n_updates | 256070 | -| policy_gradient_loss | 0.0356 | -| std | 0.0062 | -| value_loss | 8.91e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.894 | -| time/ | | -| fps | 23 | -| iterations | 25609 | -| time_elapsed | 139308 | -| total_timesteps | 3277952 | -| train/ | | -| approx_kl | 0.0072540715 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 256080 | -| policy_gradient_loss | 0.0125 | -| std | 0.0062 | -| value_loss | 7.58e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25610 | -| time_elapsed | 139310 | -| total_timesteps | 3278080 | -| train/ | | -| approx_kl | 0.06830027 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.141 | -| learning_rate | 0.0003 | -| loss | 0.00583 | -| n_updates | 256090 | -| policy_gradient_loss | 0.023 | -| std | 0.0062 | -| value_loss | 2.65e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25611 | -| time_elapsed | 139319 | -| total_timesteps | 3278208 | -| train/ | | -| approx_kl | 0.38538325 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.32 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 256100 | -| policy_gradient_loss | 0.0127 | -| std | 0.0062 | -| value_loss | 0.00154 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25612 | -| time_elapsed | 139324 | -| total_timesteps | 3278336 | -| train/ | | -| approx_kl | 0.034700118 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -2.14 | -| learning_rate | 0.0003 | -| loss | 0.00482 | -| n_updates | 256110 | -| policy_gradient_loss | 0.0492 | -| std | 0.0062 | -| value_loss | 1.45e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25613 | -| time_elapsed | 139329 | -| total_timesteps | 3278464 | -| train/ | | -| approx_kl | 0.16434313 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0832 | -| learning_rate | 0.0003 | -| loss | 0.129 | -| n_updates | 256120 | -| policy_gradient_loss | 0.0782 | -| std | 0.0062 | -| value_loss | 2.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25614 | -| time_elapsed | 139334 | -| total_timesteps | 3278592 | -| train/ | | -| approx_kl | 0.043730803 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00189 | -| learning_rate | 0.0003 | -| loss | 0.0054 | -| n_updates | 256130 | -| policy_gradient_loss | 0.0215 | -| std | 0.0062 | -| value_loss | 7.23e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25615 | -| time_elapsed | 139337 | -| total_timesteps | 3278720 | -| train/ | | -| approx_kl | 0.12441298 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 256140 | -| policy_gradient_loss | 0.0543 | -| std | 0.0062 | -| value_loss | 5.37e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25616 | -| time_elapsed | 139343 | -| total_timesteps | 3278848 | -| train/ | | -| approx_kl | 0.054789424 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.0106 | -| n_updates | 256150 | -| policy_gradient_loss | 0.0368 | -| std | 0.0062 | -| value_loss | 4.56e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.898 | -| time/ | | -| fps | 23 | -| iterations | 25617 | -| time_elapsed | 139348 | -| total_timesteps | 3278976 | -| train/ | | -| approx_kl | 0.20463236 | -| clip_fraction | 0.563 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0318 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 256160 | -| policy_gradient_loss | 0.0984 | -| std | 0.0062 | -| value_loss | 3.22e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25618 | -| time_elapsed | 139352 | -| total_timesteps | 3279104 | -| train/ | | -| approx_kl | 0.05442667 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.00288 | -| n_updates | 256170 | -| policy_gradient_loss | 0.0241 | -| std | 0.0062 | -| value_loss | 2.65e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25619 | -| time_elapsed | 139363 | -| total_timesteps | 3279232 | -| train/ | | -| approx_kl | 0.06411101 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.8 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 256180 | -| policy_gradient_loss | 0.0806 | -| std | 0.0062 | -| value_loss | 0.00251 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25620 | -| time_elapsed | 139367 | -| total_timesteps | 3279360 | -| train/ | | -| approx_kl | 0.012063304 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.347 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 256190 | -| policy_gradient_loss | 0.0504 | -| std | 0.0062 | -| value_loss | 0.000166 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25621 | -| time_elapsed | 139373 | -| total_timesteps | 3279488 | -| train/ | | -| approx_kl | 0.40810528 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 256200 | -| policy_gradient_loss | 0.184 | -| std | 0.0062 | -| value_loss | 5.87e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25622 | -| time_elapsed | 139379 | -| total_timesteps | 3279616 | -| train/ | | -| approx_kl | 0.23783444 | -| clip_fraction | 0.748 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00696 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 256210 | -| policy_gradient_loss | 0.201 | -| std | 0.0062 | -| value_loss | 2.67e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25623 | -| time_elapsed | 139382 | -| total_timesteps | 3279744 | -| train/ | | -| approx_kl | 0.040662024 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.17 | -| learning_rate | 0.0003 | -| loss | -0.0096 | -| n_updates | 256220 | -| policy_gradient_loss | 0.0284 | -| std | 0.0062 | -| value_loss | 1.18e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.896 | -| time/ | | -| fps | 23 | -| iterations | 25624 | -| time_elapsed | 139385 | -| total_timesteps | 3279872 | -| train/ | | -| approx_kl | 0.22506821 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0539 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 256230 | -| policy_gradient_loss | 0.0299 | -| std | 0.0062 | -| value_loss | 1.02e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25625 | -| time_elapsed | 139390 | -| total_timesteps | 3280000 | -| train/ | | -| approx_kl | 0.018285202 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.00548 | -| n_updates | 256240 | -| policy_gradient_loss | 0.00189 | -| std | 0.00619 | -| value_loss | 6.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25626 | -| time_elapsed | 139394 | -| total_timesteps | 3280128 | -| train/ | | -| approx_kl | 0.029481107 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00666 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 256250 | -| policy_gradient_loss | 0.0565 | -| std | 0.00619 | -| value_loss | 3.89e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25627 | -| time_elapsed | 139406 | -| total_timesteps | 3280256 | -| train/ | | -| approx_kl | 0.3130849 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.618 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 256260 | -| policy_gradient_loss | 0.111 | -| std | 0.00619 | -| value_loss | 0.00266 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25628 | -| time_elapsed | 139412 | -| total_timesteps | 3280384 | -| train/ | | -| approx_kl | 0.045047425 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0151 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 256270 | -| policy_gradient_loss | 0.0218 | -| std | 0.00619 | -| value_loss | 1.88e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25629 | -| time_elapsed | 139417 | -| total_timesteps | 3280512 | -| train/ | | -| approx_kl | 0.17819364 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00478 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 256280 | -| policy_gradient_loss | 0.0146 | -| std | 0.00619 | -| value_loss | 6.51e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25630 | -| time_elapsed | 139422 | -| total_timesteps | 3280640 | -| train/ | | -| approx_kl | 0.0154670235 | -| clip_fraction | 0.115 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | -0.00597 | -| n_updates | 256290 | -| policy_gradient_loss | -0.00367 | -| std | 0.00619 | -| value_loss | 2.45e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25631 | -| time_elapsed | 139427 | -| total_timesteps | 3280768 | -| train/ | | -| approx_kl | 0.016661685 | -| clip_fraction | 0.107 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.103 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 256300 | -| policy_gradient_loss | 0.00491 | -| std | 0.00619 | -| value_loss | 1.96e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.897 | -| time/ | | -| fps | 23 | -| iterations | 25632 | -| time_elapsed | 139430 | -| total_timesteps | 3280896 | -| train/ | | -| approx_kl | 0.034883086 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0935 | -| learning_rate | 0.0003 | -| loss | 0.0205 | -| n_updates | 256310 | -| policy_gradient_loss | 0.0427 | -| std | 0.0062 | -| value_loss | 3.56e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25633 | -| time_elapsed | 139435 | -| total_timesteps | 3281024 | -| train/ | | -| approx_kl | 0.32351357 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00485 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 256320 | -| policy_gradient_loss | 0.136 | -| std | 0.0062 | -| value_loss | 1.31e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25634 | -| time_elapsed | 139444 | -| total_timesteps | 3281152 | -| train/ | | -| approx_kl | 0.38168532 | -| clip_fraction | 0.68 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.823 | -| learning_rate | 0.0003 | -| loss | 0.0388 | -| n_updates | 256330 | -| policy_gradient_loss | 0.0305 | -| std | 0.00621 | -| value_loss | 0.00067 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25635 | -| time_elapsed | 139447 | -| total_timesteps | 3281280 | -| train/ | | -| approx_kl | 0.5311636 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.285 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 256340 | -| policy_gradient_loss | 0.115 | -| std | 0.00624 | -| value_loss | 8.3e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25636 | -| time_elapsed | 139452 | -| total_timesteps | 3281408 | -| train/ | | -| approx_kl | 0.073851876 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | 0.00344 | -| n_updates | 256350 | -| policy_gradient_loss | 0.0151 | -| std | 0.00625 | -| value_loss | 3.29e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25637 | -| time_elapsed | 139455 | -| total_timesteps | 3281536 | -| train/ | | -| approx_kl | 0.00391071 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0145 | -| learning_rate | 0.0003 | -| loss | 0.000865 | -| n_updates | 256360 | -| policy_gradient_loss | 0.035 | -| std | 0.00625 | -| value_loss | 1.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25638 | -| time_elapsed | 139460 | -| total_timesteps | 3281664 | -| train/ | | -| approx_kl | 0.65963316 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.236 | -| learning_rate | 0.0003 | -| loss | 0.255 | -| n_updates | 256370 | -| policy_gradient_loss | 0.0875 | -| std | 0.00625 | -| value_loss | 3.85e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25639 | -| time_elapsed | 139464 | -| total_timesteps | 3281792 | -| train/ | | -| approx_kl | 0.058521125 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 256380 | -| policy_gradient_loss | 0.0129 | -| std | 0.00625 | -| value_loss | 2.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25640 | -| time_elapsed | 139469 | -| total_timesteps | 3281920 | -| train/ | | -| approx_kl | 0.010131346 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.00111 | -| n_updates | 256390 | -| policy_gradient_loss | 0.0103 | -| std | 0.00625 | -| value_loss | 1.49e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25641 | -| time_elapsed | 139472 | -| total_timesteps | 3282048 | -| train/ | | -| approx_kl | 0.002627654 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0552 | -| learning_rate | 0.0003 | -| loss | -0.000925 | -| n_updates | 256400 | -| policy_gradient_loss | 0.0112 | -| std | 0.00625 | -| value_loss | 9.19e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25642 | -| time_elapsed | 139479 | -| total_timesteps | 3282176 | -| train/ | | -| approx_kl | 0.015240604 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -5.35 | -| learning_rate | 0.0003 | -| loss | -0.019 | -| n_updates | 256410 | -| policy_gradient_loss | -0.0148 | -| std | 0.00625 | -| value_loss | 0.00379 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25643 | -| time_elapsed | 139484 | -| total_timesteps | 3282304 | -| train/ | | -| approx_kl | 0.001755408 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.117 | -| learning_rate | 0.0003 | -| loss | 0.0043 | -| n_updates | 256420 | -| policy_gradient_loss | 0.00327 | -| std | 0.00625 | -| value_loss | 9.49e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25644 | -| time_elapsed | 139489 | -| total_timesteps | 3282432 | -| train/ | | -| approx_kl | 0.0062488304 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0106 | -| learning_rate | 0.0003 | -| loss | -0.00545 | -| n_updates | 256430 | -| policy_gradient_loss | 0.0104 | -| std | 0.00625 | -| value_loss | 9.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25645 | -| time_elapsed | 139494 | -| total_timesteps | 3282560 | -| train/ | | -| approx_kl | 0.069550864 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.00826 | -| n_updates | 256440 | -| policy_gradient_loss | -0.000127 | -| std | 0.00625 | -| value_loss | 8.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25646 | -| time_elapsed | 139499 | -| total_timesteps | 3282688 | -| train/ | | -| approx_kl | 0.04008931 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.034 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 256450 | -| policy_gradient_loss | 0.000601 | -| std | 0.00626 | -| value_loss | 6.05e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25647 | -| time_elapsed | 139504 | -| total_timesteps | 3282816 | -| train/ | | -| approx_kl | 4.942948e-05 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0344 | -| learning_rate | 0.0003 | -| loss | -0.0015 | -| n_updates | 256460 | -| policy_gradient_loss | -0.00191 | -| std | 0.00626 | -| value_loss | 4.54e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.89 | -| time/ | | -| fps | 23 | -| iterations | 25648 | -| time_elapsed | 139508 | -| total_timesteps | 3282944 | -| train/ | | -| approx_kl | 0.057690542 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 256470 | -| policy_gradient_loss | 0.0111 | -| std | 0.00627 | -| value_loss | 2.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25649 | -| time_elapsed | 139511 | -| total_timesteps | 3283072 | -| train/ | | -| approx_kl | 0.007846375 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.000399 | -| n_updates | 256480 | -| policy_gradient_loss | 0.00966 | -| std | 0.00628 | -| value_loss | 1.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25650 | -| time_elapsed | 139518 | -| total_timesteps | 3283200 | -| train/ | | -| approx_kl | 0.011499498 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | -0.0263 | -| n_updates | 256490 | -| policy_gradient_loss | 0.00433 | -| std | 0.00628 | -| value_loss | 2.41e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25651 | -| time_elapsed | 139522 | -| total_timesteps | 3283328 | -| train/ | | -| approx_kl | 0.5288665 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.222 | -| learning_rate | 0.0003 | -| loss | 0.0677 | -| n_updates | 256500 | -| policy_gradient_loss | 0.0338 | -| std | 0.00628 | -| value_loss | 2.17e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25652 | -| time_elapsed | 139527 | -| total_timesteps | 3283456 | -| train/ | | -| approx_kl | 0.053820856 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 256510 | -| policy_gradient_loss | 0.00162 | -| std | 0.00628 | -| value_loss | 4.9e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25653 | -| time_elapsed | 139530 | -| total_timesteps | 3283584 | -| train/ | | -| approx_kl | 0.009477744 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | -0.00863 | -| n_updates | 256520 | -| policy_gradient_loss | 0.00936 | -| std | 0.00628 | -| value_loss | 4.17e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25654 | -| time_elapsed | 139534 | -| total_timesteps | 3283712 | -| train/ | | -| approx_kl | 0.0021334896 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | -0.00161 | -| n_updates | 256530 | -| policy_gradient_loss | 0.00754 | -| std | 0.00628 | -| value_loss | 2.51e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25655 | -| time_elapsed | 139539 | -| total_timesteps | 3283840 | -| train/ | | -| approx_kl | 0.042714894 | -| clip_fraction | 0.641 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0849 | -| learning_rate | 0.0003 | -| loss | 0.0219 | -| n_updates | 256540 | -| policy_gradient_loss | 0.092 | -| std | 0.00628 | -| value_loss | 1.3e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25656 | -| time_elapsed | 139544 | -| total_timesteps | 3283968 | -| train/ | | -| approx_kl | 0.013305291 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0942 | -| learning_rate | 0.0003 | -| loss | 0.00108 | -| n_updates | 256550 | -| policy_gradient_loss | 0.0397 | -| std | 0.00628 | -| value_loss | 9.01e-09 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25657 | -| time_elapsed | 139548 | -| total_timesteps | 3284096 | -| train/ | | -| approx_kl | 0.566808 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 256560 | -| policy_gradient_loss | 0.0784 | -| std | 0.00628 | -| value_loss | 8.35e-09 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25658 | -| time_elapsed | 139557 | -| total_timesteps | 3284224 | -| train/ | | -| approx_kl | 0.0026354366 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.846 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 256570 | -| policy_gradient_loss | -0.00565 | -| std | 0.00628 | -| value_loss | 0.00304 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25659 | -| time_elapsed | 139563 | -| total_timesteps | 3284352 | -| train/ | | -| approx_kl | 0.025530681 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.411 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 256580 | -| policy_gradient_loss | 0.00941 | -| std | 0.00628 | -| value_loss | 9.62e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25660 | -| time_elapsed | 139568 | -| total_timesteps | 3284480 | -| train/ | | -| approx_kl | 0.006054976 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0063 | -| learning_rate | 0.0003 | -| loss | 0.000924 | -| n_updates | 256590 | -| policy_gradient_loss | 0.0116 | -| std | 0.00628 | -| value_loss | 2.98e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25661 | -| time_elapsed | 139573 | -| total_timesteps | 3284608 | -| train/ | | -| approx_kl | 0.079694554 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.519 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 256600 | -| policy_gradient_loss | 0.00918 | -| std | 0.00628 | -| value_loss | 1.48e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25662 | -| time_elapsed | 139578 | -| total_timesteps | 3284736 | -| train/ | | -| approx_kl | 0.04220217 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0701 | -| learning_rate | 0.0003 | -| loss | 0.00677 | -| n_updates | 256610 | -| policy_gradient_loss | 0.00494 | -| std | 0.00627 | -| value_loss | 1.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25663 | -| time_elapsed | 139584 | -| total_timesteps | 3284864 | -| train/ | | -| approx_kl | 0.006118374 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.00048 | -| n_updates | 256620 | -| policy_gradient_loss | 0.00504 | -| std | 0.00627 | -| value_loss | 6.32e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.872 | -| time/ | | -| fps | 23 | -| iterations | 25664 | -| time_elapsed | 139589 | -| total_timesteps | 3284992 | -| train/ | | -| approx_kl | 0.09267733 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0755 | -| learning_rate | 0.0003 | -| loss | 0.0677 | -| n_updates | 256630 | -| policy_gradient_loss | 0.0285 | -| std | 0.00627 | -| value_loss | 4.15e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25665 | -| time_elapsed | 139594 | -| total_timesteps | 3285120 | -| train/ | | -| approx_kl | 0.012010362 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0922 | -| learning_rate | 0.0003 | -| loss | 0.00339 | -| n_updates | 256640 | -| policy_gradient_loss | 0.0069 | -| std | 0.00628 | -| value_loss | 4.45e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25666 | -| time_elapsed | 139605 | -| total_timesteps | 3285248 | -| train/ | | -| approx_kl | 0.039550375 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.887 | -| learning_rate | 0.0003 | -| loss | -0.0317 | -| n_updates | 256650 | -| policy_gradient_loss | -0.0231 | -| std | 0.00627 | -| value_loss | 0.00246 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25667 | -| time_elapsed | 139611 | -| total_timesteps | 3285376 | -| train/ | | -| approx_kl | 0.07603079 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -8.15 | -| learning_rate | 0.0003 | -| loss | 0.00657 | -| n_updates | 256660 | -| policy_gradient_loss | 0.000655 | -| std | 0.00628 | -| value_loss | 4.54e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25668 | -| time_elapsed | 139615 | -| total_timesteps | 3285504 | -| train/ | | -| approx_kl | 0.0456151 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -1.51 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 256670 | -| policy_gradient_loss | 0.00264 | -| std | 0.00628 | -| value_loss | 2.28e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25669 | -| time_elapsed | 139620 | -| total_timesteps | 3285632 | -| train/ | | -| approx_kl | 0.059487633 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.449 | -| learning_rate | 0.0003 | -| loss | 0.0435 | -| n_updates | 256680 | -| policy_gradient_loss | 0.0198 | -| std | 0.00628 | -| value_loss | 5.44e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25670 | -| time_elapsed | 139626 | -| total_timesteps | 3285760 | -| train/ | | -| approx_kl | 0.009251911 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 256690 | -| policy_gradient_loss | 0.000242 | -| std | 0.00628 | -| value_loss | 2.26e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.877 | -| time/ | | -| fps | 23 | -| iterations | 25671 | -| time_elapsed | 139631 | -| total_timesteps | 3285888 | -| train/ | | -| approx_kl | 0.08003894 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 256700 | -| policy_gradient_loss | 0.00706 | -| std | 0.00628 | -| value_loss | 9.17e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25672 | -| time_elapsed | 139636 | -| total_timesteps | 3286016 | -| train/ | | -| approx_kl | 0.044695746 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 256710 | -| policy_gradient_loss | 0.0296 | -| std | 0.00628 | -| value_loss | 7.29e-11 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25673 | -| time_elapsed | 139647 | -| total_timesteps | 3286144 | -| train/ | | -| approx_kl | 0.218297 | -| clip_fraction | 0.554 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 256720 | -| policy_gradient_loss | 0.0527 | -| std | 0.00628 | -| value_loss | 1.7e-05 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25674 | -| time_elapsed | 139652 | -| total_timesteps | 3286272 | -| train/ | | -| approx_kl | 0.07656716 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0379 | -| learning_rate | 0.0003 | -| loss | 0.014 | -| n_updates | 256730 | -| policy_gradient_loss | 0.0281 | -| std | 0.00628 | -| value_loss | 6.96e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25675 | -| time_elapsed | 139658 | -| total_timesteps | 3286400 | -| train/ | | -| approx_kl | 0.14784543 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 256740 | -| policy_gradient_loss | 0.0606 | -| std | 0.00628 | -| value_loss | 9.84e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25676 | -| time_elapsed | 139663 | -| total_timesteps | 3286528 | -| train/ | | -| approx_kl | 0.03239522 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.00863 | -| n_updates | 256750 | -| policy_gradient_loss | 0.0331 | -| std | 0.00628 | -| value_loss | 2.02e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25677 | -| time_elapsed | 139668 | -| total_timesteps | 3286656 | -| train/ | | -| approx_kl | 0.98078144 | -| clip_fraction | 0.759 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0352 | -| learning_rate | 0.0003 | -| loss | 0.387 | -| n_updates | 256760 | -| policy_gradient_loss | 0.164 | -| std | 0.00628 | -| value_loss | 1.07e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25678 | -| time_elapsed | 139674 | -| total_timesteps | 3286784 | -| train/ | | -| approx_kl | 0.010185275 | -| clip_fraction | 0.443 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0408 | -| learning_rate | 0.0003 | -| loss | -0.00412 | -| n_updates | 256770 | -| policy_gradient_loss | 0.0329 | -| std | 0.00628 | -| value_loss | 8.35e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.862 | -| time/ | | -| fps | 23 | -| iterations | 25679 | -| time_elapsed | 139681 | -| total_timesteps | 3286912 | -| train/ | | -| approx_kl | 0.29871437 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.158 | -| n_updates | 256780 | -| policy_gradient_loss | 0.139 | -| std | 0.00628 | -| value_loss | 5.01e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25680 | -| time_elapsed | 139686 | -| total_timesteps | 3287040 | -| train/ | | -| approx_kl | 0.058331896 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.121 | -| learning_rate | 0.0003 | -| loss | 0.0241 | -| n_updates | 256790 | -| policy_gradient_loss | 0.0306 | -| std | 0.00628 | -| value_loss | 2.48e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25681 | -| time_elapsed | 139697 | -| total_timesteps | 3287168 | -| train/ | | -| approx_kl | 0.0058038034 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | -0.0158 | -| n_updates | 256800 | -| policy_gradient_loss | 0.0155 | -| std | 0.00628 | -| value_loss | 0.00189 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25682 | -| time_elapsed | 139702 | -| total_timesteps | 3287296 | -| train/ | | -| approx_kl | 0.03902228 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.0583 | -| n_updates | 256810 | -| policy_gradient_loss | -0.00241 | -| std | 0.00628 | -| value_loss | 1.83e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25683 | -| time_elapsed | 139708 | -| total_timesteps | 3287424 | -| train/ | | -| approx_kl | 0.6397428 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00328 | -| learning_rate | 0.0003 | -| loss | 0.234 | -| n_updates | 256820 | -| policy_gradient_loss | 0.0727 | -| std | 0.00628 | -| value_loss | 4.86e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25684 | -| time_elapsed | 139714 | -| total_timesteps | 3287552 | -| train/ | | -| approx_kl | 0.0077711833 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.588 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 256830 | -| policy_gradient_loss | 0.00596 | -| std | 0.00628 | -| value_loss | 1.9e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25685 | -| time_elapsed | 139719 | -| total_timesteps | 3287680 | -| train/ | | -| approx_kl | 0.07719366 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0887 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 256840 | -| policy_gradient_loss | 0.00644 | -| std | 0.00628 | -| value_loss | 1.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25686 | -| time_elapsed | 139725 | -| total_timesteps | 3287808 | -| train/ | | -| approx_kl | 0.013818699 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.00463 | -| n_updates | 256850 | -| policy_gradient_loss | 0.0102 | -| std | 0.00627 | -| value_loss | 6.8e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 25687 | -| time_elapsed | 139729 | -| total_timesteps | 3287936 | -| train/ | | -| approx_kl | 0.00082188565 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0943 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 256860 | -| policy_gradient_loss | 0.0079 | -| std | 0.00627 | -| value_loss | 4.42e-08 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25688 | -| time_elapsed | 139734 | -| total_timesteps | 3288064 | -| train/ | | -| approx_kl | 0.006261038 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.000675 | -| n_updates | 256870 | -| policy_gradient_loss | 0.00735 | -| std | 0.00627 | -| value_loss | 1.83e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25689 | -| time_elapsed | 139741 | -| total_timesteps | 3288192 | -| train/ | | -| approx_kl | 0.1275186 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -2.11 | -| learning_rate | 0.0003 | -| loss | -0.012 | -| n_updates | 256880 | -| policy_gradient_loss | -0.0176 | -| std | 0.00627 | -| value_loss | 0.00283 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25690 | -| time_elapsed | 139748 | -| total_timesteps | 3288320 | -| train/ | | -| approx_kl | 0.02310222 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.373 | -| learning_rate | 0.0003 | -| loss | 0.00938 | -| n_updates | 256890 | -| policy_gradient_loss | 0.0803 | -| std | 0.00627 | -| value_loss | 7.36e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25691 | -| time_elapsed | 139752 | -| total_timesteps | 3288448 | -| train/ | | -| approx_kl | 0.0016711121 | -| clip_fraction | 0.532 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0435 | -| learning_rate | 0.0003 | -| loss | 0.00376 | -| n_updates | 256900 | -| policy_gradient_loss | 0.163 | -| std | 0.00627 | -| value_loss | 1.99e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25692 | -| time_elapsed | 139756 | -| total_timesteps | 3288576 | -| train/ | | -| approx_kl | 0.02293144 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0218 | -| learning_rate | 0.0003 | -| loss | 0.028 | -| n_updates | 256910 | -| policy_gradient_loss | 0.0576 | -| std | 0.00627 | -| value_loss | 1.76e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25693 | -| time_elapsed | 139761 | -| total_timesteps | 3288704 | -| train/ | | -| approx_kl | 0.119703285 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 256920 | -| policy_gradient_loss | 0.0205 | -| std | 0.00627 | -| value_loss | 9.72e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25694 | -| time_elapsed | 139766 | -| total_timesteps | 3288832 | -| train/ | | -| approx_kl | 0.006847568 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0554 | -| learning_rate | 0.0003 | -| loss | 0.00182 | -| n_updates | 256930 | -| policy_gradient_loss | 0.0354 | -| std | 0.00627 | -| value_loss | 4.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.869 | -| time/ | | -| fps | 23 | -| iterations | 25695 | -| time_elapsed | 139770 | -| total_timesteps | 3288960 | -| train/ | | -| approx_kl | 0.25194266 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.599 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 256940 | -| policy_gradient_loss | 0.0365 | -| std | 0.00627 | -| value_loss | 1.51e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25696 | -| time_elapsed | 139773 | -| total_timesteps | 3289088 | -| train/ | | -| approx_kl | 0.019745065 | -| clip_fraction | 0.14 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0752 | -| learning_rate | 0.0003 | -| loss | 0.000465 | -| n_updates | 256950 | -| policy_gradient_loss | -0.00162 | -| std | 0.00627 | -| value_loss | 8.85e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25697 | -| time_elapsed | 139781 | -| total_timesteps | 3289216 | -| train/ | | -| approx_kl | 0.28578472 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.998 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 256960 | -| policy_gradient_loss | 0.0276 | -| std | 0.00627 | -| value_loss | 9.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25698 | -| time_elapsed | 139785 | -| total_timesteps | 3289344 | -| train/ | | -| approx_kl | 0.116633095 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -24.2 | -| learning_rate | 0.0003 | -| loss | 0.0257 | -| n_updates | 256970 | -| policy_gradient_loss | 0.00504 | -| std | 0.00627 | -| value_loss | 5.42e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25699 | -| time_elapsed | 139789 | -| total_timesteps | 3289472 | -| train/ | | -| approx_kl | 0.016081087 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0912 | -| learning_rate | 0.0003 | -| loss | -0.0146 | -| n_updates | 256980 | -| policy_gradient_loss | 0.00234 | -| std | 0.00627 | -| value_loss | 1.62e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25700 | -| time_elapsed | 139793 | -| total_timesteps | 3289600 | -| train/ | | -| approx_kl | 0.0035331016 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | -0.00332 | -| n_updates | 256990 | -| policy_gradient_loss | 0.0111 | -| std | 0.00627 | -| value_loss | 1.02e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25701 | -| time_elapsed | 139797 | -| total_timesteps | 3289728 | -| train/ | | -| approx_kl | 0.0016965033 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | -7.47e-05 | -| n_updates | 257000 | -| policy_gradient_loss | 0.0109 | -| std | 0.00627 | -| value_loss | 9.04e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25702 | -| time_elapsed | 139801 | -| total_timesteps | 3289856 | -| train/ | | -| approx_kl | 0.04250819 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.0514 | -| n_updates | 257010 | -| policy_gradient_loss | 0.0278 | -| std | 0.00626 | -| value_loss | 3.45e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25703 | -| time_elapsed | 139804 | -| total_timesteps | 3289984 | -| train/ | | -| approx_kl | 0.0009889388 | -| clip_fraction | 0.587 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0766 | -| learning_rate | 0.0003 | -| loss | -0.000954 | -| n_updates | 257020 | -| policy_gradient_loss | 0.113 | -| std | 0.00626 | -| value_loss | 5.47e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25704 | -| time_elapsed | 139809 | -| total_timesteps | 3290112 | -| train/ | | -| approx_kl | 0.026601585 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0761 | -| learning_rate | 0.0003 | -| loss | 0.0317 | -| n_updates | 257030 | -| policy_gradient_loss | 0.0435 | -| std | 0.00626 | -| value_loss | 6.2e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25705 | -| time_elapsed | 139819 | -| total_timesteps | 3290240 | -| train/ | | -| approx_kl | 0.028910508 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.325 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 257040 | -| policy_gradient_loss | -0.00795 | -| std | 0.00626 | -| value_loss | 0.0013 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25706 | -| time_elapsed | 139823 | -| total_timesteps | 3290368 | -| train/ | | -| approx_kl | 0.17297003 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.977 | -| learning_rate | 0.0003 | -| loss | 0.0931 | -| n_updates | 257050 | -| policy_gradient_loss | 0.0212 | -| std | 0.00626 | -| value_loss | 2.07e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25707 | -| time_elapsed | 139828 | -| total_timesteps | 3290496 | -| train/ | | -| approx_kl | 0.0003310116 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00389 | -| learning_rate | 0.0003 | -| loss | -5.85e-05 | -| n_updates | 257060 | -| policy_gradient_loss | 0.0309 | -| std | 0.00626 | -| value_loss | 2.2e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25708 | -| time_elapsed | 139833 | -| total_timesteps | 3290624 | -| train/ | | -| approx_kl | 0.045132257 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0462 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 257070 | -| policy_gradient_loss | 0.015 | -| std | 0.00628 | -| value_loss | 0.000544 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25709 | -| time_elapsed | 139838 | -| total_timesteps | 3290752 | -| train/ | | -| approx_kl | 0.025011044 | -| clip_fraction | 0.582 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0637 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 257080 | -| policy_gradient_loss | 0.0686 | -| std | 0.00628 | -| value_loss | 1.4e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.856 | -| time/ | | -| fps | 23 | -| iterations | 25710 | -| time_elapsed | 139843 | -| total_timesteps | 3290880 | -| train/ | | -| approx_kl | 0.07943903 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | 0.0704 | -| n_updates | 257090 | -| policy_gradient_loss | 0.0368 | -| std | 0.00628 | -| value_loss | 3.72e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25711 | -| time_elapsed | 139848 | -| total_timesteps | 3291008 | -| train/ | | -| approx_kl | 0.68062353 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.216 | -| n_updates | 257100 | -| policy_gradient_loss | 0.141 | -| std | 0.00628 | -| value_loss | 2.8e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25712 | -| time_elapsed | 139860 | -| total_timesteps | 3291136 | -| train/ | | -| approx_kl | 0.53699124 | -| clip_fraction | 0.717 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | 0.0691 | -| n_updates | 257110 | -| policy_gradient_loss | 0.0625 | -| std | 0.00628 | -| value_loss | 0.00217 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25713 | -| time_elapsed | 139865 | -| total_timesteps | 3291264 | -| train/ | | -| approx_kl | 0.022038277 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.223 | -| learning_rate | 0.0003 | -| loss | 0.00557 | -| n_updates | 257120 | -| policy_gradient_loss | 0.0642 | -| std | 0.00629 | -| value_loss | 5.67e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25714 | -| time_elapsed | 139870 | -| total_timesteps | 3291392 | -| train/ | | -| approx_kl | 0.008847108 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | -0.00226 | -| n_updates | 257130 | -| policy_gradient_loss | 0.0701 | -| std | 0.00629 | -| value_loss | 4.75e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25715 | -| time_elapsed | 139875 | -| total_timesteps | 3291520 | -| train/ | | -| approx_kl | 0.01328116 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0815 | -| learning_rate | 0.0003 | -| loss | -0.0177 | -| n_updates | 257140 | -| policy_gradient_loss | 0.0155 | -| std | 0.00629 | -| value_loss | 3.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25716 | -| time_elapsed | 139881 | -| total_timesteps | 3291648 | -| train/ | | -| approx_kl | 0.050824653 | -| clip_fraction | 0.493 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 257150 | -| policy_gradient_loss | 0.0562 | -| std | 0.00629 | -| value_loss | 1.89e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25717 | -| time_elapsed | 139886 | -| total_timesteps | 3291776 | -| train/ | | -| approx_kl | 0.0051423027 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | -0.00871 | -| n_updates | 257160 | -| policy_gradient_loss | 0.0877 | -| std | 0.00629 | -| value_loss | 1.52e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25718 | -| time_elapsed | 139891 | -| total_timesteps | 3291904 | -| train/ | | -| approx_kl | 0.15148462 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 257170 | -| policy_gradient_loss | 0.128 | -| std | 0.00629 | -| value_loss | 1.17e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25719 | -| time_elapsed | 139896 | -| total_timesteps | 3292032 | -| train/ | | -| approx_kl | 0.09570066 | -| clip_fraction | 0.451 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0939 | -| learning_rate | 0.0003 | -| loss | 0.049 | -| n_updates | 257180 | -| policy_gradient_loss | 0.0403 | -| std | 0.00629 | -| value_loss | 4.62e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25720 | -| time_elapsed | 139905 | -| total_timesteps | 3292160 | -| train/ | | -| approx_kl | 0.47084516 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 257190 | -| policy_gradient_loss | 0.0735 | -| std | 0.00629 | -| value_loss | 9.21e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25721 | -| time_elapsed | 139909 | -| total_timesteps | 3292288 | -| train/ | | -| approx_kl | 0.06363462 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.128 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 257200 | -| policy_gradient_loss | 0.0473 | -| std | 0.00629 | -| value_loss | 7.79e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25722 | -| time_elapsed | 139912 | -| total_timesteps | 3292416 | -| train/ | | -| approx_kl | 0.0029817503 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.161 | -| learning_rate | 0.0003 | -| loss | -0.00322 | -| n_updates | 257210 | -| policy_gradient_loss | 0.0922 | -| std | 0.00629 | -| value_loss | 6.9e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25723 | -| time_elapsed | 139917 | -| total_timesteps | 3292544 | -| train/ | | -| approx_kl | 0.03316603 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00635 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 257220 | -| policy_gradient_loss | 0.0612 | -| std | 0.00629 | -| value_loss | 2.6e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25724 | -| time_elapsed | 139921 | -| total_timesteps | 3292672 | -| train/ | | -| approx_kl | 0.36763117 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0404 | -| learning_rate | 0.0003 | -| loss | 0.184 | -| n_updates | 257230 | -| policy_gradient_loss | 0.174 | -| std | 0.00629 | -| value_loss | 1.07e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25725 | -| time_elapsed | 139926 | -| total_timesteps | 3292800 | -| train/ | | -| approx_kl | 0.21104456 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.08 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 257240 | -| policy_gradient_loss | 0.12 | -| std | 0.00629 | -| value_loss | 7.3e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25726 | -| time_elapsed | 139930 | -| total_timesteps | 3292928 | -| train/ | | -| approx_kl | 0.034986824 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 257250 | -| policy_gradient_loss | 0.0269 | -| std | 0.00629 | -| value_loss | 4.88e-09 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25727 | -| time_elapsed | 139935 | -| total_timesteps | 3293056 | -| train/ | | -| approx_kl | 0.7359783 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 257260 | -| policy_gradient_loss | 0.059 | -| std | 0.00629 | -| value_loss | 4.33e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25728 | -| time_elapsed | 139944 | -| total_timesteps | 3293184 | -| train/ | | -| approx_kl | 0.067044325 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.722 | -| learning_rate | 0.0003 | -| loss | 0.00405 | -| n_updates | 257270 | -| policy_gradient_loss | -0.00123 | -| std | 0.00629 | -| value_loss | 0.00786 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25729 | -| time_elapsed | 139948 | -| total_timesteps | 3293312 | -| train/ | | -| approx_kl | 0.42384785 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.225 | -| learning_rate | 0.0003 | -| loss | 0.225 | -| n_updates | 257280 | -| policy_gradient_loss | 0.0793 | -| std | 0.00629 | -| value_loss | 1.53e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25730 | -| time_elapsed | 139950 | -| total_timesteps | 3293440 | -| train/ | | -| approx_kl | 0.10670532 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0112 | -| learning_rate | 0.0003 | -| loss | 0.0598 | -| n_updates | 257290 | -| policy_gradient_loss | 0.0241 | -| std | 0.00629 | -| value_loss | 2.61e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25731 | -| time_elapsed | 139953 | -| total_timesteps | 3293568 | -| train/ | | -| approx_kl | 0.015372764 | -| clip_fraction | 0.208 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | -0.00379 | -| n_updates | 257300 | -| policy_gradient_loss | 0.00941 | -| std | 0.00629 | -| value_loss | 1.21e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25732 | -| time_elapsed | 139957 | -| total_timesteps | 3293696 | -| train/ | | -| approx_kl | 0.06893332 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | -0.0112 | -| n_updates | 257310 | -| policy_gradient_loss | -0.00947 | -| std | 0.00629 | -| value_loss | 1.06e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25733 | -| time_elapsed | 139961 | -| total_timesteps | 3293824 | -| train/ | | -| approx_kl | 0.0151550565 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.00554 | -| n_updates | 257320 | -| policy_gradient_loss | 0.0105 | -| std | 0.00629 | -| value_loss | 8.56e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25734 | -| time_elapsed | 139966 | -| total_timesteps | 3293952 | -| train/ | | -| approx_kl | 0.002787454 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 257330 | -| policy_gradient_loss | 0.00855 | -| std | 0.00629 | -| value_loss | 5.5e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25735 | -| time_elapsed | 139970 | -| total_timesteps | 3294080 | -| train/ | | -| approx_kl | 0.03115299 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.0255 | -| n_updates | 257340 | -| policy_gradient_loss | 0.0123 | -| std | 0.00631 | -| value_loss | 3.09e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25736 | -| time_elapsed | 139978 | -| total_timesteps | 3294208 | -| train/ | | -| approx_kl | 0.13428317 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.974 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 257350 | -| policy_gradient_loss | 0.0106 | -| std | 0.00632 | -| value_loss | 0.00353 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25737 | -| time_elapsed | 139982 | -| total_timesteps | 3294336 | -| train/ | | -| approx_kl | 0.17225799 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 257360 | -| policy_gradient_loss | 0.0357 | -| std | 0.00632 | -| value_loss | 7.37e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25738 | -| time_elapsed | 139987 | -| total_timesteps | 3294464 | -| train/ | | -| approx_kl | 0.040609445 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -3.41 | -| learning_rate | 0.0003 | -| loss | -0.00537 | -| n_updates | 257370 | -| policy_gradient_loss | 0.0138 | -| std | 0.00632 | -| value_loss | 1.97e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25739 | -| time_elapsed | 139991 | -| total_timesteps | 3294592 | -| train/ | | -| approx_kl | 0.15375903 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -82.5 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 257380 | -| policy_gradient_loss | 0.0168 | -| std | 0.00632 | -| value_loss | 7.4e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25740 | -| time_elapsed | 139996 | -| total_timesteps | 3294720 | -| train/ | | -| approx_kl | 0.18930858 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0565 | -| learning_rate | 0.0003 | -| loss | 0.0847 | -| n_updates | 257390 | -| policy_gradient_loss | 0.0321 | -| std | 0.00632 | -| value_loss | 4.65e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25741 | -| time_elapsed | 140001 | -| total_timesteps | 3294848 | -| train/ | | -| approx_kl | 0.03202185 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00853 | -| learning_rate | 0.0003 | -| loss | 0.0149 | -| n_updates | 257400 | -| policy_gradient_loss | 0.0382 | -| std | 0.00632 | -| value_loss | 2.16e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.851 | -| time/ | | -| fps | 23 | -| iterations | 25742 | -| time_elapsed | 140007 | -| total_timesteps | 3294976 | -| train/ | | -| approx_kl | 0.3163129 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 257410 | -| policy_gradient_loss | 0.153 | -| std | 0.00632 | -| value_loss | 2.03e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25743 | -| time_elapsed | 140013 | -| total_timesteps | 3295104 | -| train/ | | -| approx_kl | 0.29105565 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0233 | -| learning_rate | 0.0003 | -| loss | 0.227 | -| n_updates | 257420 | -| policy_gradient_loss | 0.17 | -| std | 0.00632 | -| value_loss | 1.68e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25744 | -| time_elapsed | 140024 | -| total_timesteps | 3295232 | -| train/ | | -| approx_kl | 0.77565163 | -| clip_fraction | 0.686 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.76 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 257430 | -| policy_gradient_loss | 0.124 | -| std | 0.00632 | -| value_loss | 0.00224 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25745 | -| time_elapsed | 140028 | -| total_timesteps | 3295360 | -| train/ | | -| approx_kl | 0.3804334 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.245 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 257440 | -| policy_gradient_loss | 0.197 | -| std | 0.00632 | -| value_loss | 2.76e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25746 | -| time_elapsed | 140032 | -| total_timesteps | 3295488 | -| train/ | | -| approx_kl | 0.28929752 | -| clip_fraction | 0.735 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0145 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 257450 | -| policy_gradient_loss | 0.154 | -| std | 0.00632 | -| value_loss | 7.19e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25747 | -| time_elapsed | 140036 | -| total_timesteps | 3295616 | -| train/ | | -| approx_kl | 0.041649777 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00577 | -| learning_rate | 0.0003 | -| loss | 0.0145 | -| n_updates | 257460 | -| policy_gradient_loss | 0.0293 | -| std | 0.00632 | -| value_loss | 4.3e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25748 | -| time_elapsed | 140041 | -| total_timesteps | 3295744 | -| train/ | | -| approx_kl | 0.21594015 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 257470 | -| policy_gradient_loss | 0.0188 | -| std | 0.00632 | -| value_loss | 3.31e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25749 | -| time_elapsed | 140046 | -| total_timesteps | 3295872 | -| train/ | | -| approx_kl | 0.021113573 | -| clip_fraction | 0.153 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0248 | -| learning_rate | 0.0003 | -| loss | 0.00197 | -| n_updates | 257480 | -| policy_gradient_loss | 0.000389 | -| std | 0.00632 | -| value_loss | 2.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25750 | -| time_elapsed | 140051 | -| total_timesteps | 3296000 | -| train/ | | -| approx_kl | 0.029184772 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | 0.0073 | -| n_updates | 257490 | -| policy_gradient_loss | 0.0356 | -| std | 0.00632 | -| value_loss | 1.47e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25751 | -| time_elapsed | 140056 | -| total_timesteps | 3296128 | -| train/ | | -| approx_kl | 0.12559882 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00419 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 257500 | -| policy_gradient_loss | 0.0147 | -| std | 0.00632 | -| value_loss | 9.34e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25752 | -| time_elapsed | 140069 | -| total_timesteps | 3296256 | -| train/ | | -| approx_kl | 0.09265258 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | 0.0193 | -| n_updates | 257510 | -| policy_gradient_loss | 0.00822 | -| std | 0.00632 | -| value_loss | 0.000182 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25753 | -| time_elapsed | 140075 | -| total_timesteps | 3296384 | -| train/ | | -| approx_kl | 0.032564532 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00143 | -| learning_rate | 0.0003 | -| loss | 0.00941 | -| n_updates | 257520 | -| policy_gradient_loss | 0.0376 | -| std | 0.00632 | -| value_loss | 1.81e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25754 | -| time_elapsed | 140080 | -| total_timesteps | 3296512 | -| train/ | | -| approx_kl | 0.37523904 | -| clip_fraction | 0.756 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0157 | -| learning_rate | 0.0003 | -| loss | 0.254 | -| n_updates | 257530 | -| policy_gradient_loss | 0.148 | -| std | 0.00632 | -| value_loss | 6.3e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25755 | -| time_elapsed | 140084 | -| total_timesteps | 3296640 | -| train/ | | -| approx_kl | 0.2267625 | -| clip_fraction | 0.746 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00726 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 257540 | -| policy_gradient_loss | 0.133 | -| std | 0.00632 | -| value_loss | 3.72e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25756 | -| time_elapsed | 140090 | -| total_timesteps | 3296768 | -| train/ | | -| approx_kl | 0.046160527 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0213 | -| learning_rate | 0.0003 | -| loss | 0.000192 | -| n_updates | 257550 | -| policy_gradient_loss | 0.0302 | -| std | 0.00632 | -| value_loss | 3.19e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25757 | -| time_elapsed | 140095 | -| total_timesteps | 3296896 | -| train/ | | -| approx_kl | 0.7431524 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0192 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 257560 | -| policy_gradient_loss | 0.0495 | -| std | 0.00632 | -| value_loss | 2.3e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25758 | -| time_elapsed | 140100 | -| total_timesteps | 3297024 | -| train/ | | -| approx_kl | 0.038361102 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | -0.00192 | -| n_updates | 257570 | -| policy_gradient_loss | 0.000871 | -| std | 0.00632 | -| value_loss | 1.64e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25759 | -| time_elapsed | 140110 | -| total_timesteps | 3297152 | -| train/ | | -| approx_kl | 0.041666657 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.72 | -| learning_rate | 0.0003 | -| loss | -0.0296 | -| n_updates | 257580 | -| policy_gradient_loss | -0.0214 | -| std | 0.00632 | -| value_loss | 0.000774 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25760 | -| time_elapsed | 140116 | -| total_timesteps | 3297280 | -| train/ | | -| approx_kl | 0.0036006016 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.25 | -| learning_rate | 0.0003 | -| loss | -0.000329 | -| n_updates | 257590 | -| policy_gradient_loss | 0.0331 | -| std | 0.00632 | -| value_loss | 1e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25761 | -| time_elapsed | 140122 | -| total_timesteps | 3297408 | -| train/ | | -| approx_kl | 0.0023645195 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -7.87 | -| learning_rate | 0.0003 | -| loss | -0.000509 | -| n_updates | 257600 | -| policy_gradient_loss | 0.00889 | -| std | 0.00632 | -| value_loss | 6.94e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25762 | -| time_elapsed | 140128 | -| total_timesteps | 3297536 | -| train/ | | -| approx_kl | 0.09333332 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00862 | -| learning_rate | 0.0003 | -| loss | 0.0862 | -| n_updates | 257610 | -| policy_gradient_loss | 0.0967 | -| std | 0.00632 | -| value_loss | 3.99e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25763 | -| time_elapsed | 140132 | -| total_timesteps | 3297664 | -| train/ | | -| approx_kl | 0.103116415 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.0381 | -| n_updates | 257620 | -| policy_gradient_loss | 0.0118 | -| std | 0.00632 | -| value_loss | 4.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25764 | -| time_elapsed | 140136 | -| total_timesteps | 3297792 | -| train/ | | -| approx_kl | 0.010577738 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0116 | -| learning_rate | 0.0003 | -| loss | 0.0208 | -| n_updates | 257630 | -| policy_gradient_loss | 0.00268 | -| std | 0.00632 | -| value_loss | 1.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.845 | -| time/ | | -| fps | 23 | -| iterations | 25765 | -| time_elapsed | 140141 | -| total_timesteps | 3297920 | -| train/ | | -| approx_kl | 0.04561625 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0276 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 257640 | -| policy_gradient_loss | 0.0424 | -| std | 0.00632 | -| value_loss | 4.88e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25766 | -| time_elapsed | 140144 | -| total_timesteps | 3298048 | -| train/ | | -| approx_kl | 1.0033026 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.204 | -| n_updates | 257650 | -| policy_gradient_loss | 0.126 | -| std | 0.00632 | -| value_loss | 3.42e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25767 | -| time_elapsed | 140152 | -| total_timesteps | 3298176 | -| train/ | | -| approx_kl | 0.0017407741 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.771 | -| learning_rate | 0.0003 | -| loss | 0.00585 | -| n_updates | 257660 | -| policy_gradient_loss | -0.000762 | -| std | 0.00632 | -| value_loss | 0.00534 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25768 | -| time_elapsed | 140158 | -| total_timesteps | 3298304 | -| train/ | | -| approx_kl | 0.012513738 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.565 | -| learning_rate | 0.0003 | -| loss | 0.0189 | -| n_updates | 257670 | -| policy_gradient_loss | 0.0204 | -| std | 0.00632 | -| value_loss | 2.84e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25769 | -| time_elapsed | 140162 | -| total_timesteps | 3298432 | -| train/ | | -| approx_kl | 0.52192265 | -| clip_fraction | 0.692 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.0135 | -| learning_rate | 0.0003 | -| loss | 0.27 | -| n_updates | 257680 | -| policy_gradient_loss | 0.182 | -| std | 0.00632 | -| value_loss | 8.23e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25770 | -| time_elapsed | 140168 | -| total_timesteps | 3298560 | -| train/ | | -| approx_kl | 0.08157842 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | 0.0393 | -| n_updates | 257690 | -| policy_gradient_loss | 0.0261 | -| std | 0.00632 | -| value_loss | 4.71e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25771 | -| time_elapsed | 140173 | -| total_timesteps | 3298688 | -| train/ | | -| approx_kl | 0.0038605635 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 257700 | -| policy_gradient_loss | 0.0282 | -| std | 0.00632 | -| value_loss | 3.75e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25772 | -| time_elapsed | 140178 | -| total_timesteps | 3298816 | -| train/ | | -| approx_kl | 0.69382423 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.231 | -| n_updates | 257710 | -| policy_gradient_loss | 0.0654 | -| std | 0.00632 | -| value_loss | 3.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.838 | -| time/ | | -| fps | 23 | -| iterations | 25773 | -| time_elapsed | 140182 | -| total_timesteps | 3298944 | -| train/ | | -| approx_kl | 0.010702003 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -0.0129 | -| n_updates | 257720 | -| policy_gradient_loss | 0.00798 | -| std | 0.00632 | -| value_loss | 2.21e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25774 | -| time_elapsed | 140186 | -| total_timesteps | 3299072 | -| train/ | | -| approx_kl | 0.06706757 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.00124 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 257730 | -| policy_gradient_loss | 0.00736 | -| std | 0.00632 | -| value_loss | 7.52e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25775 | -| time_elapsed | 140194 | -| total_timesteps | 3299200 | -| train/ | | -| approx_kl | 0.01982354 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.529 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 257740 | -| policy_gradient_loss | -0.00735 | -| std | 0.00632 | -| value_loss | 0.00113 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25776 | -| time_elapsed | 140199 | -| total_timesteps | 3299328 | -| train/ | | -| approx_kl | 0.06650029 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -8.59 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 257750 | -| policy_gradient_loss | 0.00621 | -| std | 0.00633 | -| value_loss | 6.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25777 | -| time_elapsed | 140205 | -| total_timesteps | 3299456 | -| train/ | | -| approx_kl | 0.008447964 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.688 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 257760 | -| policy_gradient_loss | 0.0061 | -| std | 0.00633 | -| value_loss | 5.75e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25778 | -| time_elapsed | 140209 | -| total_timesteps | 3299584 | -| train/ | | -| approx_kl | 0.002073063 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | 0.00991 | -| learning_rate | 0.0003 | -| loss | -0.00146 | -| n_updates | 257770 | -| policy_gradient_loss | 0.00903 | -| std | 0.00633 | -| value_loss | 2.18e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25779 | -| time_elapsed | 140213 | -| total_timesteps | 3299712 | -| train/ | | -| approx_kl | 0.11393159 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0584 | -| n_updates | 257780 | -| policy_gradient_loss | 0.0148 | -| std | 0.00633 | -| value_loss | 2.12e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25780 | -| time_elapsed | 140218 | -| total_timesteps | 3299840 | -| train/ | | -| approx_kl | 0.2762654 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.64 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 257790 | -| policy_gradient_loss | 0.0428 | -| std | 0.00631 | -| value_loss | 3.82e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25781 | -| time_elapsed | 140222 | -| total_timesteps | 3299968 | -| train/ | | -| approx_kl | 0.53782123 | -| clip_fraction | 0.478 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.59 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 257800 | -| policy_gradient_loss | 0.0521 | -| std | 0.00631 | -| value_loss | 1.64e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25782 | -| time_elapsed | 140227 | -| total_timesteps | 3300096 | -| train/ | | -| approx_kl | 0.00040325616 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.644 | -| learning_rate | 0.0003 | -| loss | -0.00673 | -| n_updates | 257810 | -| policy_gradient_loss | -0.00759 | -| std | 0.0063 | -| value_loss | 5.07e-10 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25783 | -| time_elapsed | 140240 | -| total_timesteps | 3300224 | -| train/ | | -| approx_kl | 0.09880344 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.981 | -| learning_rate | 0.0003 | -| loss | 0.00778 | -| n_updates | 257820 | -| policy_gradient_loss | -0.00169 | -| std | 0.0063 | -| value_loss | 0.000104 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25784 | -| time_elapsed | 140245 | -| total_timesteps | 3300352 | -| train/ | | -| approx_kl | 0.09428459 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 257830 | -| policy_gradient_loss | 0.00859 | -| std | 0.0063 | -| value_loss | 2.43e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25785 | -| time_elapsed | 140250 | -| total_timesteps | 3300480 | -| train/ | | -| approx_kl | 0.040874936 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0171 | -| learning_rate | 0.0003 | -| loss | 0.0312 | -| n_updates | 257840 | -| policy_gradient_loss | 0.0171 | -| std | 0.0063 | -| value_loss | 2.17e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25786 | -| time_elapsed | 140255 | -| total_timesteps | 3300608 | -| train/ | | -| approx_kl | 0.0064077084 | -| clip_fraction | 0.198 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | -0.00951 | -| n_updates | 257850 | -| policy_gradient_loss | 0.00498 | -| std | 0.00631 | -| value_loss | 9.85e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25787 | -| time_elapsed | 140259 | -| total_timesteps | 3300736 | -| train/ | | -| approx_kl | 0.074159734 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00986 | -| learning_rate | 0.0003 | -| loss | 0.0268 | -| n_updates | 257860 | -| policy_gradient_loss | 0.00933 | -| std | 0.00631 | -| value_loss | 1.51e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25788 | -| time_elapsed | 140263 | -| total_timesteps | 3300864 | -| train/ | | -| approx_kl | 0.051917933 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 257870 | -| policy_gradient_loss | 0.0161 | -| std | 0.00631 | -| value_loss | 7.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25789 | -| time_elapsed | 140267 | -| total_timesteps | 3300992 | -| train/ | | -| approx_kl | 0.00911646 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 257880 | -| policy_gradient_loss | 0.0092 | -| std | 0.0063 | -| value_loss | 4.96e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25790 | -| time_elapsed | 140273 | -| total_timesteps | 3301120 | -| train/ | | -| approx_kl | 0.07339679 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0366 | -| n_updates | 257890 | -| policy_gradient_loss | 0.0137 | -| std | 0.0063 | -| value_loss | 3.65e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25791 | -| time_elapsed | 140286 | -| total_timesteps | 3301248 | -| train/ | | -| approx_kl | 0.012888735 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.769 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 257900 | -| policy_gradient_loss | -0.00376 | -| std | 0.0063 | -| value_loss | 0.00574 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25792 | -| time_elapsed | 140291 | -| total_timesteps | 3301376 | -| train/ | | -| approx_kl | 0.056352153 | -| clip_fraction | 0.655 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.203 | -| learning_rate | 0.0003 | -| loss | 0.0479 | -| n_updates | 257910 | -| policy_gradient_loss | 0.114 | -| std | 0.0063 | -| value_loss | 0.000102 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25793 | -| time_elapsed | 140295 | -| total_timesteps | 3301504 | -| train/ | | -| approx_kl | 0.012596307 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00106 | -| learning_rate | 0.0003 | -| loss | 0.00345 | -| n_updates | 257920 | -| policy_gradient_loss | 0.0234 | -| std | 0.0063 | -| value_loss | 1.47e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25794 | -| time_elapsed | 140301 | -| total_timesteps | 3301632 | -| train/ | | -| approx_kl | 0.67999876 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.21 | -| learning_rate | 0.0003 | -| loss | 0.234 | -| n_updates | 257930 | -| policy_gradient_loss | 0.0698 | -| std | 0.0063 | -| value_loss | 5.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25795 | -| time_elapsed | 140306 | -| total_timesteps | 3301760 | -| train/ | | -| approx_kl | 0.037990566 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.00656 | -| n_updates | 257940 | -| policy_gradient_loss | 0.00389 | -| std | 0.0063 | -| value_loss | 3.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25796 | -| time_elapsed | 140311 | -| total_timesteps | 3301888 | -| train/ | | -| approx_kl | 0.052461702 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00788 | -| learning_rate | 0.0003 | -| loss | 0.0326 | -| n_updates | 257950 | -| policy_gradient_loss | 0.0154 | -| std | 0.0063 | -| value_loss | 1.56e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25797 | -| time_elapsed | 140316 | -| total_timesteps | 3302016 | -| train/ | | -| approx_kl | 0.057338417 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | -0.0187 | -| n_updates | 257960 | -| policy_gradient_loss | -0.00853 | -| std | 0.0063 | -| value_loss | 1.18e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25798 | -| time_elapsed | 140329 | -| total_timesteps | 3302144 | -| train/ | | -| approx_kl | 0.004305274 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.0181 | -| n_updates | 257970 | -| policy_gradient_loss | -0.00464 | -| std | 0.0063 | -| value_loss | 0.000629 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25799 | -| time_elapsed | 140334 | -| total_timesteps | 3302272 | -| train/ | | -| approx_kl | 0.019036656 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00498 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 257980 | -| policy_gradient_loss | 0.00499 | -| std | 0.0063 | -| value_loss | 1.33e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25800 | -| time_elapsed | 140339 | -| total_timesteps | 3302400 | -| train/ | | -| approx_kl | 0.07943917 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0143 | -| learning_rate | 0.0003 | -| loss | 0.0451 | -| n_updates | 257990 | -| policy_gradient_loss | 0.0185 | -| std | 0.0063 | -| value_loss | 2.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25801 | -| time_elapsed | 140344 | -| total_timesteps | 3302528 | -| train/ | | -| approx_kl | 0.014359685 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.000567 | -| n_updates | 258000 | -| policy_gradient_loss | 0.00902 | -| std | 0.0063 | -| value_loss | 1.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25802 | -| time_elapsed | 140348 | -| total_timesteps | 3302656 | -| train/ | | -| approx_kl | 0.07560082 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 258010 | -| policy_gradient_loss | 0.0149 | -| std | 0.0063 | -| value_loss | 1e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25803 | -| time_elapsed | 140353 | -| total_timesteps | 3302784 | -| train/ | | -| approx_kl | 0.012569573 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.057 | -| learning_rate | 0.0003 | -| loss | 0.000137 | -| n_updates | 258020 | -| policy_gradient_loss | 0.00622 | -| std | 0.0063 | -| value_loss | 6.05e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25804 | -| time_elapsed | 140356 | -| total_timesteps | 3302912 | -| train/ | | -| approx_kl | 0.06976883 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0802 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 258030 | -| policy_gradient_loss | 0.00797 | -| std | 0.0063 | -| value_loss | 4.43e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25805 | -| time_elapsed | 140361 | -| total_timesteps | 3303040 | -| train/ | | -| approx_kl | 0.043633644 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0424 | -| learning_rate | 0.0003 | -| loss | 0.00231 | -| n_updates | 258040 | -| policy_gradient_loss | 0.0025 | -| std | 0.0063 | -| value_loss | 3.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25806 | -| time_elapsed | 140370 | -| total_timesteps | 3303168 | -| train/ | | -| approx_kl | 0.01195444 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.683 | -| learning_rate | 0.0003 | -| loss | 0.00488 | -| n_updates | 258050 | -| policy_gradient_loss | 0.00745 | -| std | 0.0063 | -| value_loss | 0.00898 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25807 | -| time_elapsed | 140376 | -| total_timesteps | 3303296 | -| train/ | | -| approx_kl | 0.0014292239 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.856 | -| learning_rate | 0.0003 | -| loss | 0.00576 | -| n_updates | 258060 | -| policy_gradient_loss | 0.00263 | -| std | 0.0063 | -| value_loss | 0.00016 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25808 | -| time_elapsed | 140381 | -| total_timesteps | 3303424 | -| train/ | | -| approx_kl | 0.0058151553 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.0161 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 258070 | -| policy_gradient_loss | 0.00583 | -| std | 0.0063 | -| value_loss | 2.33e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25809 | -| time_elapsed | 140385 | -| total_timesteps | 3303552 | -| train/ | | -| approx_kl | 0.049437862 | -| clip_fraction | 0.646 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0392 | -| learning_rate | 0.0003 | -| loss | 0.0556 | -| n_updates | 258080 | -| policy_gradient_loss | 0.187 | -| std | 0.0063 | -| value_loss | 1.51e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25810 | -| time_elapsed | 140390 | -| total_timesteps | 3303680 | -| train/ | | -| approx_kl | 0.12437806 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 258090 | -| policy_gradient_loss | 0.142 | -| std | 0.0063 | -| value_loss | 1.41e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25811 | -| time_elapsed | 140394 | -| total_timesteps | 3303808 | -| train/ | | -| approx_kl | 0.14173484 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 258100 | -| policy_gradient_loss | 0.141 | -| std | 0.0063 | -| value_loss | 1.26e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25812 | -| time_elapsed | 140398 | -| total_timesteps | 3303936 | -| train/ | | -| approx_kl | 0.025494698 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0216 | -| learning_rate | 0.0003 | -| loss | 0.00402 | -| n_updates | 258110 | -| policy_gradient_loss | 0.0275 | -| std | 0.0063 | -| value_loss | 8.85e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25813 | -| time_elapsed | 140403 | -| total_timesteps | 3304064 | -| train/ | | -| approx_kl | 0.6637919 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.23 | -| n_updates | 258120 | -| policy_gradient_loss | 0.0758 | -| std | 0.0063 | -| value_loss | 5.84e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25814 | -| time_elapsed | 140412 | -| total_timesteps | 3304192 | -| train/ | | -| approx_kl | 0.09029093 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.954 | -| learning_rate | 0.0003 | -| loss | 0.0581 | -| n_updates | 258130 | -| policy_gradient_loss | 0.00981 | -| std | 0.0063 | -| value_loss | 0.000251 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25815 | -| time_elapsed | 140417 | -| total_timesteps | 3304320 | -| train/ | | -| approx_kl | 0.10958831 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | 0.00603 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 258140 | -| policy_gradient_loss | 0.0343 | -| std | 0.0063 | -| value_loss | 3.46e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25816 | -| time_elapsed | 140422 | -| total_timesteps | 3304448 | -| train/ | | -| approx_kl | 0.090244435 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | 0.0607 | -| n_updates | 258150 | -| policy_gradient_loss | 0.012 | -| std | 0.00627 | -| value_loss | 4.83e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25817 | -| time_elapsed | 140426 | -| total_timesteps | 3304576 | -| train/ | | -| approx_kl | 0.011598138 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.0308 | -| learning_rate | 0.0003 | -| loss | -0.00662 | -| n_updates | 258160 | -| policy_gradient_loss | 0.0133 | -| std | 0.00626 | -| value_loss | 0.000132 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25818 | -| time_elapsed | 140431 | -| total_timesteps | 3304704 | -| train/ | | -| approx_kl | 0.04108656 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.65 | -| explained_variance | -0.00951 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 258170 | -| policy_gradient_loss | 0.0523 | -| std | 0.00626 | -| value_loss | 4.38e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25819 | -| time_elapsed | 140435 | -| total_timesteps | 3304832 | -| train/ | | -| approx_kl | 0.1816409 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0778 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 258180 | -| policy_gradient_loss | 0.0464 | -| std | 0.00625 | -| value_loss | 2.85e-05 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.844 | -| time/ | | -| fps | 23 | -| iterations | 25820 | -| time_elapsed | 140438 | -| total_timesteps | 3304960 | -| train/ | | -| approx_kl | 0.0043573636 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.581 | -| learning_rate | 0.0003 | -| loss | -0.00416 | -| n_updates | 258190 | -| policy_gradient_loss | 0.0139 | -| std | 0.00625 | -| value_loss | 8.7e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25821 | -| time_elapsed | 140441 | -| total_timesteps | 3305088 | -| train/ | | -| approx_kl | 9.4022136e-05 | -| clip_fraction | 0.223 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.000687 | -| learning_rate | 0.0003 | -| loss | 0.00256 | -| n_updates | 258200 | -| policy_gradient_loss | -0.000654 | -| std | 0.00625 | -| value_loss | 2.08e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25822 | -| time_elapsed | 140448 | -| total_timesteps | 3305216 | -| train/ | | -| approx_kl | 0.08239864 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.739 | -| learning_rate | 0.0003 | -| loss | 0.00917 | -| n_updates | 258210 | -| policy_gradient_loss | 0.0519 | -| std | 0.00625 | -| value_loss | 0.00614 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25823 | -| time_elapsed | 140453 | -| total_timesteps | 3305344 | -| train/ | | -| approx_kl | 0.0005265451 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.00246 | -| n_updates | 258220 | -| policy_gradient_loss | 0.0967 | -| std | 0.00625 | -| value_loss | 4.92e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25824 | -| time_elapsed | 140459 | -| total_timesteps | 3305472 | -| train/ | | -| approx_kl | 0.024609322 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0108 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 258230 | -| policy_gradient_loss | 0.0556 | -| std | 0.00625 | -| value_loss | 1.04e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25825 | -| time_elapsed | 140464 | -| total_timesteps | 3305600 | -| train/ | | -| approx_kl | 0.10216988 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00926 | -| learning_rate | 0.0003 | -| loss | 0.0631 | -| n_updates | 258240 | -| policy_gradient_loss | 0.0296 | -| std | 0.00625 | -| value_loss | 4.4e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25826 | -| time_elapsed | 140468 | -| total_timesteps | 3305728 | -| train/ | | -| approx_kl | 0.1636203 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0674 | -| learning_rate | 0.0003 | -| loss | 0.0705 | -| n_updates | 258250 | -| policy_gradient_loss | 0.0219 | -| std | 0.00626 | -| value_loss | 1.03e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25827 | -| time_elapsed | 140471 | -| total_timesteps | 3305856 | -| train/ | | -| approx_kl | 0.026933378 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.000663 | -| learning_rate | 0.0003 | -| loss | 0.00863 | -| n_updates | 258260 | -| policy_gradient_loss | 0.0311 | -| std | 0.00626 | -| value_loss | 3.25e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.839 | -| time/ | | -| fps | 23 | -| iterations | 25828 | -| time_elapsed | 140474 | -| total_timesteps | 3305984 | -| train/ | | -| approx_kl | 0.3204436 | -| clip_fraction | 0.735 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.213 | -| n_updates | 258270 | -| policy_gradient_loss | 0.161 | -| std | 0.00626 | -| value_loss | 2.94e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25829 | -| time_elapsed | 140477 | -| total_timesteps | 3306112 | -| train/ | | -| approx_kl | 0.059417985 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 258280 | -| policy_gradient_loss | 0.0262 | -| std | 0.00626 | -| value_loss | 2.36e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25830 | -| time_elapsed | 140488 | -| total_timesteps | 3306240 | -| train/ | | -| approx_kl | 0.0111101065 | -| clip_fraction | 0.122 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.0269 | -| n_updates | 258290 | -| policy_gradient_loss | -0.0176 | -| std | 0.00626 | -| value_loss | 0.000178 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25831 | -| time_elapsed | 140494 | -| total_timesteps | 3306368 | -| train/ | | -| approx_kl | 0.038439367 | -| clip_fraction | 0.481 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0166 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 258300 | -| policy_gradient_loss | 0.0276 | -| std | 0.00625 | -| value_loss | 9.84e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25832 | -| time_elapsed | 140498 | -| total_timesteps | 3306496 | -| train/ | | -| approx_kl | 0.20880558 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00604 | -| learning_rate | 0.0003 | -| loss | 0.0912 | -| n_updates | 258310 | -| policy_gradient_loss | 0.0501 | -| std | 0.00625 | -| value_loss | 3.13e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25833 | -| time_elapsed | 140503 | -| total_timesteps | 3306624 | -| train/ | | -| approx_kl | 0.0044485824 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 258320 | -| policy_gradient_loss | 0.00277 | -| std | 0.00625 | -| value_loss | 2.49e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25834 | -| time_elapsed | 140508 | -| total_timesteps | 3306752 | -| train/ | | -| approx_kl | 0.10686579 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.0803 | -| n_updates | 258330 | -| policy_gradient_loss | 0.105 | -| std | 0.00625 | -| value_loss | 1.71e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.842 | -| time/ | | -| fps | 23 | -| iterations | 25835 | -| time_elapsed | 140512 | -| total_timesteps | 3306880 | -| train/ | | -| approx_kl | 0.059351742 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0334 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 258340 | -| policy_gradient_loss | 0.0343 | -| std | 0.00625 | -| value_loss | 5.66e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25836 | -| time_elapsed | 140515 | -| total_timesteps | 3307008 | -| train/ | | -| approx_kl | 0.00015906617 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.11 | -| learning_rate | 0.0003 | -| loss | -0.000727 | -| n_updates | 258350 | -| policy_gradient_loss | 0.0681 | -| std | 0.00624 | -| value_loss | 9.8e-07 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25837 | -| time_elapsed | 140526 | -| total_timesteps | 3307136 | -| train/ | | -| approx_kl | 0.0012976881 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.87 | -| learning_rate | 0.0003 | -| loss | -0.00286 | -| n_updates | 258360 | -| policy_gradient_loss | 0.0124 | -| std | 0.00624 | -| value_loss | 0.00235 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25838 | -| time_elapsed | 140532 | -| total_timesteps | 3307264 | -| train/ | | -| approx_kl | 0.08369003 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.443 | -| learning_rate | 0.0003 | -| loss | 0.0363 | -| n_updates | 258370 | -| policy_gradient_loss | 0.0204 | -| std | 0.00624 | -| value_loss | 7.16e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25839 | -| time_elapsed | 140537 | -| total_timesteps | 3307392 | -| train/ | | -| approx_kl | 6.900169e-06 | -| clip_fraction | 0.403 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0125 | -| learning_rate | 0.0003 | -| loss | -8.66e-05 | -| n_updates | 258380 | -| policy_gradient_loss | 0.0323 | -| std | 0.00624 | -| value_loss | 2.37e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25840 | -| time_elapsed | 140542 | -| total_timesteps | 3307520 | -| train/ | | -| approx_kl | 0.16293365 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | 0.0823 | -| n_updates | 258390 | -| policy_gradient_loss | 0.0218 | -| std | 0.00623 | -| value_loss | 8.49e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25841 | -| time_elapsed | 140546 | -| total_timesteps | 3307648 | -| train/ | | -| approx_kl | 0.025463816 | -| clip_fraction | 0.49 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | -0.00504 | -| n_updates | 258400 | -| policy_gradient_loss | 0.0285 | -| std | 0.00623 | -| value_loss | 7.03e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25842 | -| time_elapsed | 140551 | -| total_timesteps | 3307776 | -| train/ | | -| approx_kl | 0.34879854 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0388 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 258410 | -| policy_gradient_loss | 0.133 | -| std | 0.00623 | -| value_loss | 5.64e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.835 | -| time/ | | -| fps | 23 | -| iterations | 25843 | -| time_elapsed | 140556 | -| total_timesteps | 3307904 | -| train/ | | -| approx_kl | 0.19584669 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 258420 | -| policy_gradient_loss | 0.113 | -| std | 0.00624 | -| value_loss | 4.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25844 | -| time_elapsed | 140562 | -| total_timesteps | 3308032 | -| train/ | | -| approx_kl | 0.038371917 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0375 | -| learning_rate | 0.0003 | -| loss | 0.00245 | -| n_updates | 258430 | -| policy_gradient_loss | 0.0261 | -| std | 0.00624 | -| value_loss | 3.3e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25845 | -| time_elapsed | 140571 | -| total_timesteps | 3308160 | -| train/ | | -| approx_kl | 0.09897286 | -| clip_fraction | 0.193 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -2.45 | -| learning_rate | 0.0003 | -| loss | -0.0274 | -| n_updates | 258440 | -| policy_gradient_loss | -0.0148 | -| std | 0.00624 | -| value_loss | 0.00316 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25846 | -| time_elapsed | 140576 | -| total_timesteps | 3308288 | -| train/ | | -| approx_kl | 0.016508132 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | 0.00343 | -| n_updates | 258450 | -| policy_gradient_loss | 0.0333 | -| std | 0.00624 | -| value_loss | 1.06e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25847 | -| time_elapsed | 140581 | -| total_timesteps | 3308416 | -| train/ | | -| approx_kl | 0.32534426 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.919 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 258460 | -| policy_gradient_loss | 0.162 | -| std | 0.00624 | -| value_loss | 4.22e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25848 | -| time_elapsed | 140586 | -| total_timesteps | 3308544 | -| train/ | | -| approx_kl | 0.1707839 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.37 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 258470 | -| policy_gradient_loss | 0.103 | -| std | 0.00624 | -| value_loss | 1.67e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25849 | -| time_elapsed | 140590 | -| total_timesteps | 3308672 | -| train/ | | -| approx_kl | 0.041911364 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.513 | -| learning_rate | 0.0003 | -| loss | 0.0269 | -| n_updates | 258480 | -| policy_gradient_loss | 0.0374 | -| std | 0.00624 | -| value_loss | 4.92e-10 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25850 | -| time_elapsed | 140595 | -| total_timesteps | 3308800 | -| train/ | | -| approx_kl | 0.5890905 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0597 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 258490 | -| policy_gradient_loss | 0.0611 | -| std | 0.00624 | -| value_loss | 1.21e-10 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.832 | -| time/ | | -| fps | 23 | -| iterations | 25851 | -| time_elapsed | 140600 | -| total_timesteps | 3308928 | -| train/ | | -| approx_kl | 0.05775198 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00164 | -| learning_rate | 0.0003 | -| loss | 0.0239 | -| n_updates | 258500 | -| policy_gradient_loss | 0.0125 | -| std | 0.00624 | -| value_loss | 1.7e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25852 | -| time_elapsed | 140605 | -| total_timesteps | 3309056 | -| train/ | | -| approx_kl | 0.011903444 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -6.08e-06 | -| learning_rate | 0.0003 | -| loss | -0.00727 | -| n_updates | 258510 | -| policy_gradient_loss | 0.00596 | -| std | 0.00624 | -| value_loss | 9.62e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25853 | -| time_elapsed | 140611 | -| total_timesteps | 3309184 | -| train/ | | -| approx_kl | 0.016013583 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.829 | -| learning_rate | 0.0003 | -| loss | -0.00782 | -| n_updates | 258520 | -| policy_gradient_loss | 0.00576 | -| std | 0.00624 | -| value_loss | 0.00333 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25854 | -| time_elapsed | 140617 | -| total_timesteps | 3309312 | -| train/ | | -| approx_kl | 0.21252598 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.96 | -| learning_rate | 0.0003 | -| loss | 0.0794 | -| n_updates | 258530 | -| policy_gradient_loss | 0.0536 | -| std | 0.00624 | -| value_loss | 1.74e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25855 | -| time_elapsed | 140622 | -| total_timesteps | 3309440 | -| train/ | | -| approx_kl | 0.20570172 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0136 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 258540 | -| policy_gradient_loss | 0.0468 | -| std | 0.00624 | -| value_loss | 2.52e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25856 | -| time_elapsed | 140626 | -| total_timesteps | 3309568 | -| train/ | | -| approx_kl | 0.060094263 | -| clip_fraction | 0.597 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | 0.0319 | -| n_updates | 258550 | -| policy_gradient_loss | 0.0742 | -| std | 0.00624 | -| value_loss | 2.27e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25857 | -| time_elapsed | 140631 | -| total_timesteps | 3309696 | -| train/ | | -| approx_kl | 0.11940617 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0688 | -| n_updates | 258560 | -| policy_gradient_loss | 0.037 | -| std | 0.00623 | -| value_loss | 1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25858 | -| time_elapsed | 140636 | -| total_timesteps | 3309824 | -| train/ | | -| approx_kl | 0.73251915 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.261 | -| n_updates | 258570 | -| policy_gradient_loss | 0.153 | -| std | 0.00623 | -| value_loss | 4.35e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.824 | -| time/ | | -| fps | 23 | -| iterations | 25859 | -| time_elapsed | 140641 | -| total_timesteps | 3309952 | -| train/ | | -| approx_kl | 0.10838369 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0717 | -| learning_rate | 0.0003 | -| loss | 0.0514 | -| n_updates | 258580 | -| policy_gradient_loss | 0.0303 | -| std | 0.00624 | -| value_loss | 2.85e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25860 | -| time_elapsed | 140646 | -| total_timesteps | 3310080 | -| train/ | | -| approx_kl | 0.15568033 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.0597 | -| n_updates | 258590 | -| policy_gradient_loss | 0.0208 | -| std | 0.00624 | -| value_loss | 2.13e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25861 | -| time_elapsed | 140654 | -| total_timesteps | 3310208 | -| train/ | | -| approx_kl | 0.0020385827 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.964 | -| learning_rate | 0.0003 | -| loss | -0.0256 | -| n_updates | 258600 | -| policy_gradient_loss | -0.00135 | -| std | 0.00624 | -| value_loss | 0.000404 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25862 | -| time_elapsed | 140660 | -| total_timesteps | 3310336 | -| train/ | | -| approx_kl | 0.0027676672 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00174 | -| learning_rate | 0.0003 | -| loss | -0.00243 | -| n_updates | 258610 | -| policy_gradient_loss | 0.035 | -| std | 0.00623 | -| value_loss | 2.64e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25863 | -| time_elapsed | 140665 | -| total_timesteps | 3310464 | -| train/ | | -| approx_kl | 0.6623951 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.0129 | -| learning_rate | 0.0003 | -| loss | 0.229 | -| n_updates | 258620 | -| policy_gradient_loss | 0.0825 | -| std | 0.00623 | -| value_loss | 3.03e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25864 | -| time_elapsed | 140670 | -| total_timesteps | 3310592 | -| train/ | | -| approx_kl | 0.0060670143 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0856 | -| learning_rate | 0.0003 | -| loss | -0.0152 | -| n_updates | 258630 | -| policy_gradient_loss | 0.00588 | -| std | 0.00623 | -| value_loss | 2.51e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25865 | -| time_elapsed | 140674 | -| total_timesteps | 3310720 | -| train/ | | -| approx_kl | 0.038995456 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.0434 | -| n_updates | 258640 | -| policy_gradient_loss | 0.147 | -| std | 0.00623 | -| value_loss | 1.4e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25866 | -| time_elapsed | 140680 | -| total_timesteps | 3310848 | -| train/ | | -| approx_kl | 0.013546024 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.000856 | -| n_updates | 258650 | -| policy_gradient_loss | 0.0326 | -| std | 0.00623 | -| value_loss | 4.46e-08 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.831 | -| time/ | | -| fps | 23 | -| iterations | 25867 | -| time_elapsed | 140685 | -| total_timesteps | 3310976 | -| train/ | | -| approx_kl | 3.0966476e-07 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -4.62e-05 | -| n_updates | 258660 | -| policy_gradient_loss | 0.0295 | -| std | 0.00623 | -| value_loss | 2.7e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25868 | -| time_elapsed | 140689 | -| total_timesteps | 3311104 | -| train/ | | -| approx_kl | 0.4993145 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0718 | -| learning_rate | 0.0003 | -| loss | 0.177 | -| n_updates | 258670 | -| policy_gradient_loss | 0.0615 | -| std | 0.00623 | -| value_loss | 1.94e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25869 | -| time_elapsed | 140702 | -| total_timesteps | 3311232 | -| train/ | | -| approx_kl | 0.013308774 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.807 | -| learning_rate | 0.0003 | -| loss | -7.5e-06 | -| n_updates | 258680 | -| policy_gradient_loss | -0.00125 | -| std | 0.00623 | -| value_loss | 0.00457 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25870 | -| time_elapsed | 140707 | -| total_timesteps | 3311360 | -| train/ | | -| approx_kl | 0.0058524674 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.287 | -| learning_rate | 0.0003 | -| loss | 0.000922 | -| n_updates | 258690 | -| policy_gradient_loss | 0.00569 | -| std | 0.00623 | -| value_loss | 7.54e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25871 | -| time_elapsed | 140711 | -| total_timesteps | 3311488 | -| train/ | | -| approx_kl | 0.07126413 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | 0.039 | -| n_updates | 258700 | -| policy_gradient_loss | 0.0148 | -| std | 0.00623 | -| value_loss | 1.23e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25872 | -| time_elapsed | 140716 | -| total_timesteps | 3311616 | -| train/ | | -| approx_kl | 0.052542042 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -3.21 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 258710 | -| policy_gradient_loss | 0.000537 | -| std | 0.00623 | -| value_loss | 8.81e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25873 | -| time_elapsed | 140721 | -| total_timesteps | 3311744 | -| train/ | | -| approx_kl | 0.050022878 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.011 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 258720 | -| policy_gradient_loss | 0.0139 | -| std | 0.00622 | -| value_loss | 3.04e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.826 | -| time/ | | -| fps | 23 | -| iterations | 25874 | -| time_elapsed | 140725 | -| total_timesteps | 3311872 | -| train/ | | -| approx_kl | 0.05350228 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | 0.00528 | -| n_updates | 258730 | -| policy_gradient_loss | 0.00302 | -| std | 0.00622 | -| value_loss | 2.41e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25875 | -| time_elapsed | 140731 | -| total_timesteps | 3312000 | -| train/ | | -| approx_kl | 0.009106738 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 258740 | -| policy_gradient_loss | 0.00933 | -| std | 0.00622 | -| value_loss | 1.73e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25876 | -| time_elapsed | 140736 | -| total_timesteps | 3312128 | -| train/ | | -| approx_kl | 0.074079946 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00521 | -| learning_rate | 0.0003 | -| loss | 0.0457 | -| n_updates | 258750 | -| policy_gradient_loss | 0.0177 | -| std | 0.00622 | -| value_loss | 9.06e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25877 | -| time_elapsed | 140747 | -| total_timesteps | 3312256 | -| train/ | | -| approx_kl | 0.0068970565 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | 0.00347 | -| n_updates | 258760 | -| policy_gradient_loss | -0.000651 | -| std | 0.00622 | -| value_loss | 0.0036 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25878 | -| time_elapsed | 140751 | -| total_timesteps | 3312384 | -| train/ | | -| approx_kl | 0.0032277405 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.312 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 258770 | -| policy_gradient_loss | 0.00783 | -| std | 0.00622 | -| value_loss | 0.000112 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25879 | -| time_elapsed | 140755 | -| total_timesteps | 3312512 | -| train/ | | -| approx_kl | 3.5929494e-05 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | 0.000823 | -| n_updates | 258780 | -| policy_gradient_loss | 0.0284 | -| std | 0.00621 | -| value_loss | 0.000665 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25880 | -| time_elapsed | 140758 | -| total_timesteps | 3312640 | -| train/ | | -| approx_kl | 0.1978782 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0782 | -| learning_rate | 0.0003 | -| loss | 0.196 | -| n_updates | 258790 | -| policy_gradient_loss | 0.0707 | -| std | 0.00621 | -| value_loss | 1.53e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25881 | -| time_elapsed | 140762 | -| total_timesteps | 3312768 | -| train/ | | -| approx_kl | 0.044536356 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 258800 | -| policy_gradient_loss | 0.0439 | -| std | 0.00621 | -| value_loss | 1.09e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.837 | -| time/ | | -| fps | 23 | -| iterations | 25882 | -| time_elapsed | 140767 | -| total_timesteps | 3312896 | -| train/ | | -| approx_kl | 0.15181297 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 258810 | -| policy_gradient_loss | 0.0886 | -| std | 0.00621 | -| value_loss | 5.28e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25883 | -| time_elapsed | 140772 | -| total_timesteps | 3313024 | -| train/ | | -| approx_kl | 5.3189695e-05 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | 3.69e-05 | -| n_updates | 258820 | -| policy_gradient_loss | 0.0162 | -| std | 0.00621 | -| value_loss | 7.19e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25884 | -| time_elapsed | 140783 | -| total_timesteps | 3313152 | -| train/ | | -| approx_kl | 0.01944245 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.931 | -| learning_rate | 0.0003 | -| loss | 0.00123 | -| n_updates | 258830 | -| policy_gradient_loss | -0.000223 | -| std | 0.0062 | -| value_loss | 0.00121 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25885 | -| time_elapsed | 140789 | -| total_timesteps | 3313280 | -| train/ | | -| approx_kl | 0.10353589 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -14.2 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 258840 | -| policy_gradient_loss | -0.00421 | -| std | 0.0062 | -| value_loss | 0.000123 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25886 | -| time_elapsed | 140794 | -| total_timesteps | 3313408 | -| train/ | | -| approx_kl | 0.012415907 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.512 | -| learning_rate | 0.0003 | -| loss | 0.0004 | -| n_updates | 258850 | -| policy_gradient_loss | 0.006 | -| std | 0.0062 | -| value_loss | 3.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25887 | -| time_elapsed | 140798 | -| total_timesteps | 3313536 | -| train/ | | -| approx_kl | 0.084378116 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.358 | -| learning_rate | 0.0003 | -| loss | 0.0436 | -| n_updates | 258860 | -| policy_gradient_loss | 0.0171 | -| std | 0.0062 | -| value_loss | 5.18e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25888 | -| time_elapsed | 140804 | -| total_timesteps | 3313664 | -| train/ | | -| approx_kl | 0.0114598 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0732 | -| learning_rate | 0.0003 | -| loss | -0.00676 | -| n_updates | 258870 | -| policy_gradient_loss | 0.00552 | -| std | 0.0062 | -| value_loss | 3.57e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25889 | -| time_elapsed | 140808 | -| total_timesteps | 3313792 | -| train/ | | -| approx_kl | 0.0032913503 | -| clip_fraction | 0.211 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | -0.00693 | -| n_updates | 258880 | -| policy_gradient_loss | 0.0115 | -| std | 0.0062 | -| value_loss | 2.76e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.846 | -| time/ | | -| fps | 23 | -| iterations | 25890 | -| time_elapsed | 140812 | -| total_timesteps | 3313920 | -| train/ | | -| approx_kl | 0.09411607 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | 0.0384 | -| n_updates | 258890 | -| policy_gradient_loss | 0.0109 | -| std | 0.0062 | -| value_loss | 1.58e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25891 | -| time_elapsed | 140817 | -| total_timesteps | 3314048 | -| train/ | | -| approx_kl | 0.008799663 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0873 | -| learning_rate | 0.0003 | -| loss | 0.0243 | -| n_updates | 258900 | -| policy_gradient_loss | 0.00427 | -| std | 0.0062 | -| value_loss | 1.18e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25892 | -| time_elapsed | 140826 | -| total_timesteps | 3314176 | -| train/ | | -| approx_kl | 0.012993105 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.913 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 258910 | -| policy_gradient_loss | -0.00526 | -| std | 0.0062 | -| value_loss | 0.00158 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25893 | -| time_elapsed | 140831 | -| total_timesteps | 3314304 | -| train/ | | -| approx_kl | 0.5290758 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.517 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 258920 | -| policy_gradient_loss | 0.0573 | -| std | 0.0062 | -| value_loss | 1.87e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25894 | -| time_elapsed | 140835 | -| total_timesteps | 3314432 | -| train/ | | -| approx_kl | 0.008017421 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.00498 | -| learning_rate | 0.0003 | -| loss | -0.00415 | -| n_updates | 258930 | -| policy_gradient_loss | 0.00588 | -| std | 0.0062 | -| value_loss | 2.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25895 | -| time_elapsed | 140840 | -| total_timesteps | 3314560 | -| train/ | | -| approx_kl | 0.0023092972 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | -0.00156 | -| n_updates | 258940 | -| policy_gradient_loss | 0.00841 | -| std | 0.00619 | -| value_loss | 1.22e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25896 | -| time_elapsed | 140844 | -| total_timesteps | 3314688 | -| train/ | | -| approx_kl | 9.099953e-06 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0831 | -| learning_rate | 0.0003 | -| loss | -0.000159 | -| n_updates | 258950 | -| policy_gradient_loss | 0.0322 | -| std | 0.00619 | -| value_loss | 1.2e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25897 | -| time_elapsed | 140850 | -| total_timesteps | 3314816 | -| train/ | | -| approx_kl | 1.0594281 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.244 | -| n_updates | 258960 | -| policy_gradient_loss | 0.153 | -| std | 0.00621 | -| value_loss | 0.000251 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.848 | -| time/ | | -| fps | 23 | -| iterations | 25898 | -| time_elapsed | 140855 | -| total_timesteps | 3314944 | -| train/ | | -| approx_kl | 0.0028219284 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.985 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 258970 | -| policy_gradient_loss | 0.0255 | -| std | 0.00621 | -| value_loss | 2.32e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25899 | -| time_elapsed | 140860 | -| total_timesteps | 3315072 | -| train/ | | -| approx_kl | 0.85010755 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.538 | -| n_updates | 258980 | -| policy_gradient_loss | 0.122 | -| std | 0.00621 | -| value_loss | 1.66e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25900 | -| time_elapsed | 140868 | -| total_timesteps | 3315200 | -| train/ | | -| approx_kl | 0.008878471 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.789 | -| learning_rate | 0.0003 | -| loss | -0.00965 | -| n_updates | 258990 | -| policy_gradient_loss | 0.024 | -| std | 0.00621 | -| value_loss | 0.00673 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25901 | -| time_elapsed | 140872 | -| total_timesteps | 3315328 | -| train/ | | -| approx_kl | 0.16804451 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -2.04 | -| learning_rate | 0.0003 | -| loss | 0.118 | -| n_updates | 259000 | -| policy_gradient_loss | 0.0663 | -| std | 0.00621 | -| value_loss | 8.38e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25902 | -| time_elapsed | 140876 | -| total_timesteps | 3315456 | -| train/ | | -| approx_kl | 0.042784285 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.000394 | -| n_updates | 259010 | -| policy_gradient_loss | 0.0299 | -| std | 0.00621 | -| value_loss | 1.3e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25903 | -| time_elapsed | 140881 | -| total_timesteps | 3315584 | -| train/ | | -| approx_kl | 0.83827645 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.00177 | -| learning_rate | 0.0003 | -| loss | 0.277 | -| n_updates | 259020 | -| policy_gradient_loss | 0.189 | -| std | 0.00621 | -| value_loss | 6.16e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25904 | -| time_elapsed | 140886 | -| total_timesteps | 3315712 | -| train/ | | -| approx_kl | 0.009044178 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | -0.00227 | -| n_updates | 259030 | -| policy_gradient_loss | 0.0315 | -| std | 0.00621 | -| value_loss | 4.03e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25905 | -| time_elapsed | 140892 | -| total_timesteps | 3315840 | -| train/ | | -| approx_kl | 0.30024248 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | 0.222 | -| n_updates | 259040 | -| policy_gradient_loss | 0.143 | -| std | 0.00621 | -| value_loss | 3.39e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25906 | -| time_elapsed | 140896 | -| total_timesteps | 3315968 | -| train/ | | -| approx_kl | 0.03974916 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | 0.00594 | -| n_updates | 259050 | -| policy_gradient_loss | 0.0197 | -| std | 0.00621 | -| value_loss | 2.41e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25907 | -| time_elapsed | 140901 | -| total_timesteps | 3316096 | -| train/ | | -| approx_kl | 0.6726172 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.211 | -| n_updates | 259060 | -| policy_gradient_loss | 0.0651 | -| std | 0.00621 | -| value_loss | 1.83e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25908 | -| time_elapsed | 140911 | -| total_timesteps | 3316224 | -| train/ | | -| approx_kl | 0.023864131 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | 0.165 | -| learning_rate | 0.0003 | -| loss | -0.0273 | -| n_updates | 259070 | -| policy_gradient_loss | -0.0145 | -| std | 0.00621 | -| value_loss | 0.00232 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25909 | -| time_elapsed | 140915 | -| total_timesteps | 3316352 | -| train/ | | -| approx_kl | 0.015118482 | -| clip_fraction | 0.549 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.363 | -| learning_rate | 0.0003 | -| loss | -0.00733 | -| n_updates | 259080 | -| policy_gradient_loss | 0.0918 | -| std | 0.00621 | -| value_loss | 4.91e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25910 | -| time_elapsed | 140919 | -| total_timesteps | 3316480 | -| train/ | | -| approx_kl | 0.3483353 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.66 | -| explained_variance | -0.185 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 259090 | -| policy_gradient_loss | 0.0554 | -| std | 0.0062 | -| value_loss | 1.9e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25911 | -| time_elapsed | 140924 | -| total_timesteps | 3316608 | -| train/ | | -| approx_kl | 0.0016892646 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0182 | -| learning_rate | 0.0003 | -| loss | -0.00449 | -| n_updates | 259100 | -| policy_gradient_loss | 0.00751 | -| std | 0.00618 | -| value_loss | 2.11e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25912 | -| time_elapsed | 140929 | -| total_timesteps | 3316736 | -| train/ | | -| approx_kl | 5.6209974e-06 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.018 | -| learning_rate | 0.0003 | -| loss | -0.000288 | -| n_updates | 259110 | -| policy_gradient_loss | 0.0112 | -| std | 0.00618 | -| value_loss | 2.36e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25913 | -| time_elapsed | 140934 | -| total_timesteps | 3316864 | -| train/ | | -| approx_kl | 0.06892505 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0753 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 259120 | -| policy_gradient_loss | 0.0658 | -| std | 0.00618 | -| value_loss | 1.01e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 25914 | -| time_elapsed | 140938 | -| total_timesteps | 3316992 | -| train/ | | -| approx_kl | 0.26833346 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -10.4 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 259130 | -| policy_gradient_loss | 0.0285 | -| std | 0.00617 | -| value_loss | 4.47e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25915 | -| time_elapsed | 140942 | -| total_timesteps | 3317120 | -| train/ | | -| approx_kl | 0.06771754 | -| clip_fraction | 0.571 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00431 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 259140 | -| policy_gradient_loss | 0.1 | -| std | 0.00617 | -| value_loss | 5.98e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25916 | -| time_elapsed | 140956 | -| total_timesteps | 3317248 | -| train/ | | -| approx_kl | 0.0073759765 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.827 | -| learning_rate | 0.0003 | -| loss | -0.0172 | -| n_updates | 259150 | -| policy_gradient_loss | 0.00525 | -| std | 0.00617 | -| value_loss | 0.00425 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25917 | -| time_elapsed | 140961 | -| total_timesteps | 3317376 | -| train/ | | -| approx_kl | 0.6514285 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.518 | -| learning_rate | 0.0003 | -| loss | 0.287 | -| n_updates | 259160 | -| policy_gradient_loss | 0.167 | -| std | 0.00616 | -| value_loss | 0.0014 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25918 | -| time_elapsed | 140968 | -| total_timesteps | 3317504 | -| train/ | | -| approx_kl | 0.23646164 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.841 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 259170 | -| policy_gradient_loss | 0.133 | -| std | 0.00615 | -| value_loss | 0.00503 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25919 | -| time_elapsed | 140973 | -| total_timesteps | 3317632 | -| train/ | | -| approx_kl | 0.062154308 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0757 | -| learning_rate | 0.0003 | -| loss | 0.0392 | -| n_updates | 259180 | -| policy_gradient_loss | 0.0396 | -| std | 0.00615 | -| value_loss | 0.000836 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25920 | -| time_elapsed | 140976 | -| total_timesteps | 3317760 | -| train/ | | -| approx_kl | 0.83172804 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00495 | -| learning_rate | 0.0003 | -| loss | 0.183 | -| n_updates | 259190 | -| policy_gradient_loss | 0.0618 | -| std | 0.00615 | -| value_loss | 0.000353 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25921 | -| time_elapsed | 140981 | -| total_timesteps | 3317888 | -| train/ | | -| approx_kl | 0.050923984 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0407 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 259200 | -| policy_gradient_loss | -0.00522 | -| std | 0.00615 | -| value_loss | 0.000237 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25922 | -| time_elapsed | 140985 | -| total_timesteps | 3318016 | -| train/ | | -| approx_kl | 0.053041823 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0438 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 259210 | -| policy_gradient_loss | 0.0149 | -| std | 0.00615 | -| value_loss | 0.000168 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25923 | -| time_elapsed | 140996 | -| total_timesteps | 3318144 | -| train/ | | -| approx_kl | 0.101857334 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.924 | -| learning_rate | 0.0003 | -| loss | 0.00753 | -| n_updates | 259220 | -| policy_gradient_loss | -0.00895 | -| std | 0.00615 | -| value_loss | 0.00234 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25924 | -| time_elapsed | 140999 | -| total_timesteps | 3318272 | -| train/ | | -| approx_kl | 0.053852797 | -| clip_fraction | 0.46 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0569 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 259230 | -| policy_gradient_loss | 0.03 | -| std | 0.00615 | -| value_loss | 0.000199 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25925 | -| time_elapsed | 141004 | -| total_timesteps | 3318400 | -| train/ | | -| approx_kl | 0.9375278 | -| clip_fraction | 0.761 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.304 | -| n_updates | 259240 | -| policy_gradient_loss | 0.143 | -| std | 0.00615 | -| value_loss | 3.53e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25926 | -| time_elapsed | 141009 | -| total_timesteps | 3318528 | -| train/ | | -| approx_kl | 0.016399879 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 259250 | -| policy_gradient_loss | 0.0339 | -| std | 0.00615 | -| value_loss | 3.5e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25927 | -| time_elapsed | 141014 | -| total_timesteps | 3318656 | -| train/ | | -| approx_kl | 0.29633766 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0325 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 259260 | -| policy_gradient_loss | 0.167 | -| std | 0.00615 | -| value_loss | 2.74e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25928 | -| time_elapsed | 141019 | -| total_timesteps | 3318784 | -| train/ | | -| approx_kl | 0.20099257 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0336 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 259270 | -| policy_gradient_loss | 0.109 | -| std | 0.00615 | -| value_loss | 2.43e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.85 | -| time/ | | -| fps | 23 | -| iterations | 25929 | -| time_elapsed | 141024 | -| total_timesteps | 3318912 | -| train/ | | -| approx_kl | 0.24538939 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | 0.233 | -| n_updates | 259280 | -| policy_gradient_loss | 0.235 | -| std | 0.00615 | -| value_loss | 1.32e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25930 | -| time_elapsed | 141028 | -| total_timesteps | 3319040 | -| train/ | | -| approx_kl | 0.1570495 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | 0.0605 | -| n_updates | 259290 | -| policy_gradient_loss | 0.0719 | -| std | 0.00615 | -| value_loss | 9.68e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25931 | -| time_elapsed | 141038 | -| total_timesteps | 3319168 | -| train/ | | -| approx_kl | 0.13254556 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.779 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 259300 | -| policy_gradient_loss | 0.123 | -| std | 0.00615 | -| value_loss | 0.00531 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25932 | -| time_elapsed | 141044 | -| total_timesteps | 3319296 | -| train/ | | -| approx_kl | 0.039567057 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.00607 | -| n_updates | 259310 | -| policy_gradient_loss | 0.0344 | -| std | 0.00615 | -| value_loss | 6.97e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25933 | -| time_elapsed | 141049 | -| total_timesteps | 3319424 | -| train/ | | -| approx_kl | 0.5766672 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.989 | -| learning_rate | 0.0003 | -| loss | 0.0254 | -| n_updates | 259320 | -| policy_gradient_loss | 0.0159 | -| std | 0.00616 | -| value_loss | 1.41e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25934 | -| time_elapsed | 141054 | -| total_timesteps | 3319552 | -| train/ | | -| approx_kl | 0.009414608 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.396 | -| learning_rate | 0.0003 | -| loss | -0.00648 | -| n_updates | 259330 | -| policy_gradient_loss | 0.00327 | -| std | 0.00616 | -| value_loss | 2.5e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25935 | -| time_elapsed | 141058 | -| total_timesteps | 3319680 | -| train/ | | -| approx_kl | 0.0025687884 | -| clip_fraction | 0.215 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0684 | -| learning_rate | 0.0003 | -| loss | -0.000831 | -| n_updates | 259340 | -| policy_gradient_loss | 0.00415 | -| std | 0.00616 | -| value_loss | 2.62e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25936 | -| time_elapsed | 141063 | -| total_timesteps | 3319808 | -| train/ | | -| approx_kl | 4.920643e-06 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | 0.000256 | -| n_updates | 259350 | -| policy_gradient_loss | 0.0449 | -| std | 0.00616 | -| value_loss | 1.63e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.849 | -| time/ | | -| fps | 23 | -| iterations | 25937 | -| time_elapsed | 141067 | -| total_timesteps | 3319936 | -| train/ | | -| approx_kl | 0.7095699 | -| clip_fraction | 0.766 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.34 | -| n_updates | 259360 | -| policy_gradient_loss | 0.174 | -| std | 0.00617 | -| value_loss | 9.34e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25938 | -| time_elapsed | 141071 | -| total_timesteps | 3320064 | -| train/ | | -| approx_kl | 0.030946627 | -| clip_fraction | 0.154 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | -0.0163 | -| n_updates | 259370 | -| policy_gradient_loss | -0.0135 | -| std | 0.00617 | -| value_loss | 7.63e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25939 | -| time_elapsed | 141079 | -| total_timesteps | 3320192 | -| train/ | | -| approx_kl | 0.01602354 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -1 | -| learning_rate | 0.0003 | -| loss | -0.0223 | -| n_updates | 259380 | -| policy_gradient_loss | -0.00917 | -| std | 0.00617 | -| value_loss | 0.00321 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25940 | -| time_elapsed | 141083 | -| total_timesteps | 3320320 | -| train/ | | -| approx_kl | 0.12766522 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0247 | -| learning_rate | 0.0003 | -| loss | 0.075 | -| n_updates | 259390 | -| policy_gradient_loss | 0.0362 | -| std | 0.00617 | -| value_loss | 3.92e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25941 | -| time_elapsed | 141087 | -| total_timesteps | 3320448 | -| train/ | | -| approx_kl | 0.00031509856 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -97.2 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 259400 | -| policy_gradient_loss | 0.0179 | -| std | 0.00617 | -| value_loss | 2.54e-08 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25942 | -| time_elapsed | 141091 | -| total_timesteps | 3320576 | -| train/ | | -| approx_kl | 0.86649 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.86 | -| learning_rate | 0.0003 | -| loss | 0.29 | -| n_updates | 259410 | -| policy_gradient_loss | 0.0791 | -| std | 0.00617 | -| value_loss | 2.27e-09 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25943 | -| time_elapsed | 141096 | -| total_timesteps | 3320704 | -| train/ | | -| approx_kl | 0.043815922 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0215 | -| learning_rate | 0.0003 | -| loss | 0.0286 | -| n_updates | 259420 | -| policy_gradient_loss | 0.0145 | -| std | 0.00617 | -| value_loss | 6.26e-10 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25944 | -| time_elapsed | 141101 | -| total_timesteps | 3320832 | -| train/ | | -| approx_kl | 0.007979799 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0682 | -| learning_rate | 0.0003 | -| loss | 0.00114 | -| n_updates | 259430 | -| policy_gradient_loss | 0.00815 | -| std | 0.00617 | -| value_loss | 7.5e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.853 | -| time/ | | -| fps | 23 | -| iterations | 25945 | -| time_elapsed | 141104 | -| total_timesteps | 3320960 | -| train/ | | -| approx_kl | 0.07945603 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | 0.0489 | -| n_updates | 259440 | -| policy_gradient_loss | 0.0199 | -| std | 0.00616 | -| value_loss | 1.22e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25946 | -| time_elapsed | 141109 | -| total_timesteps | 3321088 | -| train/ | | -| approx_kl | 0.01549596 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0665 | -| learning_rate | 0.0003 | -| loss | 0.00241 | -| n_updates | 259450 | -| policy_gradient_loss | 0.0101 | -| std | 0.00616 | -| value_loss | 1.66e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25947 | -| time_elapsed | 141119 | -| total_timesteps | 3321216 | -| train/ | | -| approx_kl | 0.048763573 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.994 | -| learning_rate | 0.0003 | -| loss | -0.000809 | -| n_updates | 259460 | -| policy_gradient_loss | -0.00293 | -| std | 0.00615 | -| value_loss | 7.15e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25948 | -| time_elapsed | 141124 | -| total_timesteps | 3321344 | -| train/ | | -| approx_kl | 0.045720596 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.481 | -| learning_rate | 0.0003 | -| loss | -0.00475 | -| n_updates | 259470 | -| policy_gradient_loss | 0.00107 | -| std | 0.00615 | -| value_loss | 1.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25949 | -| time_elapsed | 141127 | -| total_timesteps | 3321472 | -| train/ | | -| approx_kl | 0.061827138 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 259480 | -| policy_gradient_loss | 0.0104 | -| std | 0.00615 | -| value_loss | 2.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25950 | -| time_elapsed | 141131 | -| total_timesteps | 3321600 | -| train/ | | -| approx_kl | 0.055499718 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00112 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 259490 | -| policy_gradient_loss | 0.00839 | -| std | 0.00615 | -| value_loss | 1.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25951 | -| time_elapsed | 141136 | -| total_timesteps | 3321728 | -| train/ | | -| approx_kl | 0.04259275 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 259500 | -| policy_gradient_loss | 0.0112 | -| std | 0.00615 | -| value_loss | 8.79e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25952 | -| time_elapsed | 141141 | -| total_timesteps | 3321856 | -| train/ | | -| approx_kl | 0.050756082 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | 0.00507 | -| n_updates | 259510 | -| policy_gradient_loss | 0.00248 | -| std | 0.00615 | -| value_loss | 6.77e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25953 | -| time_elapsed | 141146 | -| total_timesteps | 3321984 | -| train/ | | -| approx_kl | 0.058205757 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0445 | -| learning_rate | 0.0003 | -| loss | 0.0301 | -| n_updates | 259520 | -| policy_gradient_loss | 0.0145 | -| std | 0.00615 | -| value_loss | 5.6e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25954 | -| time_elapsed | 141149 | -| total_timesteps | 3322112 | -| train/ | | -| approx_kl | 0.009104548 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | -0.0118 | -| n_updates | 259530 | -| policy_gradient_loss | 0.00547 | -| std | 0.00615 | -| value_loss | 4.57e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25955 | -| time_elapsed | 141161 | -| total_timesteps | 3322240 | -| train/ | | -| approx_kl | 0.31971058 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.426 | -| learning_rate | 0.0003 | -| loss | 0.17 | -| n_updates | 259540 | -| policy_gradient_loss | 0.0344 | -| std | 0.00615 | -| value_loss | 0.00821 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25956 | -| time_elapsed | 141167 | -| total_timesteps | 3322368 | -| train/ | | -| approx_kl | 2.3591332e-05 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.341 | -| learning_rate | 0.0003 | -| loss | -0.000292 | -| n_updates | 259550 | -| policy_gradient_loss | 0.0369 | -| std | 0.00615 | -| value_loss | 5e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25957 | -| time_elapsed | 141171 | -| total_timesteps | 3322496 | -| train/ | | -| approx_kl | 0.88695383 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0363 | -| learning_rate | 0.0003 | -| loss | 0.327 | -| n_updates | 259560 | -| policy_gradient_loss | 0.0995 | -| std | 0.00615 | -| value_loss | 8.57e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25958 | -| time_elapsed | 141175 | -| total_timesteps | 3322624 | -| train/ | | -| approx_kl | 0.012107016 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.00347 | -| n_updates | 259570 | -| policy_gradient_loss | 0.0063 | -| std | 0.00614 | -| value_loss | 3.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25959 | -| time_elapsed | 141179 | -| total_timesteps | 3322752 | -| train/ | | -| approx_kl | 0.07820914 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0641 | -| learning_rate | 0.0003 | -| loss | 0.0245 | -| n_updates | 259580 | -| policy_gradient_loss | 0.0083 | -| std | 0.00614 | -| value_loss | 2.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.841 | -| time/ | | -| fps | 23 | -| iterations | 25960 | -| time_elapsed | 141184 | -| total_timesteps | 3322880 | -| train/ | | -| approx_kl | 0.011424389 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.00151 | -| n_updates | 259590 | -| policy_gradient_loss | 0.00731 | -| std | 0.00614 | -| value_loss | 1.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25961 | -| time_elapsed | 141189 | -| total_timesteps | 3323008 | -| train/ | | -| approx_kl | 0.08256019 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0703 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 259600 | -| policy_gradient_loss | 0.0125 | -| std | 0.00614 | -| value_loss | 1.41e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25962 | -| time_elapsed | 141200 | -| total_timesteps | 3323136 | -| train/ | | -| approx_kl | 0.058074944 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.655 | -| learning_rate | 0.0003 | -| loss | -0.0225 | -| n_updates | 259610 | -| policy_gradient_loss | -0.0151 | -| std | 0.00614 | -| value_loss | 0.00122 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25963 | -| time_elapsed | 141205 | -| total_timesteps | 3323264 | -| train/ | | -| approx_kl | 0.02375304 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.353 | -| learning_rate | 0.0003 | -| loss | 0.016 | -| n_updates | 259620 | -| policy_gradient_loss | 0.0139 | -| std | 0.00613 | -| value_loss | 9.95e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25964 | -| time_elapsed | 141209 | -| total_timesteps | 3323392 | -| train/ | | -| approx_kl | 0.0035763732 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0163 | -| learning_rate | 0.0003 | -| loss | -0.000993 | -| n_updates | 259630 | -| policy_gradient_loss | 0.00917 | -| std | 0.00613 | -| value_loss | 1.32e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25965 | -| time_elapsed | 141214 | -| total_timesteps | 3323520 | -| train/ | | -| approx_kl | 0.082173556 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | 0.0154 | -| n_updates | 259640 | -| policy_gradient_loss | 0.00169 | -| std | 0.00613 | -| value_loss | 1.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25966 | -| time_elapsed | 141220 | -| total_timesteps | 3323648 | -| train/ | | -| approx_kl | 0.054761194 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | 0.00227 | -| n_updates | 259650 | -| policy_gradient_loss | 0.00394 | -| std | 0.00613 | -| value_loss | 1.37e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25967 | -| time_elapsed | 141224 | -| total_timesteps | 3323776 | -| train/ | | -| approx_kl | 0.06377717 | -| clip_fraction | 0.292 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 259660 | -| policy_gradient_loss | 0.00639 | -| std | 0.00613 | -| value_loss | 1.19e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.84 | -| time/ | | -| fps | 23 | -| iterations | 25968 | -| time_elapsed | 141228 | -| total_timesteps | 3323904 | -| train/ | | -| approx_kl | 0.047858607 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.0335 | -| n_updates | 259670 | -| policy_gradient_loss | 0.0164 | -| std | 0.00614 | -| value_loss | 6.02e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25969 | -| time_elapsed | 141232 | -| total_timesteps | 3324032 | -| train/ | | -| approx_kl | 0.008637249 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | -0.000571 | -| n_updates | 259680 | -| policy_gradient_loss | 0.00614 | -| std | 0.00614 | -| value_loss | 8.68e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25970 | -| time_elapsed | 141241 | -| total_timesteps | 3324160 | -| train/ | | -| approx_kl | 0.0063056042 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | -0.0057 | -| n_updates | 259690 | -| policy_gradient_loss | 0.00199 | -| std | 0.00614 | -| value_loss | 0.00484 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25971 | -| time_elapsed | 141246 | -| total_timesteps | 3324288 | -| train/ | | -| approx_kl | 0.016090853 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.00155 | -| n_updates | 259700 | -| policy_gradient_loss | 0.00625 | -| std | 0.00614 | -| value_loss | 4.98e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25972 | -| time_elapsed | 141251 | -| total_timesteps | 3324416 | -| train/ | | -| approx_kl | 0.050859556 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.00445 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 259710 | -| policy_gradient_loss | 0.00303 | -| std | 0.00614 | -| value_loss | 7.37e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25973 | -| time_elapsed | 141256 | -| total_timesteps | 3324544 | -| train/ | | -| approx_kl | 0.010213828 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0142 | -| learning_rate | 0.0003 | -| loss | 0.00373 | -| n_updates | 259720 | -| policy_gradient_loss | 0.00875 | -| std | 0.00614 | -| value_loss | 2.99e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25974 | -| time_elapsed | 141261 | -| total_timesteps | 3324672 | -| train/ | | -| approx_kl | 0.066013396 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | 0.0155 | -| n_updates | 259730 | -| policy_gradient_loss | 0.0044 | -| std | 0.00614 | -| value_loss | 1.55e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25975 | -| time_elapsed | 141267 | -| total_timesteps | 3324800 | -| train/ | | -| approx_kl | 0.034730352 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | 0.00971 | -| n_updates | 259740 | -| policy_gradient_loss | 0.00561 | -| std | 0.00614 | -| value_loss | 1.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.843 | -| time/ | | -| fps | 23 | -| iterations | 25976 | -| time_elapsed | 141273 | -| total_timesteps | 3324928 | -| train/ | | -| approx_kl | 0.062100284 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | 0.0248 | -| n_updates | 259750 | -| policy_gradient_loss | 0.0114 | -| std | 0.00614 | -| value_loss | 9.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25977 | -| time_elapsed | 141278 | -| total_timesteps | 3325056 | -| train/ | | -| approx_kl | 0.044127956 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.043 | -| learning_rate | 0.0003 | -| loss | 0.00378 | -| n_updates | 259760 | -| policy_gradient_loss | 0.00199 | -| std | 0.00614 | -| value_loss | 7.85e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25978 | -| time_elapsed | 141286 | -| total_timesteps | 3325184 | -| train/ | | -| approx_kl | 0.007265664 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.962 | -| learning_rate | 0.0003 | -| loss | -0.00775 | -| n_updates | 259770 | -| policy_gradient_loss | 0.00318 | -| std | 0.00614 | -| value_loss | 0.000507 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25979 | -| time_elapsed | 141291 | -| total_timesteps | 3325312 | -| train/ | | -| approx_kl | 0.36294004 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.189 | -| n_updates | 259780 | -| policy_gradient_loss | 0.0661 | -| std | 0.00614 | -| value_loss | 3.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25980 | -| time_elapsed | 141295 | -| total_timesteps | 3325440 | -| train/ | | -| approx_kl | 0.09410875 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0019 | -| learning_rate | 0.0003 | -| loss | 0.0676 | -| n_updates | 259790 | -| policy_gradient_loss | 0.028 | -| std | 0.00613 | -| value_loss | 1.17e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25981 | -| time_elapsed | 141301 | -| total_timesteps | 3325568 | -| train/ | | -| approx_kl | 0.013179742 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | 0.00234 | -| n_updates | 259800 | -| policy_gradient_loss | 0.0102 | -| std | 0.00613 | -| value_loss | 7.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25982 | -| time_elapsed | 141305 | -| total_timesteps | 3325696 | -| train/ | | -| approx_kl | 0.003656404 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0543 | -| learning_rate | 0.0003 | -| loss | -0.00188 | -| n_updates | 259810 | -| policy_gradient_loss | 0.0118 | -| std | 0.00613 | -| value_loss | 5.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25983 | -| time_elapsed | 141310 | -| total_timesteps | 3325824 | -| train/ | | -| approx_kl | 0.08560493 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0555 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 259820 | -| policy_gradient_loss | 0.0073 | -| std | 0.00613 | -| value_loss | 4.21e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.855 | -| time/ | | -| fps | 23 | -| iterations | 25984 | -| time_elapsed | 141316 | -| total_timesteps | 3325952 | -| train/ | | -| approx_kl | 0.011838273 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0587 | -| learning_rate | 0.0003 | -| loss | 0.00818 | -| n_updates | 259830 | -| policy_gradient_loss | 0.0108 | -| std | 0.00613 | -| value_loss | 2.56e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25985 | -| time_elapsed | 141322 | -| total_timesteps | 3326080 | -| train/ | | -| approx_kl | 0.0031161397 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0682 | -| learning_rate | 0.0003 | -| loss | -0.00743 | -| n_updates | 259840 | -| policy_gradient_loss | 0.00783 | -| std | 0.00613 | -| value_loss | 2.06e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25986 | -| time_elapsed | 141332 | -| total_timesteps | 3326208 | -| train/ | | -| approx_kl | 0.020864677 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.751 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 259850 | -| policy_gradient_loss | -0.00762 | -| std | 0.00613 | -| value_loss | 0.00445 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25987 | -| time_elapsed | 141338 | -| total_timesteps | 3326336 | -| train/ | | -| approx_kl | 0.04561757 | -| clip_fraction | 0.631 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.401 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 259860 | -| policy_gradient_loss | 0.128 | -| std | 0.00613 | -| value_loss | 7.3e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25988 | -| time_elapsed | 141342 | -| total_timesteps | 3326464 | -| train/ | | -| approx_kl | 0.013596185 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | -0.00351 | -| n_updates | 259870 | -| policy_gradient_loss | 0.0323 | -| std | 0.00613 | -| value_loss | 1.64e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25989 | -| time_elapsed | 141348 | -| total_timesteps | 3326592 | -| train/ | | -| approx_kl | 0.21340328 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00564 | -| learning_rate | 0.0003 | -| loss | 0.0873 | -| n_updates | 259880 | -| policy_gradient_loss | 0.0233 | -| std | 0.00613 | -| value_loss | 8.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25990 | -| time_elapsed | 141353 | -| total_timesteps | 3326720 | -| train/ | | -| approx_kl | 0.021824155 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | -0.00631 | -| n_updates | 259890 | -| policy_gradient_loss | 0.0264 | -| std | 0.00613 | -| value_loss | 6.95e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25991 | -| time_elapsed | 141357 | -| total_timesteps | 3326848 | -| train/ | | -| approx_kl | 0.2433882 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0242 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 259900 | -| policy_gradient_loss | 0.114 | -| std | 0.00613 | -| value_loss | 3.84e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 25992 | -| time_elapsed | 141362 | -| total_timesteps | 3326976 | -| train/ | | -| approx_kl | 0.19863346 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0522 | -| learning_rate | 0.0003 | -| loss | 0.15 | -| n_updates | 259910 | -| policy_gradient_loss | 0.122 | -| std | 0.00614 | -| value_loss | 3.59e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 25993 | -| time_elapsed | 141367 | -| total_timesteps | 3327104 | -| train/ | | -| approx_kl | 0.16327816 | -| clip_fraction | 0.694 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0358 | -| learning_rate | 0.0003 | -| loss | 0.091 | -| n_updates | 259920 | -| policy_gradient_loss | 0.118 | -| std | 0.00614 | -| value_loss | 1.95e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 25994 | -| time_elapsed | 141376 | -| total_timesteps | 3327232 | -| train/ | | -| approx_kl | 0.009151092 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.832 | -| learning_rate | 0.0003 | -| loss | 0.0089 | -| n_updates | 259930 | -| policy_gradient_loss | 0.0166 | -| std | 0.00614 | -| value_loss | 0.00415 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 25995 | -| time_elapsed | 141381 | -| total_timesteps | 3327360 | -| train/ | | -| approx_kl | 0.18241368 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.00775 | -| learning_rate | 0.0003 | -| loss | 0.105 | -| n_updates | 259940 | -| policy_gradient_loss | 0.0277 | -| std | 0.00613 | -| value_loss | 1.25e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 25996 | -| time_elapsed | 141386 | -| total_timesteps | 3327488 | -| train/ | | -| approx_kl | 0.015109178 | -| clip_fraction | 0.112 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00391 | -| learning_rate | 0.0003 | -| loss | 0.00876 | -| n_updates | 259950 | -| policy_gradient_loss | 0.0036 | -| std | 0.00613 | -| value_loss | 2.63e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 25997 | -| time_elapsed | 141391 | -| total_timesteps | 3327616 | -| train/ | | -| approx_kl | 0.03331632 | -| clip_fraction | 0.465 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.00362 | -| n_updates | 259960 | -| policy_gradient_loss | 0.0309 | -| std | 0.00613 | -| value_loss | 2.1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 25998 | -| time_elapsed | 141396 | -| total_timesteps | 3327744 | -| train/ | | -| approx_kl | 0.11068165 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0428 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 259970 | -| policy_gradient_loss | 0.0186 | -| std | 0.00613 | -| value_loss | 1.78e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.86 | -| time/ | | -| fps | 23 | -| iterations | 25999 | -| time_elapsed | 141401 | -| total_timesteps | 3327872 | -| train/ | | -| approx_kl | 0.15037003 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0384 | -| learning_rate | 0.0003 | -| loss | 0.0744 | -| n_updates | 259980 | -| policy_gradient_loss | 0.0237 | -| std | 0.00613 | -| value_loss | 1.3e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26000 | -| time_elapsed | 141406 | -| total_timesteps | 3328000 | -| train/ | | -| approx_kl | 0.033312988 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 259990 | -| policy_gradient_loss | 0.0287 | -| std | 0.00613 | -| value_loss | 7.98e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26001 | -| time_elapsed | 141411 | -| total_timesteps | 3328128 | -| train/ | | -| approx_kl | 0.26726732 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0062 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 260000 | -| policy_gradient_loss | 0.113 | -| std | 0.00613 | -| value_loss | 4.14e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26002 | -| time_elapsed | 141422 | -| total_timesteps | 3328256 | -| train/ | | -| approx_kl | 0.019720338 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 260010 | -| policy_gradient_loss | 0.00879 | -| std | 0.00613 | -| value_loss | 0.000513 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26003 | -| time_elapsed | 141427 | -| total_timesteps | 3328384 | -| train/ | | -| approx_kl | 0.14138313 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | 0.0869 | -| n_updates | 260020 | -| policy_gradient_loss | 0.0553 | -| std | 0.00613 | -| value_loss | 3.67e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26004 | -| time_elapsed | 141432 | -| total_timesteps | 3328512 | -| train/ | | -| approx_kl | 0.042193927 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | 0.00759 | -| n_updates | 260030 | -| policy_gradient_loss | 0.0316 | -| std | 0.00613 | -| value_loss | 1.11e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26005 | -| time_elapsed | 141437 | -| total_timesteps | 3328640 | -| train/ | | -| approx_kl | 0.86327463 | -| clip_fraction | 0.747 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 260040 | -| policy_gradient_loss | 0.18 | -| std | 0.00613 | -| value_loss | 5.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26006 | -| time_elapsed | 141446 | -| total_timesteps | 3328768 | -| train/ | | -| approx_kl | 0.008338271 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 260050 | -| policy_gradient_loss | 0.0263 | -| std | 0.00613 | -| value_loss | 5.55e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.865 | -| time/ | | -| fps | 23 | -| iterations | 26007 | -| time_elapsed | 141452 | -| total_timesteps | 3328896 | -| train/ | | -| approx_kl | 0.29881242 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | 0.191 | -| n_updates | 260060 | -| policy_gradient_loss | 0.15 | -| std | 0.00613 | -| value_loss | 4.43e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26008 | -| time_elapsed | 141456 | -| total_timesteps | 3329024 | -| train/ | | -| approx_kl | 0.2394953 | -| clip_fraction | 0.704 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 260070 | -| policy_gradient_loss | 0.166 | -| std | 0.00613 | -| value_loss | 3e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26009 | -| time_elapsed | 141470 | -| total_timesteps | 3329152 | -| train/ | | -| approx_kl | 0.09940192 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.0762 | -| n_updates | 260080 | -| policy_gradient_loss | 0.0904 | -| std | 0.00613 | -| value_loss | 0.000553 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26010 | -| time_elapsed | 141475 | -| total_timesteps | 3329280 | -| train/ | | -| approx_kl | 0.2070486 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0258 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 260090 | -| policy_gradient_loss | 0.195 | -| std | 0.00613 | -| value_loss | 1.08e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26011 | -| time_elapsed | 141481 | -| total_timesteps | 3329408 | -| train/ | | -| approx_kl | 0.030020477 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 260100 | -| policy_gradient_loss | 0.0271 | -| std | 0.00614 | -| value_loss | 7.36e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26012 | -| time_elapsed | 141487 | -| total_timesteps | 3329536 | -| train/ | | -| approx_kl | 0.00061767595 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.67 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | 0.00675 | -| n_updates | 260110 | -| policy_gradient_loss | 0.0319 | -| std | 0.00614 | -| value_loss | 4.52e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26013 | -| time_elapsed | 141492 | -| total_timesteps | 3329664 | -| train/ | | -| approx_kl | 0.069750324 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.0356 | -| n_updates | 260120 | -| policy_gradient_loss | 0.00833 | -| std | 0.00611 | -| value_loss | 3.29e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26014 | -| time_elapsed | 141496 | -| total_timesteps | 3329792 | -| train/ | | -| approx_kl | 0.02409807 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -2.05 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 260130 | -| policy_gradient_loss | 0.00955 | -| std | 0.0061 | -| value_loss | 2.53e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.857 | -| time/ | | -| fps | 23 | -| iterations | 26015 | -| time_elapsed | 141501 | -| total_timesteps | 3329920 | -| train/ | | -| approx_kl | 0.071643256 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0162 | -| learning_rate | 0.0003 | -| loss | 0.0378 | -| n_updates | 260140 | -| policy_gradient_loss | 0.0146 | -| std | 0.00609 | -| value_loss | 9.57e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26016 | -| time_elapsed | 141505 | -| total_timesteps | 3330048 | -| train/ | | -| approx_kl | 0.05087606 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0045 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 260150 | -| policy_gradient_loss | 0.0185 | -| std | 0.00609 | -| value_loss | 4.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26017 | -| time_elapsed | 141514 | -| total_timesteps | 3330176 | -| train/ | | -| approx_kl | 0.016130928 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 260160 | -| policy_gradient_loss | -0.0131 | -| std | 0.00609 | -| value_loss | 0.00275 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26018 | -| time_elapsed | 141520 | -| total_timesteps | 3330304 | -| train/ | | -| approx_kl | 0.030799605 | -| clip_fraction | 0.163 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.99 | -| learning_rate | 0.0003 | -| loss | 0.00146 | -| n_updates | 260170 | -| policy_gradient_loss | -0.00351 | -| std | 0.00608 | -| value_loss | 9.86e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26019 | -| time_elapsed | 141525 | -| total_timesteps | 3330432 | -| train/ | | -| approx_kl | 0.020454682 | -| clip_fraction | 0.447 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.000411 | -| n_updates | 260180 | -| policy_gradient_loss | 0.0304 | -| std | 0.00608 | -| value_loss | 5.91e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26020 | -| time_elapsed | 141531 | -| total_timesteps | 3330560 | -| train/ | | -| approx_kl | 0.34488064 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0453 | -| learning_rate | 0.0003 | -| loss | 0.156 | -| n_updates | 260190 | -| policy_gradient_loss | 0.143 | -| std | 0.00608 | -| value_loss | 4.66e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26021 | -| time_elapsed | 141535 | -| total_timesteps | 3330688 | -| train/ | | -| approx_kl | 0.2386322 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | 0.151 | -| n_updates | 260200 | -| policy_gradient_loss | 0.158 | -| std | 0.00608 | -| value_loss | 8.2e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26022 | -| time_elapsed | 141539 | -| total_timesteps | 3330816 | -| train/ | | -| approx_kl | 0.20658956 | -| clip_fraction | 0.751 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.52 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 260210 | -| policy_gradient_loss | 0.124 | -| std | 0.00608 | -| value_loss | 1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.863 | -| time/ | | -| fps | 23 | -| iterations | 26023 | -| time_elapsed | 141544 | -| total_timesteps | 3330944 | -| train/ | | -| approx_kl | 0.16177411 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.16 | -| learning_rate | 0.0003 | -| loss | 0.139 | -| n_updates | 260220 | -| policy_gradient_loss | 0.116 | -| std | 0.00608 | -| value_loss | 5.85e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26024 | -| time_elapsed | 141549 | -| total_timesteps | 3331072 | -| train/ | | -| approx_kl | 0.1726503 | -| clip_fraction | 0.721 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 260230 | -| policy_gradient_loss | 0.175 | -| std | 0.00608 | -| value_loss | 5.03e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26025 | -| time_elapsed | 141559 | -| total_timesteps | 3331200 | -| train/ | | -| approx_kl | 0.29308948 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -3.91 | -| learning_rate | 0.0003 | -| loss | 0.0427 | -| n_updates | 260240 | -| policy_gradient_loss | 0.0509 | -| std | 0.00608 | -| value_loss | 0.00437 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26026 | -| time_elapsed | 141565 | -| total_timesteps | 3331328 | -| train/ | | -| approx_kl | 0.13004196 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -40.5 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 260250 | -| policy_gradient_loss | 0.0115 | -| std | 0.00609 | -| value_loss | 2.07e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26027 | -| time_elapsed | 141570 | -| total_timesteps | 3331456 | -| train/ | | -| approx_kl | 0.0087869745 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | 0.0237 | -| n_updates | 260260 | -| policy_gradient_loss | 0.00747 | -| std | 0.00609 | -| value_loss | 6.24e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26028 | -| time_elapsed | 141574 | -| total_timesteps | 3331584 | -| train/ | | -| approx_kl | 0.07103402 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.274 | -| learning_rate | 0.0003 | -| loss | 0.0444 | -| n_updates | 260270 | -| policy_gradient_loss | 0.0331 | -| std | 0.00609 | -| value_loss | 3.79e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26029 | -| time_elapsed | 141578 | -| total_timesteps | 3331712 | -| train/ | | -| approx_kl | 0.006164173 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.00334 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 260280 | -| policy_gradient_loss | 0.0377 | -| std | 0.00609 | -| value_loss | 3.38e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26030 | -| time_elapsed | 141583 | -| total_timesteps | 3331840 | -| train/ | | -| approx_kl | 0.011331489 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.476 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 260290 | -| policy_gradient_loss | -0.000268 | -| std | 0.00608 | -| value_loss | 1.71e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.871 | -| time/ | | -| fps | 23 | -| iterations | 26031 | -| time_elapsed | 141588 | -| total_timesteps | 3331968 | -| train/ | | -| approx_kl | 0.0013438459 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.677 | -| learning_rate | 0.0003 | -| loss | -0.00693 | -| n_updates | 260300 | -| policy_gradient_loss | 0.0104 | -| std | 0.00608 | -| value_loss | 1.28e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26032 | -| time_elapsed | 141592 | -| total_timesteps | 3332096 | -| train/ | | -| approx_kl | 9.9172816e-05 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.102 | -| learning_rate | 0.0003 | -| loss | 0.000301 | -| n_updates | 260310 | -| policy_gradient_loss | 0.0164 | -| std | 0.00607 | -| value_loss | 7.22e-09 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26033 | -| time_elapsed | 141603 | -| total_timesteps | 3332224 | -| train/ | | -| approx_kl | 0.029070213 | -| clip_fraction | 0.205 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -1.61 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 260320 | -| policy_gradient_loss | -0.00301 | -| std | 0.00607 | -| value_loss | 0.00342 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26034 | -| time_elapsed | 141607 | -| total_timesteps | 3332352 | -| train/ | | -| approx_kl | 0.061873063 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.601 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 260330 | -| policy_gradient_loss | 0.012 | -| std | 0.00607 | -| value_loss | 6.7e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26035 | -| time_elapsed | 141611 | -| total_timesteps | 3332480 | -| train/ | | -| approx_kl | 0.0395997 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.00484 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 260340 | -| policy_gradient_loss | -0.00491 | -| std | 0.00607 | -| value_loss | 5.05e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26036 | -| time_elapsed | 141615 | -| total_timesteps | 3332608 | -| train/ | | -| approx_kl | 0.008601495 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0664 | -| learning_rate | 0.0003 | -| loss | -0.0101 | -| n_updates | 260350 | -| policy_gradient_loss | 0.004 | -| std | 0.00607 | -| value_loss | 4.54e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26037 | -| time_elapsed | 141619 | -| total_timesteps | 3332736 | -| train/ | | -| approx_kl | 0.0034697265 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0576 | -| learning_rate | 0.0003 | -| loss | -0.00943 | -| n_updates | 260360 | -| policy_gradient_loss | 0.0104 | -| std | 0.00608 | -| value_loss | 2.14e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26038 | -| time_elapsed | 141624 | -| total_timesteps | 3332864 | -| train/ | | -| approx_kl | 2.3106113e-06 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0908 | -| learning_rate | 0.0003 | -| loss | 0.000188 | -| n_updates | 260370 | -| policy_gradient_loss | 0.0516 | -| std | 0.00608 | -| value_loss | 2.08e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.866 | -| time/ | | -| fps | 23 | -| iterations | 26039 | -| time_elapsed | 141628 | -| total_timesteps | 3332992 | -| train/ | | -| approx_kl | 1.1385146 | -| clip_fraction | 0.768 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.235 | -| n_updates | 260380 | -| policy_gradient_loss | 0.13 | -| std | 0.00608 | -| value_loss | 1.17e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 26040 | -| time_elapsed | 141634 | -| total_timesteps | 3333120 | -| train/ | | -| approx_kl | 0.02997074 | -| clip_fraction | 0.166 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0807 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 260390 | -| policy_gradient_loss | 0.00473 | -| std | 0.00608 | -| value_loss | 7.59e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 26041 | -| time_elapsed | 141644 | -| total_timesteps | 3333248 | -| train/ | | -| approx_kl | 0.050960783 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.76 | -| learning_rate | 0.0003 | -| loss | 0.0179 | -| n_updates | 260400 | -| policy_gradient_loss | 0.0243 | -| std | 0.00608 | -| value_loss | 0.00644 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 26042 | -| time_elapsed | 141648 | -| total_timesteps | 3333376 | -| train/ | | -| approx_kl | 0.778015 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.511 | -| learning_rate | 0.0003 | -| loss | 0.23 | -| n_updates | 260410 | -| policy_gradient_loss | 0.0714 | -| std | 0.00607 | -| value_loss | 0.000245 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 26043 | -| time_elapsed | 141652 | -| total_timesteps | 3333504 | -| train/ | | -| approx_kl | 0.06534706 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | 0.0121 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 260420 | -| policy_gradient_loss | 0.0107 | -| std | 0.00607 | -| value_loss | 6.11e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 26044 | -| time_elapsed | 141657 | -| total_timesteps | 3333632 | -| train/ | | -| approx_kl | 0.011122362 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0135 | -| learning_rate | 0.0003 | -| loss | -0.00882 | -| n_updates | 260430 | -| policy_gradient_loss | 0.00913 | -| std | 0.00608 | -| value_loss | 3.95e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 26045 | -| time_elapsed | 141661 | -| total_timesteps | 3333760 | -| train/ | | -| approx_kl | 0.0010375502 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.00601 | -| n_updates | 260440 | -| policy_gradient_loss | 0.00267 | -| std | 0.00608 | -| value_loss | 2.87e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.867 | -| time/ | | -| fps | 23 | -| iterations | 26046 | -| time_elapsed | 141664 | -| total_timesteps | 3333888 | -| train/ | | -| approx_kl | 0.06896726 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.68 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | 0.0394 | -| n_updates | 260450 | -| policy_gradient_loss | 0.0177 | -| std | 0.00607 | -| value_loss | 1.46e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26047 | -| time_elapsed | 141668 | -| total_timesteps | 3334016 | -| train/ | | -| approx_kl | 0.059185185 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.0161 | -| n_updates | 260460 | -| policy_gradient_loss | 0.00814 | -| std | 0.00607 | -| value_loss | 1.79e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26048 | -| time_elapsed | 141677 | -| total_timesteps | 3334144 | -| train/ | | -| approx_kl | 0.031462047 | -| clip_fraction | 0.228 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 260470 | -| policy_gradient_loss | -0.00763 | -| std | 0.00607 | -| value_loss | 0.000334 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26049 | -| time_elapsed | 141681 | -| total_timesteps | 3334272 | -| train/ | | -| approx_kl | 0.085618354 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 260480 | -| policy_gradient_loss | 0.0206 | -| std | 0.00607 | -| value_loss | 0.015 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26050 | -| time_elapsed | 141686 | -| total_timesteps | 3334400 | -| train/ | | -| approx_kl | 0.04789704 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0697 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 260490 | -| policy_gradient_loss | 0.0104 | -| std | 0.00607 | -| value_loss | 0.000406 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26051 | -| time_elapsed | 141690 | -| total_timesteps | 3334528 | -| train/ | | -| approx_kl | 0.053617172 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0148 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 260500 | -| policy_gradient_loss | -0.00705 | -| std | 0.00607 | -| value_loss | 9.03e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26052 | -| time_elapsed | 141695 | -| total_timesteps | 3334656 | -| train/ | | -| approx_kl | 0.045760073 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0181 | -| learning_rate | 0.0003 | -| loss | -0.00437 | -| n_updates | 260510 | -| policy_gradient_loss | -0.00205 | -| std | 0.00607 | -| value_loss | 6.24e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26053 | -| time_elapsed | 141699 | -| total_timesteps | 3334784 | -| train/ | | -| approx_kl | 0.011480963 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.00267 | -| n_updates | 260520 | -| policy_gradient_loss | 0.0103 | -| std | 0.00607 | -| value_loss | 2.72e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.88 | -| time/ | | -| fps | 23 | -| iterations | 26054 | -| time_elapsed | 141704 | -| total_timesteps | 3334912 | -| train/ | | -| approx_kl | 0.0023679966 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0997 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 260530 | -| policy_gradient_loss | 0.00896 | -| std | 0.00607 | -| value_loss | 2.21e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26055 | -| time_elapsed | 141709 | -| total_timesteps | 3335040 | -| train/ | | -| approx_kl | 0.05252779 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0618 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 260540 | -| policy_gradient_loss | 0.146 | -| std | 0.00607 | -| value_loss | 1.22e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26056 | -| time_elapsed | 141719 | -| total_timesteps | 3335168 | -| train/ | | -| approx_kl | 0.09934059 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.141 | -| learning_rate | 0.0003 | -| loss | 0.000131 | -| n_updates | 260550 | -| policy_gradient_loss | 0.0214 | -| std | 0.00607 | -| value_loss | 0.00237 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26057 | -| time_elapsed | 141726 | -| total_timesteps | 3335296 | -| train/ | | -| approx_kl | 0.17433995 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.118 | -| learning_rate | 0.0003 | -| loss | 0.0733 | -| n_updates | 260560 | -| policy_gradient_loss | 0.0527 | -| std | 0.00607 | -| value_loss | 1.12e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26058 | -| time_elapsed | 141731 | -| total_timesteps | 3335424 | -| train/ | | -| approx_kl | 0.027505234 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0834 | -| learning_rate | 0.0003 | -| loss | 0.00716 | -| n_updates | 260570 | -| policy_gradient_loss | 0.00929 | -| std | 0.00607 | -| value_loss | 3.95e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26059 | -| time_elapsed | 141737 | -| total_timesteps | 3335552 | -| train/ | | -| approx_kl | 0.02977337 | -| clip_fraction | 0.637 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0863 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 260580 | -| policy_gradient_loss | 0.0827 | -| std | 0.00606 | -| value_loss | 2.12e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26060 | -| time_elapsed | 141741 | -| total_timesteps | 3335680 | -| train/ | | -| approx_kl | 0.018214487 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0714 | -| learning_rate | 0.0003 | -| loss | 0.00471 | -| n_updates | 260590 | -| policy_gradient_loss | 0.0328 | -| std | 0.00607 | -| value_loss | 1.34e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26061 | -| time_elapsed | 141745 | -| total_timesteps | 3335808 | -| train/ | | -| approx_kl | 0.17278203 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | 0.0744 | -| n_updates | 260600 | -| policy_gradient_loss | 0.0317 | -| std | 0.00607 | -| value_loss | 3.34e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.886 | -| time/ | | -| fps | 23 | -| iterations | 26062 | -| time_elapsed | 141749 | -| total_timesteps | 3335936 | -| train/ | | -| approx_kl | 0.054295417 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 260610 | -| policy_gradient_loss | 0.0571 | -| std | 0.00607 | -| value_loss | 8.21e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26063 | -| time_elapsed | 141754 | -| total_timesteps | 3336064 | -| train/ | | -| approx_kl | 0.0021409052 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0952 | -| learning_rate | 0.0003 | -| loss | -0.000678 | -| n_updates | 260620 | -| policy_gradient_loss | 0.0685 | -| std | 0.00607 | -| value_loss | 5.3e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26064 | -| time_elapsed | 141766 | -| total_timesteps | 3336192 | -| train/ | | -| approx_kl | 1.0951651 | -| clip_fraction | 0.773 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.664 | -| learning_rate | 0.0003 | -| loss | 0.422 | -| n_updates | 260630 | -| policy_gradient_loss | 0.309 | -| std | 0.00607 | -| value_loss | 0.0132 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26065 | -| time_elapsed | 141771 | -| total_timesteps | 3336320 | -| train/ | | -| approx_kl | 0.024313437 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.389 | -| learning_rate | 0.0003 | -| loss | -0.00478 | -| n_updates | 260640 | -| policy_gradient_loss | 0.0987 | -| std | 0.00607 | -| value_loss | 0.000326 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26066 | -| time_elapsed | 141776 | -| total_timesteps | 3336448 | -| train/ | | -| approx_kl | 0.30988288 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.000293 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 260650 | -| policy_gradient_loss | 0.0461 | -| std | 0.00607 | -| value_loss | 8.94e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26067 | -| time_elapsed | 141782 | -| total_timesteps | 3336576 | -| train/ | | -| approx_kl | 0.0731999 | -| clip_fraction | 0.601 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00105 | -| learning_rate | 0.0003 | -| loss | 0.0478 | -| n_updates | 260660 | -| policy_gradient_loss | 0.0799 | -| std | 0.00607 | -| value_loss | 4.15e-05 | ---------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26068 | -| time_elapsed | 141788 | -| total_timesteps | 3336704 | -| train/ | | -| approx_kl | 3.6674086e-05 | -| clip_fraction | 0.531 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | 0.000921 | -| n_updates | 260670 | -| policy_gradient_loss | 0.0882 | -| std | 0.00607 | -| value_loss | 3.48e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26069 | -| time_elapsed | 141792 | -| total_timesteps | 3336832 | -| train/ | | -| approx_kl | 0.046607815 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0419 | -| learning_rate | 0.0003 | -| loss | 0.0393 | -| n_updates | 260680 | -| policy_gradient_loss | 0.048 | -| std | 0.00604 | -| value_loss | 0.00453 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.876 | -| time/ | | -| fps | 23 | -| iterations | 26070 | -| time_elapsed | 141796 | -| total_timesteps | 3336960 | -| train/ | | -| approx_kl | 0.36299777 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | 0.25 | -| n_updates | 260690 | -| policy_gradient_loss | 0.132 | -| std | 0.00603 | -| value_loss | 0.000367 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26071 | -| time_elapsed | 141800 | -| total_timesteps | 3337088 | -| train/ | | -| approx_kl | 0.24522565 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0155 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 260700 | -| policy_gradient_loss | 0.118 | -| std | 0.00603 | -| value_loss | 0.000131 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26072 | -| time_elapsed | 141809 | -| total_timesteps | 3337216 | -| train/ | | -| approx_kl | 0.06942011 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.883 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 260710 | -| policy_gradient_loss | 0.0361 | -| std | 0.00603 | -| value_loss | 0.00315 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26073 | -| time_elapsed | 141814 | -| total_timesteps | 3337344 | -| train/ | | -| approx_kl | 0.34314987 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -42.4 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 260720 | -| policy_gradient_loss | 0.0597 | -| std | 0.00603 | -| value_loss | 0.000113 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26074 | -| time_elapsed | 141819 | -| total_timesteps | 3337472 | -| train/ | | -| approx_kl | 0.1779832 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.47 | -| learning_rate | 0.0003 | -| loss | 0.0951 | -| n_updates | 260730 | -| policy_gradient_loss | 0.104 | -| std | 0.00603 | -| value_loss | 4.43e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26075 | -| time_elapsed | 141823 | -| total_timesteps | 3337600 | -| train/ | | -| approx_kl | 0.048706897 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00927 | -| learning_rate | 0.0003 | -| loss | 0.00869 | -| n_updates | 260740 | -| policy_gradient_loss | 0.0341 | -| std | 0.00603 | -| value_loss | 2.25e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26076 | -| time_elapsed | 141828 | -| total_timesteps | 3337728 | -| train/ | | -| approx_kl | 0.024985928 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.0172 | -| n_updates | 260750 | -| policy_gradient_loss | 0.0279 | -| std | 0.006 | -| value_loss | 0.000138 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26077 | -| time_elapsed | 141833 | -| total_timesteps | 3337856 | -| train/ | | -| approx_kl | 0.00019046292 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -2.71 | -| learning_rate | 0.0003 | -| loss | 0.000316 | -| n_updates | 260760 | -| policy_gradient_loss | 0.0168 | -| std | 0.00599 | -| value_loss | 3.79e-06 | -------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.891 | -| time/ | | -| fps | 23 | -| iterations | 26078 | -| time_elapsed | 141837 | -| total_timesteps | 3337984 | -| train/ | | -| approx_kl | 0.610812 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00608 | -| learning_rate | 0.0003 | -| loss | 0.236 | -| n_updates | 260770 | -| policy_gradient_loss | 0.0776 | -| std | 0.00599 | -| value_loss | 5.59e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 26079 | -| time_elapsed | 141841 | -| total_timesteps | 3338112 | -| train/ | | -| approx_kl | 0.056846827 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.144 | -| learning_rate | 0.0003 | -| loss | 0.0298 | -| n_updates | 260780 | -| policy_gradient_loss | 0.0137 | -| std | 0.00599 | -| value_loss | 4.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 26080 | -| time_elapsed | 141850 | -| total_timesteps | 3338240 | -| train/ | | -| approx_kl | 0.06588542 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.885 | -| learning_rate | 0.0003 | -| loss | -0.00741 | -| n_updates | 260790 | -| policy_gradient_loss | -0.00669 | -| std | 0.00599 | -| value_loss | 0.00245 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 26081 | -| time_elapsed | 141853 | -| total_timesteps | 3338368 | -| train/ | | -| approx_kl | 0.012735202 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -8.24 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 260800 | -| policy_gradient_loss | 0.00319 | -| std | 0.00599 | -| value_loss | 9.9e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 26082 | -| time_elapsed | 141858 | -| total_timesteps | 3338496 | -| train/ | | -| approx_kl | 0.003207196 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.177 | -| learning_rate | 0.0003 | -| loss | -0.00217 | -| n_updates | 260810 | -| policy_gradient_loss | 0.0103 | -| std | 0.00599 | -| value_loss | 6.25e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 26083 | -| time_elapsed | 141863 | -| total_timesteps | 3338624 | -| train/ | | -| approx_kl | 1.2053177e-05 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0241 | -| learning_rate | 0.0003 | -| loss | 0.000195 | -| n_updates | 260820 | -| policy_gradient_loss | 0.0385 | -| std | 0.00599 | -| value_loss | 2.86e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 26084 | -| time_elapsed | 141868 | -| total_timesteps | 3338752 | -| train/ | | -| approx_kl | 0.89489096 | -| clip_fraction | 0.776 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | 0.211 | -| n_updates | 260830 | -| policy_gradient_loss | 0.188 | -| std | 0.00599 | -| value_loss | 1.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.901 | -| time/ | | -| fps | 23 | -| iterations | 26085 | -| time_elapsed | 141872 | -| total_timesteps | 3338880 | -| train/ | | -| approx_kl | 0.012501159 | -| clip_fraction | 0.428 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 260840 | -| policy_gradient_loss | 0.0206 | -| std | 0.00599 | -| value_loss | 2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26086 | -| time_elapsed | 141876 | -| total_timesteps | 3339008 | -| train/ | | -| approx_kl | 0.12425294 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.04 | -| n_updates | 260850 | -| policy_gradient_loss | 0.0258 | -| std | 0.00599 | -| value_loss | 1.64e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26087 | -| time_elapsed | 141886 | -| total_timesteps | 3339136 | -| train/ | | -| approx_kl | 0.0099888295 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.868 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 260860 | -| policy_gradient_loss | 0.0109 | -| std | 0.00599 | -| value_loss | 0.00299 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26088 | -| time_elapsed | 141891 | -| total_timesteps | 3339264 | -| train/ | | -| approx_kl | 0.12696508 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.261 | -| learning_rate | 0.0003 | -| loss | 0.0546 | -| n_updates | 260870 | -| policy_gradient_loss | 0.0179 | -| std | 0.00599 | -| value_loss | 0.000374 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26089 | -| time_elapsed | 141894 | -| total_timesteps | 3339392 | -| train/ | | -| approx_kl | 1.2457371e-05 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.195 | -| learning_rate | 0.0003 | -| loss | 0.000888 | -| n_updates | 260880 | -| policy_gradient_loss | 0.0165 | -| std | 0.00599 | -| value_loss | 1.04e-05 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26090 | -| time_elapsed | 141898 | -| total_timesteps | 3339520 | -| train/ | | -| approx_kl | 0.0003844113 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00579 | -| learning_rate | 0.0003 | -| loss | -0.0067 | -| n_updates | 260890 | -| policy_gradient_loss | 0.00961 | -| std | 0.00599 | -| value_loss | 3e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26091 | -| time_elapsed | 141903 | -| total_timesteps | 3339648 | -| train/ | | -| approx_kl | 0.016748725 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.00757 | -| n_updates | 260900 | -| policy_gradient_loss | 0.0198 | -| std | 0.00599 | -| value_loss | 1.85e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26092 | -| time_elapsed | 141908 | -| total_timesteps | 3339776 | -| train/ | | -| approx_kl | 0.022789009 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 260910 | -| policy_gradient_loss | 0.0363 | -| std | 0.00599 | -| value_loss | 1.29e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26093 | -| time_elapsed | 141912 | -| total_timesteps | 3339904 | -| train/ | | -| approx_kl | 0.113789655 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.263 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 260920 | -| policy_gradient_loss | 0.0292 | -| std | 0.00599 | -| value_loss | 4.14e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26094 | -| time_elapsed | 141917 | -| total_timesteps | 3340032 | -| train/ | | -| approx_kl | 0.14377634 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.131 | -| learning_rate | 0.0003 | -| loss | 0.0611 | -| n_updates | 260930 | -| policy_gradient_loss | 0.0213 | -| std | 0.00599 | -| value_loss | 3.02e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26095 | -| time_elapsed | 141927 | -| total_timesteps | 3340160 | -| train/ | | -| approx_kl | 0.004518285 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.944 | -| learning_rate | 0.0003 | -| loss | -0.000486 | -| n_updates | 260940 | -| policy_gradient_loss | 0.0168 | -| std | 0.00599 | -| value_loss | 0.000898 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26096 | -| time_elapsed | 141932 | -| total_timesteps | 3340288 | -| train/ | | -| approx_kl | 0.3384032 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 260950 | -| policy_gradient_loss | 0.146 | -| std | 0.00599 | -| value_loss | 2.85e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26097 | -| time_elapsed | 141936 | -| total_timesteps | 3340416 | -| train/ | | -| approx_kl | 0.056870416 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0153 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 260960 | -| policy_gradient_loss | 0.025 | -| std | 0.00599 | -| value_loss | 6.33e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26098 | -| time_elapsed | 141941 | -| total_timesteps | 3340544 | -| train/ | | -| approx_kl | 0.14084259 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.256 | -| learning_rate | 0.0003 | -| loss | 0.0497 | -| n_updates | 260970 | -| policy_gradient_loss | 0.0182 | -| std | 0.00599 | -| value_loss | 2.11e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26099 | -| time_elapsed | 141946 | -| total_timesteps | 3340672 | -| train/ | | -| approx_kl | 0.016023284 | -| clip_fraction | 0.102 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0994 | -| learning_rate | 0.0003 | -| loss | -0.00356 | -| n_updates | 260980 | -| policy_gradient_loss | -0.00211 | -| std | 0.00599 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26100 | -| time_elapsed | 141950 | -| total_timesteps | 3340800 | -| train/ | | -| approx_kl | 0.031866048 | -| clip_fraction | 0.455 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0706 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 260990 | -| policy_gradient_loss | 0.0386 | -| std | 0.00599 | -| value_loss | 1.15e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.908 | -| time/ | | -| fps | 23 | -| iterations | 26101 | -| time_elapsed | 141955 | -| total_timesteps | 3340928 | -| train/ | | -| approx_kl | 0.31343096 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0531 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 261000 | -| policy_gradient_loss | 0.142 | -| std | 0.006 | -| value_loss | 6.63e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26102 | -| time_elapsed | 141958 | -| total_timesteps | 3341056 | -| train/ | | -| approx_kl | 0.20620939 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0842 | -| learning_rate | 0.0003 | -| loss | 0.136 | -| n_updates | 261010 | -| policy_gradient_loss | 0.128 | -| std | 0.006 | -| value_loss | 6.62e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26103 | -| time_elapsed | 141966 | -| total_timesteps | 3341184 | -| train/ | | -| approx_kl | 0.008331286 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.966 | -| learning_rate | 0.0003 | -| loss | -0.00821 | -| n_updates | 261020 | -| policy_gradient_loss | 0.00531 | -| std | 0.006 | -| value_loss | 0.000486 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26104 | -| time_elapsed | 141970 | -| total_timesteps | 3341312 | -| train/ | | -| approx_kl | 0.12593362 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.0276 | -| n_updates | 261030 | -| policy_gradient_loss | 0.0255 | -| std | 0.006 | -| value_loss | 3.4e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26105 | -| time_elapsed | 141975 | -| total_timesteps | 3341440 | -| train/ | | -| approx_kl | 0.44268435 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.000962 | -| learning_rate | 0.0003 | -| loss | 0.227 | -| n_updates | 261040 | -| policy_gradient_loss | 0.226 | -| std | 0.006 | -| value_loss | 8.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26106 | -| time_elapsed | 141980 | -| total_timesteps | 3341568 | -| train/ | | -| approx_kl | 0.049022995 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00417 | -| learning_rate | 0.0003 | -| loss | 0.0318 | -| n_updates | 261050 | -| policy_gradient_loss | 0.0227 | -| std | 0.00599 | -| value_loss | 3.04e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26107 | -| time_elapsed | 141986 | -| total_timesteps | 3341696 | -| train/ | | -| approx_kl | 0.16879776 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.0777 | -| n_updates | 261060 | -| policy_gradient_loss | 0.0231 | -| std | 0.00599 | -| value_loss | 2e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26108 | -| time_elapsed | 141990 | -| total_timesteps | 3341824 | -| train/ | | -| approx_kl | 0.030640356 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 261070 | -| policy_gradient_loss | 0.0406 | -| std | 0.00599 | -| value_loss | 1.77e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.905 | -| time/ | | -| fps | 23 | -| iterations | 26109 | -| time_elapsed | 141995 | -| total_timesteps | 3341952 | -| train/ | | -| approx_kl | 0.12175899 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | 0.0696 | -| n_updates | 261080 | -| policy_gradient_loss | 0.0345 | -| std | 0.00599 | -| value_loss | 1.42e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26110 | -| time_elapsed | 141999 | -| total_timesteps | 3342080 | -| train/ | | -| approx_kl | 0.0068356474 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0457 | -| learning_rate | 0.0003 | -| loss | 0.0069 | -| n_updates | 261090 | -| policy_gradient_loss | 0.0109 | -| std | 0.00599 | -| value_loss | 9.11e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26111 | -| time_elapsed | 142009 | -| total_timesteps | 3342208 | -| train/ | | -| approx_kl | 0.06853873 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.838 | -| learning_rate | 0.0003 | -| loss | 0.00375 | -| n_updates | 261100 | -| policy_gradient_loss | 0.00671 | -| std | 0.00599 | -| value_loss | 0.00175 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26112 | -| time_elapsed | 142015 | -| total_timesteps | 3342336 | -| train/ | | -| approx_kl | 0.23783718 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | 0.0853 | -| n_updates | 261110 | -| policy_gradient_loss | 0.0239 | -| std | 0.00599 | -| value_loss | 1.13e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26113 | -| time_elapsed | 142020 | -| total_timesteps | 3342464 | -| train/ | | -| approx_kl | 0.01881434 | -| clip_fraction | 0.139 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00803 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 261120 | -| policy_gradient_loss | -0.000657 | -| std | 0.00599 | -| value_loss | 2.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26114 | -| time_elapsed | 142025 | -| total_timesteps | 3342592 | -| train/ | | -| approx_kl | 0.012923373 | -| clip_fraction | 0.105 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0274 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 261130 | -| policy_gradient_loss | -0.00638 | -| std | 0.00599 | -| value_loss | 1.07e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26115 | -| time_elapsed | 142029 | -| total_timesteps | 3342720 | -| train/ | | -| approx_kl | 0.030692087 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0689 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 261140 | -| policy_gradient_loss | 0.04 | -| std | 0.00599 | -| value_loss | 7.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26116 | -| time_elapsed | 142034 | -| total_timesteps | 3342848 | -| train/ | | -| approx_kl | 0.16463003 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0593 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 261150 | -| policy_gradient_loss | 0.0263 | -| std | 0.00599 | -| value_loss | 7.53e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.907 | -| time/ | | -| fps | 23 | -| iterations | 26117 | -| time_elapsed | 142039 | -| total_timesteps | 3342976 | -| train/ | | -| approx_kl | 0.00018746918 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0321 | -| learning_rate | 0.0003 | -| loss | -0.00234 | -| n_updates | 261160 | -| policy_gradient_loss | 0.0249 | -| std | 0.00599 | -| value_loss | 6.48e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 26118 | -| time_elapsed | 142045 | -| total_timesteps | 3343104 | -| train/ | | -| approx_kl | 0.00084326137 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0319 | -| learning_rate | 0.0003 | -| loss | 0.000113 | -| n_updates | 261170 | -| policy_gradient_loss | 0.0377 | -| std | 0.00599 | -| value_loss | 1.91e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 26119 | -| time_elapsed | 142055 | -| total_timesteps | 3343232 | -| train/ | | -| approx_kl | 0.032680858 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.966 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 261180 | -| policy_gradient_loss | -0.0102 | -| std | 0.00599 | -| value_loss | 0.000243 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 26120 | -| time_elapsed | 142060 | -| total_timesteps | 3343360 | -| train/ | | -| approx_kl | 0.04432816 | -| clip_fraction | 0.424 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0823 | -| learning_rate | 0.0003 | -| loss | 0.000645 | -| n_updates | 261190 | -| policy_gradient_loss | 0.0303 | -| std | 0.00599 | -| value_loss | 2.26e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 26121 | -| time_elapsed | 142065 | -| total_timesteps | 3343488 | -| train/ | | -| approx_kl | 1.1141416 | -| clip_fraction | 0.763 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0163 | -| learning_rate | 0.0003 | -| loss | 0.455 | -| n_updates | 261200 | -| policy_gradient_loss | 0.195 | -| std | 0.00599 | -| value_loss | 6.62e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 26122 | -| time_elapsed | 142069 | -| total_timesteps | 3343616 | -| train/ | | -| approx_kl | 0.006575453 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0692 | -| learning_rate | 0.0003 | -| loss | -0.00786 | -| n_updates | 261210 | -| policy_gradient_loss | 0.0204 | -| std | 0.00599 | -| value_loss | 3.37e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 26123 | -| time_elapsed | 142074 | -| total_timesteps | 3343744 | -| train/ | | -| approx_kl | 0.0039213127 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | 0.0196 | -| n_updates | 261220 | -| policy_gradient_loss | 0.00786 | -| std | 0.00599 | -| value_loss | 2.96e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.91 | -| time/ | | -| fps | 23 | -| iterations | 26124 | -| time_elapsed | 142079 | -| total_timesteps | 3343872 | -| train/ | | -| approx_kl | 0.07065076 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | 0.0337 | -| n_updates | 261230 | -| policy_gradient_loss | 0.0301 | -| std | 0.00599 | -| value_loss | 1.69e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26125 | -| time_elapsed | 142083 | -| total_timesteps | 3344000 | -| train/ | | -| approx_kl | 0.00044646487 | -| clip_fraction | 0.365 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0679 | -| learning_rate | 0.0003 | -| loss | 0.000971 | -| n_updates | 261240 | -| policy_gradient_loss | 0.0287 | -| std | 0.00599 | -| value_loss | 1.32e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26126 | -| time_elapsed | 142085 | -| total_timesteps | 3344128 | -| train/ | | -| approx_kl | 0.00019834517 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00621 | -| learning_rate | 0.0003 | -| loss | 0.00257 | -| n_updates | 261250 | -| policy_gradient_loss | 0.0353 | -| std | 0.00599 | -| value_loss | 7.83e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26127 | -| time_elapsed | 142097 | -| total_timesteps | 3344256 | -| train/ | | -| approx_kl | 0.03415219 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.968 | -| learning_rate | 0.0003 | -| loss | -0.0182 | -| n_updates | 261260 | -| policy_gradient_loss | -0.00696 | -| std | 0.00599 | -| value_loss | 0.000471 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26128 | -| time_elapsed | 142102 | -| total_timesteps | 3344384 | -| train/ | | -| approx_kl | 0.5959442 | -| clip_fraction | 0.509 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.204 | -| n_updates | 261270 | -| policy_gradient_loss | 0.0684 | -| std | 0.006 | -| value_loss | 3.79e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26129 | -| time_elapsed | 142106 | -| total_timesteps | 3344512 | -| train/ | | -| approx_kl | 0.010635205 | -| clip_fraction | 0.219 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | 0.000414 | -| n_updates | 261280 | -| policy_gradient_loss | 0.00899 | -| std | 0.00599 | -| value_loss | 7.97e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26130 | -| time_elapsed | 142110 | -| total_timesteps | 3344640 | -| train/ | | -| approx_kl | 0.07653656 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0282 | -| learning_rate | 0.0003 | -| loss | 0.0035 | -| n_updates | 261290 | -| policy_gradient_loss | -0.0035 | -| std | 0.00599 | -| value_loss | 5.65e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26131 | -| time_elapsed | 142115 | -| total_timesteps | 3344768 | -| train/ | | -| approx_kl | 0.052479304 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 0.0315 | -| n_updates | 261300 | -| policy_gradient_loss | 0.0161 | -| std | 0.006 | -| value_loss | 3.12e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.911 | -| time/ | | -| fps | 23 | -| iterations | 26132 | -| time_elapsed | 142119 | -| total_timesteps | 3344896 | -| train/ | | -| approx_kl | 0.008725178 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0959 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 261310 | -| policy_gradient_loss | 0.00567 | -| std | 0.006 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26133 | -| time_elapsed | 142123 | -| total_timesteps | 3345024 | -| train/ | | -| approx_kl | 0.0024061673 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | -0.00672 | -| n_updates | 261320 | -| policy_gradient_loss | 0.0102 | -| std | 0.006 | -| value_loss | 2.26e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26134 | -| time_elapsed | 142134 | -| total_timesteps | 3345152 | -| train/ | | -| approx_kl | 0.052992977 | -| clip_fraction | 0.62 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.959 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 261330 | -| policy_gradient_loss | 0.0809 | -| std | 0.006 | -| value_loss | 0.000605 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26135 | -| time_elapsed | 142139 | -| total_timesteps | 3345280 | -| train/ | | -| approx_kl | 0.21817823 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0221 | -| learning_rate | 0.0003 | -| loss | 0.115 | -| n_updates | 261340 | -| policy_gradient_loss | 0.137 | -| std | 0.00602 | -| value_loss | 2.91e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26136 | -| time_elapsed | 142144 | -| total_timesteps | 3345408 | -| train/ | | -| approx_kl | 0.033201694 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0226 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 261350 | -| policy_gradient_loss | 0.0225 | -| std | 0.00602 | -| value_loss | 6.22e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26137 | -| time_elapsed | 142149 | -| total_timesteps | 3345536 | -| train/ | | -| approx_kl | 0.669989 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.165 | -| n_updates | 261360 | -| policy_gradient_loss | 0.0645 | -| std | 0.00603 | -| value_loss | 4.11e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26138 | -| time_elapsed | 142154 | -| total_timesteps | 3345664 | -| train/ | | -| approx_kl | 0.045583323 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0376 | -| learning_rate | 0.0003 | -| loss | 0.0331 | -| n_updates | 261370 | -| policy_gradient_loss | 0.017 | -| std | 0.00603 | -| value_loss | 2.09e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26139 | -| time_elapsed | 142158 | -| total_timesteps | 3345792 | -| train/ | | -| approx_kl | 0.056603394 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 261380 | -| policy_gradient_loss | 0.00965 | -| std | 0.00603 | -| value_loss | 1.56e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.906 | -| time/ | | -| fps | 23 | -| iterations | 26140 | -| time_elapsed | 142162 | -| total_timesteps | 3345920 | -| train/ | | -| approx_kl | 0.01013284 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0574 | -| learning_rate | 0.0003 | -| loss | -0.0189 | -| n_updates | 261390 | -| policy_gradient_loss | 0.00259 | -| std | 0.00603 | -| value_loss | 1.27e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26141 | -| time_elapsed | 142167 | -| total_timesteps | 3346048 | -| train/ | | -| approx_kl | 0.00040295208 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | -2.33e-05 | -| n_updates | 261400 | -| policy_gradient_loss | 0.0408 | -| std | 0.00603 | -| value_loss | 1.45e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26142 | -| time_elapsed | 142178 | -| total_timesteps | 3346176 | -| train/ | | -| approx_kl | 0.7071111 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | 0.249 | -| n_updates | 261410 | -| policy_gradient_loss | 0.14 | -| std | 0.00604 | -| value_loss | 0.00296 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26143 | -| time_elapsed | 142183 | -| total_timesteps | 3346304 | -| train/ | | -| approx_kl | 0.024866411 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.329 | -| learning_rate | 0.0003 | -| loss | 0.00511 | -| n_updates | 261420 | -| policy_gradient_loss | 0.000695 | -| std | 0.00604 | -| value_loss | 9.16e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26144 | -| time_elapsed | 142187 | -| total_timesteps | 3346432 | -| train/ | | -| approx_kl | 0.025979493 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 261430 | -| policy_gradient_loss | 0.0342 | -| std | 0.00605 | -| value_loss | 2.45e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26145 | -| time_elapsed | 142190 | -| total_timesteps | 3346560 | -| train/ | | -| approx_kl | 0.32957423 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | 0.185 | -| n_updates | 261440 | -| policy_gradient_loss | 0.163 | -| std | 0.00605 | -| value_loss | 2.15e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26146 | -| time_elapsed | 142195 | -| total_timesteps | 3346688 | -| train/ | | -| approx_kl | 0.33523005 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0278 | -| learning_rate | 0.0003 | -| loss | 0.204 | -| n_updates | 261450 | -| policy_gradient_loss | 0.166 | -| std | 0.00603 | -| value_loss | 0.00392 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26147 | -| time_elapsed | 142201 | -| total_timesteps | 3346816 | -| train/ | | -| approx_kl | 0.050089914 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.36 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 261460 | -| policy_gradient_loss | 0.0215 | -| std | 0.00603 | -| value_loss | 0.000599 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.903 | -| time/ | | -| fps | 23 | -| iterations | 26148 | -| time_elapsed | 142205 | -| total_timesteps | 3346944 | -| train/ | | -| approx_kl | 0.00073224027 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0116 | -| learning_rate | 0.0003 | -| loss | 0.000443 | -| n_updates | 261470 | -| policy_gradient_loss | 0.0307 | -| std | 0.00603 | -| value_loss | 9.66e-05 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26149 | -| time_elapsed | 142211 | -| total_timesteps | 3347072 | -| train/ | | -| approx_kl | 0.8535478 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0441 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 261480 | -| policy_gradient_loss | 0.0629 | -| std | 0.00603 | -| value_loss | 4.34e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26150 | -| time_elapsed | 142218 | -| total_timesteps | 3347200 | -| train/ | | -| approx_kl | 0.029763602 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.354 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 261490 | -| policy_gradient_loss | 0.018 | -| std | 0.00603 | -| value_loss | 0.0653 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26151 | -| time_elapsed | 142223 | -| total_timesteps | 3347328 | -| train/ | | -| approx_kl | 0.21191777 | -| clip_fraction | 0.45 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.073 | -| n_updates | 261500 | -| policy_gradient_loss | 0.0441 | -| std | 0.00603 | -| value_loss | 0.00462 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26152 | -| time_elapsed | 142230 | -| total_timesteps | 3347456 | -| train/ | | -| approx_kl | 0.42507243 | -| clip_fraction | 0.689 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 261510 | -| policy_gradient_loss | 0.147 | -| std | 0.00603 | -| value_loss | 0.00112 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26153 | -| time_elapsed | 142235 | -| total_timesteps | 3347584 | -| train/ | | -| approx_kl | 0.20536286 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00189 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 261520 | -| policy_gradient_loss | 0.117 | -| std | 0.00603 | -| value_loss | 0.00073 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26154 | -| time_elapsed | 142239 | -| total_timesteps | 3347712 | -| train/ | | -| approx_kl | 0.1699211 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 261530 | -| policy_gradient_loss | 0.163 | -| std | 0.00603 | -| value_loss | 0.000535 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26155 | -| time_elapsed | 142244 | -| total_timesteps | 3347840 | -| train/ | | -| approx_kl | 0.030161452 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0302 | -| learning_rate | 0.0003 | -| loss | 0.0182 | -| n_updates | 261540 | -| policy_gradient_loss | 0.0317 | -| std | 0.00603 | -| value_loss | 0.000463 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.913 | -| time/ | | -| fps | 23 | -| iterations | 26156 | -| time_elapsed | 142248 | -| total_timesteps | 3347968 | -| train/ | | -| approx_kl | 0.6593127 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.031 | -| learning_rate | 0.0003 | -| loss | 0.147 | -| n_updates | 261550 | -| policy_gradient_loss | 0.0562 | -| std | 0.00603 | -| value_loss | 0.000414 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26157 | -| time_elapsed | 142253 | -| total_timesteps | 3348096 | -| train/ | | -| approx_kl | 0.07051855 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 261560 | -| policy_gradient_loss | 0.0166 | -| std | 0.00603 | -| value_loss | 0.000362 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26158 | -| time_elapsed | 142265 | -| total_timesteps | 3348224 | -| train/ | | -| approx_kl | 0.016235813 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.724 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 261570 | -| policy_gradient_loss | -0.0043 | -| std | 0.00603 | -| value_loss | 0.00847 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26159 | -| time_elapsed | 142270 | -| total_timesteps | 3348352 | -| train/ | | -| approx_kl | 0.05588968 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 261580 | -| policy_gradient_loss | 0.00489 | -| std | 0.00603 | -| value_loss | 0.000204 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26160 | -| time_elapsed | 142275 | -| total_timesteps | 3348480 | -| train/ | | -| approx_kl | 0.042928692 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0471 | -| learning_rate | 0.0003 | -| loss | 0.0233 | -| n_updates | 261590 | -| policy_gradient_loss | 0.0129 | -| std | 0.00604 | -| value_loss | 0.000129 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26161 | -| time_elapsed | 142280 | -| total_timesteps | 3348608 | -| train/ | | -| approx_kl | 0.095326774 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0859 | -| learning_rate | 0.0003 | -| loss | 0.0224 | -| n_updates | 261600 | -| policy_gradient_loss | 0.00801 | -| std | 0.00604 | -| value_loss | 9.94e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26162 | -| time_elapsed | 142284 | -| total_timesteps | 3348736 | -| train/ | | -| approx_kl | 0.079333946 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | 0.0327 | -| n_updates | 261610 | -| policy_gradient_loss | 0.0163 | -| std | 0.00604 | -| value_loss | 0.000104 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26163 | -| time_elapsed | 142288 | -| total_timesteps | 3348864 | -| train/ | | -| approx_kl | 0.012923661 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0288 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 261620 | -| policy_gradient_loss | 0.00742 | -| std | 0.00604 | -| value_loss | 9.26e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.929 | -| time/ | | -| fps | 23 | -| iterations | 26164 | -| time_elapsed | 142294 | -| total_timesteps | 3348992 | -| train/ | | -| approx_kl | 0.11131738 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0264 | -| learning_rate | 0.0003 | -| loss | 0.0333 | -| n_updates | 261630 | -| policy_gradient_loss | 0.0104 | -| std | 0.00604 | -| value_loss | 7.98e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26165 | -| time_elapsed | 142299 | -| total_timesteps | 3349120 | -| train/ | | -| approx_kl | 0.06771973 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | -0.00531 | -| n_updates | 261640 | -| policy_gradient_loss | -0.00129 | -| std | 0.00604 | -| value_loss | 7.15e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26166 | -| time_elapsed | 142312 | -| total_timesteps | 3349248 | -| train/ | | -| approx_kl | 0.04467735 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | -0.0248 | -| n_updates | 261650 | -| policy_gradient_loss | -0.0145 | -| std | 0.00604 | -| value_loss | 0.000926 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26167 | -| time_elapsed | 142315 | -| total_timesteps | 3349376 | -| train/ | | -| approx_kl | 0.1096447 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.167 | -| learning_rate | 0.0003 | -| loss | 0.0948 | -| n_updates | 261660 | -| policy_gradient_loss | 0.13 | -| std | 0.00604 | -| value_loss | 2.22e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26168 | -| time_elapsed | 142321 | -| total_timesteps | 3349504 | -| train/ | | -| approx_kl | 0.022762239 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | 0.012 | -| n_updates | 261670 | -| policy_gradient_loss | 0.029 | -| std | 0.00604 | -| value_loss | 8.87e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26169 | -| time_elapsed | 142326 | -| total_timesteps | 3349632 | -| train/ | | -| approx_kl | 0.2122068 | -| clip_fraction | 0.378 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.0898 | -| n_updates | 261680 | -| policy_gradient_loss | 0.0244 | -| std | 0.00604 | -| value_loss | 5.24e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26170 | -| time_elapsed | 142331 | -| total_timesteps | 3349760 | -| train/ | | -| approx_kl | 0.018263733 | -| clip_fraction | 0.16 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0724 | -| learning_rate | 0.0003 | -| loss | 0.0057 | -| n_updates | 261690 | -| policy_gradient_loss | 0.00158 | -| std | 0.00604 | -| value_loss | 4.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26171 | -| time_elapsed | 142336 | -| total_timesteps | 3349888 | -| train/ | | -| approx_kl | 0.016844977 | -| clip_fraction | 0.134 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | 0.000763 | -| n_updates | 261700 | -| policy_gradient_loss | -0.000333 | -| std | 0.00604 | -| value_loss | 3.26e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26172 | -| time_elapsed | 142340 | -| total_timesteps | 3350016 | -| train/ | | -| approx_kl | 0.030395657 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | 0.00226 | -| n_updates | 261710 | -| policy_gradient_loss | 0.0311 | -| std | 0.00604 | -| value_loss | 2.85e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26173 | -| time_elapsed | 142352 | -| total_timesteps | 3350144 | -| train/ | | -| approx_kl | 0.45247746 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.816 | -| learning_rate | 0.0003 | -| loss | 0.056 | -| n_updates | 261720 | -| policy_gradient_loss | 0.0347 | -| std | 0.00604 | -| value_loss | 0.000868 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26174 | -| time_elapsed | 142357 | -| total_timesteps | 3350272 | -| train/ | | -| approx_kl | 0.08912976 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.729 | -| learning_rate | 0.0003 | -| loss | 0.0308 | -| n_updates | 261730 | -| policy_gradient_loss | 0.0241 | -| std | 0.00604 | -| value_loss | 1.64e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26175 | -| time_elapsed | 142363 | -| total_timesteps | 3350400 | -| train/ | | -| approx_kl | 0.55617464 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.606 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 261740 | -| policy_gradient_loss | 0.038 | -| std | 0.00604 | -| value_loss | 1.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26176 | -| time_elapsed | 142369 | -| total_timesteps | 3350528 | -| train/ | | -| approx_kl | 0.07992217 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00915 | -| learning_rate | 0.0003 | -| loss | 0.0272 | -| n_updates | 261750 | -| policy_gradient_loss | 0.00818 | -| std | 0.00604 | -| value_loss | 1.15e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26177 | -| time_elapsed | 142374 | -| total_timesteps | 3350656 | -| train/ | | -| approx_kl | 0.011502925 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0175 | -| learning_rate | 0.0003 | -| loss | 0.00325 | -| n_updates | 261760 | -| policy_gradient_loss | 0.00793 | -| std | 0.00604 | -| value_loss | 1.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26178 | -| time_elapsed | 142379 | -| total_timesteps | 3350784 | -| train/ | | -| approx_kl | 0.07603036 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.124 | -| learning_rate | 0.0003 | -| loss | 0.0466 | -| n_updates | 261770 | -| policy_gradient_loss | 0.0192 | -| std | 0.00604 | -| value_loss | 1.2e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26179 | -| time_elapsed | 142383 | -| total_timesteps | 3350912 | -| train/ | | -| approx_kl | 0.0087521 | -| clip_fraction | 0.179 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0725 | -| learning_rate | 0.0003 | -| loss | -0.00928 | -| n_updates | 261780 | -| policy_gradient_loss | 0.00246 | -| std | 0.00604 | -| value_loss | 1.02e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26180 | -| time_elapsed | 142387 | -| total_timesteps | 3351040 | -| train/ | | -| approx_kl | 0.08604061 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.0548 | -| n_updates | 261790 | -| policy_gradient_loss | 0.0251 | -| std | 0.00605 | -| value_loss | 5.64e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26181 | -| time_elapsed | 142398 | -| total_timesteps | 3351168 | -| train/ | | -| approx_kl | 0.06498551 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.742 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 261800 | -| policy_gradient_loss | 0.00504 | -| std | 0.00605 | -| value_loss | 0.00105 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26182 | -| time_elapsed | 142403 | -| total_timesteps | 3351296 | -| train/ | | -| approx_kl | 0.058219284 | -| clip_fraction | 0.63 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.362 | -| learning_rate | 0.0003 | -| loss | 0.0007 | -| n_updates | 261810 | -| policy_gradient_loss | 0.0792 | -| std | 0.00605 | -| value_loss | 2.22e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26183 | -| time_elapsed | 142408 | -| total_timesteps | 3351424 | -| train/ | | -| approx_kl | 0.016659766 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -10.1 | -| learning_rate | 0.0003 | -| loss | -0.0145 | -| n_updates | 261820 | -| policy_gradient_loss | -0.000694 | -| std | 0.00605 | -| value_loss | 2.09e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26184 | -| time_elapsed | 142413 | -| total_timesteps | 3351552 | -| train/ | | -| approx_kl | 0.20064056 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.0522 | -| n_updates | 261830 | -| policy_gradient_loss | 0.00933 | -| std | 0.00605 | -| value_loss | 2.15e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26185 | -| time_elapsed | 142416 | -| total_timesteps | 3351680 | -| train/ | | -| approx_kl | 0.0050933775 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | 0.0077 | -| n_updates | 261840 | -| policy_gradient_loss | 0.0194 | -| std | 0.00605 | -| value_loss | 8.91e-10 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26186 | -| time_elapsed | 142420 | -| total_timesteps | 3351808 | -| train/ | | -| approx_kl | 0.002127008 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.00362 | -| n_updates | 261850 | -| policy_gradient_loss | 0.0241 | -| std | 0.00605 | -| value_loss | 5.62e-10 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26187 | -| time_elapsed | 142424 | -| total_timesteps | 3351936 | -| train/ | | -| approx_kl | 0.09293869 | -| clip_fraction | 0.467 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.032 | -| n_updates | 261860 | -| policy_gradient_loss | 0.0292 | -| std | 0.00605 | -| value_loss | 4.33e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26188 | -| time_elapsed | 142428 | -| total_timesteps | 3352064 | -| train/ | | -| approx_kl | 0.14197785 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 261870 | -| policy_gradient_loss | 0.013 | -| std | 0.00605 | -| value_loss | 3.75e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26189 | -| time_elapsed | 142437 | -| total_timesteps | 3352192 | -| train/ | | -| approx_kl | 0.059331007 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.788 | -| learning_rate | 0.0003 | -| loss | 0.0451 | -| n_updates | 261880 | -| policy_gradient_loss | 0.00372 | -| std | 0.00605 | -| value_loss | 0.00702 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26190 | -| time_elapsed | 142442 | -| total_timesteps | 3352320 | -| train/ | | -| approx_kl | 0.18116201 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.53 | -| learning_rate | 0.0003 | -| loss | 0.0799 | -| n_updates | 261890 | -| policy_gradient_loss | 0.0553 | -| std | 0.00605 | -| value_loss | 3.79e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26191 | -| time_elapsed | 142446 | -| total_timesteps | 3352448 | -| train/ | | -| approx_kl | 0.14070483 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 261900 | -| policy_gradient_loss | 0.0335 | -| std | 0.00605 | -| value_loss | 6.49e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26192 | -| time_elapsed | 142450 | -| total_timesteps | 3352576 | -| train/ | | -| approx_kl | 0.035227396 | -| clip_fraction | 0.406 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0451 | -| learning_rate | 0.0003 | -| loss | -0.00442 | -| n_updates | 261910 | -| policy_gradient_loss | 0.0245 | -| std | 0.00605 | -| value_loss | 2e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26193 | -| time_elapsed | 142454 | -| total_timesteps | 3352704 | -| train/ | | -| approx_kl | 0.006839931 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0964 | -| learning_rate | 0.0003 | -| loss | -0.00806 | -| n_updates | 261920 | -| policy_gradient_loss | 0.0216 | -| std | 0.00605 | -| value_loss | 2.1e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26194 | -| time_elapsed | 142459 | -| total_timesteps | 3352832 | -| train/ | | -| approx_kl | 0.1742122 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 261930 | -| policy_gradient_loss | 0.0204 | -| std | 0.00605 | -| value_loss | 1.1e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.928 | -| time/ | | -| fps | 23 | -| iterations | 26195 | -| time_elapsed | 142465 | -| total_timesteps | 3352960 | -| train/ | | -| approx_kl | 0.007261811 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0114 | -| n_updates | 261940 | -| policy_gradient_loss | 0.019 | -| std | 0.00605 | -| value_loss | 8.79e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26196 | -| time_elapsed | 142471 | -| total_timesteps | 3353088 | -| train/ | | -| approx_kl | 0.026339116 | -| clip_fraction | 0.183 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0671 | -| learning_rate | 0.0003 | -| loss | 0.00599 | -| n_updates | 261950 | -| policy_gradient_loss | 0.00085 | -| std | 0.00605 | -| value_loss | 6.25e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26197 | -| time_elapsed | 142481 | -| total_timesteps | 3353216 | -| train/ | | -| approx_kl | 0.0047679436 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | -0.0116 | -| n_updates | 261960 | -| policy_gradient_loss | 0.00465 | -| std | 0.00605 | -| value_loss | 0.0042 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26198 | -| time_elapsed | 142486 | -| total_timesteps | 3353344 | -| train/ | | -| approx_kl | 0.14678767 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.00981 | -| n_updates | 261970 | -| policy_gradient_loss | 0.0364 | -| std | 0.00605 | -| value_loss | 1.78e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26199 | -| time_elapsed | 142492 | -| total_timesteps | 3353472 | -| train/ | | -| approx_kl | 0.2517579 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0115 | -| learning_rate | 0.0003 | -| loss | 0.076 | -| n_updates | 261980 | -| policy_gradient_loss | 0.0426 | -| std | 0.00605 | -| value_loss | 3.3e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26200 | -| time_elapsed | 142496 | -| total_timesteps | 3353600 | -| train/ | | -| approx_kl | 0.060100317 | -| clip_fraction | 0.608 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0399 | -| n_updates | 261990 | -| policy_gradient_loss | 0.0918 | -| std | 0.00605 | -| value_loss | 1.77e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26201 | -| time_elapsed | 142501 | -| total_timesteps | 3353728 | -| train/ | | -| approx_kl | 0.0002974975 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0536 | -| learning_rate | 0.0003 | -| loss | 0.0027 | -| n_updates | 262000 | -| policy_gradient_loss | 0.119 | -| std | 0.00605 | -| value_loss | 1.53e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26202 | -| time_elapsed | 142506 | -| total_timesteps | 3353856 | -| train/ | | -| approx_kl | 0.032670602 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0861 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 262010 | -| policy_gradient_loss | 0.0519 | -| std | 0.00605 | -| value_loss | 6.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.941 | -| time/ | | -| fps | 23 | -| iterations | 26203 | -| time_elapsed | 142513 | -| total_timesteps | 3353984 | -| train/ | | -| approx_kl | 0.14736702 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0954 | -| learning_rate | 0.0003 | -| loss | 0.072 | -| n_updates | 262020 | -| policy_gradient_loss | 0.0381 | -| std | 0.00605 | -| value_loss | 6.74e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 26204 | -| time_elapsed | 142517 | -| total_timesteps | 3354112 | -| train/ | | -| approx_kl | 0.00021361001 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | -0.00231 | -| n_updates | 262030 | -| policy_gradient_loss | 0.0331 | -| std | 0.00605 | -| value_loss | 6.23e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 26205 | -| time_elapsed | 142528 | -| total_timesteps | 3354240 | -| train/ | | -| approx_kl | 0.024313744 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 262040 | -| policy_gradient_loss | 0.00291 | -| std | 0.00605 | -| value_loss | 0.000586 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 26206 | -| time_elapsed | 142533 | -| total_timesteps | 3354368 | -| train/ | | -| approx_kl | 0.011072689 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.281 | -| learning_rate | 0.0003 | -| loss | -0.0123 | -| n_updates | 262050 | -| policy_gradient_loss | 0.0094 | -| std | 0.00605 | -| value_loss | 1.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 26207 | -| time_elapsed | 142537 | -| total_timesteps | 3354496 | -| train/ | | -| approx_kl | 0.11474812 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | 0.0599 | -| n_updates | 262060 | -| policy_gradient_loss | 0.0496 | -| std | 0.00605 | -| value_loss | 9.87e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 26208 | -| time_elapsed | 142541 | -| total_timesteps | 3354624 | -| train/ | | -| approx_kl | 0.0010338076 | -| clip_fraction | 0.0922 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | -0.000334 | -| n_updates | 262070 | -| policy_gradient_loss | 0.00284 | -| std | 0.00604 | -| value_loss | 4.74e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 26209 | -| time_elapsed | 142546 | -| total_timesteps | 3354752 | -| train/ | | -| approx_kl | 0.09162252 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0657 | -| learning_rate | 0.0003 | -| loss | 0.0423 | -| n_updates | 262080 | -| policy_gradient_loss | 0.0168 | -| std | 0.00603 | -| value_loss | 4.26e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.942 | -| time/ | | -| fps | 23 | -| iterations | 26210 | -| time_elapsed | 142551 | -| total_timesteps | 3354880 | -| train/ | | -| approx_kl | 0.005860958 | -| clip_fraction | 0.0602 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0165 | -| learning_rate | 0.0003 | -| loss | -0.00121 | -| n_updates | 262090 | -| policy_gradient_loss | -0.000346 | -| std | 0.00603 | -| value_loss | 5.57e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26211 | -| time_elapsed | 142555 | -| total_timesteps | 3355008 | -| train/ | | -| approx_kl | 0.5302769 | -| clip_fraction | 0.687 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.2 | -| n_updates | 262100 | -| policy_gradient_loss | 0.154 | -| std | 0.00603 | -| value_loss | 6.02e-08 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26212 | -| time_elapsed | 142565 | -| total_timesteps | 3355136 | -| train/ | | -| approx_kl | 0.2348422 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.916 | -| learning_rate | 0.0003 | -| loss | 0.026 | -| n_updates | 262110 | -| policy_gradient_loss | 0.027 | -| std | 0.00603 | -| value_loss | 0.000474 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26213 | -| time_elapsed | 142569 | -| total_timesteps | 3355264 | -| train/ | | -| approx_kl | 0.09651142 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.942 | -| learning_rate | 0.0003 | -| loss | 0.0166 | -| n_updates | 262120 | -| policy_gradient_loss | 0.0142 | -| std | 0.00603 | -| value_loss | 2.73e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26214 | -| time_elapsed | 142574 | -| total_timesteps | 3355392 | -| train/ | | -| approx_kl | 0.0012223013 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | -0.00849 | -| n_updates | 262130 | -| policy_gradient_loss | 0.0248 | -| std | 0.00603 | -| value_loss | 1.06e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26215 | -| time_elapsed | 142578 | -| total_timesteps | 3355520 | -| train/ | | -| approx_kl | 0.000764966 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0033 | -| learning_rate | 0.0003 | -| loss | 0.00235 | -| n_updates | 262140 | -| policy_gradient_loss | 0.0294 | -| std | 0.00603 | -| value_loss | 3.31e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26216 | -| time_elapsed | 142583 | -| total_timesteps | 3355648 | -| train/ | | -| approx_kl | 0.50551933 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 262150 | -| policy_gradient_loss | 0.0698 | -| std | 0.00603 | -| value_loss | 2.97e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26217 | -| time_elapsed | 142588 | -| total_timesteps | 3355776 | -| train/ | | -| approx_kl | 0.078551196 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.0423 | -| n_updates | 262160 | -| policy_gradient_loss | 0.0187 | -| std | 0.00603 | -| value_loss | 2.6e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.938 | -| time/ | | -| fps | 23 | -| iterations | 26218 | -| time_elapsed | 142591 | -| total_timesteps | 3355904 | -| train/ | | -| approx_kl | 0.01348554 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | 0.00809 | -| n_updates | 262170 | -| policy_gradient_loss | 0.0193 | -| std | 0.00603 | -| value_loss | 2.02e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26219 | -| time_elapsed | 142595 | -| total_timesteps | 3356032 | -| train/ | | -| approx_kl | 0.0031506484 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.00298 | -| n_updates | 262180 | -| policy_gradient_loss | 0.0105 | -| std | 0.00603 | -| value_loss | 1.64e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26220 | -| time_elapsed | 142603 | -| total_timesteps | 3356160 | -| train/ | | -| approx_kl | 0.124967285 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00706 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 262190 | -| policy_gradient_loss | 0.0278 | -| std | 0.00603 | -| value_loss | 0.00229 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26221 | -| time_elapsed | 142608 | -| total_timesteps | 3356288 | -| train/ | | -| approx_kl | 0.038532026 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.14 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 262200 | -| policy_gradient_loss | 0.025 | -| std | 0.00603 | -| value_loss | 1.23e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26222 | -| time_elapsed | 142612 | -| total_timesteps | 3356416 | -| train/ | | -| approx_kl | 0.63770056 | -| clip_fraction | 0.548 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0116 | -| learning_rate | 0.0003 | -| loss | 0.263 | -| n_updates | 262210 | -| policy_gradient_loss | 0.0974 | -| std | 0.00603 | -| value_loss | 2.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26223 | -| time_elapsed | 142617 | -| total_timesteps | 3356544 | -| train/ | | -| approx_kl | 0.009581342 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0195 | -| learning_rate | 0.0003 | -| loss | -0.00331 | -| n_updates | 262220 | -| policy_gradient_loss | 0.00979 | -| std | 0.00603 | -| value_loss | 1.73e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26224 | -| time_elapsed | 142621 | -| total_timesteps | 3356672 | -| train/ | | -| approx_kl | 0.07925548 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0283 | -| learning_rate | 0.0003 | -| loss | -0.00923 | -| n_updates | 262230 | -| policy_gradient_loss | 0.0125 | -| std | 0.00603 | -| value_loss | 1.31e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26225 | -| time_elapsed | 142625 | -| total_timesteps | 3356800 | -| train/ | | -| approx_kl | 0.16092893 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 262240 | -| policy_gradient_loss | 0.0865 | -| std | 0.00603 | -| value_loss | 8.84e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.933 | -| time/ | | -| fps | 23 | -| iterations | 26226 | -| time_elapsed | 142630 | -| total_timesteps | 3356928 | -| train/ | | -| approx_kl | 0.23457737 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0443 | -| learning_rate | 0.0003 | -| loss | 0.235 | -| n_updates | 262250 | -| policy_gradient_loss | 0.0495 | -| std | 0.00603 | -| value_loss | 8.03e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26227 | -| time_elapsed | 142635 | -| total_timesteps | 3357056 | -| train/ | | -| approx_kl | 0.06652565 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | -0.0353 | -| n_updates | 262260 | -| policy_gradient_loss | -0.0183 | -| std | 0.00603 | -| value_loss | 5.2e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26228 | -| time_elapsed | 142645 | -| total_timesteps | 3357184 | -| train/ | | -| approx_kl | 0.03733002 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.859 | -| learning_rate | 0.0003 | -| loss | -0.000106 | -| n_updates | 262270 | -| policy_gradient_loss | -0.00296 | -| std | 0.00603 | -| value_loss | 0.00332 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26229 | -| time_elapsed | 142649 | -| total_timesteps | 3357312 | -| train/ | | -| approx_kl | 0.005517909 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.787 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 262280 | -| policy_gradient_loss | 0.0188 | -| std | 0.00603 | -| value_loss | 3.41e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26230 | -| time_elapsed | 142655 | -| total_timesteps | 3357440 | -| train/ | | -| approx_kl | 7.983763e-06 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | -0.000567 | -| n_updates | 262290 | -| policy_gradient_loss | 0.0312 | -| std | 0.00602 | -| value_loss | 4.6e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26231 | -| time_elapsed | 142660 | -| total_timesteps | 3357568 | -| train/ | | -| approx_kl | 0.012681768 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0389 | -| learning_rate | 0.0003 | -| loss | 0.00783 | -| n_updates | 262300 | -| policy_gradient_loss | 0.0277 | -| std | 0.00603 | -| value_loss | 6.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26232 | -| time_elapsed | 142664 | -| total_timesteps | 3357696 | -| train/ | | -| approx_kl | 0.021976175 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.641 | -| learning_rate | 0.0003 | -| loss | -0.00114 | -| n_updates | 262310 | -| policy_gradient_loss | 0.0268 | -| std | 0.00603 | -| value_loss | 6.18e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26233 | -| time_elapsed | 142668 | -| total_timesteps | 3357824 | -| train/ | | -| approx_kl | 0.3040886 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 262320 | -| policy_gradient_loss | 0.145 | -| std | 0.00604 | -| value_loss | 3.69e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.925 | -| time/ | | -| fps | 23 | -| iterations | 26234 | -| time_elapsed | 142672 | -| total_timesteps | 3357952 | -| train/ | | -| approx_kl | 0.047270585 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0547 | -| learning_rate | 0.0003 | -| loss | 0.0232 | -| n_updates | 262330 | -| policy_gradient_loss | 0.0247 | -| std | 0.00604 | -| value_loss | 2.72e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26235 | -| time_elapsed | 142678 | -| total_timesteps | 3358080 | -| train/ | | -| approx_kl | 0.59458816 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.166 | -| n_updates | 262340 | -| policy_gradient_loss | 0.058 | -| std | 0.00604 | -| value_loss | 2.35e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26236 | -| time_elapsed | 142690 | -| total_timesteps | 3358208 | -| train/ | | -| approx_kl | 0.1086331 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.759 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 262350 | -| policy_gradient_loss | 0.0375 | -| std | 0.00604 | -| value_loss | 0.00629 | ---------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26237 | -| time_elapsed | 142694 | -| total_timesteps | 3358336 | -| train/ | | -| approx_kl | 1.317783 | -| clip_fraction | 0.752 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.369 | -| learning_rate | 0.0003 | -| loss | 0.479 | -| n_updates | 262360 | -| policy_gradient_loss | 0.31 | -| std | 0.00603 | -| value_loss | 0.000273 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26238 | -| time_elapsed | 142698 | -| total_timesteps | 3358464 | -| train/ | | -| approx_kl | 0.08191378 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | 0.0962 | -| n_updates | 262370 | -| policy_gradient_loss | 0.00518 | -| std | 0.00603 | -| value_loss | 7.91e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26239 | -| time_elapsed | 142704 | -| total_timesteps | 3358592 | -| train/ | | -| approx_kl | 0.21779297 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0538 | -| learning_rate | 0.0003 | -| loss | 0.0793 | -| n_updates | 262380 | -| policy_gradient_loss | 0.0193 | -| std | 0.00603 | -| value_loss | 0.000109 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26240 | -| time_elapsed | 142709 | -| total_timesteps | 3358720 | -| train/ | | -| approx_kl | 0.021478798 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.73 | -| learning_rate | 0.0003 | -| loss | -0.00683 | -| n_updates | 262390 | -| policy_gradient_loss | 0.0155 | -| std | 0.00603 | -| value_loss | 5.82e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26241 | -| time_elapsed | 142715 | -| total_timesteps | 3358848 | -| train/ | | -| approx_kl | 0.38621905 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.366 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 262400 | -| policy_gradient_loss | 0.171 | -| std | 0.00603 | -| value_loss | 1.16e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.937 | -| time/ | | -| fps | 23 | -| iterations | 26242 | -| time_elapsed | 142720 | -| total_timesteps | 3358976 | -| train/ | | -| approx_kl | 0.05701575 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.081 | -| learning_rate | 0.0003 | -| loss | 0.00302 | -| n_updates | 262410 | -| policy_gradient_loss | 0.0247 | -| std | 0.00603 | -| value_loss | 1.15e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 26243 | -| time_elapsed | 142725 | -| total_timesteps | 3359104 | -| train/ | | -| approx_kl | 0.8826845 | -| clip_fraction | 0.535 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.264 | -| n_updates | 262420 | -| policy_gradient_loss | 0.0744 | -| std | 0.00603 | -| value_loss | 9.57e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 26244 | -| time_elapsed | 142734 | -| total_timesteps | 3359232 | -| train/ | | -| approx_kl | 0.025897756 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.932 | -| learning_rate | 0.0003 | -| loss | -0.000325 | -| n_updates | 262430 | -| policy_gradient_loss | 0.000665 | -| std | 0.00603 | -| value_loss | 0.00118 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 26245 | -| time_elapsed | 142737 | -| total_timesteps | 3359360 | -| train/ | | -| approx_kl | 0.021645296 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0128 | -| learning_rate | 0.0003 | -| loss | 0.000217 | -| n_updates | 262440 | -| policy_gradient_loss | 0.00597 | -| std | 0.00603 | -| value_loss | 2.87e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 26246 | -| time_elapsed | 142740 | -| total_timesteps | 3359488 | -| train/ | | -| approx_kl | 0.08847938 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.00992 | -| learning_rate | 0.0003 | -| loss | 0.0546 | -| n_updates | 262450 | -| policy_gradient_loss | 0.0227 | -| std | 0.00603 | -| value_loss | 8.03e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 26247 | -| time_elapsed | 142745 | -| total_timesteps | 3359616 | -| train/ | | -| approx_kl | 0.013768562 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0646 | -| learning_rate | 0.0003 | -| loss | -0.0232 | -| n_updates | 262460 | -| policy_gradient_loss | 0.00287 | -| std | 0.00602 | -| value_loss | 5.29e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 26248 | -| time_elapsed | 142748 | -| total_timesteps | 3359744 | -| train/ | | -| approx_kl | 0.06263563 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0572 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 262470 | -| policy_gradient_loss | 0.0123 | -| std | 0.00602 | -| value_loss | 4.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.946 | -| time/ | | -| fps | 23 | -| iterations | 26249 | -| time_elapsed | 142753 | -| total_timesteps | 3359872 | -| train/ | | -| approx_kl | 0.009532431 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0528 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 262480 | -| policy_gradient_loss | 0.00203 | -| std | 0.00602 | -| value_loss | 3.42e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26250 | -| time_elapsed | 142758 | -| total_timesteps | 3360000 | -| train/ | | -| approx_kl | 4.52511e-05 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0477 | -| learning_rate | 0.0003 | -| loss | 3.8e-05 | -| n_updates | 262490 | -| policy_gradient_loss | 0.0353 | -| std | 0.00602 | -| value_loss | 1.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26251 | -| time_elapsed | 142762 | -| total_timesteps | 3360128 | -| train/ | | -| approx_kl | 0.24105357 | -| clip_fraction | 0.557 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0093 | -| learning_rate | 0.0003 | -| loss | 0.0923 | -| n_updates | 262500 | -| policy_gradient_loss | 0.0389 | -| std | 0.00602 | -| value_loss | 1.15e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26252 | -| time_elapsed | 142772 | -| total_timesteps | 3360256 | -| train/ | | -| approx_kl | 0.05375893 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.762 | -| learning_rate | 0.0003 | -| loss | -0.00992 | -| n_updates | 262510 | -| policy_gradient_loss | 0.00102 | -| std | 0.00602 | -| value_loss | 0.00171 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26253 | -| time_elapsed | 142777 | -| total_timesteps | 3360384 | -| train/ | | -| approx_kl | 0.0030265334 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.269 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 262520 | -| policy_gradient_loss | 0.0046 | -| std | 0.00602 | -| value_loss | 2.08e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26254 | -| time_elapsed | 142781 | -| total_timesteps | 3360512 | -| train/ | | -| approx_kl | 0.004504348 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0137 | -| learning_rate | 0.0003 | -| loss | -0.00268 | -| n_updates | 262530 | -| policy_gradient_loss | 0.00799 | -| std | 0.00602 | -| value_loss | 3.49e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26255 | -| time_elapsed | 142785 | -| total_timesteps | 3360640 | -| train/ | | -| approx_kl | 0.042234253 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0364 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 262540 | -| policy_gradient_loss | 0.148 | -| std | 0.00603 | -| value_loss | 2.57e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26256 | -| time_elapsed | 142790 | -| total_timesteps | 3360768 | -| train/ | | -| approx_kl | 0.119069375 | -| clip_fraction | 0.688 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | 0.0961 | -| n_updates | 262550 | -| policy_gradient_loss | 0.137 | -| std | 0.00603 | -| value_loss | 2.35e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.955 | -| time/ | | -| fps | 23 | -| iterations | 26257 | -| time_elapsed | 142794 | -| total_timesteps | 3360896 | -| train/ | | -| approx_kl | 0.1446541 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 262560 | -| policy_gradient_loss | 0.155 | -| std | 0.00603 | -| value_loss | 2.12e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26258 | -| time_elapsed | 142798 | -| total_timesteps | 3361024 | -| train/ | | -| approx_kl | 0.035503093 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0246 | -| learning_rate | 0.0003 | -| loss | 0.0212 | -| n_updates | 262570 | -| policy_gradient_loss | 0.0342 | -| std | 0.00603 | -| value_loss | 1.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26259 | -| time_elapsed | 142807 | -| total_timesteps | 3361152 | -| train/ | | -| approx_kl | 0.030120151 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.608 | -| learning_rate | 0.0003 | -| loss | -0.0137 | -| n_updates | 262580 | -| policy_gradient_loss | -0.00404 | -| std | 0.00603 | -| value_loss | 0.00152 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26260 | -| time_elapsed | 142811 | -| total_timesteps | 3361280 | -| train/ | | -| approx_kl | 0.018654417 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.114 | -| learning_rate | 0.0003 | -| loss | -0.0108 | -| n_updates | 262590 | -| policy_gradient_loss | 0.027 | -| std | 0.00603 | -| value_loss | 1.06e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26261 | -| time_elapsed | 142815 | -| total_timesteps | 3361408 | -| train/ | | -| approx_kl | 0.1609295 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 262600 | -| policy_gradient_loss | 0.0489 | -| std | 0.00603 | -| value_loss | 9.77e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26262 | -| time_elapsed | 142820 | -| total_timesteps | 3361536 | -| train/ | | -| approx_kl | 0.26901865 | -| clip_fraction | 0.392 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.026 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 262610 | -| policy_gradient_loss | 0.0374 | -| std | 0.00603 | -| value_loss | 5.4e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26263 | -| time_elapsed | 142825 | -| total_timesteps | 3361664 | -| train/ | | -| approx_kl | 0.6008353 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0963 | -| learning_rate | 0.0003 | -| loss | 0.172 | -| n_updates | 262620 | -| policy_gradient_loss | 0.0565 | -| std | 0.00603 | -| value_loss | 2.94e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26264 | -| time_elapsed | 142829 | -| total_timesteps | 3361792 | -| train/ | | -| approx_kl | 0.012690283 | -| clip_fraction | 0.24 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0755 | -| learning_rate | 0.0003 | -| loss | -0.0254 | -| n_updates | 262630 | -| policy_gradient_loss | 0.00129 | -| std | 0.00603 | -| value_loss | 2.86e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.957 | -| time/ | | -| fps | 23 | -| iterations | 26265 | -| time_elapsed | 142834 | -| total_timesteps | 3361920 | -| train/ | | -| approx_kl | 0.002602172 | -| clip_fraction | 0.192 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 262640 | -| policy_gradient_loss | 0.00745 | -| std | 0.00603 | -| value_loss | 1.7e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26266 | -| time_elapsed | 142839 | -| total_timesteps | 3362048 | -| train/ | | -| approx_kl | 0.04622717 | -| clip_fraction | 0.652 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0673 | -| learning_rate | 0.0003 | -| loss | 0.0514 | -| n_updates | 262650 | -| policy_gradient_loss | 0.102 | -| std | 0.00603 | -| value_loss | 1.5e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26267 | -| time_elapsed | 142848 | -| total_timesteps | 3362176 | -| train/ | | -| approx_kl | 0.016757816 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.239 | -| learning_rate | 0.0003 | -| loss | 0.00885 | -| n_updates | 262660 | -| policy_gradient_loss | 0.0239 | -| std | 0.00603 | -| value_loss | 0.00256 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26268 | -| time_elapsed | 142852 | -| total_timesteps | 3362304 | -| train/ | | -| approx_kl | 0.0014795982 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.846 | -| learning_rate | 0.0003 | -| loss | 0.00039 | -| n_updates | 262670 | -| policy_gradient_loss | 0.0364 | -| std | 0.00603 | -| value_loss | 4.85e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26269 | -| time_elapsed | 142857 | -| total_timesteps | 3362432 | -| train/ | | -| approx_kl | 0.00019252067 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -6.56 | -| learning_rate | 0.0003 | -| loss | -0.000409 | -| n_updates | 262680 | -| policy_gradient_loss | 0.027 | -| std | 0.00602 | -| value_loss | 1.88e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26270 | -| time_elapsed | 142862 | -| total_timesteps | 3362560 | -| train/ | | -| approx_kl | 0.25008318 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | 0.068 | -| n_updates | 262690 | -| policy_gradient_loss | 0.0176 | -| std | 0.00601 | -| value_loss | 4.46e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26271 | -| time_elapsed | 142867 | -| total_timesteps | 3362688 | -| train/ | | -| approx_kl | 0.02342846 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -2.61 | -| learning_rate | 0.0003 | -| loss | -0.00241 | -| n_updates | 262700 | -| policy_gradient_loss | -0.00296 | -| std | 0.00601 | -| value_loss | 2e-10 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26272 | -| time_elapsed | 142871 | -| total_timesteps | 3362816 | -| train/ | | -| approx_kl | 0.018135693 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.506 | -| learning_rate | 0.0003 | -| loss | -0.00342 | -| n_updates | 262710 | -| policy_gradient_loss | -0.00255 | -| std | 0.00601 | -| value_loss | 1.79e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.959 | -| time/ | | -| fps | 23 | -| iterations | 26273 | -| time_elapsed | 142875 | -| total_timesteps | 3362944 | -| train/ | | -| approx_kl | 0.015136847 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | -0.000411 | -| n_updates | 262720 | -| policy_gradient_loss | -0.000422 | -| std | 0.00601 | -| value_loss | 1.29e-11 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26274 | -| time_elapsed | 142880 | -| total_timesteps | 3363072 | -| train/ | | -| approx_kl | 0.034380607 | -| clip_fraction | 0.476 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0607 | -| learning_rate | 0.0003 | -| loss | 0.0216 | -| n_updates | 262730 | -| policy_gradient_loss | 0.0447 | -| std | 0.00601 | -| value_loss | 1.03e-11 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26275 | -| time_elapsed | 142889 | -| total_timesteps | 3363200 | -| train/ | | -| approx_kl | 0.24286568 | -| clip_fraction | 0.69 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.935 | -| learning_rate | 0.0003 | -| loss | 0.0852 | -| n_updates | 262740 | -| policy_gradient_loss | 0.0716 | -| std | 0.00601 | -| value_loss | 0.0011 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26276 | -| time_elapsed | 142894 | -| total_timesteps | 3363328 | -| train/ | | -| approx_kl | 0.06365837 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.511 | -| learning_rate | 0.0003 | -| loss | -0.000832 | -| n_updates | 262750 | -| policy_gradient_loss | 0.0242 | -| std | 0.00601 | -| value_loss | 3.14e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26277 | -| time_elapsed | 142900 | -| total_timesteps | 3363456 | -| train/ | | -| approx_kl | 0.7408083 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0107 | -| learning_rate | 0.0003 | -| loss | 0.199 | -| n_updates | 262760 | -| policy_gradient_loss | 0.0689 | -| std | 0.00601 | -| value_loss | 8.86e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26278 | -| time_elapsed | 142904 | -| total_timesteps | 3363584 | -| train/ | | -| approx_kl | 0.012789197 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.000286 | -| learning_rate | 0.0003 | -| loss | 0.004 | -| n_updates | 262770 | -| policy_gradient_loss | 0.00745 | -| std | 0.00601 | -| value_loss | 3.58e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26279 | -| time_elapsed | 142909 | -| total_timesteps | 3363712 | -| train/ | | -| approx_kl | 0.07387501 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.237 | -| learning_rate | 0.0003 | -| loss | 0.0465 | -| n_updates | 262780 | -| policy_gradient_loss | 0.0194 | -| std | 0.00601 | -| value_loss | 1.41e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26280 | -| time_elapsed | 142912 | -| total_timesteps | 3363840 | -| train/ | | -| approx_kl | 0.044788253 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0685 | -| learning_rate | 0.0003 | -| loss | 0.00352 | -| n_updates | 262790 | -| policy_gradient_loss | 0.00302 | -| std | 0.00601 | -| value_loss | 1.14e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.956 | -| time/ | | -| fps | 23 | -| iterations | 26281 | -| time_elapsed | 142916 | -| total_timesteps | 3363968 | -| train/ | | -| approx_kl | 0.010358289 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0461 | -| learning_rate | 0.0003 | -| loss | 0.00131 | -| n_updates | 262800 | -| policy_gradient_loss | 0.0105 | -| std | 0.00601 | -| value_loss | 7.62e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26282 | -| time_elapsed | 142919 | -| total_timesteps | 3364096 | -| train/ | | -| approx_kl | 0.07618946 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 262810 | -| policy_gradient_loss | 0.0172 | -| std | 0.00601 | -| value_loss | 5.63e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26283 | -| time_elapsed | 142930 | -| total_timesteps | 3364224 | -| train/ | | -| approx_kl | 0.017688738 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | -0.0089 | -| n_updates | 262820 | -| policy_gradient_loss | 0.00468 | -| std | 0.00601 | -| value_loss | 0.000978 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26284 | -| time_elapsed | 142934 | -| total_timesteps | 3364352 | -| train/ | | -| approx_kl | 0.08591597 | -| clip_fraction | 0.3 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.193 | -| learning_rate | 0.0003 | -| loss | 0.0436 | -| n_updates | 262830 | -| policy_gradient_loss | 0.0174 | -| std | 0.00601 | -| value_loss | 8.85e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26285 | -| time_elapsed | 142939 | -| total_timesteps | 3364480 | -| train/ | | -| approx_kl | 0.011563628 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0021 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 262840 | -| policy_gradient_loss | 0.00412 | -| std | 0.00601 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26286 | -| time_elapsed | 142944 | -| total_timesteps | 3364608 | -| train/ | | -| approx_kl | 0.0008958713 | -| clip_fraction | 0.263 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.00635 | -| n_updates | 262850 | -| policy_gradient_loss | 0.00516 | -| std | 0.00601 | -| value_loss | 1.05e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26287 | -| time_elapsed | 142949 | -| total_timesteps | 3364736 | -| train/ | | -| approx_kl | 3.380701e-06 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0357 | -| learning_rate | 0.0003 | -| loss | 0.000642 | -| n_updates | 262860 | -| policy_gradient_loss | -0.00796 | -| std | 0.00601 | -| value_loss | 7.75e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26288 | -| time_elapsed | 142954 | -| total_timesteps | 3364864 | -| train/ | | -| approx_kl | 0.06890737 | -| clip_fraction | 0.294 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0468 | -| learning_rate | 0.0003 | -| loss | 0.0505 | -| n_updates | 262870 | -| policy_gradient_loss | 0.0239 | -| std | 0.00601 | -| value_loss | 4.26e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.965 | -| time/ | | -| fps | 23 | -| iterations | 26289 | -| time_elapsed | 142958 | -| total_timesteps | 3364992 | -| train/ | | -| approx_kl | 0.0094509125 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.087 | -| learning_rate | 0.0003 | -| loss | -0.00184 | -| n_updates | 262880 | -| policy_gradient_loss | 0.00715 | -| std | 0.00602 | -| value_loss | 2.98e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 26290 | -| time_elapsed | 142965 | -| total_timesteps | 3365120 | -| train/ | | -| approx_kl | 0.002539603 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0644 | -| learning_rate | 0.0003 | -| loss | -0.00152 | -| n_updates | 262890 | -| policy_gradient_loss | 0.0103 | -| std | 0.00602 | -| value_loss | 2.07e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 26291 | -| time_elapsed | 142978 | -| total_timesteps | 3365248 | -| train/ | | -| approx_kl | 0.057581466 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.63 | -| learning_rate | 0.0003 | -| loss | -0.0226 | -| n_updates | 262900 | -| policy_gradient_loss | -0.0141 | -| std | 0.00601 | -| value_loss | 0.00132 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 26292 | -| time_elapsed | 142983 | -| total_timesteps | 3365376 | -| train/ | | -| approx_kl | 0.049130417 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -52.3 | -| learning_rate | 0.0003 | -| loss | 0.000298 | -| n_updates | 262910 | -| policy_gradient_loss | 0.0119 | -| std | 0.00601 | -| value_loss | 5.02e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 26293 | -| time_elapsed | 142987 | -| total_timesteps | 3365504 | -| train/ | | -| approx_kl | 0.99703705 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.377 | -| learning_rate | 0.0003 | -| loss | 0.416 | -| n_updates | 262920 | -| policy_gradient_loss | 0.158 | -| std | 0.00601 | -| value_loss | 1.03e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 26294 | -| time_elapsed | 142992 | -| total_timesteps | 3365632 | -| train/ | | -| approx_kl | 0.010125538 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | -0.00033 | -| n_updates | 262930 | -| policy_gradient_loss | 0.0422 | -| std | 0.00602 | -| value_loss | 8.68e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 26295 | -| time_elapsed | 142997 | -| total_timesteps | 3365760 | -| train/ | | -| approx_kl | 0.10189657 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.041 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 262940 | -| policy_gradient_loss | 0.0151 | -| std | 0.00602 | -| value_loss | 7.87e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.971 | -| time/ | | -| fps | 23 | -| iterations | 26296 | -| time_elapsed | 143002 | -| total_timesteps | 3365888 | -| train/ | | -| approx_kl | 3.5766046e-05 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0349 | -| learning_rate | 0.0003 | -| loss | -0.00043 | -| n_updates | 262950 | -| policy_gradient_loss | 0.0498 | -| std | 0.00602 | -| value_loss | 6.01e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26297 | -| time_elapsed | 143005 | -| total_timesteps | 3366016 | -| train/ | | -| approx_kl | 0.6505759 | -| clip_fraction | 0.521 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.197 | -| n_updates | 262960 | -| policy_gradient_loss | 0.062 | -| std | 0.00602 | -| value_loss | 3.43e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26298 | -| time_elapsed | 143017 | -| total_timesteps | 3366144 | -| train/ | | -| approx_kl | 0.025036678 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.82 | -| learning_rate | 0.0003 | -| loss | 0.00333 | -| n_updates | 262970 | -| policy_gradient_loss | 0.00425 | -| std | 0.00602 | -| value_loss | 0.00319 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26299 | -| time_elapsed | 143022 | -| total_timesteps | 3366272 | -| train/ | | -| approx_kl | 0.0064992593 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0124 | -| learning_rate | 0.0003 | -| loss | -0.00772 | -| n_updates | 262980 | -| policy_gradient_loss | 0.00666 | -| std | 0.00602 | -| value_loss | 0.00485 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26300 | -| time_elapsed | 143027 | -| total_timesteps | 3366400 | -| train/ | | -| approx_kl | 0.0015516249 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0688 | -| learning_rate | 0.0003 | -| loss | 0.0064 | -| n_updates | 262990 | -| policy_gradient_loss | 0.00447 | -| std | 0.00602 | -| value_loss | 7.74e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26301 | -| time_elapsed | 143030 | -| total_timesteps | 3366528 | -| train/ | | -| approx_kl | 0.06698108 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0144 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 263000 | -| policy_gradient_loss | 0.0128 | -| std | 0.00602 | -| value_loss | 1.5e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26302 | -| time_elapsed | 143034 | -| total_timesteps | 3366656 | -| train/ | | -| approx_kl | 0.010115126 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0406 | -| learning_rate | 0.0003 | -| loss | -0.000452 | -| n_updates | 263010 | -| policy_gradient_loss | 0.00684 | -| std | 0.00601 | -| value_loss | 8.12e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26303 | -| time_elapsed | 143040 | -| total_timesteps | 3366784 | -| train/ | | -| approx_kl | 0.003007248 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0649 | -| learning_rate | 0.0003 | -| loss | -0.000863 | -| n_updates | 263020 | -| policy_gradient_loss | 0.00984 | -| std | 0.00601 | -| value_loss | 4.44e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.966 | -| time/ | | -| fps | 23 | -| iterations | 26304 | -| time_elapsed | 143045 | -| total_timesteps | 3366912 | -| train/ | | -| approx_kl | 2.7809292e-06 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0848 | -| learning_rate | 0.0003 | -| loss | 0.000181 | -| n_updates | 263030 | -| policy_gradient_loss | 0.0272 | -| std | 0.00601 | -| value_loss | 4.43e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26305 | -| time_elapsed | 143050 | -| total_timesteps | 3367040 | -| train/ | | -| approx_kl | 0.22953318 | -| clip_fraction | 0.533 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0776 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 263040 | -| policy_gradient_loss | 0.0652 | -| std | 0.00601 | -| value_loss | 2.1e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26306 | -| time_elapsed | 143059 | -| total_timesteps | 3367168 | -| train/ | | -| approx_kl | 0.20586488 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.905 | -| learning_rate | 0.0003 | -| loss | -0.00786 | -| n_updates | 263050 | -| policy_gradient_loss | -0.00814 | -| std | 0.00601 | -| value_loss | 0.000513 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26307 | -| time_elapsed | 143065 | -| total_timesteps | 3367296 | -| train/ | | -| approx_kl | 0.03559897 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.46 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 263060 | -| policy_gradient_loss | 0.0337 | -| std | 0.00601 | -| value_loss | 5.33e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26308 | -| time_elapsed | 143070 | -| total_timesteps | 3367424 | -| train/ | | -| approx_kl | 0.03456209 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -6.78 | -| learning_rate | 0.0003 | -| loss | 0.00147 | -| n_updates | 263070 | -| policy_gradient_loss | 0.0111 | -| std | 0.00601 | -| value_loss | 3.77e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26309 | -| time_elapsed | 143075 | -| total_timesteps | 3367552 | -| train/ | | -| approx_kl | 0.0040048338 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.157 | -| learning_rate | 0.0003 | -| loss | -0.00116 | -| n_updates | 263080 | -| policy_gradient_loss | 0.00993 | -| std | 0.00602 | -| value_loss | 1.02e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26310 | -| time_elapsed | 143079 | -| total_timesteps | 3367680 | -| train/ | | -| approx_kl | 0.012345962 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0793 | -| learning_rate | 0.0003 | -| loss | -0.00586 | -| n_updates | 263090 | -| policy_gradient_loss | 0.0175 | -| std | 0.00603 | -| value_loss | 2.91e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26311 | -| time_elapsed | 143085 | -| total_timesteps | 3367808 | -| train/ | | -| approx_kl | 0.21176775 | -| clip_fraction | 0.401 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0076 | -| learning_rate | 0.0003 | -| loss | 0.122 | -| n_updates | 263100 | -| policy_gradient_loss | 0.0502 | -| std | 0.00604 | -| value_loss | 7.85e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26312 | -| time_elapsed | 143089 | -| total_timesteps | 3367936 | -| train/ | | -| approx_kl | 0.13294749 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.165 | -| learning_rate | 0.0003 | -| loss | 0.05 | -| n_updates | 263110 | -| policy_gradient_loss | 0.0143 | -| std | 0.00604 | -| value_loss | 4.12e-09 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26313 | -| time_elapsed | 143093 | -| total_timesteps | 3368064 | -| train/ | | -| approx_kl | 0.0021910318 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0563 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 263120 | -| policy_gradient_loss | 0.0154 | -| std | 0.00604 | -| value_loss | 2.49e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26314 | -| time_elapsed | 143101 | -| total_timesteps | 3368192 | -| train/ | | -| approx_kl | 0.59062046 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.296 | -| learning_rate | 0.0003 | -| loss | 0.348 | -| n_updates | 263130 | -| policy_gradient_loss | 0.211 | -| std | 0.00604 | -| value_loss | 0.0148 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26315 | -| time_elapsed | 143106 | -| total_timesteps | 3368320 | -| train/ | | -| approx_kl | 0.08815586 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.6 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 263140 | -| policy_gradient_loss | 0.0306 | -| std | 0.00604 | -| value_loss | 0.000104 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26316 | -| time_elapsed | 143113 | -| total_timesteps | 3368448 | -| train/ | | -| approx_kl | 0.682119 | -| clip_fraction | 0.565 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00243 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 263150 | -| policy_gradient_loss | 0.065 | -| std | 0.00604 | -| value_loss | 2.87e-05 | --------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26317 | -| time_elapsed | 143117 | -| total_timesteps | 3368576 | -| train/ | | -| approx_kl | 0.0149955265 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00153 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 263160 | -| policy_gradient_loss | 0.0061 | -| std | 0.00604 | -| value_loss | 1.07e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26318 | -| time_elapsed | 143122 | -| total_timesteps | 3368704 | -| train/ | | -| approx_kl | 0.0038330671 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0473 | -| learning_rate | 0.0003 | -| loss | -0.00636 | -| n_updates | 263170 | -| policy_gradient_loss | 0.0107 | -| std | 0.00604 | -| value_loss | 8.4e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26319 | -| time_elapsed | 143127 | -| total_timesteps | 3368832 | -| train/ | | -| approx_kl | 0.09348347 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0453 | -| learning_rate | 0.0003 | -| loss | 0.0434 | -| n_updates | 263180 | -| policy_gradient_loss | 0.0111 | -| std | 0.00604 | -| value_loss | 6.03e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.973 | -| time/ | | -| fps | 23 | -| iterations | 26320 | -| time_elapsed | 143131 | -| total_timesteps | 3368960 | -| train/ | | -| approx_kl | 0.00812185 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.00817 | -| n_updates | 263190 | -| policy_gradient_loss | 0.0146 | -| std | 0.00604 | -| value_loss | 2.59e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26321 | -| time_elapsed | 143137 | -| total_timesteps | 3369088 | -| train/ | | -| approx_kl | 0.0067029083 | -| clip_fraction | 0.157 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.106 | -| learning_rate | 0.0003 | -| loss | 0.00285 | -| n_updates | 263200 | -| policy_gradient_loss | 0.00628 | -| std | 0.00602 | -| value_loss | 1.47e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26322 | -| time_elapsed | 143145 | -| total_timesteps | 3369216 | -| train/ | | -| approx_kl | 0.0576183 | -| clip_fraction | 0.457 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.801 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 263210 | -| policy_gradient_loss | 0.0112 | -| std | 0.00599 | -| value_loss | 0.000838 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26323 | -| time_elapsed | 143150 | -| total_timesteps | 3369344 | -| train/ | | -| approx_kl | 0.18167076 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.115 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 263220 | -| policy_gradient_loss | 0.0907 | -| std | 0.00599 | -| value_loss | 2.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26324 | -| time_elapsed | 143155 | -| total_timesteps | 3369472 | -| train/ | | -| approx_kl | 0.051854953 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 263230 | -| policy_gradient_loss | 0.0327 | -| std | 0.00599 | -| value_loss | 3.55e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26325 | -| time_elapsed | 143160 | -| total_timesteps | 3369600 | -| train/ | | -| approx_kl | 1.1236745 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0738 | -| learning_rate | 0.0003 | -| loss | 0.377 | -| n_updates | 263240 | -| policy_gradient_loss | 0.149 | -| std | 0.00599 | -| value_loss | 2.59e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26326 | -| time_elapsed | 143165 | -| total_timesteps | 3369728 | -| train/ | | -| approx_kl | 0.009965591 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0504 | -| learning_rate | 0.0003 | -| loss | -0.0021 | -| n_updates | 263250 | -| policy_gradient_loss | 0.0376 | -| std | 0.00599 | -| value_loss | 2.01e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26327 | -| time_elapsed | 143169 | -| total_timesteps | 3369856 | -| train/ | | -| approx_kl | 0.11611386 | -| clip_fraction | 0.332 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0456 | -| n_updates | 263260 | -| policy_gradient_loss | 0.0266 | -| std | 0.00599 | -| value_loss | 1.51e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.976 | -| time/ | | -| fps | 23 | -| iterations | 26328 | -| time_elapsed | 143174 | -| total_timesteps | 3369984 | -| train/ | | -| approx_kl | 4.7891866e-05 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0494 | -| learning_rate | 0.0003 | -| loss | -0.000704 | -| n_updates | 263270 | -| policy_gradient_loss | 0.0382 | -| std | 0.00599 | -| value_loss | 1.21e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26329 | -| time_elapsed | 143179 | -| total_timesteps | 3370112 | -| train/ | | -| approx_kl | 0.16550203 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0379 | -| learning_rate | 0.0003 | -| loss | 0.0673 | -| n_updates | 263280 | -| policy_gradient_loss | 0.0195 | -| std | 0.00599 | -| value_loss | 6.95e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26330 | -| time_elapsed | 143192 | -| total_timesteps | 3370240 | -| train/ | | -| approx_kl | 0.009125315 | -| clip_fraction | 0.182 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.815 | -| learning_rate | 0.0003 | -| loss | -0.00909 | -| n_updates | 263290 | -| policy_gradient_loss | -0.00653 | -| std | 0.00598 | -| value_loss | 0.005 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26331 | -| time_elapsed | 143197 | -| total_timesteps | 3370368 | -| train/ | | -| approx_kl | 0.019919785 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.37 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 263300 | -| policy_gradient_loss | 0.0267 | -| std | 0.00598 | -| value_loss | 1.46e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26332 | -| time_elapsed | 143201 | -| total_timesteps | 3370496 | -| train/ | | -| approx_kl | 0.048110697 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00862 | -| learning_rate | 0.0003 | -| loss | 0.0415 | -| n_updates | 263310 | -| policy_gradient_loss | 0.00797 | -| std | 0.00598 | -| value_loss | 4.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26333 | -| time_elapsed | 143206 | -| total_timesteps | 3370624 | -| train/ | | -| approx_kl | 0.09238382 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0455 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 263320 | -| policy_gradient_loss | 0.0367 | -| std | 0.00598 | -| value_loss | 2.08e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26334 | -| time_elapsed | 143211 | -| total_timesteps | 3370752 | -| train/ | | -| approx_kl | 0.018712614 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | -0.0412 | -| n_updates | 263330 | -| policy_gradient_loss | -0.00741 | -| std | 0.00598 | -| value_loss | 1.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26335 | -| time_elapsed | 143216 | -| total_timesteps | 3370880 | -| train/ | | -| approx_kl | 0.023385098 | -| clip_fraction | 0.344 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.068 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 263340 | -| policy_gradient_loss | 0.032 | -| std | 0.00598 | -| value_loss | 8.73e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26336 | -| time_elapsed | 143220 | -| total_timesteps | 3371008 | -| train/ | | -| approx_kl | 0.5228834 | -| clip_fraction | 0.695 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.173 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 263350 | -| policy_gradient_loss | 0.128 | -| std | 0.00598 | -| value_loss | 4.25e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26337 | -| time_elapsed | 143230 | -| total_timesteps | 3371136 | -| train/ | | -| approx_kl | 0.4589459 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.967 | -| learning_rate | 0.0003 | -| loss | 0.0191 | -| n_updates | 263360 | -| policy_gradient_loss | 0.0283 | -| std | 0.00598 | -| value_loss | 0.000242 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26338 | -| time_elapsed | 143234 | -| total_timesteps | 3371264 | -| train/ | | -| approx_kl | 0.73905396 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.976 | -| learning_rate | 0.0003 | -| loss | 0.27 | -| n_updates | 263370 | -| policy_gradient_loss | 0.172 | -| std | 0.00598 | -| value_loss | 1.8e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26339 | -| time_elapsed | 143239 | -| total_timesteps | 3371392 | -| train/ | | -| approx_kl | 0.3203298 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -28.9 | -| learning_rate | 0.0003 | -| loss | 0.299 | -| n_updates | 263380 | -| policy_gradient_loss | 0.177 | -| std | 0.00598 | -| value_loss | 5.09e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26340 | -| time_elapsed | 143243 | -| total_timesteps | 3371520 | -| train/ | | -| approx_kl | 0.18050998 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -7.9 | -| learning_rate | 0.0003 | -| loss | 0.0853 | -| n_updates | 263390 | -| policy_gradient_loss | 0.0678 | -| std | 0.00598 | -| value_loss | 3.55e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26341 | -| time_elapsed | 143248 | -| total_timesteps | 3371648 | -| train/ | | -| approx_kl | 0.18168736 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0286 | -| learning_rate | 0.0003 | -| loss | 0.117 | -| n_updates | 263400 | -| policy_gradient_loss | 0.165 | -| std | 0.00598 | -| value_loss | 3.27e-10 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26342 | -| time_elapsed | 143253 | -| total_timesteps | 3371776 | -| train/ | | -| approx_kl | 0.03788119 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.0165 | -| n_updates | 263410 | -| policy_gradient_loss | 0.0403 | -| std | 0.00598 | -| value_loss | 2.81e-10 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.985 | -| time/ | | -| fps | 23 | -| iterations | 26343 | -| time_elapsed | 143259 | -| total_timesteps | 3371904 | -| train/ | | -| approx_kl | 0.0005747187 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.00344 | -| n_updates | 263420 | -| policy_gradient_loss | 0.0459 | -| std | 0.00598 | -| value_loss | 1.73e-10 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26344 | -| time_elapsed | 143264 | -| total_timesteps | 3372032 | -| train/ | | -| approx_kl | 0.00135649 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0806 | -| learning_rate | 0.0003 | -| loss | -0.000994 | -| n_updates | 263430 | -| policy_gradient_loss | 0.0463 | -| std | 0.00598 | -| value_loss | 9.38e-11 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26345 | -| time_elapsed | 143275 | -| total_timesteps | 3372160 | -| train/ | | -| approx_kl | 0.045608032 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.769 | -| learning_rate | 0.0003 | -| loss | 0.000229 | -| n_updates | 263440 | -| policy_gradient_loss | -0.00305 | -| std | 0.00597 | -| value_loss | 0.00809 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26346 | -| time_elapsed | 143280 | -| total_timesteps | 3372288 | -| train/ | | -| approx_kl | 0.008341361 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.615 | -| learning_rate | 0.0003 | -| loss | -0.00124 | -| n_updates | 263450 | -| policy_gradient_loss | 0.00572 | -| std | 0.00597 | -| value_loss | 0.000126 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26347 | -| time_elapsed | 143286 | -| total_timesteps | 3372416 | -| train/ | | -| approx_kl | 0.10058978 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.0521 | -| n_updates | 263460 | -| policy_gradient_loss | 0.0192 | -| std | 0.00597 | -| value_loss | 1.25e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26348 | -| time_elapsed | 143289 | -| total_timesteps | 3372544 | -| train/ | | -| approx_kl | 0.017169466 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | -0.036 | -| n_updates | 263470 | -| policy_gradient_loss | -0.000787 | -| std | 0.00597 | -| value_loss | 1.14e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26349 | -| time_elapsed | 143294 | -| total_timesteps | 3372672 | -| train/ | | -| approx_kl | 0.10126903 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0617 | -| learning_rate | 0.0003 | -| loss | 0.0356 | -| n_updates | 263480 | -| policy_gradient_loss | 0.0115 | -| std | 0.00597 | -| value_loss | 7.08e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26350 | -| time_elapsed | 143300 | -| total_timesteps | 3372800 | -| train/ | | -| approx_kl | 0.3196962 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0618 | -| learning_rate | 0.0003 | -| loss | 0.193 | -| n_updates | 263490 | -| policy_gradient_loss | 0.0439 | -| std | 0.00597 | -| value_loss | 5.38e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.978 | -| time/ | | -| fps | 23 | -| iterations | 26351 | -| time_elapsed | 143306 | -| total_timesteps | 3372928 | -| train/ | | -| approx_kl | 0.0014505112 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.000758 | -| n_updates | 263500 | -| policy_gradient_loss | 0.0411 | -| std | 0.00597 | -| value_loss | 3.77e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26352 | -| time_elapsed | 143310 | -| total_timesteps | 3373056 | -| train/ | | -| approx_kl | 0.45376801 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.246 | -| learning_rate | 0.0003 | -| loss | 0.108 | -| n_updates | 263510 | -| policy_gradient_loss | 0.0365 | -| std | 0.00597 | -| value_loss | 1.72e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26353 | -| time_elapsed | 143317 | -| total_timesteps | 3373184 | -| train/ | | -| approx_kl | 0.0018715528 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -4.44 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 263520 | -| policy_gradient_loss | 0.0021 | -| std | 0.00597 | -| value_loss | 0.00519 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26354 | -| time_elapsed | 143322 | -| total_timesteps | 3373312 | -| train/ | | -| approx_kl | 0.023546888 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00849 | -| n_updates | 263530 | -| policy_gradient_loss | 0.00261 | -| std | 0.00597 | -| value_loss | 6.94e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26355 | -| time_elapsed | 143327 | -| total_timesteps | 3373440 | -| train/ | | -| approx_kl | 0.08789314 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -4.45 | -| learning_rate | 0.0003 | -| loss | 0.03 | -| n_updates | 263540 | -| policy_gradient_loss | 0.0127 | -| std | 0.00597 | -| value_loss | 1.63e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26356 | -| time_elapsed | 143332 | -| total_timesteps | 3373568 | -| train/ | | -| approx_kl | 0.05580241 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.393 | -| learning_rate | 0.0003 | -| loss | 0.0278 | -| n_updates | 263550 | -| policy_gradient_loss | 0.0131 | -| std | 0.00598 | -| value_loss | 9.49e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26357 | -| time_elapsed | 143337 | -| total_timesteps | 3373696 | -| train/ | | -| approx_kl | 0.012857217 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0198 | -| learning_rate | 0.0003 | -| loss | -0.00869 | -| n_updates | 263560 | -| policy_gradient_loss | 0.00635 | -| std | 0.00598 | -| value_loss | 6.2e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26358 | -| time_elapsed | 143342 | -| total_timesteps | 3373824 | -| train/ | | -| approx_kl | 0.001042047 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0158 | -| learning_rate | 0.0003 | -| loss | 0.00459 | -| n_updates | 263570 | -| policy_gradient_loss | 0.00661 | -| std | 0.00598 | -| value_loss | 1.4e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.988 | -| time/ | | -| fps | 23 | -| iterations | 26359 | -| time_elapsed | 143346 | -| total_timesteps | 3373952 | -| train/ | | -| approx_kl | 0.07403425 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0333 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 263580 | -| policy_gradient_loss | 0.0116 | -| std | 0.00599 | -| value_loss | 6.46e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26360 | -| time_elapsed | 143350 | -| total_timesteps | 3374080 | -| train/ | | -| approx_kl | 0.011151176 | -| clip_fraction | 0.232 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | -0.00201 | -| n_updates | 263590 | -| policy_gradient_loss | 0.00709 | -| std | 0.00599 | -| value_loss | 4.41e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26361 | -| time_elapsed | 143360 | -| total_timesteps | 3374208 | -| train/ | | -| approx_kl | 0.016123781 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | -0.00978 | -| n_updates | 263600 | -| policy_gradient_loss | 0.0118 | -| std | 0.00599 | -| value_loss | 0.00179 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26362 | -| time_elapsed | 143365 | -| total_timesteps | 3374336 | -| train/ | | -| approx_kl | 1.1389225 | -| clip_fraction | 0.749 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.04 | -| learning_rate | 0.0003 | -| loss | 0.239 | -| n_updates | 263610 | -| policy_gradient_loss | 0.146 | -| std | 0.00599 | -| value_loss | 9.24e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26363 | -| time_elapsed | 143370 | -| total_timesteps | 3374464 | -| train/ | | -| approx_kl | 0.0036708838 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | -0.00732 | -| n_updates | 263620 | -| policy_gradient_loss | 0.0267 | -| std | 0.006 | -| value_loss | 8.33e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26364 | -| time_elapsed | 143375 | -| total_timesteps | 3374592 | -| train/ | | -| approx_kl | 0.22831956 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0217 | -| learning_rate | 0.0003 | -| loss | 0.0984 | -| n_updates | 263630 | -| policy_gradient_loss | 0.035 | -| std | 0.006 | -| value_loss | 5.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26365 | -| time_elapsed | 143380 | -| total_timesteps | 3374720 | -| train/ | | -| approx_kl | 0.016711934 | -| clip_fraction | 0.116 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0511 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 263640 | -| policy_gradient_loss | 0.000274 | -| std | 0.006 | -| value_loss | 3.1e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26366 | -| time_elapsed | 143385 | -| total_timesteps | 3374848 | -| train/ | | -| approx_kl | 0.02061719 | -| clip_fraction | 0.152 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0802 | -| learning_rate | 0.0003 | -| loss | -0.0249 | -| n_updates | 263650 | -| policy_gradient_loss | -0.0128 | -| std | 0.006 | -| value_loss | 2.36e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.975 | -| time/ | | -| fps | 23 | -| iterations | 26367 | -| time_elapsed | 143389 | -| total_timesteps | 3374976 | -| train/ | | -| approx_kl | 0.015253382 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | -0.00435 | -| n_updates | 263660 | -| policy_gradient_loss | -0.00224 | -| std | 0.006 | -| value_loss | 1.72e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 26368 | -| time_elapsed | 143394 | -| total_timesteps | 3375104 | -| train/ | | -| approx_kl | 0.017193045 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.058 | -| learning_rate | 0.0003 | -| loss | -0.00883 | -| n_updates | 263670 | -| policy_gradient_loss | -0.00447 | -| std | 0.006 | -| value_loss | 1.27e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 26369 | -| time_elapsed | 143405 | -| total_timesteps | 3375232 | -| train/ | | -| approx_kl | 0.16492158 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.805 | -| learning_rate | 0.0003 | -| loss | 0.0366 | -| n_updates | 263680 | -| policy_gradient_loss | 0.0265 | -| std | 0.006 | -| value_loss | 0.00102 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 26370 | -| time_elapsed | 143409 | -| total_timesteps | 3375360 | -| train/ | | -| approx_kl | 0.055182632 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.182 | -| learning_rate | 0.0003 | -| loss | 0.059 | -| n_updates | 263690 | -| policy_gradient_loss | 0.0221 | -| std | 0.00598 | -| value_loss | 0.000734 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 26371 | -| time_elapsed | 143414 | -| total_timesteps | 3375488 | -| train/ | | -| approx_kl | 0.057231486 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.76 | -| learning_rate | 0.0003 | -| loss | 0.0393 | -| n_updates | 263700 | -| policy_gradient_loss | 0.0479 | -| std | 0.00597 | -| value_loss | 0.000353 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 26372 | -| time_elapsed | 143419 | -| total_timesteps | 3375616 | -| train/ | | -| approx_kl | 0.38420618 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0139 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 263710 | -| policy_gradient_loss | 0.135 | -| std | 0.00597 | -| value_loss | 3.7e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 26373 | -| time_elapsed | 143424 | -| total_timesteps | 3375744 | -| train/ | | -| approx_kl | 0.06258304 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0403 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 263720 | -| policy_gradient_loss | 0.0288 | -| std | 0.00597 | -| value_loss | 3.39e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.981 | -| time/ | | -| fps | 23 | -| iterations | 26374 | -| time_elapsed | 143427 | -| total_timesteps | 3375872 | -| train/ | | -| approx_kl | 0.83723974 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 263730 | -| policy_gradient_loss | 0.0634 | -| std | 0.00597 | -| value_loss | 2.83e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26375 | -| time_elapsed | 143432 | -| total_timesteps | 3376000 | -| train/ | | -| approx_kl | 0.052113008 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0306 | -| learning_rate | 0.0003 | -| loss | -0.00529 | -| n_updates | 263740 | -| policy_gradient_loss | -0.000867 | -| std | 0.00597 | -| value_loss | 2.13e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26376 | -| time_elapsed | 143435 | -| total_timesteps | 3376128 | -| train/ | | -| approx_kl | 0.09047824 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00466 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 263750 | -| policy_gradient_loss | 0.0174 | -| std | 0.00597 | -| value_loss | 0.000109 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26377 | -| time_elapsed | 143447 | -| total_timesteps | 3376256 | -| train/ | | -| approx_kl | 0.013769116 | -| clip_fraction | 0.22 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | -0.0126 | -| n_updates | 263760 | -| policy_gradient_loss | 0.00964 | -| std | 0.00597 | -| value_loss | 0.000965 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26378 | -| time_elapsed | 143452 | -| total_timesteps | 3376384 | -| train/ | | -| approx_kl | 0.13181382 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.247 | -| learning_rate | 0.0003 | -| loss | 0.0275 | -| n_updates | 263770 | -| policy_gradient_loss | 0.0465 | -| std | 0.00597 | -| value_loss | 3.3e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26379 | -| time_elapsed | 143457 | -| total_timesteps | 3376512 | -| train/ | | -| approx_kl | 0.13989525 | -| clip_fraction | 0.368 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | 0.0951 | -| n_updates | 263780 | -| policy_gradient_loss | 0.0425 | -| std | 0.00596 | -| value_loss | 8.1e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26380 | -| time_elapsed | 143462 | -| total_timesteps | 3376640 | -| train/ | | -| approx_kl | 0.1735119 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 263790 | -| policy_gradient_loss | 0.0125 | -| std | 0.00596 | -| value_loss | 3.14e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26381 | -| time_elapsed | 143466 | -| total_timesteps | 3376768 | -| train/ | | -| approx_kl | 0.07714682 | -| clip_fraction | 0.529 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.472 | -| learning_rate | 0.0003 | -| loss | 0.0285 | -| n_updates | 263800 | -| policy_gradient_loss | 0.0421 | -| std | 0.00596 | -| value_loss | 7.21e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.974 | -| time/ | | -| fps | 23 | -| iterations | 26382 | -| time_elapsed | 143471 | -| total_timesteps | 3376896 | -| train/ | | -| approx_kl | 0.16060849 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.328 | -| learning_rate | 0.0003 | -| loss | 0.0636 | -| n_updates | 263810 | -| policy_gradient_loss | 0.0287 | -| std | 0.00596 | -| value_loss | 1.25e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26383 | -| time_elapsed | 143476 | -| total_timesteps | 3377024 | -| train/ | | -| approx_kl | 0.17776449 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.0559 | -| n_updates | 263820 | -| policy_gradient_loss | 0.0191 | -| std | 0.00596 | -| value_loss | 1.12e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26384 | -| time_elapsed | 143489 | -| total_timesteps | 3377152 | -| train/ | | -| approx_kl | 0.5227119 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.66 | -| learning_rate | 0.0003 | -| loss | 0.0441 | -| n_updates | 263830 | -| policy_gradient_loss | 0.00605 | -| std | 0.00596 | -| value_loss | 0.0157 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26385 | -| time_elapsed | 143495 | -| total_timesteps | 3377280 | -| train/ | | -| approx_kl | 0.1766225 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00626 | -| learning_rate | 0.0003 | -| loss | 0.0984 | -| n_updates | 263840 | -| policy_gradient_loss | 0.0334 | -| std | 0.00596 | -| value_loss | 0.000479 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26386 | -| time_elapsed | 143499 | -| total_timesteps | 3377408 | -| train/ | | -| approx_kl | 0.036420666 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.069 | -| learning_rate | 0.0003 | -| loss | 0.0264 | -| n_updates | 263850 | -| policy_gradient_loss | 0.0503 | -| std | 0.00596 | -| value_loss | 5.62e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26387 | -| time_elapsed | 143503 | -| total_timesteps | 3377536 | -| train/ | | -| approx_kl | 0.57288194 | -| clip_fraction | 0.711 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00815 | -| learning_rate | 0.0003 | -| loss | 0.207 | -| n_updates | 263860 | -| policy_gradient_loss | 0.146 | -| std | 0.00598 | -| value_loss | 0.00576 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26388 | -| time_elapsed | 143507 | -| total_timesteps | 3377664 | -| train/ | | -| approx_kl | 0.117753595 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.8 | -| learning_rate | 0.0003 | -| loss | 0.0143 | -| n_updates | 263870 | -| policy_gradient_loss | 0.0225 | -| std | 0.00598 | -| value_loss | 0.00052 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26389 | -| time_elapsed | 143512 | -| total_timesteps | 3377792 | -| train/ | | -| approx_kl | 0.19045076 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0145 | -| learning_rate | 0.0003 | -| loss | 0.0623 | -| n_updates | 263880 | -| policy_gradient_loss | 0.0194 | -| std | 0.00599 | -| value_loss | 0.000161 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.977 | -| time/ | | -| fps | 23 | -| iterations | 26390 | -| time_elapsed | 143518 | -| total_timesteps | 3377920 | -| train/ | | -| approx_kl | 0.03596318 | -| clip_fraction | 0.486 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.0274 | -| n_updates | 263890 | -| policy_gradient_loss | 0.0566 | -| std | 0.00599 | -| value_loss | 7.97e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26391 | -| time_elapsed | 143523 | -| total_timesteps | 3378048 | -| train/ | | -| approx_kl | 0.3670889 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 263900 | -| policy_gradient_loss | 0.101 | -| std | 0.00599 | -| value_loss | 7.69e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26392 | -| time_elapsed | 143532 | -| total_timesteps | 3378176 | -| train/ | | -| approx_kl | 0.022335887 | -| clip_fraction | 0.429 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.909 | -| learning_rate | 0.0003 | -| loss | -0.0132 | -| n_updates | 263910 | -| policy_gradient_loss | 0.0129 | -| std | 0.00599 | -| value_loss | 0.000715 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26393 | -| time_elapsed | 143538 | -| total_timesteps | 3378304 | -| train/ | | -| approx_kl | 0.8306016 | -| clip_fraction | 0.795 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0945 | -| learning_rate | 0.0003 | -| loss | 0.411 | -| n_updates | 263920 | -| policy_gradient_loss | 0.225 | -| std | 0.00599 | -| value_loss | 2.35e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26394 | -| time_elapsed | 143543 | -| total_timesteps | 3378432 | -| train/ | | -| approx_kl | 0.083801426 | -| clip_fraction | 0.197 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0819 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 263930 | -| policy_gradient_loss | 0.0127 | -| std | 0.00599 | -| value_loss | 2.05e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26395 | -| time_elapsed | 143550 | -| total_timesteps | 3378560 | -| train/ | | -| approx_kl | 0.77829623 | -| clip_fraction | 0.574 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0573 | -| learning_rate | 0.0003 | -| loss | 0.218 | -| n_updates | 263940 | -| policy_gradient_loss | 0.0773 | -| std | 0.00599 | -| value_loss | 1.58e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26396 | -| time_elapsed | 143554 | -| total_timesteps | 3378688 | -| train/ | | -| approx_kl | 0.06803902 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0426 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 263950 | -| policy_gradient_loss | 0.00838 | -| std | 0.00599 | -| value_loss | 1.21e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26397 | -| time_elapsed | 143560 | -| total_timesteps | 3378816 | -| train/ | | -| approx_kl | 0.06337352 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0545 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 263960 | -| policy_gradient_loss | 0.0126 | -| std | 0.00599 | -| value_loss | 8.68e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.987 | -| time/ | | -| fps | 23 | -| iterations | 26398 | -| time_elapsed | 143566 | -| total_timesteps | 3378944 | -| train/ | | -| approx_kl | 0.05724067 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0485 | -| learning_rate | 0.0003 | -| loss | 0.0294 | -| n_updates | 263970 | -| policy_gradient_loss | 0.014 | -| std | 0.00599 | -| value_loss | 6.54e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26399 | -| time_elapsed | 143570 | -| total_timesteps | 3379072 | -| train/ | | -| approx_kl | 0.0110959215 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0542 | -| learning_rate | 0.0003 | -| loss | -0.00922 | -| n_updates | 263980 | -| policy_gradient_loss | 0.00651 | -| std | 0.006 | -| value_loss | 5.04e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26400 | -| time_elapsed | 143579 | -| total_timesteps | 3379200 | -| train/ | | -| approx_kl | 0.019820556 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.79 | -| learning_rate | 0.0003 | -| loss | 0.00313 | -| n_updates | 263990 | -| policy_gradient_loss | -0.002 | -| std | 0.006 | -| value_loss | 0.00523 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26401 | -| time_elapsed | 143584 | -| total_timesteps | 3379328 | -| train/ | | -| approx_kl | 0.00038461527 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -4.82 | -| learning_rate | 0.0003 | -| loss | -0.00383 | -| n_updates | 264000 | -| policy_gradient_loss | -0.00641 | -| std | 0.006 | -| value_loss | 1.96e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26402 | -| time_elapsed | 143589 | -| total_timesteps | 3379456 | -| train/ | | -| approx_kl | 0.011035429 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -18.9 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 264010 | -| policy_gradient_loss | 0.00512 | -| std | 0.006 | -| value_loss | 5.66e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26403 | -| time_elapsed | 143594 | -| total_timesteps | 3379584 | -| train/ | | -| approx_kl | 0.08640565 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.023 | -| learning_rate | 0.0003 | -| loss | 0.0613 | -| n_updates | 264020 | -| policy_gradient_loss | 0.025 | -| std | 0.00599 | -| value_loss | 1.13e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26404 | -| time_elapsed | 143599 | -| total_timesteps | 3379712 | -| train/ | | -| approx_kl | 0.017127687 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0625 | -| learning_rate | 0.0003 | -| loss | 0.00272 | -| n_updates | 264030 | -| policy_gradient_loss | 0.0118 | -| std | 0.00599 | -| value_loss | 7.49e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26405 | -| time_elapsed | 143603 | -| total_timesteps | 3379840 | -| train/ | | -| approx_kl | 0.0009674551 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | 0.00313 | -| n_updates | 264040 | -| policy_gradient_loss | 0.00735 | -| std | 0.00599 | -| value_loss | 6.5e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.99 | -| time/ | | -| fps | 23 | -| iterations | 26406 | -| time_elapsed | 143607 | -| total_timesteps | 3379968 | -| train/ | | -| approx_kl | 0.008392636 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | -0.00668 | -| n_updates | 264050 | -| policy_gradient_loss | 0.0101 | -| std | 0.006 | -| value_loss | 3.86e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26407 | -| time_elapsed | 143612 | -| total_timesteps | 3380096 | -| train/ | | -| approx_kl | 0.0015593707 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0586 | -| learning_rate | 0.0003 | -| loss | 0.00559 | -| n_updates | 264060 | -| policy_gradient_loss | 0.00709 | -| std | 0.00599 | -| value_loss | 3.49e-09 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26408 | -| time_elapsed | 143624 | -| total_timesteps | 3380224 | -| train/ | | -| approx_kl | 0.04107132 | -| clip_fraction | 0.346 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.902 | -| learning_rate | 0.0003 | -| loss | 0.0303 | -| n_updates | 264070 | -| policy_gradient_loss | 0.0243 | -| std | 0.00599 | -| value_loss | 0.0017 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26409 | -| time_elapsed | 143630 | -| total_timesteps | 3380352 | -| train/ | | -| approx_kl | 0.20711008 | -| clip_fraction | 0.719 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.499 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 264080 | -| policy_gradient_loss | 0.168 | -| std | 0.00599 | -| value_loss | 6.61e-05 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26410 | -| time_elapsed | 143634 | -| total_timesteps | 3380480 | -| train/ | | -| approx_kl | 0.171245 | -| clip_fraction | 0.702 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00112 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 264090 | -| policy_gradient_loss | 0.151 | -| std | 0.00599 | -| value_loss | 2.24e-05 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26411 | -| time_elapsed | 143638 | -| total_timesteps | 3380608 | -| train/ | | -| approx_kl | 0.19003361 | -| clip_fraction | 0.729 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00397 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 264100 | -| policy_gradient_loss | 0.166 | -| std | 0.00599 | -| value_loss | 1.44e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26412 | -| time_elapsed | 143643 | -| total_timesteps | 3380736 | -| train/ | | -| approx_kl | 0.031195614 | -| clip_fraction | 0.441 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0154 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 264110 | -| policy_gradient_loss | 0.0312 | -| std | 0.00599 | -| value_loss | 1.19e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26413 | -| time_elapsed | 143648 | -| total_timesteps | 3380864 | -| train/ | | -| approx_kl | 0.9335472 | -| clip_fraction | 0.581 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 264120 | -| policy_gradient_loss | 0.0767 | -| std | 0.00599 | -| value_loss | 9.44e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.993 | -| time/ | | -| fps | 23 | -| iterations | 26414 | -| time_elapsed | 143654 | -| total_timesteps | 3380992 | -| train/ | | -| approx_kl | 0.06822946 | -| clip_fraction | 0.296 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0268 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 264130 | -| policy_gradient_loss | 0.02 | -| std | 0.006 | -| value_loss | 6.41e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 26415 | -| time_elapsed | 143659 | -| total_timesteps | 3381120 | -| train/ | | -| approx_kl | 0.016368575 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | 0.00927 | -| n_updates | 264140 | -| policy_gradient_loss | 0.011 | -| std | 0.00599 | -| value_loss | 5.47e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 26416 | -| time_elapsed | 143671 | -| total_timesteps | 3381248 | -| train/ | | -| approx_kl | 0.09089409 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -3.23 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 264150 | -| policy_gradient_loss | -0.00624 | -| std | 0.00599 | -| value_loss | 0.0042 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 26417 | -| time_elapsed | 143676 | -| total_timesteps | 3381376 | -| train/ | | -| approx_kl | 0.061887003 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | 0.00629 | -| n_updates | 264160 | -| policy_gradient_loss | 0.00304 | -| std | 0.00599 | -| value_loss | 3.58e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 26418 | -| time_elapsed | 143681 | -| total_timesteps | 3381504 | -| train/ | | -| approx_kl | 0.014227152 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -2.03 | -| learning_rate | 0.0003 | -| loss | 0.00476 | -| n_updates | 264170 | -| policy_gradient_loss | 0.00617 | -| std | 0.006 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 26419 | -| time_elapsed | 143685 | -| total_timesteps | 3381632 | -| train/ | | -| approx_kl | 0.0033179163 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -5.66 | -| learning_rate | 0.0003 | -| loss | -0.00749 | -| n_updates | 264180 | -| policy_gradient_loss | 0.0176 | -| std | 0.006 | -| value_loss | 7.95e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 26420 | -| time_elapsed | 143690 | -| total_timesteps | 3381760 | -| train/ | | -| approx_kl | 0.0016223011 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0464 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 264190 | -| policy_gradient_loss | 0.0134 | -| std | 0.006 | -| value_loss | 3.38e-09 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.998 | -| time/ | | -| fps | 23 | -| iterations | 26421 | -| time_elapsed | 143694 | -| total_timesteps | 3381888 | -| train/ | | -| approx_kl | 2.4978071e-06 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0372 | -| learning_rate | 0.0003 | -| loss | -0.000222 | -| n_updates | 264200 | -| policy_gradient_loss | 0.055 | -| std | 0.006 | -| value_loss | 2.68e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26422 | -| time_elapsed | 143699 | -| total_timesteps | 3382016 | -| train/ | | -| approx_kl | 0.22134393 | -| clip_fraction | 0.512 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0356 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 264210 | -| policy_gradient_loss | 0.0607 | -| std | 0.006 | -| value_loss | 1.82e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26423 | -| time_elapsed | 143711 | -| total_timesteps | 3382144 | -| train/ | | -| approx_kl | 0.015786514 | -| clip_fraction | 0.254 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.951 | -| learning_rate | 0.0003 | -| loss | 0.0113 | -| n_updates | 264220 | -| policy_gradient_loss | 0.00835 | -| std | 0.006 | -| value_loss | 0.00306 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26424 | -| time_elapsed | 143716 | -| total_timesteps | 3382272 | -| train/ | | -| approx_kl | 0.008028329 | -| clip_fraction | 0.356 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.2 | -| learning_rate | 0.0003 | -| loss | -0.0111 | -| n_updates | 264230 | -| policy_gradient_loss | 0.0037 | -| std | 0.006 | -| value_loss | 1.13e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26425 | -| time_elapsed | 143722 | -| total_timesteps | 3382400 | -| train/ | | -| approx_kl | 2.0303763e-05 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | -0.000549 | -| n_updates | 264240 | -| policy_gradient_loss | 0.0186 | -| std | 0.006 | -| value_loss | 2.86e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26426 | -| time_elapsed | 143728 | -| total_timesteps | 3382528 | -| train/ | | -| approx_kl | 0.24034572 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0141 | -| learning_rate | 0.0003 | -| loss | 0.184 | -| n_updates | 264250 | -| policy_gradient_loss | 0.0502 | -| std | 0.006 | -| value_loss | 1.9e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26427 | -| time_elapsed | 143732 | -| total_timesteps | 3382656 | -| train/ | | -| approx_kl | 0.00081658363 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0446 | -| learning_rate | 0.0003 | -| loss | 0.000505 | -| n_updates | 264260 | -| policy_gradient_loss | 0.0291 | -| std | 0.006 | -| value_loss | 9.04e-08 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26428 | -| time_elapsed | 143736 | -| total_timesteps | 3382784 | -| train/ | | -| approx_kl | 0.00041890098 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0784 | -| learning_rate | 0.0003 | -| loss | 0.00112 | -| n_updates | 264270 | -| policy_gradient_loss | 0.0475 | -| std | 0.006 | -| value_loss | 8.84e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.995 | -| time/ | | -| fps | 23 | -| iterations | 26429 | -| time_elapsed | 143742 | -| total_timesteps | 3382912 | -| train/ | | -| approx_kl | 0.23125277 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0385 | -| learning_rate | 0.0003 | -| loss | 0.0592 | -| n_updates | 264280 | -| policy_gradient_loss | 0.0148 | -| std | 0.006 | -| value_loss | 7.58e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26430 | -| time_elapsed | 143746 | -| total_timesteps | 3383040 | -| train/ | | -| approx_kl | 0.026640646 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.00442 | -| n_updates | 264290 | -| policy_gradient_loss | -0.000368 | -| std | 0.006 | -| value_loss | 5.83e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26431 | -| time_elapsed | 143757 | -| total_timesteps | 3383168 | -| train/ | | -| approx_kl | 0.29168907 | -| clip_fraction | 0.552 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.807 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 264300 | -| policy_gradient_loss | 0.00807 | -| std | 0.006 | -| value_loss | 0.00565 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26432 | -| time_elapsed | 143762 | -| total_timesteps | 3383296 | -| train/ | | -| approx_kl | 0.11179211 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.38 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 264310 | -| policy_gradient_loss | 0.0157 | -| std | 0.006 | -| value_loss | 8.79e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26433 | -| time_elapsed | 143766 | -| total_timesteps | 3383424 | -| train/ | | -| approx_kl | 0.063518465 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0631 | -| learning_rate | 0.0003 | -| loss | 0.0354 | -| n_updates | 264320 | -| policy_gradient_loss | 0.0185 | -| std | 0.006 | -| value_loss | 9.08e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26434 | -| time_elapsed | 143770 | -| total_timesteps | 3383552 | -| train/ | | -| approx_kl | 0.072544284 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 264330 | -| policy_gradient_loss | 0.0149 | -| std | 0.00599 | -| value_loss | 4.41e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26435 | -| time_elapsed | 143773 | -| total_timesteps | 3383680 | -| train/ | | -| approx_kl | 0.011433109 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0534 | -| learning_rate | 0.0003 | -| loss | 0.000377 | -| n_updates | 264340 | -| policy_gradient_loss | 0.0117 | -| std | 0.006 | -| value_loss | 3.16e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26436 | -| time_elapsed | 143778 | -| total_timesteps | 3383808 | -| train/ | | -| approx_kl | 0.07392813 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | -0.00126 | -| n_updates | 264350 | -| policy_gradient_loss | -0.00569 | -| std | 0.006 | -| value_loss | 2.97e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 0.997 | -| time/ | | -| fps | 23 | -| iterations | 26437 | -| time_elapsed | 143783 | -| total_timesteps | 3383936 | -| train/ | | -| approx_kl | 0.01371946 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0359 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 264360 | -| policy_gradient_loss | 0.00633 | -| std | 0.006 | -| value_loss | 2.16e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26438 | -| time_elapsed | 143786 | -| total_timesteps | 3384064 | -| train/ | | -| approx_kl | 0.0036378056 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0447 | -| learning_rate | 0.0003 | -| loss | -0.00154 | -| n_updates | 264370 | -| policy_gradient_loss | 0.0116 | -| std | 0.006 | -| value_loss | 1.27e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26439 | -| time_elapsed | 143794 | -| total_timesteps | 3384192 | -| train/ | | -| approx_kl | 0.3182313 | -| clip_fraction | 0.748 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0277 | -| learning_rate | 0.0003 | -| loss | 0.202 | -| n_updates | 264380 | -| policy_gradient_loss | 0.206 | -| std | 0.006 | -| value_loss | 0.0307 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26440 | -| time_elapsed | 143799 | -| total_timesteps | 3384320 | -| train/ | | -| approx_kl | 0.24166207 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.649 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 264390 | -| policy_gradient_loss | 0.149 | -| std | 0.006 | -| value_loss | 0.000187 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26441 | -| time_elapsed | 143805 | -| total_timesteps | 3384448 | -| train/ | | -| approx_kl | 0.184917 | -| clip_fraction | 0.707 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0103 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 264400 | -| policy_gradient_loss | 0.153 | -| std | 0.006 | -| value_loss | 6.31e-05 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26442 | -| time_elapsed | 143811 | -| total_timesteps | 3384576 | -| train/ | | -| approx_kl | 0.040071525 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 6.92e-05 | -| learning_rate | 0.0003 | -| loss | 0.0217 | -| n_updates | 264410 | -| policy_gradient_loss | 0.0336 | -| std | 0.006 | -| value_loss | 3.07e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26443 | -| time_elapsed | 143816 | -| total_timesteps | 3384704 | -| train/ | | -| approx_kl | 0.24773292 | -| clip_fraction | 0.377 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.0391 | -| n_updates | 264420 | -| policy_gradient_loss | 0.0172 | -| std | 0.006 | -| value_loss | 2.53e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26444 | -| time_elapsed | 143821 | -| total_timesteps | 3384832 | -| train/ | | -| approx_kl | 0.022430822 | -| clip_fraction | 0.149 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.036 | -| learning_rate | 0.0003 | -| loss | 0.0123 | -| n_updates | 264430 | -| policy_gradient_loss | 0.00511 | -| std | 0.006 | -| value_loss | 1.39e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26445 | -| time_elapsed | 143825 | -| total_timesteps | 3384960 | -| train/ | | -| approx_kl | 0.019260608 | -| clip_fraction | 0.181 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0851 | -| learning_rate | 0.0003 | -| loss | 0.00276 | -| n_updates | 264440 | -| policy_gradient_loss | 0.00114 | -| std | 0.006 | -| value_loss | 9.45e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26446 | -| time_elapsed | 143831 | -| total_timesteps | 3385088 | -| train/ | | -| approx_kl | 0.014952574 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0665 | -| learning_rate | 0.0003 | -| loss | -0.000583 | -| n_updates | 264450 | -| policy_gradient_loss | -0.000251 | -| std | 0.006 | -| value_loss | 7.33e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26447 | -| time_elapsed | 143841 | -| total_timesteps | 3385216 | -| train/ | | -| approx_kl | 0.07529463 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.993 | -| learning_rate | 0.0003 | -| loss | -0.00636 | -| n_updates | 264460 | -| policy_gradient_loss | 0.016 | -| std | 0.006 | -| value_loss | 6.51e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26448 | -| time_elapsed | 143846 | -| total_timesteps | 3385344 | -| train/ | | -| approx_kl | 0.0915679 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.0704 | -| n_updates | 264470 | -| policy_gradient_loss | 0.014 | -| std | 0.00599 | -| value_loss | 4.06e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26449 | -| time_elapsed | 143851 | -| total_timesteps | 3385472 | -| train/ | | -| approx_kl | 0.07488516 | -| clip_fraction | 0.369 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.176 | -| learning_rate | 0.0003 | -| loss | 0.0591 | -| n_updates | 264480 | -| policy_gradient_loss | 0.0312 | -| std | 0.00599 | -| value_loss | 1.66e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26450 | -| time_elapsed | 143855 | -| total_timesteps | 3385600 | -| train/ | | -| approx_kl | 0.10656863 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.0639 | -| n_updates | 264490 | -| policy_gradient_loss | 0.0184 | -| std | 0.00599 | -| value_loss | 1.01e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26451 | -| time_elapsed | 143861 | -| total_timesteps | 3385728 | -| train/ | | -| approx_kl | 0.05337982 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0978 | -| learning_rate | 0.0003 | -| loss | 0.0146 | -| n_updates | 264500 | -| policy_gradient_loss | 0.037 | -| std | 0.00599 | -| value_loss | 8.13e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26452 | -| time_elapsed | 143865 | -| total_timesteps | 3385856 | -| train/ | | -| approx_kl | 0.30833322 | -| clip_fraction | 0.743 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0493 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 264510 | -| policy_gradient_loss | 0.139 | -| std | 0.00599 | -| value_loss | 5.51e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1 | -| time/ | | -| fps | 23 | -| iterations | 26453 | -| time_elapsed | 143868 | -| total_timesteps | 3385984 | -| train/ | | -| approx_kl | 0.2608118 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 264520 | -| policy_gradient_loss | 0.156 | -| std | 0.00599 | -| value_loss | 4.68e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26454 | -| time_elapsed | 143872 | -| total_timesteps | 3386112 | -| train/ | | -| approx_kl | 0.040948633 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0436 | -| learning_rate | 0.0003 | -| loss | 0.0305 | -| n_updates | 264530 | -| policy_gradient_loss | 0.0351 | -| std | 0.00599 | -| value_loss | 2.77e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26455 | -| time_elapsed | 143884 | -| total_timesteps | 3386240 | -| train/ | | -| approx_kl | 0.5729197 | -| clip_fraction | 0.511 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.878 | -| learning_rate | 0.0003 | -| loss | 0.1 | -| n_updates | 264540 | -| policy_gradient_loss | 0.0388 | -| std | 0.00599 | -| value_loss | 0.00203 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26456 | -| time_elapsed | 143888 | -| total_timesteps | 3386368 | -| train/ | | -| approx_kl | 0.011075057 | -| clip_fraction | 0.256 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.00696 | -| n_updates | 264550 | -| policy_gradient_loss | 0.0133 | -| std | 0.00599 | -| value_loss | 1.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26457 | -| time_elapsed | 143892 | -| total_timesteps | 3386496 | -| train/ | | -| approx_kl | 0.08720101 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.183 | -| learning_rate | 0.0003 | -| loss | 0.0365 | -| n_updates | 264560 | -| policy_gradient_loss | 0.014 | -| std | 0.00599 | -| value_loss | 5.94e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26458 | -| time_elapsed | 143897 | -| total_timesteps | 3386624 | -| train/ | | -| approx_kl | 0.015152365 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0713 | -| learning_rate | 0.0003 | -| loss | -0.000173 | -| n_updates | 264570 | -| policy_gradient_loss | 0.00761 | -| std | 0.00599 | -| value_loss | 4.11e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26459 | -| time_elapsed | 143901 | -| total_timesteps | 3386752 | -| train/ | | -| approx_kl | 0.003653062 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0674 | -| learning_rate | 0.0003 | -| loss | -0.00117 | -| n_updates | 264580 | -| policy_gradient_loss | 0.0118 | -| std | 0.00598 | -| value_loss | 2.6e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26460 | -| time_elapsed | 143907 | -| total_timesteps | 3386880 | -| train/ | | -| approx_kl | 0.052051924 | -| clip_fraction | 0.662 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0726 | -| learning_rate | 0.0003 | -| loss | 0.0542 | -| n_updates | 264590 | -| policy_gradient_loss | 0.142 | -| std | 0.00598 | -| value_loss | 2.65e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26461 | -| time_elapsed | 143911 | -| total_timesteps | 3387008 | -| train/ | | -| approx_kl | 0.012330752 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0346 | -| learning_rate | 0.0003 | -| loss | -0.00295 | -| n_updates | 264600 | -| policy_gradient_loss | 0.0283 | -| std | 0.00598 | -| value_loss | 2.06e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26462 | -| time_elapsed | 143924 | -| total_timesteps | 3387136 | -| train/ | | -| approx_kl | 0.051563814 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.926 | -| learning_rate | 0.0003 | -| loss | -0.0274 | -| n_updates | 264610 | -| policy_gradient_loss | -0.0193 | -| std | 0.00598 | -| value_loss | 0.000415 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26463 | -| time_elapsed | 143929 | -| total_timesteps | 3387264 | -| train/ | | -| approx_kl | 0.17334361 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.309 | -| learning_rate | 0.0003 | -| loss | 0.0258 | -| n_updates | 264620 | -| policy_gradient_loss | 0.00303 | -| std | 0.00598 | -| value_loss | 0.000305 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26464 | -| time_elapsed | 143935 | -| total_timesteps | 3387392 | -| train/ | | -| approx_kl | 0.028512312 | -| clip_fraction | 0.621 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0272 | -| learning_rate | 0.0003 | -| loss | 0.00558 | -| n_updates | 264630 | -| policy_gradient_loss | 0.0768 | -| std | 0.00598 | -| value_loss | 5.01e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26465 | -| time_elapsed | 143940 | -| total_timesteps | 3387520 | -| train/ | | -| approx_kl | 0.07796799 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00964 | -| learning_rate | 0.0003 | -| loss | 0.059 | -| n_updates | 264640 | -| policy_gradient_loss | 0.0295 | -| std | 0.00598 | -| value_loss | 6.21e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26466 | -| time_elapsed | 143945 | -| total_timesteps | 3387648 | -| train/ | | -| approx_kl | 0.09281984 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0311 | -| learning_rate | 0.0003 | -| loss | 0.054 | -| n_updates | 264650 | -| policy_gradient_loss | 0.0793 | -| std | 0.00598 | -| value_loss | 2.87e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26467 | -| time_elapsed | 143949 | -| total_timesteps | 3387776 | -| train/ | | -| approx_kl | 0.001964355 | -| clip_fraction | 0.577 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0761 | -| learning_rate | 0.0003 | -| loss | -0.00358 | -| n_updates | 264660 | -| policy_gradient_loss | 0.136 | -| std | 0.00598 | -| value_loss | 1.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26468 | -| time_elapsed | 143953 | -| total_timesteps | 3387904 | -| train/ | | -| approx_kl | 0.11844678 | -| clip_fraction | 0.681 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0639 | -| learning_rate | 0.0003 | -| loss | 0.0974 | -| n_updates | 264670 | -| policy_gradient_loss | 0.216 | -| std | 0.00598 | -| value_loss | 1.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26469 | -| time_elapsed | 143958 | -| total_timesteps | 3388032 | -| train/ | | -| approx_kl | 0.08255501 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0506 | -| learning_rate | 0.0003 | -| loss | 0.0328 | -| n_updates | 264680 | -| policy_gradient_loss | 0.0301 | -| std | 0.00598 | -| value_loss | 1.07e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26470 | -| time_elapsed | 143968 | -| total_timesteps | 3388160 | -| train/ | | -| approx_kl | 0.0019399775 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.903 | -| learning_rate | 0.0003 | -| loss | -0.0127 | -| n_updates | 264690 | -| policy_gradient_loss | 0.0233 | -| std | 0.00598 | -| value_loss | 0.00114 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26471 | -| time_elapsed | 143973 | -| total_timesteps | 3388288 | -| train/ | | -| approx_kl | 0.0996124 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.14 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 264700 | -| policy_gradient_loss | 0.03 | -| std | 0.00598 | -| value_loss | 1.61e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26472 | -| time_elapsed | 143977 | -| total_timesteps | 3388416 | -| train/ | | -| approx_kl | 0.46706152 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0133 | -| learning_rate | 0.0003 | -| loss | 0.212 | -| n_updates | 264710 | -| policy_gradient_loss | 0.193 | -| std | 0.00597 | -| value_loss | 5.86e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26473 | -| time_elapsed | 143982 | -| total_timesteps | 3388544 | -| train/ | | -| approx_kl | 0.2760541 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.841 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 264720 | -| policy_gradient_loss | 0.11 | -| std | 0.00597 | -| value_loss | 4.9e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26474 | -| time_elapsed | 143985 | -| total_timesteps | 3388672 | -| train/ | | -| approx_kl | 0.18752176 | -| clip_fraction | 0.723 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 264730 | -| policy_gradient_loss | 0.136 | -| std | 0.00597 | -| value_loss | 1.37e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26475 | -| time_elapsed | 143991 | -| total_timesteps | 3388800 | -| train/ | | -| approx_kl | 0.20786662 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0778 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 264740 | -| policy_gradient_loss | 0.147 | -| std | 0.00597 | -| value_loss | 1.31e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26476 | -| time_elapsed | 143995 | -| total_timesteps | 3388928 | -| train/ | | -| approx_kl | 0.17768838 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 264750 | -| policy_gradient_loss | 0.134 | -| std | 0.00597 | -| value_loss | 1.14e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26477 | -| time_elapsed | 144000 | -| total_timesteps | 3389056 | -| train/ | | -| approx_kl | 0.1817793 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 264760 | -| policy_gradient_loss | 0.154 | -| std | 0.00597 | -| value_loss | 8.96e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26478 | -| time_elapsed | 144010 | -| total_timesteps | 3389184 | -| train/ | | -| approx_kl | 0.007176677 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.854 | -| learning_rate | 0.0003 | -| loss | -0.00292 | -| n_updates | 264770 | -| policy_gradient_loss | 0.00643 | -| std | 0.00597 | -| value_loss | 0.00344 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26479 | -| time_elapsed | 144014 | -| total_timesteps | 3389312 | -| train/ | | -| approx_kl | 0.0075904513 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.156 | -| learning_rate | 0.0003 | -| loss | -0.0169 | -| n_updates | 264780 | -| policy_gradient_loss | 0.024 | -| std | 0.00597 | -| value_loss | 1.05e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26480 | -| time_elapsed | 144018 | -| total_timesteps | 3389440 | -| train/ | | -| approx_kl | 0.16423579 | -| clip_fraction | 0.342 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0084 | -| learning_rate | 0.0003 | -| loss | 0.0873 | -| n_updates | 264790 | -| policy_gradient_loss | 0.0236 | -| std | 0.00597 | -| value_loss | 1.97e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26481 | -| time_elapsed | 144023 | -| total_timesteps | 3389568 | -| train/ | | -| approx_kl | 0.02736879 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0125 | -| learning_rate | 0.0003 | -| loss | -0.00462 | -| n_updates | 264800 | -| policy_gradient_loss | 0.0257 | -| std | 0.00597 | -| value_loss | 1.29e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26482 | -| time_elapsed | 144028 | -| total_timesteps | 3389696 | -| train/ | | -| approx_kl | 0.19535065 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 264810 | -| policy_gradient_loss | 0.066 | -| std | 0.00598 | -| value_loss | 4.46e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26483 | -| time_elapsed | 144032 | -| total_timesteps | 3389824 | -| train/ | | -| approx_kl | 0.07828598 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.169 | -| learning_rate | 0.0003 | -| loss | 0.0465 | -| n_updates | 264820 | -| policy_gradient_loss | 0.0188 | -| std | 0.00599 | -| value_loss | 0.000285 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.01 | -| time/ | | -| fps | 23 | -| iterations | 26484 | -| time_elapsed | 144038 | -| total_timesteps | 3389952 | -| train/ | | -| approx_kl | 0.008737212 | -| clip_fraction | 0.0805 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00922 | -| learning_rate | 0.0003 | -| loss | -0.00104 | -| n_updates | 264830 | -| policy_gradient_loss | 0.000447 | -| std | 0.006 | -| value_loss | 2.88e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26485 | -| time_elapsed | 144044 | -| total_timesteps | 3390080 | -| train/ | | -| approx_kl | 0.011079041 | -| clip_fraction | 0.0734 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.00182 | -| n_updates | 264840 | -| policy_gradient_loss | 0.00118 | -| std | 0.006 | -| value_loss | 1.27e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26486 | -| time_elapsed | 144052 | -| total_timesteps | 3390208 | -| train/ | | -| approx_kl | 0.0635003 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.89 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 264850 | -| policy_gradient_loss | 0.000537 | -| std | 0.006 | -| value_loss | 0.00201 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26487 | -| time_elapsed | 144057 | -| total_timesteps | 3390336 | -| train/ | | -| approx_kl | 0.6960697 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0142 | -| learning_rate | 0.0003 | -| loss | 0.322 | -| n_updates | 264860 | -| policy_gradient_loss | 0.215 | -| std | 0.006 | -| value_loss | 3.53e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26488 | -| time_elapsed | 144062 | -| total_timesteps | 3390464 | -| train/ | | -| approx_kl | 0.28903866 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00535 | -| learning_rate | 0.0003 | -| loss | 0.234 | -| n_updates | 264870 | -| policy_gradient_loss | 0.156 | -| std | 0.006 | -| value_loss | 2.37e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26489 | -| time_elapsed | 144068 | -| total_timesteps | 3390592 | -| train/ | | -| approx_kl | 0.04362133 | -| clip_fraction | 0.381 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0113 | -| learning_rate | 0.0003 | -| loss | 0.00942 | -| n_updates | 264880 | -| policy_gradient_loss | 0.022 | -| std | 0.006 | -| value_loss | 1.48e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26490 | -| time_elapsed | 144074 | -| total_timesteps | 3390720 | -| train/ | | -| approx_kl | 0.59815675 | -| clip_fraction | 0.488 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0341 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 264890 | -| policy_gradient_loss | 0.0558 | -| std | 0.006 | -| value_loss | 1.15e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26491 | -| time_elapsed | 144079 | -| total_timesteps | 3390848 | -| train/ | | -| approx_kl | 0.043578163 | -| clip_fraction | 0.229 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 264900 | -| policy_gradient_loss | 0.0155 | -| std | 0.00599 | -| value_loss | 7.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.02 | -| time/ | | -| fps | 23 | -| iterations | 26492 | -| time_elapsed | 144085 | -| total_timesteps | 3390976 | -| train/ | | -| approx_kl | 0.067768045 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0305 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 264910 | -| policy_gradient_loss | 0.00908 | -| std | 0.00599 | -| value_loss | 4.46e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26493 | -| time_elapsed | 144090 | -| total_timesteps | 3391104 | -| train/ | | -| approx_kl | 0.0108418465 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0177 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 264920 | -| policy_gradient_loss | 0.00324 | -| std | 0.00599 | -| value_loss | 1.37e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26494 | -| time_elapsed | 144100 | -| total_timesteps | 3391232 | -| train/ | | -| approx_kl | 0.011989326 | -| clip_fraction | 0.324 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.945 | -| learning_rate | 0.0003 | -| loss | -0.00801 | -| n_updates | 264930 | -| policy_gradient_loss | 0.0175 | -| std | 0.00599 | -| value_loss | 0.000808 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26495 | -| time_elapsed | 144105 | -| total_timesteps | 3391360 | -| train/ | | -| approx_kl | 0.02361343 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.0326 | -| n_updates | 264940 | -| policy_gradient_loss | 0.031 | -| std | 0.00599 | -| value_loss | 1.04e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26496 | -| time_elapsed | 144110 | -| total_timesteps | 3391488 | -| train/ | | -| approx_kl | 0.081206165 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0128 | -| learning_rate | 0.0003 | -| loss | 0.0331 | -| n_updates | 264950 | -| policy_gradient_loss | 0.0198 | -| std | 0.00599 | -| value_loss | 7.8e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26497 | -| time_elapsed | 144114 | -| total_timesteps | 3391616 | -| train/ | | -| approx_kl | 0.035308864 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.348 | -| learning_rate | 0.0003 | -| loss | -0.00751 | -| n_updates | 264960 | -| policy_gradient_loss | 0.0143 | -| std | 0.006 | -| value_loss | 5.85e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26498 | -| time_elapsed | 144118 | -| total_timesteps | 3391744 | -| train/ | | -| approx_kl | 0.29830024 | -| clip_fraction | 0.696 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.553 | -| learning_rate | 0.0003 | -| loss | 0.199 | -| n_updates | 264970 | -| policy_gradient_loss | 0.109 | -| std | 0.00601 | -| value_loss | 5.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26499 | -| time_elapsed | 144121 | -| total_timesteps | 3391872 | -| train/ | | -| approx_kl | 0.20074612 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0977 | -| learning_rate | 0.0003 | -| loss | 0.111 | -| n_updates | 264980 | -| policy_gradient_loss | 0.134 | -| std | 0.00601 | -| value_loss | 2.97e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26500 | -| time_elapsed | 144124 | -| total_timesteps | 3392000 | -| train/ | | -| approx_kl | 0.038173623 | -| clip_fraction | 0.376 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.11 | -| learning_rate | 0.0003 | -| loss | 0.00908 | -| n_updates | 264990 | -| policy_gradient_loss | 0.0248 | -| std | 0.00601 | -| value_loss | 2.39e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26501 | -| time_elapsed | 144128 | -| total_timesteps | 3392128 | -| train/ | | -| approx_kl | 0.17254539 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00649 | -| learning_rate | 0.0003 | -| loss | 0.0299 | -| n_updates | 265000 | -| policy_gradient_loss | 0.0114 | -| std | 0.00601 | -| value_loss | 1.42e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26502 | -| time_elapsed | 144139 | -| total_timesteps | 3392256 | -| train/ | | -| approx_kl | 0.004141246 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.923 | -| learning_rate | 0.0003 | -| loss | -0.0203 | -| n_updates | 265010 | -| policy_gradient_loss | 0.00541 | -| std | 0.00601 | -| value_loss | 0.000477 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26503 | -| time_elapsed | 144143 | -| total_timesteps | 3392384 | -| train/ | | -| approx_kl | 0.19053136 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0156 | -| learning_rate | 0.0003 | -| loss | 0.0755 | -| n_updates | 265020 | -| policy_gradient_loss | 0.021 | -| std | 0.00601 | -| value_loss | 2.26e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26504 | -| time_elapsed | 144147 | -| total_timesteps | 3392512 | -| train/ | | -| approx_kl | 0.02363071 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.018 | -| learning_rate | 0.0003 | -| loss | 0.00446 | -| n_updates | 265030 | -| policy_gradient_loss | 0.0337 | -| std | 0.00602 | -| value_loss | 5.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26505 | -| time_elapsed | 144151 | -| total_timesteps | 3392640 | -| train/ | | -| approx_kl | 0.31032714 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0231 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 265040 | -| policy_gradient_loss | 0.119 | -| std | 0.00602 | -| value_loss | 4.23e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26506 | -| time_elapsed | 144155 | -| total_timesteps | 3392768 | -| train/ | | -| approx_kl | 0.19412898 | -| clip_fraction | 0.701 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 265050 | -| policy_gradient_loss | 0.122 | -| std | 0.00602 | -| value_loss | 3.09e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26507 | -| time_elapsed | 144158 | -| total_timesteps | 3392896 | -| train/ | | -| approx_kl | 0.036257625 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | -0.0113 | -| n_updates | 265060 | -| policy_gradient_loss | 0.0221 | -| std | 0.00602 | -| value_loss | 2.69e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26508 | -| time_elapsed | 144162 | -| total_timesteps | 3393024 | -| train/ | | -| approx_kl | 0.53116924 | -| clip_fraction | 0.484 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0326 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 265070 | -| policy_gradient_loss | 0.0506 | -| std | 0.00602 | -| value_loss | 1.65e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26509 | -| time_elapsed | 144172 | -| total_timesteps | 3393152 | -| train/ | | -| approx_kl | 0.06635016 | -| clip_fraction | 0.187 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.784 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 265080 | -| policy_gradient_loss | 0.00154 | -| std | 0.00602 | -| value_loss | 0.00629 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26510 | -| time_elapsed | 144177 | -| total_timesteps | 3393280 | -| train/ | | -| approx_kl | 0.0075647766 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.238 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 265090 | -| policy_gradient_loss | 0.00485 | -| std | 0.00602 | -| value_loss | 8.3e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26511 | -| time_elapsed | 144182 | -| total_timesteps | 3393408 | -| train/ | | -| approx_kl | 0.06406334 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0156 | -| learning_rate | 0.0003 | -| loss | 0.0489 | -| n_updates | 265100 | -| policy_gradient_loss | 0.0213 | -| std | 0.00601 | -| value_loss | 4.49e-05 | ----------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26512 | -| time_elapsed | 144185 | -| total_timesteps | 3393536 | -| train/ | | -| approx_kl | 0.000105266925 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -22.5 | -| learning_rate | 0.0003 | -| loss | -0.0014 | -| n_updates | 265110 | -| policy_gradient_loss | -0.00335 | -| std | 0.006 | -| value_loss | 0.00155 | --------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26513 | -| time_elapsed | 144189 | -| total_timesteps | 3393664 | -| train/ | | -| approx_kl | 0.071604155 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.396 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 265120 | -| policy_gradient_loss | 0.0196 | -| std | 0.006 | -| value_loss | 0.000278 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26514 | -| time_elapsed | 144194 | -| total_timesteps | 3393792 | -| train/ | | -| approx_kl | 0.051209103 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -12.2 | -| learning_rate | 0.0003 | -| loss | -0.000604 | -| n_updates | 265130 | -| policy_gradient_loss | -0.000167 | -| std | 0.006 | -| value_loss | 4.6e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26515 | -| time_elapsed | 144198 | -| total_timesteps | 3393920 | -| train/ | | -| approx_kl | 0.011316184 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0143 | -| learning_rate | 0.0003 | -| loss | -0.00848 | -| n_updates | 265140 | -| policy_gradient_loss | 0.00874 | -| std | 0.006 | -| value_loss | 8.44e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26516 | -| time_elapsed | 144203 | -| total_timesteps | 3394048 | -| train/ | | -| approx_kl | 0.099295005 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 265150 | -| policy_gradient_loss | 0.00594 | -| std | 0.006 | -| value_loss | 6.63e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26517 | -| time_elapsed | 144213 | -| total_timesteps | 3394176 | -| train/ | | -| approx_kl | 0.0027364227 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.744 | -| learning_rate | 0.0003 | -| loss | -0.008 | -| n_updates | 265160 | -| policy_gradient_loss | -0.000448 | -| std | 0.006 | -| value_loss | 0.00997 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26518 | -| time_elapsed | 144218 | -| total_timesteps | 3394304 | -| train/ | | -| approx_kl | 0.0050345184 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -3.18 | -| learning_rate | 0.0003 | -| loss | -0.00375 | -| n_updates | 265170 | -| policy_gradient_loss | 0.0154 | -| std | 0.006 | -| value_loss | 1.57e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26519 | -| time_elapsed | 144221 | -| total_timesteps | 3394432 | -| train/ | | -| approx_kl | 0.22547962 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.261 | -| learning_rate | 0.0003 | -| loss | 0.163 | -| n_updates | 265180 | -| policy_gradient_loss | 0.0263 | -| std | 0.006 | -| value_loss | 5.47e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26520 | -| time_elapsed | 144227 | -| total_timesteps | 3394560 | -| train/ | | -| approx_kl | 0.18232346 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -15.1 | -| learning_rate | 0.0003 | -| loss | 0.033 | -| n_updates | 265190 | -| policy_gradient_loss | 0.0133 | -| std | 0.006 | -| value_loss | 2.19e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26521 | -| time_elapsed | 144231 | -| total_timesteps | 3394688 | -| train/ | | -| approx_kl | 0.02950324 | -| clip_fraction | 0.485 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0296 | -| learning_rate | 0.0003 | -| loss | 0.00469 | -| n_updates | 265200 | -| policy_gradient_loss | 0.0337 | -| std | 0.006 | -| value_loss | 3.05e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26522 | -| time_elapsed | 144236 | -| total_timesteps | 3394816 | -| train/ | | -| approx_kl | 0.4082663 | -| clip_fraction | 0.682 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00803 | -| learning_rate | 0.0003 | -| loss | 0.24 | -| n_updates | 265210 | -| policy_gradient_loss | 0.198 | -| std | 0.00599 | -| value_loss | 2.28e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.03 | -| time/ | | -| fps | 23 | -| iterations | 26523 | -| time_elapsed | 144241 | -| total_timesteps | 3394944 | -| train/ | | -| approx_kl | 0.23164904 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0187 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 265220 | -| policy_gradient_loss | 0.128 | -| std | 0.00599 | -| value_loss | 1.94e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26524 | -| time_elapsed | 144245 | -| total_timesteps | 3395072 | -| train/ | | -| approx_kl | 0.050263964 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.024 | -| learning_rate | 0.0003 | -| loss | 0.0364 | -| n_updates | 265230 | -| policy_gradient_loss | 0.0376 | -| std | 0.006 | -| value_loss | 1.28e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26525 | -| time_elapsed | 144254 | -| total_timesteps | 3395200 | -| train/ | | -| approx_kl | 0.022591373 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.00848 | -| n_updates | 265240 | -| policy_gradient_loss | -0.00592 | -| std | 0.006 | -| value_loss | 0.000371 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26526 | -| time_elapsed | 144259 | -| total_timesteps | 3395328 | -| train/ | | -| approx_kl | 0.022719838 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.324 | -| learning_rate | 0.0003 | -| loss | 0.00801 | -| n_updates | 265250 | -| policy_gradient_loss | 0.0121 | -| std | 0.006 | -| value_loss | 2.35e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26527 | -| time_elapsed | 144264 | -| total_timesteps | 3395456 | -| train/ | | -| approx_kl | 0.07530367 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00522 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 265260 | -| policy_gradient_loss | 0.0176 | -| std | 0.006 | -| value_loss | 3.96e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26528 | -| time_elapsed | 144268 | -| total_timesteps | 3395584 | -| train/ | | -| approx_kl | 0.20791778 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0491 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 265270 | -| policy_gradient_loss | 0.0672 | -| std | 0.00602 | -| value_loss | 7.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26529 | -| time_elapsed | 144273 | -| total_timesteps | 3395712 | -| train/ | | -| approx_kl | 0.21624576 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.0105 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 265280 | -| policy_gradient_loss | 0.0416 | -| std | 0.00603 | -| value_loss | 8.63e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26530 | -| time_elapsed | 144278 | -| total_timesteps | 3395840 | -| train/ | | -| approx_kl | 0.0014612549 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0115 | -| learning_rate | 0.0003 | -| loss | 0.0017 | -| n_updates | 265290 | -| policy_gradient_loss | 0.0449 | -| std | 0.00603 | -| value_loss | 1.56e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26531 | -| time_elapsed | 144282 | -| total_timesteps | 3395968 | -| train/ | | -| approx_kl | 0.20854148 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0803 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 265300 | -| policy_gradient_loss | 0.0298 | -| std | 0.00603 | -| value_loss | 1.29e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26532 | -| time_elapsed | 144287 | -| total_timesteps | 3396096 | -| train/ | | -| approx_kl | 0.019846661 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0729 | -| learning_rate | 0.0003 | -| loss | 0.00803 | -| n_updates | 265310 | -| policy_gradient_loss | 0.00288 | -| std | 0.00603 | -| value_loss | 9.03e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26533 | -| time_elapsed | 144296 | -| total_timesteps | 3396224 | -| train/ | | -| approx_kl | 0.013897952 | -| clip_fraction | 0.373 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 265320 | -| policy_gradient_loss | 0.0047 | -| std | 0.00603 | -| value_loss | 0.000299 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26534 | -| time_elapsed | 144301 | -| total_timesteps | 3396352 | -| train/ | | -| approx_kl | 0.24578102 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0347 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 265330 | -| policy_gradient_loss | 0.0288 | -| std | 0.00603 | -| value_loss | 3.14e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26535 | -| time_elapsed | 144305 | -| total_timesteps | 3396480 | -| train/ | | -| approx_kl | 0.01744924 | -| clip_fraction | 0.132 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.000562 | -| learning_rate | 0.0003 | -| loss | -0.00225 | -| n_updates | 265340 | -| policy_gradient_loss | -0.00229 | -| std | 0.00603 | -| value_loss | 7.31e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26536 | -| time_elapsed | 144309 | -| total_timesteps | 3396608 | -| train/ | | -| approx_kl | 0.02708171 | -| clip_fraction | 0.46 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 265350 | -| policy_gradient_loss | 0.0467 | -| std | 0.00603 | -| value_loss | 6.56e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26537 | -| time_elapsed | 144316 | -| total_timesteps | 3396736 | -| train/ | | -| approx_kl | 0.30680436 | -| clip_fraction | 0.713 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.462 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 265360 | -| policy_gradient_loss | 0.111 | -| std | 0.00603 | -| value_loss | 9.6e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26538 | -| time_elapsed | 144321 | -| total_timesteps | 3396864 | -| train/ | | -| approx_kl | 0.19324005 | -| clip_fraction | 0.676 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 265370 | -| policy_gradient_loss | 0.136 | -| std | 0.00603 | -| value_loss | 7.93e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26539 | -| time_elapsed | 144326 | -| total_timesteps | 3396992 | -| train/ | | -| approx_kl | 0.041633226 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0469 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 265380 | -| policy_gradient_loss | 0.0263 | -| std | 0.00603 | -| value_loss | 7.82e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26540 | -| time_elapsed | 144331 | -| total_timesteps | 3397120 | -| train/ | | -| approx_kl | 0.000998674 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0301 | -| learning_rate | 0.0003 | -| loss | 0.000919 | -| n_updates | 265390 | -| policy_gradient_loss | 0.0386 | -| std | 0.00602 | -| value_loss | 4.36e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26541 | -| time_elapsed | 144343 | -| total_timesteps | 3397248 | -| train/ | | -| approx_kl | 0.02590783 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.33 | -| learning_rate | 0.0003 | -| loss | -0.0197 | -| n_updates | 265400 | -| policy_gradient_loss | -0.0185 | -| std | 0.00602 | -| value_loss | 0.00359 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26542 | -| time_elapsed | 144349 | -| total_timesteps | 3397376 | -| train/ | | -| approx_kl | 0.0031433757 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.3 | -| learning_rate | 0.0003 | -| loss | -0.00133 | -| n_updates | 265410 | -| policy_gradient_loss | 0.00447 | -| std | 0.00602 | -| value_loss | 3.77e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26543 | -| time_elapsed | 144353 | -| total_timesteps | 3397504 | -| train/ | | -| approx_kl | 0.05342794 | -| clip_fraction | 0.67 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.00134 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 265420 | -| policy_gradient_loss | 0.113 | -| std | 0.00603 | -| value_loss | 1.64e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26544 | -| time_elapsed | 144357 | -| total_timesteps | 3397632 | -| train/ | | -| approx_kl | 0.1308625 | -| clip_fraction | 0.715 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -1.48 | -| learning_rate | 0.0003 | -| loss | 0.0792 | -| n_updates | 265430 | -| policy_gradient_loss | 0.0925 | -| std | 0.00604 | -| value_loss | 9.63e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26545 | -| time_elapsed | 144361 | -| total_timesteps | 3397760 | -| train/ | | -| approx_kl | 0.028217118 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.377 | -| learning_rate | 0.0003 | -| loss | 0.00158 | -| n_updates | 265440 | -| policy_gradient_loss | 0.0297 | -| std | 0.00604 | -| value_loss | 1.54e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26546 | -| time_elapsed | 144364 | -| total_timesteps | 3397888 | -| train/ | | -| approx_kl | 0.20658176 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.0822 | -| n_updates | 265450 | -| policy_gradient_loss | 0.0211 | -| std | 0.00604 | -| value_loss | 1.02e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26547 | -| time_elapsed | 144368 | -| total_timesteps | 3398016 | -| train/ | | -| approx_kl | 0.022483535 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0822 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 265460 | -| policy_gradient_loss | 0.00412 | -| std | 0.00604 | -| value_loss | 6.5e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26548 | -| time_elapsed | 144380 | -| total_timesteps | 3398144 | -| train/ | | -| approx_kl | 0.07541574 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | -0.00474 | -| n_updates | 265470 | -| policy_gradient_loss | 0.012 | -| std | 0.00604 | -| value_loss | 0.000437 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26549 | -| time_elapsed | 144384 | -| total_timesteps | 3398272 | -| train/ | | -| approx_kl | 0.00047667138 | -| clip_fraction | 0.0555 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | 0.216 | -| learning_rate | 0.0003 | -| loss | -0.000123 | -| n_updates | 265480 | -| policy_gradient_loss | 0.00099 | -| std | 0.00603 | -| value_loss | 9.73e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26550 | -| time_elapsed | 144387 | -| total_timesteps | 3398400 | -| train/ | | -| approx_kl | 0.046626143 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.36 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 265490 | -| policy_gradient_loss | 0.0417 | -| std | 0.00602 | -| value_loss | 9.36e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26551 | -| time_elapsed | 144391 | -| total_timesteps | 3398528 | -| train/ | | -| approx_kl | 0.121717975 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.69 | -| explained_variance | -0.0498 | -| learning_rate | 0.0003 | -| loss | 0.0554 | -| n_updates | 265500 | -| policy_gradient_loss | 0.0279 | -| std | 0.00601 | -| value_loss | 4.59e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26552 | -| time_elapsed | 144398 | -| total_timesteps | 3398656 | -| train/ | | -| approx_kl | 0.14596647 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.0743 | -| n_updates | 265510 | -| policy_gradient_loss | 0.0242 | -| std | 0.00601 | -| value_loss | 2.18e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26553 | -| time_elapsed | 144402 | -| total_timesteps | 3398784 | -| train/ | | -| approx_kl | 0.03142757 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0838 | -| learning_rate | 0.0003 | -| loss | 0.0141 | -| n_updates | 265520 | -| policy_gradient_loss | 0.0378 | -| std | 0.00601 | -| value_loss | 1.45e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26554 | -| time_elapsed | 144408 | -| total_timesteps | 3398912 | -| train/ | | -| approx_kl | 3.8738362e-06 | -| clip_fraction | 0.0609 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0668 | -| learning_rate | 0.0003 | -| loss | 0.000109 | -| n_updates | 265530 | -| policy_gradient_loss | 0.0012 | -| std | 0.00601 | -| value_loss | 1.09e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26555 | -| time_elapsed | 144411 | -| total_timesteps | 3399040 | -| train/ | | -| approx_kl | 0.2149018 | -| clip_fraction | 0.201 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.0798 | -| n_updates | 265540 | -| policy_gradient_loss | 0.0124 | -| std | 0.006 | -| value_loss | 5.46e-09 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26556 | -| time_elapsed | 144420 | -| total_timesteps | 3399168 | -| train/ | | -| approx_kl | 0.3416497 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.00762 | -| n_updates | 265550 | -| policy_gradient_loss | 0.000547 | -| std | 0.00599 | -| value_loss | 0.000304 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26557 | -| time_elapsed | 144426 | -| total_timesteps | 3399296 | -| train/ | | -| approx_kl | 0.06469005 | -| clip_fraction | 0.573 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.84 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 265560 | -| policy_gradient_loss | 0.0521 | -| std | 0.00599 | -| value_loss | 1.32e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26558 | -| time_elapsed | 144430 | -| total_timesteps | 3399424 | -| train/ | | -| approx_kl | 0.34849524 | -| clip_fraction | 0.48 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00987 | -| learning_rate | 0.0003 | -| loss | 0.153 | -| n_updates | 265570 | -| policy_gradient_loss | 0.0577 | -| std | 0.00599 | -| value_loss | 3.97e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26559 | -| time_elapsed | 144435 | -| total_timesteps | 3399552 | -| train/ | | -| approx_kl | 0.0012306073 | -| clip_fraction | 0.242 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00309 | -| learning_rate | 0.0003 | -| loss | -0.0054 | -| n_updates | 265580 | -| policy_gradient_loss | 0.0116 | -| std | 0.00599 | -| value_loss | 2.61e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26560 | -| time_elapsed | 144440 | -| total_timesteps | 3399680 | -| train/ | | -| approx_kl | 0.098193765 | -| clip_fraction | 0.593 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.0498 | -| n_updates | 265590 | -| policy_gradient_loss | 0.0906 | -| std | 0.00599 | -| value_loss | 1.95e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26561 | -| time_elapsed | 144446 | -| total_timesteps | 3399808 | -| train/ | | -| approx_kl | 1.9017607e-05 | -| clip_fraction | 0.58 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.000209 | -| n_updates | 265600 | -| policy_gradient_loss | 0.1 | -| std | 0.00599 | -| value_loss | 1.43e-07 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26562 | -| time_elapsed | 144450 | -| total_timesteps | 3399936 | -| train/ | | -| approx_kl | 0.028256817 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.039 | -| learning_rate | 0.0003 | -| loss | 0.0511 | -| n_updates | 265610 | -| policy_gradient_loss | 0.0691 | -| std | 0.00599 | -| value_loss | 1.2e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26563 | -| time_elapsed | 144455 | -| total_timesteps | 3400064 | -| train/ | | -| approx_kl | 0.31343782 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 265620 | -| policy_gradient_loss | 0.149 | -| std | 0.00599 | -| value_loss | 1e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26564 | -| time_elapsed | 144464 | -| total_timesteps | 3400192 | -| train/ | | -| approx_kl | 0.301786 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.593 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 265630 | -| policy_gradient_loss | 0.157 | -| std | 0.00599 | -| value_loss | 0.00699 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26565 | -| time_elapsed | 144469 | -| total_timesteps | 3400320 | -| train/ | | -| approx_kl | 0.19315398 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.897 | -| learning_rate | 0.0003 | -| loss | 0.114 | -| n_updates | 265640 | -| policy_gradient_loss | 0.119 | -| std | 0.00599 | -| value_loss | 5.05e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26566 | -| time_elapsed | 144474 | -| total_timesteps | 3400448 | -| train/ | | -| approx_kl | 0.18034786 | -| clip_fraction | 0.706 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00658 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 265650 | -| policy_gradient_loss | 0.137 | -| std | 0.00599 | -| value_loss | 1.76e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26567 | -| time_elapsed | 144478 | -| total_timesteps | 3400576 | -| train/ | | -| approx_kl | 0.2203904 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.000904 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 265660 | -| policy_gradient_loss | 0.192 | -| std | 0.00599 | -| value_loss | 7.55e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26568 | -| time_elapsed | 144483 | -| total_timesteps | 3400704 | -| train/ | | -| approx_kl | 0.034923516 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.251 | -| learning_rate | 0.0003 | -| loss | 0.00404 | -| n_updates | 265670 | -| policy_gradient_loss | 0.0305 | -| std | 0.00599 | -| value_loss | 2.64e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26569 | -| time_elapsed | 144487 | -| total_timesteps | 3400832 | -| train/ | | -| approx_kl | 0.5597124 | -| clip_fraction | 0.523 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0886 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 265680 | -| policy_gradient_loss | 0.0567 | -| std | 0.00598 | -| value_loss | 2.38e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26570 | -| time_elapsed | 144491 | -| total_timesteps | 3400960 | -| train/ | | -| approx_kl | 0.050853264 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 265690 | -| policy_gradient_loss | 0.0127 | -| std | 0.00598 | -| value_loss | 1.71e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26571 | -| time_elapsed | 144495 | -| total_timesteps | 3401088 | -| train/ | | -| approx_kl | 0.05364789 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0574 | -| learning_rate | 0.0003 | -| loss | 0.0136 | -| n_updates | 265700 | -| policy_gradient_loss | 0.00674 | -| std | 0.00598 | -| value_loss | 1.26e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26572 | -| time_elapsed | 144506 | -| total_timesteps | 3401216 | -| train/ | | -| approx_kl | 0.01246288 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.884 | -| learning_rate | 0.0003 | -| loss | 0.00211 | -| n_updates | 265710 | -| policy_gradient_loss | 0.00572 | -| std | 0.00598 | -| value_loss | 0.00146 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26573 | -| time_elapsed | 144513 | -| total_timesteps | 3401344 | -| train/ | | -| approx_kl | 0.0028927606 | -| clip_fraction | 0.19 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0383 | -| learning_rate | 0.0003 | -| loss | -0.000605 | -| n_updates | 265720 | -| policy_gradient_loss | 0.00671 | -| std | 0.00598 | -| value_loss | 7.96e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26574 | -| time_elapsed | 144518 | -| total_timesteps | 3401472 | -| train/ | | -| approx_kl | 0.0002466282 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00881 | -| learning_rate | 0.0003 | -| loss | 2.87e-05 | -| n_updates | 265730 | -| policy_gradient_loss | 0.0322 | -| std | 0.00599 | -| value_loss | 7.54e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26575 | -| time_elapsed | 144523 | -| total_timesteps | 3401600 | -| train/ | | -| approx_kl | 0.3551174 | -| clip_fraction | 0.584 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.306 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 265740 | -| policy_gradient_loss | 0.0833 | -| std | 0.00599 | -| value_loss | 2.48e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26576 | -| time_elapsed | 144527 | -| total_timesteps | 3401728 | -| train/ | | -| approx_kl | 0.08269706 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00181 | -| learning_rate | 0.0003 | -| loss | 0.027 | -| n_updates | 265750 | -| policy_gradient_loss | 0.00729 | -| std | 0.00599 | -| value_loss | 4.64e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26577 | -| time_elapsed | 144532 | -| total_timesteps | 3401856 | -| train/ | | -| approx_kl | 0.044983134 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0232 | -| learning_rate | 0.0003 | -| loss | 0.00773 | -| n_updates | 265760 | -| policy_gradient_loss | 0.00694 | -| std | 0.00599 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26578 | -| time_elapsed | 144536 | -| total_timesteps | 3401984 | -| train/ | | -| approx_kl | 0.007881651 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0635 | -| learning_rate | 0.0003 | -| loss | 0.000626 | -| n_updates | 265770 | -| policy_gradient_loss | 0.00976 | -| std | 0.00599 | -| value_loss | 1.35e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26579 | -| time_elapsed | 144540 | -| total_timesteps | 3402112 | -| train/ | | -| approx_kl | 0.0910663 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.196 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 265780 | -| policy_gradient_loss | 0.0134 | -| std | 0.00599 | -| value_loss | 7.76e-07 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26580 | -| time_elapsed | 144552 | -| total_timesteps | 3402240 | -| train/ | | -| approx_kl | 0.0024325717 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.763 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 265790 | -| policy_gradient_loss | -0.000392 | -| std | 0.00599 | -| value_loss | 0.00813 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26581 | -| time_elapsed | 144557 | -| total_timesteps | 3402368 | -| train/ | | -| approx_kl | 0.06720174 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.0557 | -| n_updates | 265800 | -| policy_gradient_loss | 0.0256 | -| std | 0.00599 | -| value_loss | 0.000148 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26582 | -| time_elapsed | 144562 | -| total_timesteps | 3402496 | -| train/ | | -| approx_kl | 0.05782312 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00643 | -| learning_rate | 0.0003 | -| loss | 0.0386 | -| n_updates | 265810 | -| policy_gradient_loss | 0.0194 | -| std | 0.00599 | -| value_loss | 9.78e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26583 | -| time_elapsed | 144567 | -| total_timesteps | 3402624 | -| train/ | | -| approx_kl | 0.008269545 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0906 | -| learning_rate | 0.0003 | -| loss | -0.00339 | -| n_updates | 265820 | -| policy_gradient_loss | 0.00903 | -| std | 0.00599 | -| value_loss | 8.27e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26584 | -| time_elapsed | 144571 | -| total_timesteps | 3402752 | -| train/ | | -| approx_kl | 0.024756897 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0645 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 265830 | -| policy_gradient_loss | 0.0196 | -| std | 0.00599 | -| value_loss | 5.35e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26585 | -| time_elapsed | 144576 | -| total_timesteps | 3402880 | -| train/ | | -| approx_kl | 0.054508056 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0899 | -| learning_rate | 0.0003 | -| loss | 0.00658 | -| n_updates | 265840 | -| policy_gradient_loss | 0.0403 | -| std | 0.00599 | -| value_loss | 4.3e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26586 | -| time_elapsed | 144580 | -| total_timesteps | 3403008 | -| train/ | | -| approx_kl | 0.1496192 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | 0.112 | -| n_updates | 265850 | -| policy_gradient_loss | 0.0566 | -| std | 0.00599 | -| value_loss | 3.62e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26587 | -| time_elapsed | 144590 | -| total_timesteps | 3403136 | -| train/ | | -| approx_kl | 0.06064821 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.989 | -| learning_rate | 0.0003 | -| loss | 0.00396 | -| n_updates | 265860 | -| policy_gradient_loss | 0.0124 | -| std | 0.00599 | -| value_loss | 0.000109 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26588 | -| time_elapsed | 144595 | -| total_timesteps | 3403264 | -| train/ | | -| approx_kl | 0.73264986 | -| clip_fraction | 0.756 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | 0.178 | -| n_updates | 265870 | -| policy_gradient_loss | 0.136 | -| std | 0.00599 | -| value_loss | 1.03e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26589 | -| time_elapsed | 144600 | -| total_timesteps | 3403392 | -| train/ | | -| approx_kl | 0.0044196197 | -| clip_fraction | 0.47 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.15 | -| learning_rate | 0.0003 | -| loss | -0.000731 | -| n_updates | 265880 | -| policy_gradient_loss | 0.0404 | -| std | 0.00597 | -| value_loss | 3e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26590 | -| time_elapsed | 144602 | -| total_timesteps | 3403520 | -| train/ | | -| approx_kl | 0.21708967 | -| clip_fraction | 0.671 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -23.6 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 265890 | -| policy_gradient_loss | 0.107 | -| std | 0.00597 | -| value_loss | 1.28e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26591 | -| time_elapsed | 144607 | -| total_timesteps | 3403648 | -| train/ | | -| approx_kl | 0.047550943 | -| clip_fraction | 0.345 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0054 | -| learning_rate | 0.0003 | -| loss | 0.0289 | -| n_updates | 265900 | -| policy_gradient_loss | 0.0269 | -| std | 0.00597 | -| value_loss | 1.59e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26592 | -| time_elapsed | 144613 | -| total_timesteps | 3403776 | -| train/ | | -| approx_kl | 0.0016809837 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0967 | -| learning_rate | 0.0003 | -| loss | 0.000247 | -| n_updates | 265910 | -| policy_gradient_loss | 0.03 | -| std | 0.00597 | -| value_loss | 1.75e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26593 | -| time_elapsed | 144618 | -| total_timesteps | 3403904 | -| train/ | | -| approx_kl | 0.22261207 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.0908 | -| n_updates | 265920 | -| policy_gradient_loss | 0.0235 | -| std | 0.00597 | -| value_loss | 1.24e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26594 | -| time_elapsed | 144623 | -| total_timesteps | 3404032 | -| train/ | | -| approx_kl | 0.016561314 | -| clip_fraction | 0.439 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0129 | -| learning_rate | 0.0003 | -| loss | 0.00516 | -| n_updates | 265930 | -| policy_gradient_loss | 0.031 | -| std | 0.00598 | -| value_loss | 1.17e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26595 | -| time_elapsed | 144632 | -| total_timesteps | 3404160 | -| train/ | | -| approx_kl | 0.13875635 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.728 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 265940 | -| policy_gradient_loss | 0.0237 | -| std | 0.00598 | -| value_loss | 0.00967 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26596 | -| time_elapsed | 144636 | -| total_timesteps | 3404288 | -| train/ | | -| approx_kl | 1.3311517 | -| clip_fraction | 0.725 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.987 | -| learning_rate | 0.0003 | -| loss | 0.322 | -| n_updates | 265950 | -| policy_gradient_loss | 0.199 | -| std | 0.00597 | -| value_loss | 0.000257 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26597 | -| time_elapsed | 144641 | -| total_timesteps | 3404416 | -| train/ | | -| approx_kl | 0.001430545 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0169 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 265960 | -| policy_gradient_loss | 0.0323 | -| std | 0.00597 | -| value_loss | 3.65e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26598 | -| time_elapsed | 144646 | -| total_timesteps | 3404544 | -| train/ | | -| approx_kl | 0.8838558 | -| clip_fraction | 0.53 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0584 | -| learning_rate | 0.0003 | -| loss | 0.269 | -| n_updates | 265970 | -| policy_gradient_loss | 0.0789 | -| std | 0.00597 | -| value_loss | 3.38e-05 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26599 | -| time_elapsed | 144650 | -| total_timesteps | 3404672 | -| train/ | | -| approx_kl | 0.0155147 | -| clip_fraction | 0.282 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0456 | -| learning_rate | 0.0003 | -| loss | -0.00663 | -| n_updates | 265980 | -| policy_gradient_loss | 0.0109 | -| std | 0.00597 | -| value_loss | 2.66e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26600 | -| time_elapsed | 144655 | -| total_timesteps | 3404800 | -| train/ | | -| approx_kl | 0.016846173 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0423 | -| learning_rate | 0.0003 | -| loss | 0.0117 | -| n_updates | 265990 | -| policy_gradient_loss | 0.0144 | -| std | 0.00595 | -| value_loss | 0.000405 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26601 | -| time_elapsed | 144660 | -| total_timesteps | 3404928 | -| train/ | | -| approx_kl | 0.009630635 | -| clip_fraction | 0.213 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0871 | -| learning_rate | 0.0003 | -| loss | 0.0024 | -| n_updates | 266000 | -| policy_gradient_loss | 0.0112 | -| std | 0.00594 | -| value_loss | 0.000124 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26602 | -| time_elapsed | 144665 | -| total_timesteps | 3405056 | -| train/ | | -| approx_kl | 0.00082275784 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | 0.000337 | -| n_updates | 266010 | -| policy_gradient_loss | 0.0129 | -| std | 0.00593 | -| value_loss | 0.000388 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26603 | -| time_elapsed | 144676 | -| total_timesteps | 3405184 | -| train/ | | -| approx_kl | 0.122334845 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.95 | -| learning_rate | 0.0003 | -| loss | 0.0432 | -| n_updates | 266020 | -| policy_gradient_loss | 0.0325 | -| std | 0.00593 | -| value_loss | 0.00453 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26604 | -| time_elapsed | 144681 | -| total_timesteps | 3405312 | -| train/ | | -| approx_kl | 0.11281643 | -| clip_fraction | 0.329 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.079 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 266030 | -| policy_gradient_loss | 0.0361 | -| std | 0.00593 | -| value_loss | 1.13e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26605 | -| time_elapsed | 144685 | -| total_timesteps | 3405440 | -| train/ | | -| approx_kl | 5.267095e-06 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0747 | -| learning_rate | 0.0003 | -| loss | -0.000219 | -| n_updates | 266040 | -| policy_gradient_loss | 0.0317 | -| std | 0.00593 | -| value_loss | 1.33e-06 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26606 | -| time_elapsed | 144689 | -| total_timesteps | 3405568 | -| train/ | | -| approx_kl | 0.792022 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.282 | -| learning_rate | 0.0003 | -| loss | 0.285 | -| n_updates | 266050 | -| policy_gradient_loss | 0.0816 | -| std | 0.00593 | -| value_loss | 3.05e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26607 | -| time_elapsed | 144693 | -| total_timesteps | 3405696 | -| train/ | | -| approx_kl | 0.039483942 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0184 | -| learning_rate | 0.0003 | -| loss | 0.0256 | -| n_updates | 266060 | -| policy_gradient_loss | 0.0131 | -| std | 0.00593 | -| value_loss | 4.39e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26608 | -| time_elapsed | 144697 | -| total_timesteps | 3405824 | -| train/ | | -| approx_kl | 0.008237587 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00469 | -| n_updates | 266070 | -| policy_gradient_loss | 0.0105 | -| std | 0.00592 | -| value_loss | 4.84e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26609 | -| time_elapsed | 144702 | -| total_timesteps | 3405952 | -| train/ | | -| approx_kl | 0.07123897 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0285 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 266080 | -| policy_gradient_loss | 0.00557 | -| std | 0.00592 | -| value_loss | 3.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26610 | -| time_elapsed | 144707 | -| total_timesteps | 3406080 | -| train/ | | -| approx_kl | 0.052790567 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0351 | -| learning_rate | 0.0003 | -| loss | 0.0259 | -| n_updates | 266090 | -| policy_gradient_loss | 0.0141 | -| std | 0.00592 | -| value_loss | 2.67e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26611 | -| time_elapsed | 144715 | -| total_timesteps | 3406208 | -| train/ | | -| approx_kl | 0.09166475 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.479 | -| learning_rate | 0.0003 | -| loss | -0.021 | -| n_updates | 266100 | -| policy_gradient_loss | -0.0147 | -| std | 0.00592 | -| value_loss | 0.00305 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26612 | -| time_elapsed | 144720 | -| total_timesteps | 3406336 | -| train/ | | -| approx_kl | 0.14803526 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.129 | -| learning_rate | 0.0003 | -| loss | 0.0577 | -| n_updates | 266110 | -| policy_gradient_loss | 0.0266 | -| std | 0.00592 | -| value_loss | 1.69e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26613 | -| time_elapsed | 144724 | -| total_timesteps | 3406464 | -| train/ | | -| approx_kl | 0.00043198233 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.56 | -| learning_rate | 0.0003 | -| loss | -0.00337 | -| n_updates | 266120 | -| policy_gradient_loss | 0.0358 | -| std | 0.00591 | -| value_loss | 7.52e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26614 | -| time_elapsed | 144728 | -| total_timesteps | 3406592 | -| train/ | | -| approx_kl | 0.7447601 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00787 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 266130 | -| policy_gradient_loss | 0.0551 | -| std | 0.00591 | -| value_loss | 5.04e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26615 | -| time_elapsed | 144732 | -| total_timesteps | 3406720 | -| train/ | | -| approx_kl | 0.014318457 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.000262 | -| n_updates | 266140 | -| policy_gradient_loss | 0.0081 | -| std | 0.00591 | -| value_loss | 3.35e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26616 | -| time_elapsed | 144736 | -| total_timesteps | 3406848 | -| train/ | | -| approx_kl | 0.0029566884 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | -0.00374 | -| n_updates | 266150 | -| policy_gradient_loss | 0.0141 | -| std | 0.00591 | -| value_loss | 2.55e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26617 | -| time_elapsed | 144741 | -| total_timesteps | 3406976 | -| train/ | | -| approx_kl | 0.05043838 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | 0.0488 | -| n_updates | 266160 | -| policy_gradient_loss | 0.106 | -| std | 0.00591 | -| value_loss | 1.96e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26618 | -| time_elapsed | 144746 | -| total_timesteps | 3407104 | -| train/ | | -| approx_kl | 0.014817689 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0445 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 266170 | -| policy_gradient_loss | 0.0391 | -| std | 0.00591 | -| value_loss | 1.73e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26619 | -| time_elapsed | 144756 | -| total_timesteps | 3407232 | -| train/ | | -| approx_kl | 0.02147012 | -| clip_fraction | 0.44 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.9 | -| learning_rate | 0.0003 | -| loss | -0.0221 | -| n_updates | 266180 | -| policy_gradient_loss | 0.0168 | -| std | 0.00591 | -| value_loss | 0.00192 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26620 | -| time_elapsed | 144761 | -| total_timesteps | 3407360 | -| train/ | | -| approx_kl | 0.17324272 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.736 | -| learning_rate | 0.0003 | -| loss | 0.0694 | -| n_updates | 266190 | -| policy_gradient_loss | 0.0187 | -| std | 0.00591 | -| value_loss | 3.81e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26621 | -| time_elapsed | 144765 | -| total_timesteps | 3407488 | -| train/ | | -| approx_kl | 0.018888399 | -| clip_fraction | 0.123 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0588 | -| learning_rate | 0.0003 | -| loss | 0.00328 | -| n_updates | 266200 | -| policy_gradient_loss | 0.000532 | -| std | 0.00592 | -| value_loss | 5.28e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26622 | -| time_elapsed | 144768 | -| total_timesteps | 3407616 | -| train/ | | -| approx_kl | 0.030056287 | -| clip_fraction | 0.446 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0122 | -| learning_rate | 0.0003 | -| loss | 0.02 | -| n_updates | 266210 | -| policy_gradient_loss | 0.0406 | -| std | 0.00592 | -| value_loss | 2.77e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26623 | -| time_elapsed | 144772 | -| total_timesteps | 3407744 | -| train/ | | -| approx_kl | 0.39024758 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 266220 | -| policy_gradient_loss | 0.167 | -| std | 0.00592 | -| value_loss | 8.16e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26624 | -| time_elapsed | 144776 | -| total_timesteps | 3407872 | -| train/ | | -| approx_kl | 0.18686849 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.154 | -| n_updates | 266230 | -| policy_gradient_loss | 0.119 | -| std | 0.00592 | -| value_loss | 7.3e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26625 | -| time_elapsed | 144781 | -| total_timesteps | 3408000 | -| train/ | | -| approx_kl | 0.046422306 | -| clip_fraction | 0.409 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0524 | -| learning_rate | 0.0003 | -| loss | 0.0273 | -| n_updates | 266240 | -| policy_gradient_loss | 0.0389 | -| std | 0.00592 | -| value_loss | 6.33e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26626 | -| time_elapsed | 144787 | -| total_timesteps | 3408128 | -| train/ | | -| approx_kl | 0.6566147 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00489 | -| learning_rate | 0.0003 | -| loss | 0.167 | -| n_updates | 266250 | -| policy_gradient_loss | 0.0549 | -| std | 0.00593 | -| value_loss | 3.47e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26627 | -| time_elapsed | 144796 | -| total_timesteps | 3408256 | -| train/ | | -| approx_kl | 0.019171458 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.718 | -| learning_rate | 0.0003 | -| loss | 0.0111 | -| n_updates | 266260 | -| policy_gradient_loss | 0.00849 | -| std | 0.00593 | -| value_loss | 0.0071 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26628 | -| time_elapsed | 144801 | -| total_timesteps | 3408384 | -| train/ | | -| approx_kl | 0.08653071 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.294 | -| learning_rate | 0.0003 | -| loss | 0.0433 | -| n_updates | 266270 | -| policy_gradient_loss | 0.0176 | -| std | 0.00592 | -| value_loss | 9.67e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26629 | -| time_elapsed | 144805 | -| total_timesteps | 3408512 | -| train/ | | -| approx_kl | 0.043496836 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.0085 | -| learning_rate | 0.0003 | -| loss | -0.00445 | -| n_updates | 266280 | -| policy_gradient_loss | -0.00104 | -| std | 0.00592 | -| value_loss | 1.57e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26630 | -| time_elapsed | 144810 | -| total_timesteps | 3408640 | -| train/ | | -| approx_kl | 0.009281054 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0303 | -| learning_rate | 0.0003 | -| loss | -0.024 | -| n_updates | 266290 | -| policy_gradient_loss | 0.00499 | -| std | 0.00592 | -| value_loss | 1.19e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26631 | -| time_elapsed | 144814 | -| total_timesteps | 3408768 | -| train/ | | -| approx_kl | 0.04369489 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0399 | -| learning_rate | 0.0003 | -| loss | 0.0314 | -| n_updates | 266300 | -| policy_gradient_loss | 0.111 | -| std | 0.00593 | -| value_loss | 7.59e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26632 | -| time_elapsed | 144817 | -| total_timesteps | 3408896 | -| train/ | | -| approx_kl | 0.1083526 | -| clip_fraction | 0.667 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0546 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 266310 | -| policy_gradient_loss | 0.119 | -| std | 0.00593 | -| value_loss | 7.07e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26633 | -| time_elapsed | 144820 | -| total_timesteps | 3409024 | -| train/ | | -| approx_kl | 0.02430651 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 266320 | -| policy_gradient_loss | 0.0302 | -| std | 0.00593 | -| value_loss | 6.59e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26634 | -| time_elapsed | 144831 | -| total_timesteps | 3409152 | -| train/ | | -| approx_kl | 0.2477412 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.893 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 266330 | -| policy_gradient_loss | 0.0069 | -| std | 0.00593 | -| value_loss | 0.0023 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26635 | -| time_elapsed | 144836 | -| total_timesteps | 3409280 | -| train/ | | -| approx_kl | 0.007366377 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00652 | -| learning_rate | 0.0003 | -| loss | -0.0121 | -| n_updates | 266340 | -| policy_gradient_loss | 0.0322 | -| std | 0.00593 | -| value_loss | 9.59e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26636 | -| time_elapsed | 144841 | -| total_timesteps | 3409408 | -| train/ | | -| approx_kl | 0.0037430278 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.00581 | -| learning_rate | 0.0003 | -| loss | -0.00263 | -| n_updates | 266350 | -| policy_gradient_loss | 0.0294 | -| std | 0.00593 | -| value_loss | 3.53e-06 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26637 | -| time_elapsed | 144845 | -| total_timesteps | 3409536 | -| train/ | | -| approx_kl | 0.4149929 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0789 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 266360 | -| policy_gradient_loss | 0.0554 | -| std | 0.00594 | -| value_loss | 1.91e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26638 | -| time_elapsed | 144850 | -| total_timesteps | 3409664 | -| train/ | | -| approx_kl | 0.0057959813 | -| clip_fraction | 0.202 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.105 | -| learning_rate | 0.0003 | -| loss | -0.00138 | -| n_updates | 266370 | -| policy_gradient_loss | 0.00641 | -| std | 0.00594 | -| value_loss | 1.4e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26639 | -| time_elapsed | 144855 | -| total_timesteps | 3409792 | -| train/ | | -| approx_kl | 0.114788085 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0838 | -| learning_rate | 0.0003 | -| loss | 0.0745 | -| n_updates | 266380 | -| policy_gradient_loss | 0.0307 | -| std | 0.00594 | -| value_loss | 1.03e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26640 | -| time_elapsed | 144859 | -| total_timesteps | 3409920 | -| train/ | | -| approx_kl | 0.013925666 | -| clip_fraction | 0.217 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0872 | -| learning_rate | 0.0003 | -| loss | -0.0263 | -| n_updates | 266390 | -| policy_gradient_loss | 0.000678 | -| std | 0.00594 | -| value_loss | 7.9e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26641 | -| time_elapsed | 144864 | -| total_timesteps | 3410048 | -| train/ | | -| approx_kl | 0.037544683 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0579 | -| learning_rate | 0.0003 | -| loss | 0.0446 | -| n_updates | 266400 | -| policy_gradient_loss | 0.125 | -| std | 0.00594 | -| value_loss | 6.69e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26642 | -| time_elapsed | 144874 | -| total_timesteps | 3410176 | -| train/ | | -| approx_kl | 0.014416242 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | 0.0102 | -| n_updates | 266410 | -| policy_gradient_loss | 0.0256 | -| std | 0.00594 | -| value_loss | 0.000122 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26643 | -| time_elapsed | 144878 | -| total_timesteps | 3410304 | -| train/ | | -| approx_kl | 0.1597121 | -| clip_fraction | 0.352 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00541 | -| learning_rate | 0.0003 | -| loss | 0.0701 | -| n_updates | 266420 | -| policy_gradient_loss | 0.0192 | -| std | 0.00594 | -| value_loss | 1.02e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26644 | -| time_elapsed | 144882 | -| total_timesteps | 3410432 | -| train/ | | -| approx_kl | 0.014304119 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0123 | -| learning_rate | 0.0003 | -| loss | -0.0053 | -| n_updates | 266430 | -| policy_gradient_loss | -0.00313 | -| std | 0.00594 | -| value_loss | 4.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26645 | -| time_elapsed | 144888 | -| total_timesteps | 3410560 | -| train/ | | -| approx_kl | 0.03142072 | -| clip_fraction | 0.487 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0567 | -| learning_rate | 0.0003 | -| loss | -0.0207 | -| n_updates | 266440 | -| policy_gradient_loss | 0.0171 | -| std | 0.00594 | -| value_loss | 3.72e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26646 | -| time_elapsed | 144892 | -| total_timesteps | 3410688 | -| train/ | | -| approx_kl | 0.14611992 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | 0.0443 | -| n_updates | 266450 | -| policy_gradient_loss | 0.0275 | -| std | 0.00594 | -| value_loss | 3.43e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26647 | -| time_elapsed | 144896 | -| total_timesteps | 3410816 | -| train/ | | -| approx_kl | 0.02659002 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.0603 | -| n_updates | 266460 | -| policy_gradient_loss | -0.0133 | -| std | 0.00594 | -| value_loss | 2.73e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26648 | -| time_elapsed | 144900 | -| total_timesteps | 3410944 | -| train/ | | -| approx_kl | 0.24762878 | -| clip_fraction | 0.33 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0714 | -| n_updates | 266470 | -| policy_gradient_loss | 0.0144 | -| std | 0.00594 | -| value_loss | 1.86e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26649 | -| time_elapsed | 144906 | -| total_timesteps | 3411072 | -| train/ | | -| approx_kl | 0.01826919 | -| clip_fraction | 0.437 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0529 | -| learning_rate | 0.0003 | -| loss | 0.00434 | -| n_updates | 266480 | -| policy_gradient_loss | 0.0357 | -| std | 0.00594 | -| value_loss | 1.42e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26650 | -| time_elapsed | 144913 | -| total_timesteps | 3411200 | -| train/ | | -| approx_kl | 0.31657583 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.941 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 266490 | -| policy_gradient_loss | 0.0912 | -| std | 0.00594 | -| value_loss | 0.00109 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26651 | -| time_elapsed | 144917 | -| total_timesteps | 3411328 | -| train/ | | -| approx_kl | 0.1519652 | -| clip_fraction | 0.325 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0254 | -| learning_rate | 0.0003 | -| loss | 0.0825 | -| n_updates | 266500 | -| policy_gradient_loss | 0.036 | -| std | 0.00594 | -| value_loss | 1.23e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26652 | -| time_elapsed | 144922 | -| total_timesteps | 3411456 | -| train/ | | -| approx_kl | 0.008242616 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.00529 | -| learning_rate | 0.0003 | -| loss | 0.0137 | -| n_updates | 266510 | -| policy_gradient_loss | 0.0104 | -| std | 0.00594 | -| value_loss | 1.83e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26653 | -| time_elapsed | 144926 | -| total_timesteps | 3411584 | -| train/ | | -| approx_kl | 0.0893206 | -| clip_fraction | 0.386 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | 0.00856 | -| n_updates | 266520 | -| policy_gradient_loss | 0.0266 | -| std | 0.00594 | -| value_loss | 1.69e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26654 | -| time_elapsed | 144930 | -| total_timesteps | 3411712 | -| train/ | | -| approx_kl | 0.16129713 | -| clip_fraction | 0.331 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | 0.08 | -| n_updates | 266530 | -| policy_gradient_loss | 0.026 | -| std | 0.00594 | -| value_loss | 1.12e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26655 | -| time_elapsed | 144933 | -| total_timesteps | 3411840 | -| train/ | | -| approx_kl | 0.01891245 | -| clip_fraction | 0.173 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0715 | -| learning_rate | 0.0003 | -| loss | 0.007 | -| n_updates | 266540 | -| policy_gradient_loss | 0.00318 | -| std | 0.00594 | -| value_loss | 7.45e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26656 | -| time_elapsed | 144937 | -| total_timesteps | 3411968 | -| train/ | | -| approx_kl | 0.014563533 | -| clip_fraction | 0.13 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0884 | -| learning_rate | 0.0003 | -| loss | 0.0064 | -| n_updates | 266550 | -| policy_gradient_loss | 0.00307 | -| std | 0.00595 | -| value_loss | 4.7e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26657 | -| time_elapsed | 144942 | -| total_timesteps | 3412096 | -| train/ | | -| approx_kl | 0.015087657 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.00196 | -| n_updates | 266560 | -| policy_gradient_loss | 0.000931 | -| std | 0.00595 | -| value_loss | 3.69e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26658 | -| time_elapsed | 144951 | -| total_timesteps | 3412224 | -| train/ | | -| approx_kl | 0.02988941 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.953 | -| learning_rate | 0.0003 | -| loss | -0.00608 | -| n_updates | 266570 | -| policy_gradient_loss | 0.0156 | -| std | 0.00595 | -| value_loss | 0.000885 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26659 | -| time_elapsed | 144955 | -| total_timesteps | 3412352 | -| train/ | | -| approx_kl | 0.4640411 | -| clip_fraction | 0.709 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | 0.214 | -| n_updates | 266580 | -| policy_gradient_loss | 0.136 | -| std | 0.00595 | -| value_loss | 8.72e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26660 | -| time_elapsed | 144959 | -| total_timesteps | 3412480 | -| train/ | | -| approx_kl | 0.26954812 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0127 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 266590 | -| policy_gradient_loss | 0.154 | -| std | 0.00595 | -| value_loss | 1.7e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26661 | -| time_elapsed | 144965 | -| total_timesteps | 3412608 | -| train/ | | -| approx_kl | 0.046362177 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00715 | -| learning_rate | 0.0003 | -| loss | 0.0267 | -| n_updates | 266600 | -| policy_gradient_loss | 0.029 | -| std | 0.00595 | -| value_loss | 8.81e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26662 | -| time_elapsed | 144969 | -| total_timesteps | 3412736 | -| train/ | | -| approx_kl | 0.0012673372 | -| clip_fraction | 0.388 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0486 | -| learning_rate | 0.0003 | -| loss | 0.000289 | -| n_updates | 266610 | -| policy_gradient_loss | 0.0312 | -| std | 0.00596 | -| value_loss | 4.6e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26663 | -| time_elapsed | 144975 | -| total_timesteps | 3412864 | -| train/ | | -| approx_kl | 0.6699495 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.143 | -| learning_rate | 0.0003 | -| loss | 0.233 | -| n_updates | 266620 | -| policy_gradient_loss | 0.0678 | -| std | 0.00596 | -| value_loss | 7.95e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26664 | -| time_elapsed | 144978 | -| total_timesteps | 3412992 | -| train/ | | -| approx_kl | 0.014524331 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.016 | -| learning_rate | 0.0003 | -| loss | -0.00278 | -| n_updates | 266630 | -| policy_gradient_loss | 0.0116 | -| std | 0.00596 | -| value_loss | 3.11e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26665 | -| time_elapsed | 144982 | -| total_timesteps | 3413120 | -| train/ | | -| approx_kl | 0.08339009 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0559 | -| learning_rate | 0.0003 | -| loss | 0.0503 | -| n_updates | 266640 | -| policy_gradient_loss | 0.0209 | -| std | 0.00596 | -| value_loss | 1.99e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26666 | -| time_elapsed | 144995 | -| total_timesteps | 3413248 | -| train/ | | -| approx_kl | 0.04890165 | -| clip_fraction | 0.336 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.936 | -| learning_rate | 0.0003 | -| loss | -0.0297 | -| n_updates | 266650 | -| policy_gradient_loss | -0.0197 | -| std | 0.00596 | -| value_loss | 0.000436 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26667 | -| time_elapsed | 145000 | -| total_timesteps | 3413376 | -| train/ | | -| approx_kl | 0.097982764 | -| clip_fraction | 0.691 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.00821 | -| learning_rate | 0.0003 | -| loss | 0.102 | -| n_updates | 266660 | -| policy_gradient_loss | 0.103 | -| std | 0.00596 | -| value_loss | 2.17e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26668 | -| time_elapsed | 145004 | -| total_timesteps | 3413504 | -| train/ | | -| approx_kl | 0.119806364 | -| clip_fraction | 0.679 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0181 | -| learning_rate | 0.0003 | -| loss | 0.13 | -| n_updates | 266670 | -| policy_gradient_loss | 0.102 | -| std | 0.00596 | -| value_loss | 7.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26669 | -| time_elapsed | 145008 | -| total_timesteps | 3413632 | -| train/ | | -| approx_kl | 0.14079104 | -| clip_fraction | 0.7 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00688 | -| learning_rate | 0.0003 | -| loss | 0.0846 | -| n_updates | 266680 | -| policy_gradient_loss | 0.133 | -| std | 0.00597 | -| value_loss | 2.97e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26670 | -| time_elapsed | 145012 | -| total_timesteps | 3413760 | -| train/ | | -| approx_kl | 0.12474051 | -| clip_fraction | 0.684 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0691 | -| learning_rate | 0.0003 | -| loss | 0.138 | -| n_updates | 266690 | -| policy_gradient_loss | 0.127 | -| std | 0.00597 | -| value_loss | 3.11e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26671 | -| time_elapsed | 145016 | -| total_timesteps | 3413888 | -| train/ | | -| approx_kl | 0.033104338 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.00909 | -| n_updates | 266700 | -| policy_gradient_loss | 0.0344 | -| std | 0.00597 | -| value_loss | 2.65e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26672 | -| time_elapsed | 145020 | -| total_timesteps | 3414016 | -| train/ | | -| approx_kl | 0.5681969 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0338 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 266710 | -| policy_gradient_loss | 0.0524 | -| std | 0.00597 | -| value_loss | 2.16e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26673 | -| time_elapsed | 145030 | -| total_timesteps | 3414144 | -| train/ | | -| approx_kl | 0.009595177 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.835 | -| learning_rate | 0.0003 | -| loss | -0.00921 | -| n_updates | 266720 | -| policy_gradient_loss | -0.00377 | -| std | 0.00597 | -| value_loss | 0.00494 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26674 | -| time_elapsed | 145035 | -| total_timesteps | 3414272 | -| train/ | | -| approx_kl | 0.11724339 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.018 | -| learning_rate | 0.0003 | -| loss | 0.000947 | -| n_updates | 266730 | -| policy_gradient_loss | 0.000764 | -| std | 0.00597 | -| value_loss | 0.000785 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26675 | -| time_elapsed | 145039 | -| total_timesteps | 3414400 | -| train/ | | -| approx_kl | 0.3202954 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.00971 | -| learning_rate | 0.0003 | -| loss | 0.252 | -| n_updates | 266740 | -| policy_gradient_loss | 0.0474 | -| std | 0.00596 | -| value_loss | 9.89e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26676 | -| time_elapsed | 145045 | -| total_timesteps | 3414528 | -| train/ | | -| approx_kl | 0.006670741 | -| clip_fraction | 0.136 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0224 | -| learning_rate | 0.0003 | -| loss | -0.00252 | -| n_updates | 266750 | -| policy_gradient_loss | 0.000308 | -| std | 0.00595 | -| value_loss | 0.000416 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26677 | -| time_elapsed | 145048 | -| total_timesteps | 3414656 | -| train/ | | -| approx_kl | 0.1184033 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -2.77 | -| learning_rate | 0.0003 | -| loss | 0.0468 | -| n_updates | 266760 | -| policy_gradient_loss | 0.0107 | -| std | 0.00594 | -| value_loss | 3.42e-06 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26678 | -| time_elapsed | 145052 | -| total_timesteps | 3414784 | -| train/ | | -| approx_kl | 0.0037929518 | -| clip_fraction | 0.05 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | -0.00159 | -| n_updates | 266770 | -| policy_gradient_loss | 0.00077 | -| std | 0.00594 | -| value_loss | 1.42e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26679 | -| time_elapsed | 145058 | -| total_timesteps | 3414912 | -| train/ | | -| approx_kl | 0.047434565 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.113 | -| learning_rate | 0.0003 | -| loss | 0.00601 | -| n_updates | 266780 | -| policy_gradient_loss | 0.0279 | -| std | 0.00594 | -| value_loss | 2.39e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26680 | -| time_elapsed | 145062 | -| total_timesteps | 3415040 | -| train/ | | -| approx_kl | 0.3681851 | -| clip_fraction | 0.75 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0043 | -| learning_rate | 0.0003 | -| loss | 0.287 | -| n_updates | 266790 | -| policy_gradient_loss | 0.195 | -| std | 0.00595 | -| value_loss | 1.51e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26681 | -| time_elapsed | 145070 | -| total_timesteps | 3415168 | -| train/ | | -| approx_kl | 0.05496225 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | 0.586 | -| learning_rate | 0.0003 | -| loss | 0.0283 | -| n_updates | 266800 | -| policy_gradient_loss | 0.0128 | -| std | 0.00595 | -| value_loss | 0.0236 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26682 | -| time_elapsed | 145074 | -| total_timesteps | 3415296 | -| train/ | | -| approx_kl | 0.00032183388 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -1.31 | -| learning_rate | 0.0003 | -| loss | -0.00261 | -| n_updates | 266810 | -| policy_gradient_loss | 0.00349 | -| std | 0.00595 | -| value_loss | 0.000391 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26683 | -| time_elapsed | 145077 | -| total_timesteps | 3415424 | -| train/ | | -| approx_kl | 0.054139137 | -| clip_fraction | 0.459 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0168 | -| learning_rate | 0.0003 | -| loss | 0.00846 | -| n_updates | 266820 | -| policy_gradient_loss | 0.0479 | -| std | 0.00595 | -| value_loss | 6.23e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26684 | -| time_elapsed | 145083 | -| total_timesteps | 3415552 | -| train/ | | -| approx_kl | 0.16143277 | -| clip_fraction | 0.514 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0184 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 266830 | -| policy_gradient_loss | 0.0695 | -| std | 0.00595 | -| value_loss | 2.65e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26685 | -| time_elapsed | 145087 | -| total_timesteps | 3415680 | -| train/ | | -| approx_kl | 0.00021703122 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.0998 | -| learning_rate | 0.0003 | -| loss | 0.00044 | -| n_updates | 266840 | -| policy_gradient_loss | 0.0168 | -| std | 0.00596 | -| value_loss | 6.61e-05 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26686 | -| time_elapsed | 145092 | -| total_timesteps | 3415808 | -| train/ | | -| approx_kl | 0.2497249 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -1.12 | -| learning_rate | 0.0003 | -| loss | 0.179 | -| n_updates | 266850 | -| policy_gradient_loss | 0.0434 | -| std | 0.00597 | -| value_loss | 1.2e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26687 | -| time_elapsed | 145098 | -| total_timesteps | 3415936 | -| train/ | | -| approx_kl | 0.58750975 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.524 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 266860 | -| policy_gradient_loss | 0.0575 | -| std | 0.00597 | -| value_loss | 1.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26688 | -| time_elapsed | 145102 | -| total_timesteps | 3416064 | -| train/ | | -| approx_kl | 0.051593877 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | -0.0022 | -| n_updates | 266870 | -| policy_gradient_loss | 0.000356 | -| std | 0.00597 | -| value_loss | 1.33e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26689 | -| time_elapsed | 145110 | -| total_timesteps | 3416192 | -| train/ | | -| approx_kl | 0.025271887 | -| clip_fraction | 0.246 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.629 | -| learning_rate | 0.0003 | -| loss | 0.00607 | -| n_updates | 266880 | -| policy_gradient_loss | 0.00996 | -| std | 0.00597 | -| value_loss | 0.0066 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26690 | -| time_elapsed | 145115 | -| total_timesteps | 3416320 | -| train/ | | -| approx_kl | 0.10163754 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.322 | -| learning_rate | 0.0003 | -| loss | 0.0445 | -| n_updates | 266890 | -| policy_gradient_loss | 0.0174 | -| std | 0.00597 | -| value_loss | 0.000128 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26691 | -| time_elapsed | 145118 | -| total_timesteps | 3416448 | -| train/ | | -| approx_kl | 0.014405383 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.017 | -| learning_rate | 0.0003 | -| loss | -0.00805 | -| n_updates | 266900 | -| policy_gradient_loss | 0.00726 | -| std | 0.00597 | -| value_loss | 1.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26692 | -| time_elapsed | 145123 | -| total_timesteps | 3416576 | -| train/ | | -| approx_kl | 0.080850974 | -| clip_fraction | 0.313 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0474 | -| n_updates | 266910 | -| policy_gradient_loss | 0.0191 | -| std | 0.00597 | -| value_loss | 1.04e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26693 | -| time_elapsed | 145127 | -| total_timesteps | 3416704 | -| train/ | | -| approx_kl | 0.047332898 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0721 | -| learning_rate | 0.0003 | -| loss | 0.0343 | -| n_updates | 266920 | -| policy_gradient_loss | 0.0175 | -| std | 0.00596 | -| value_loss | 5.95e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26694 | -| time_elapsed | 145131 | -| total_timesteps | 3416832 | -| train/ | | -| approx_kl | 0.008759918 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.126 | -| learning_rate | 0.0003 | -| loss | -0.00394 | -| n_updates | 266930 | -| policy_gradient_loss | 0.0052 | -| std | 0.00596 | -| value_loss | 4.16e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26695 | -| time_elapsed | 145135 | -| total_timesteps | 3416960 | -| train/ | | -| approx_kl | 0.092619814 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0892 | -| learning_rate | 0.0003 | -| loss | 0.0502 | -| n_updates | 266940 | -| policy_gradient_loss | 0.0201 | -| std | 0.00596 | -| value_loss | 3.1e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26696 | -| time_elapsed | 145139 | -| total_timesteps | 3417088 | -| train/ | | -| approx_kl | 0.00060629286 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.0739 | -| learning_rate | 0.0003 | -| loss | -0.00486 | -| n_updates | 266950 | -| policy_gradient_loss | -0.00055 | -| std | 0.00596 | -| value_loss | 2.22e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26697 | -| time_elapsed | 145149 | -| total_timesteps | 3417216 | -| train/ | | -| approx_kl | 0.0046276287 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.872 | -| learning_rate | 0.0003 | -| loss | -0.00515 | -| n_updates | 266960 | -| policy_gradient_loss | 0.00546 | -| std | 0.00596 | -| value_loss | 0.00417 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26698 | -| time_elapsed | 145154 | -| total_timesteps | 3417344 | -| train/ | | -| approx_kl | 0.021922946 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | -0.906 | -| learning_rate | 0.0003 | -| loss | 0.0115 | -| n_updates | 266970 | -| policy_gradient_loss | 0.0135 | -| std | 0.00596 | -| value_loss | 0.000162 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26699 | -| time_elapsed | 145160 | -| total_timesteps | 3417472 | -| train/ | | -| approx_kl | 0.0008235518 | -| clip_fraction | 0.206 | -| clip_range | 0.2 | -| entropy_loss | 3.7 | -| explained_variance | 0.0122 | -| learning_rate | 0.0003 | -| loss | -0.000518 | -| n_updates | 266980 | -| policy_gradient_loss | 0.018 | -| std | 0.00594 | -| value_loss | 2.22e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26700 | -| time_elapsed | 145164 | -| total_timesteps | 3417600 | -| train/ | | -| approx_kl | 0.0036631646 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.71 | -| explained_variance | -0.402 | -| learning_rate | 0.0003 | -| loss | 0.00295 | -| n_updates | 266990 | -| policy_gradient_loss | 0.0433 | -| std | 0.00589 | -| value_loss | 0.00326 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26701 | -| time_elapsed | 145169 | -| total_timesteps | 3417728 | -| train/ | | -| approx_kl | 0.80320525 | -| clip_fraction | 0.77 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -1.74 | -| learning_rate | 0.0003 | -| loss | 0.222 | -| n_updates | 267000 | -| policy_gradient_loss | 0.17 | -| std | 0.00587 | -| value_loss | 5.7e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26702 | -| time_elapsed | 145173 | -| total_timesteps | 3417856 | -| train/ | | -| approx_kl | 0.016656315 | -| clip_fraction | 0.479 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.35 | -| learning_rate | 0.0003 | -| loss | -0.0027 | -| n_updates | 267010 | -| policy_gradient_loss | 0.0307 | -| std | 0.00587 | -| value_loss | 1.2e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26703 | -| time_elapsed | 145177 | -| total_timesteps | 3417984 | -| train/ | | -| approx_kl | 0.31997874 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0753 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 267020 | -| policy_gradient_loss | 0.121 | -| std | 0.00587 | -| value_loss | 9.9e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26704 | -| time_elapsed | 145181 | -| total_timesteps | 3418112 | -| train/ | | -| approx_kl | 0.0504004 | -| clip_fraction | 0.353 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0532 | -| learning_rate | 0.0003 | -| loss | 0.0139 | -| n_updates | 267030 | -| policy_gradient_loss | 0.0187 | -| std | 0.00587 | -| value_loss | 8.43e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26705 | -| time_elapsed | 145192 | -| total_timesteps | 3418240 | -| train/ | | -| approx_kl | 0.16177987 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.787 | -| learning_rate | 0.0003 | -| loss | 0.0252 | -| n_updates | 267040 | -| policy_gradient_loss | 0.022 | -| std | 0.00587 | -| value_loss | 0.00893 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26706 | -| time_elapsed | 145198 | -| total_timesteps | 3418368 | -| train/ | | -| approx_kl | 0.24474739 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -10.4 | -| learning_rate | 0.0003 | -| loss | 0.0989 | -| n_updates | 267050 | -| policy_gradient_loss | 0.0184 | -| std | 0.00587 | -| value_loss | 4.6e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26707 | -| time_elapsed | 145203 | -| total_timesteps | 3418496 | -| train/ | | -| approx_kl | 0.0016281302 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.92 | -| learning_rate | 0.0003 | -| loss | 0.00101 | -| n_updates | 267060 | -| policy_gradient_loss | 0.024 | -| std | 0.00587 | -| value_loss | 8.65e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26708 | -| time_elapsed | 145207 | -| total_timesteps | 3418624 | -| train/ | | -| approx_kl | 0.7911657 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0335 | -| learning_rate | 0.0003 | -| loss | 0.264 | -| n_updates | 267070 | -| policy_gradient_loss | 0.0857 | -| std | 0.00587 | -| value_loss | 2.7e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26709 | -| time_elapsed | 145212 | -| total_timesteps | 3418752 | -| train/ | | -| approx_kl | 0.053811964 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0695 | -| learning_rate | 0.0003 | -| loss | 0.0152 | -| n_updates | 267080 | -| policy_gradient_loss | 0.00674 | -| std | 0.00587 | -| value_loss | 2.62e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26710 | -| time_elapsed | 145218 | -| total_timesteps | 3418880 | -| train/ | | -| approx_kl | 0.057566866 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | -0.015 | -| n_updates | 267090 | -| policy_gradient_loss | -0.00673 | -| std | 0.00587 | -| value_loss | 2.2e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26711 | -| time_elapsed | 145222 | -| total_timesteps | 3419008 | -| train/ | | -| approx_kl | 0.0721174 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.038 | -| learning_rate | 0.0003 | -| loss | 0.037 | -| n_updates | 267100 | -| policy_gradient_loss | 0.0178 | -| std | 0.00587 | -| value_loss | 1.53e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26712 | -| time_elapsed | 145234 | -| total_timesteps | 3419136 | -| train/ | | -| approx_kl | 0.015463032 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 267110 | -| policy_gradient_loss | -0.00791 | -| std | 0.00587 | -| value_loss | 0.000412 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26713 | -| time_elapsed | 145239 | -| total_timesteps | 3419264 | -| train/ | | -| approx_kl | 0.013037387 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.16 | -| learning_rate | 0.0003 | -| loss | -0.00189 | -| n_updates | 267120 | -| policy_gradient_loss | 0.0056 | -| std | 0.00587 | -| value_loss | 0.00195 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26714 | -| time_elapsed | 145245 | -| total_timesteps | 3419392 | -| train/ | | -| approx_kl | 0.026534688 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.44 | -| learning_rate | 0.0003 | -| loss | 0.00977 | -| n_updates | 267130 | -| policy_gradient_loss | 0.00802 | -| std | 0.00588 | -| value_loss | 6.43e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26715 | -| time_elapsed | 145249 | -| total_timesteps | 3419520 | -| train/ | | -| approx_kl | 0.076061204 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00596 | -| learning_rate | 0.0003 | -| loss | 0.0407 | -| n_updates | 267140 | -| policy_gradient_loss | 0.0165 | -| std | 0.00588 | -| value_loss | 6.24e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26716 | -| time_elapsed | 145253 | -| total_timesteps | 3419648 | -| train/ | | -| approx_kl | 0.051788375 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0605 | -| learning_rate | 0.0003 | -| loss | 0.0142 | -| n_updates | 267150 | -| policy_gradient_loss | 0.00771 | -| std | 0.00588 | -| value_loss | 5.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26717 | -| time_elapsed | 145256 | -| total_timesteps | 3419776 | -| train/ | | -| approx_kl | 0.000171524 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0526 | -| learning_rate | 0.0003 | -| loss | -0.00105 | -| n_updates | 267160 | -| policy_gradient_loss | 0.0121 | -| std | 0.00586 | -| value_loss | 0.000123 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26718 | -| time_elapsed | 145261 | -| total_timesteps | 3419904 | -| train/ | | -| approx_kl | 0.07789244 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -13.4 | -| learning_rate | 0.0003 | -| loss | -0.00425 | -| n_updates | 267170 | -| policy_gradient_loss | -0.00493 | -| std | 0.00585 | -| value_loss | 0.000171 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26719 | -| time_elapsed | 145266 | -| total_timesteps | 3420032 | -| train/ | | -| approx_kl | 0.24559176 | -| clip_fraction | 0.349 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.381 | -| learning_rate | 0.0003 | -| loss | 0.0769 | -| n_updates | 267180 | -| policy_gradient_loss | 0.0194 | -| std | 0.00585 | -| value_loss | 2.72e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26720 | -| time_elapsed | 145276 | -| total_timesteps | 3420160 | -| train/ | | -| approx_kl | 0.027053656 | -| clip_fraction | 0.171 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.658 | -| learning_rate | 0.0003 | -| loss | 0.0108 | -| n_updates | 267190 | -| policy_gradient_loss | -0.00134 | -| std | 0.00585 | -| value_loss | 0.00847 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26721 | -| time_elapsed | 145280 | -| total_timesteps | 3420288 | -| train/ | | -| approx_kl | 0.024401601 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00574 | -| learning_rate | 0.0003 | -| loss | 0.0138 | -| n_updates | 267200 | -| policy_gradient_loss | 0.0452 | -| std | 0.00585 | -| value_loss | 0.0045 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26722 | -| time_elapsed | 145285 | -| total_timesteps | 3420416 | -| train/ | | -| approx_kl | 0.17461923 | -| clip_fraction | 0.34 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0459 | -| learning_rate | 0.0003 | -| loss | 0.101 | -| n_updates | 267210 | -| policy_gradient_loss | 0.051 | -| std | 0.00585 | -| value_loss | 9.96e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26723 | -| time_elapsed | 145290 | -| total_timesteps | 3420544 | -| train/ | | -| approx_kl | 1.0694843e-05 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0168 | -| learning_rate | 0.0003 | -| loss | -0.000381 | -| n_updates | 267220 | -| policy_gradient_loss | 0.0388 | -| std | 0.00585 | -| value_loss | 4.54e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26724 | -| time_elapsed | 145295 | -| total_timesteps | 3420672 | -| train/ | | -| approx_kl | 0.88712436 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0139 | -| learning_rate | 0.0003 | -| loss | 0.29 | -| n_updates | 267230 | -| policy_gradient_loss | 0.0786 | -| std | 0.00585 | -| value_loss | 3.3e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26725 | -| time_elapsed | 145299 | -| total_timesteps | 3420800 | -| train/ | | -| approx_kl | 0.011603127 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.028 | -| learning_rate | 0.0003 | -| loss | -0.000713 | -| n_updates | 267240 | -| policy_gradient_loss | 0.0127 | -| std | 0.00584 | -| value_loss | 2.5e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26726 | -| time_elapsed | 145305 | -| total_timesteps | 3420928 | -| train/ | | -| approx_kl | 0.007744998 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | 0.00658 | -| n_updates | 267250 | -| policy_gradient_loss | 0.0155 | -| std | 0.00585 | -| value_loss | 1.94e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26727 | -| time_elapsed | 145309 | -| total_timesteps | 3421056 | -| train/ | | -| approx_kl | 0.06463313 | -| clip_fraction | 0.436 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0467 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 267260 | -| policy_gradient_loss | 0.0372 | -| std | 0.00585 | -| value_loss | 1.52e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26728 | -| time_elapsed | 145317 | -| total_timesteps | 3421184 | -| train/ | | -| approx_kl | 0.47390246 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.972 | -| learning_rate | 0.0003 | -| loss | 0.0581 | -| n_updates | 267270 | -| policy_gradient_loss | 0.0144 | -| std | 0.00585 | -| value_loss | 0.00391 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26729 | -| time_elapsed | 145322 | -| total_timesteps | 3421312 | -| train/ | | -| approx_kl | 0.014231076 | -| clip_fraction | 0.269 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -7.89 | -| learning_rate | 0.0003 | -| loss | -0.0128 | -| n_updates | 267280 | -| policy_gradient_loss | -0.000477 | -| std | 0.00585 | -| value_loss | 0.00169 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26730 | -| time_elapsed | 145325 | -| total_timesteps | 3421440 | -| train/ | | -| approx_kl | 0.22562695 | -| clip_fraction | 0.407 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.642 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 267290 | -| policy_gradient_loss | 0.0581 | -| std | 0.00586 | -| value_loss | 0.00546 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26731 | -| time_elapsed | 145331 | -| total_timesteps | 3421568 | -| train/ | | -| approx_kl | 0.35649443 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0709 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 267300 | -| policy_gradient_loss | 0.0491 | -| std | 0.00586 | -| value_loss | 0.00125 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26732 | -| time_elapsed | 145335 | -| total_timesteps | 3421696 | -| train/ | | -| approx_kl | 0.21807651 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00418 | -| learning_rate | 0.0003 | -| loss | 0.0672 | -| n_updates | 267310 | -| policy_gradient_loss | 0.0107 | -| std | 0.00586 | -| value_loss | 0.000793 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26733 | -| time_elapsed | 145340 | -| total_timesteps | 3421824 | -| train/ | | -| approx_kl | 0.2119245 | -| clip_fraction | 0.188 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0205 | -| learning_rate | 0.0003 | -| loss | 0.109 | -| n_updates | 267320 | -| policy_gradient_loss | 0.0193 | -| std | 0.00586 | -| value_loss | 0.000486 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26734 | -| time_elapsed | 145346 | -| total_timesteps | 3421952 | -| train/ | | -| approx_kl | 0.048064236 | -| clip_fraction | 0.466 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0774 | -| learning_rate | 0.0003 | -| loss | 0.003 | -| n_updates | 267330 | -| policy_gradient_loss | 0.036 | -| std | 0.00586 | -| value_loss | 0.00031 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26735 | -| time_elapsed | 145350 | -| total_timesteps | 3422080 | -| train/ | | -| approx_kl | 0.005996497 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0629 | -| learning_rate | 0.0003 | -| loss | -0.00807 | -| n_updates | 267340 | -| policy_gradient_loss | 0.0233 | -| std | 0.00586 | -| value_loss | 0.000321 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26736 | -| time_elapsed | 145360 | -| total_timesteps | 3422208 | -| train/ | | -| approx_kl | 0.015595527 | -| clip_fraction | 0.101 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.862 | -| learning_rate | 0.0003 | -| loss | -0.00939 | -| n_updates | 267350 | -| policy_gradient_loss | -0.00532 | -| std | 0.00586 | -| value_loss | 0.00164 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26737 | -| time_elapsed | 145365 | -| total_timesteps | 3422336 | -| train/ | | -| approx_kl | 0.03252823 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.112 | -| learning_rate | 0.0003 | -| loss | 0.0213 | -| n_updates | 267360 | -| policy_gradient_loss | 0.039 | -| std | 0.00587 | -| value_loss | 0.000103 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26738 | -| time_elapsed | 145370 | -| total_timesteps | 3422464 | -| train/ | | -| approx_kl | 0.4835752 | -| clip_fraction | 0.752 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0958 | -| learning_rate | 0.0003 | -| loss | 0.231 | -| n_updates | 267370 | -| policy_gradient_loss | 0.177 | -| std | 0.00587 | -| value_loss | 0.000117 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26739 | -| time_elapsed | 145375 | -| total_timesteps | 3422592 | -| train/ | | -| approx_kl | 0.05904275 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0382 | -| n_updates | 267380 | -| policy_gradient_loss | 0.0272 | -| std | 0.00586 | -| value_loss | 0.000249 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26740 | -| time_elapsed | 145379 | -| total_timesteps | 3422720 | -| train/ | | -| approx_kl | 0.88524294 | -| clip_fraction | 0.517 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 267390 | -| policy_gradient_loss | 0.0444 | -| std | 0.00586 | -| value_loss | 2.11e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26741 | -| time_elapsed | 145383 | -| total_timesteps | 3422848 | -| train/ | | -| approx_kl | 0.015665822 | -| clip_fraction | 0.249 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | -0.0122 | -| n_updates | 267400 | -| policy_gradient_loss | 0.00673 | -| std | 0.00586 | -| value_loss | 9.95e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26742 | -| time_elapsed | 145387 | -| total_timesteps | 3422976 | -| train/ | | -| approx_kl | 0.0043101315 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0704 | -| learning_rate | 0.0003 | -| loss | -0.01 | -| n_updates | 267410 | -| policy_gradient_loss | 0.0112 | -| std | 0.00586 | -| value_loss | 1.04e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26743 | -| time_elapsed | 145390 | -| total_timesteps | 3423104 | -| train/ | | -| approx_kl | 0.10527124 | -| clip_fraction | 0.283 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0339 | -| learning_rate | 0.0003 | -| loss | 0.0593 | -| n_updates | 267420 | -| policy_gradient_loss | 0.015 | -| std | 0.00586 | -| value_loss | 8.2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26744 | -| time_elapsed | 145400 | -| total_timesteps | 3423232 | -| train/ | | -| approx_kl | 0.003028696 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.879 | -| learning_rate | 0.0003 | -| loss | -0.00696 | -| n_updates | 267430 | -| policy_gradient_loss | 0.0455 | -| std | 0.00585 | -| value_loss | 0.0019 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26745 | -| time_elapsed | 145404 | -| total_timesteps | 3423360 | -| train/ | | -| approx_kl | 0.0007208772 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | 0.00149 | -| n_updates | 267440 | -| policy_gradient_loss | 0.0412 | -| std | 0.00585 | -| value_loss | 0.000757 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26746 | -| time_elapsed | 145407 | -| total_timesteps | 3423488 | -| train/ | | -| approx_kl | 0.00044963835 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.012 | -| learning_rate | 0.0003 | -| loss | -0.00119 | -| n_updates | 267450 | -| policy_gradient_loss | 0.031 | -| std | 0.00585 | -| value_loss | 0.000157 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26747 | -| time_elapsed | 145410 | -| total_timesteps | 3423616 | -| train/ | | -| approx_kl | 0.008845207 | -| clip_fraction | 0.389 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.02 | -| n_updates | 267460 | -| policy_gradient_loss | 0.0295 | -| std | 0.00585 | -| value_loss | 8.29e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26748 | -| time_elapsed | 145414 | -| total_timesteps | 3423744 | -| train/ | | -| approx_kl | 0.007614648 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0643 | -| learning_rate | 0.0003 | -| loss | -0.00601 | -| n_updates | 267470 | -| policy_gradient_loss | 0.0367 | -| std | 0.00585 | -| value_loss | 6.6e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26749 | -| time_elapsed | 145417 | -| total_timesteps | 3423872 | -| train/ | | -| approx_kl | 0.23977211 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0513 | -| learning_rate | 0.0003 | -| loss | 0.135 | -| n_updates | 267480 | -| policy_gradient_loss | 0.0707 | -| std | 0.00584 | -| value_loss | 4.98e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26750 | -| time_elapsed | 145420 | -| total_timesteps | 3424000 | -| train/ | | -| approx_kl | 0.046786536 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0591 | -| learning_rate | 0.0003 | -| loss | -0.00257 | -| n_updates | 267490 | -| policy_gradient_loss | 0.0253 | -| std | 0.00584 | -| value_loss | 4.58e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26751 | -| time_elapsed | 145424 | -| total_timesteps | 3424128 | -| train/ | | -| approx_kl | 0.1569432 | -| clip_fraction | 0.507 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00497 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 267500 | -| policy_gradient_loss | 0.0555 | -| std | 0.00584 | -| value_loss | 0.000253 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26752 | -| time_elapsed | 145433 | -| total_timesteps | 3424256 | -| train/ | | -| approx_kl | 0.040423334 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.776 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 267510 | -| policy_gradient_loss | 0.00912 | -| std | 0.00584 | -| value_loss | 0.00744 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26753 | -| time_elapsed | 145437 | -| total_timesteps | 3424384 | -| train/ | | -| approx_kl | 0.12408837 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0174 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 267520 | -| policy_gradient_loss | -0.000761 | -| std | 0.00584 | -| value_loss | 0.000135 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26754 | -| time_elapsed | 145439 | -| total_timesteps | 3424512 | -| train/ | | -| approx_kl | 0.015556637 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0154 | -| learning_rate | 0.0003 | -| loss | 0.00455 | -| n_updates | 267530 | -| policy_gradient_loss | 0.013 | -| std | 0.00584 | -| value_loss | 7.58e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26755 | -| time_elapsed | 145442 | -| total_timesteps | 3424640 | -| train/ | | -| approx_kl | 0.003408723 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00755 | -| learning_rate | 0.0003 | -| loss | -0.000794 | -| n_updates | 267540 | -| policy_gradient_loss | 0.00903 | -| std | 0.00584 | -| value_loss | 4.21e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26756 | -| time_elapsed | 145444 | -| total_timesteps | 3424768 | -| train/ | | -| approx_kl | 0.0005663256 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0454 | -| learning_rate | 0.0003 | -| loss | -0.000781 | -| n_updates | 267550 | -| policy_gradient_loss | 0.0187 | -| std | 0.00584 | -| value_loss | 2.82e-05 | ------------------------------------------- --------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26757 | -| time_elapsed | 145448 | -| total_timesteps | 3424896 | -| train/ | | -| approx_kl | 0.000100643374 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | -0.000201 | -| n_updates | 267560 | -| policy_gradient_loss | 0.0517 | -| std | 0.00584 | -| value_loss | 2.39e-05 | --------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26758 | -| time_elapsed | 145452 | -| total_timesteps | 3425024 | -| train/ | | -| approx_kl | 0.21387723 | -| clip_fraction | 0.564 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0476 | -| learning_rate | 0.0003 | -| loss | 0.144 | -| n_updates | 267570 | -| policy_gradient_loss | 0.0773 | -| std | 0.00584 | -| value_loss | 2.35e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26759 | -| time_elapsed | 145464 | -| total_timesteps | 3425152 | -| train/ | | -| approx_kl | 0.05581363 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.63 | -| learning_rate | 0.0003 | -| loss | -0.0217 | -| n_updates | 267580 | -| policy_gradient_loss | -0.0128 | -| std | 0.00584 | -| value_loss | 0.00429 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26760 | -| time_elapsed | 145468 | -| total_timesteps | 3425280 | -| train/ | | -| approx_kl | 0.089867674 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0406 | -| learning_rate | 0.0003 | -| loss | 0.0669 | -| n_updates | 267590 | -| policy_gradient_loss | 0.016 | -| std | 0.00584 | -| value_loss | 0.000276 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26761 | -| time_elapsed | 145474 | -| total_timesteps | 3425408 | -| train/ | | -| approx_kl | 0.012912777 | -| clip_fraction | 0.317 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | 0.00115 | -| n_updates | 267600 | -| policy_gradient_loss | 0.0289 | -| std | 0.00584 | -| value_loss | 1.01e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26762 | -| time_elapsed | 145479 | -| total_timesteps | 3425536 | -| train/ | | -| approx_kl | 0.20357245 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0166 | -| learning_rate | 0.0003 | -| loss | 0.0376 | -| n_updates | 267610 | -| policy_gradient_loss | 0.00722 | -| std | 0.00584 | -| value_loss | 6.29e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26763 | -| time_elapsed | 145484 | -| total_timesteps | 3425664 | -| train/ | | -| approx_kl | 0.07993417 | -| clip_fraction | 0.503 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.029 | -| learning_rate | 0.0003 | -| loss | 0.0409 | -| n_updates | 267620 | -| policy_gradient_loss | 0.047 | -| std | 0.00584 | -| value_loss | 5.66e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26764 | -| time_elapsed | 145489 | -| total_timesteps | 3425792 | -| train/ | | -| approx_kl | 0.33614588 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0255 | -| learning_rate | 0.0003 | -| loss | 0.202 | -| n_updates | 267630 | -| policy_gradient_loss | 0.14 | -| std | 0.00584 | -| value_loss | 4.91e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26765 | -| time_elapsed | 145493 | -| total_timesteps | 3425920 | -| train/ | | -| approx_kl | 0.27594113 | -| clip_fraction | 0.737 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0243 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 267640 | -| policy_gradient_loss | 0.199 | -| std | 0.00584 | -| value_loss | 4.8e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26766 | -| time_elapsed | 145498 | -| total_timesteps | 3426048 | -| train/ | | -| approx_kl | 0.042575102 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.00766 | -| n_updates | 267650 | -| policy_gradient_loss | 0.0274 | -| std | 0.00584 | -| value_loss | 4.37e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26767 | -| time_elapsed | 145507 | -| total_timesteps | 3426176 | -| train/ | | -| approx_kl | 0.3948656 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.79 | -| learning_rate | 0.0003 | -| loss | 0.0362 | -| n_updates | 267660 | -| policy_gradient_loss | 0.0151 | -| std | 0.00584 | -| value_loss | 0.00677 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26768 | -| time_elapsed | 145511 | -| total_timesteps | 3426304 | -| train/ | | -| approx_kl | 0.047090545 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00913 | -| learning_rate | 0.0003 | -| loss | 0.015 | -| n_updates | 267670 | -| policy_gradient_loss | 0.067 | -| std | 0.00584 | -| value_loss | 2.41e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26769 | -| time_elapsed | 145516 | -| total_timesteps | 3426432 | -| train/ | | -| approx_kl | 0.0055968678 | -| clip_fraction | 0.564 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0157 | -| learning_rate | 0.0003 | -| loss | -0.00649 | -| n_updates | 267680 | -| policy_gradient_loss | 0.0851 | -| std | 0.00584 | -| value_loss | 1.31e-05 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26770 | -| time_elapsed | 145521 | -| total_timesteps | 3426560 | -| train/ | | -| approx_kl | 3.2500186 | -| clip_fraction | 0.852 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00818 | -| learning_rate | 0.0003 | -| loss | 0.214 | -| n_updates | 267690 | -| policy_gradient_loss | 0.197 | -| std | 0.00586 | -| value_loss | 0.000148 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26771 | -| time_elapsed | 145524 | -| total_timesteps | 3426688 | -| train/ | | -| approx_kl | 0.044318203 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -44.5 | -| learning_rate | 0.0003 | -| loss | -0.00983 | -| n_updates | 267700 | -| policy_gradient_loss | 0.0133 | -| std | 0.00588 | -| value_loss | 1.68e-05 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26772 | -| time_elapsed | 145528 | -| total_timesteps | 3426816 | -| train/ | | -| approx_kl | 0.298633 | -| clip_fraction | 0.399 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 267710 | -| policy_gradient_loss | 0.0422 | -| std | 0.00588 | -| value_loss | 1.29e-06 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26773 | -| time_elapsed | 145532 | -| total_timesteps | 3426944 | -| train/ | | -| approx_kl | 0.01854151 | -| clip_fraction | 0.127 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0177 | -| learning_rate | 0.0003 | -| loss | 0.00199 | -| n_updates | 267720 | -| policy_gradient_loss | 0.000228 | -| std | 0.00588 | -| value_loss | 7.01e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26774 | -| time_elapsed | 145538 | -| total_timesteps | 3427072 | -| train/ | | -| approx_kl | 0.0139935985 | -| clip_fraction | 0.126 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | -0.00875 | -| n_updates | 267730 | -| policy_gradient_loss | -0.0047 | -| std | 0.00588 | -| value_loss | 5.45e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26775 | -| time_elapsed | 145546 | -| total_timesteps | 3427200 | -| train/ | | -| approx_kl | 0.043357603 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.839 | -| learning_rate | 0.0003 | -| loss | 0.00326 | -| n_updates | 267740 | -| policy_gradient_loss | 0.0155 | -| std | 0.00588 | -| value_loss | 0.00453 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26776 | -| time_elapsed | 145550 | -| total_timesteps | 3427328 | -| train/ | | -| approx_kl | 0.16505949 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0796 | -| learning_rate | 0.0003 | -| loss | 0.0836 | -| n_updates | 267750 | -| policy_gradient_loss | 0.0378 | -| std | 0.00588 | -| value_loss | 5.71e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26777 | -| time_elapsed | 145554 | -| total_timesteps | 3427456 | -| train/ | | -| approx_kl | 0.0007815296 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0163 | -| learning_rate | 0.0003 | -| loss | -0.00183 | -| n_updates | 267760 | -| policy_gradient_loss | 0.0401 | -| std | 0.00588 | -| value_loss | 2.37e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26778 | -| time_elapsed | 145558 | -| total_timesteps | 3427584 | -| train/ | | -| approx_kl | 0.16458915 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00457 | -| learning_rate | 0.0003 | -| loss | 0.0879 | -| n_updates | 267770 | -| policy_gradient_loss | 0.0248 | -| std | 0.00588 | -| value_loss | 1.36e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26779 | -| time_elapsed | 145560 | -| total_timesteps | 3427712 | -| train/ | | -| approx_kl | 0.031842392 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 267780 | -| policy_gradient_loss | 0.0404 | -| std | 0.00588 | -| value_loss | 1.08e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26780 | -| time_elapsed | 145564 | -| total_timesteps | 3427840 | -| train/ | | -| approx_kl | 0.11133174 | -| clip_fraction | 0.318 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0345 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 267790 | -| policy_gradient_loss | 0.0222 | -| std | 0.00588 | -| value_loss | 9.77e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26781 | -| time_elapsed | 145569 | -| total_timesteps | 3427968 | -| train/ | | -| approx_kl | 0.00023816433 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0312 | -| learning_rate | 0.0003 | -| loss | -0.000427 | -| n_updates | 267800 | -| policy_gradient_loss | 0.046 | -| std | 0.00588 | -| value_loss | 7.24e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26782 | -| time_elapsed | 145574 | -| total_timesteps | 3428096 | -| train/ | | -| approx_kl | 0.58127624 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0369 | -| learning_rate | 0.0003 | -| loss | 0.203 | -| n_updates | 267810 | -| policy_gradient_loss | 0.0643 | -| std | 0.00588 | -| value_loss | 1.34e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26783 | -| time_elapsed | 145585 | -| total_timesteps | 3428224 | -| train/ | | -| approx_kl | 0.04733055 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.0167 | -| n_updates | 267820 | -| policy_gradient_loss | 0.0109 | -| std | 0.00588 | -| value_loss | 0.000257 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26784 | -| time_elapsed | 145590 | -| total_timesteps | 3428352 | -| train/ | | -| approx_kl | 0.10343303 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.166 | -| learning_rate | 0.0003 | -| loss | 0.0307 | -| n_updates | 267830 | -| policy_gradient_loss | 0.011 | -| std | 0.00588 | -| value_loss | 3.67e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26785 | -| time_elapsed | 145596 | -| total_timesteps | 3428480 | -| train/ | | -| approx_kl | 0.01631708 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0085 | -| learning_rate | 0.0003 | -| loss | -0.0032 | -| n_updates | 267840 | -| policy_gradient_loss | 0.00966 | -| std | 0.00588 | -| value_loss | 2.37e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26786 | -| time_elapsed | 145602 | -| total_timesteps | 3428608 | -| train/ | | -| approx_kl | 0.0029642098 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0132 | -| learning_rate | 0.0003 | -| loss | -0.00231 | -| n_updates | 267850 | -| policy_gradient_loss | 0.00826 | -| std | 0.00588 | -| value_loss | 1.61e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26787 | -| time_elapsed | 145606 | -| total_timesteps | 3428736 | -| train/ | | -| approx_kl | 0.044945046 | -| clip_fraction | 0.64 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.0497 | -| n_updates | 267860 | -| policy_gradient_loss | 0.119 | -| std | 0.00588 | -| value_loss | 1.1e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26788 | -| time_elapsed | 145611 | -| total_timesteps | 3428864 | -| train/ | | -| approx_kl | 0.124141574 | -| clip_fraction | 0.685 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.044 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 267870 | -| policy_gradient_loss | 0.118 | -| std | 0.00588 | -| value_loss | 1.12e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26789 | -| time_elapsed | 145615 | -| total_timesteps | 3428992 | -| train/ | | -| approx_kl | 0.13145818 | -| clip_fraction | 0.728 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0266 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 267880 | -| policy_gradient_loss | 0.125 | -| std | 0.00588 | -| value_loss | 1.06e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26790 | -| time_elapsed | 145620 | -| total_timesteps | 3429120 | -| train/ | | -| approx_kl | 0.027242457 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.0127 | -| n_updates | 267890 | -| policy_gradient_loss | 0.0273 | -| std | 0.00588 | -| value_loss | 8.71e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26791 | -| time_elapsed | 145631 | -| total_timesteps | 3429248 | -| train/ | | -| approx_kl | 0.0077384 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.814 | -| learning_rate | 0.0003 | -| loss | 0.00255 | -| n_updates | 267900 | -| policy_gradient_loss | 0.0167 | -| std | 0.00588 | -| value_loss | 0.00567 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26792 | -| time_elapsed | 145636 | -| total_timesteps | 3429376 | -| train/ | | -| approx_kl | 0.17415658 | -| clip_fraction | 0.354 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00295 | -| learning_rate | 0.0003 | -| loss | 0.0833 | -| n_updates | 267910 | -| policy_gradient_loss | 0.0247 | -| std | 0.00588 | -| value_loss | 1.04e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26793 | -| time_elapsed | 145641 | -| total_timesteps | 3429504 | -| train/ | | -| approx_kl | 0.030446794 | -| clip_fraction | 0.505 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0113 | -| learning_rate | 0.0003 | -| loss | 0.0118 | -| n_updates | 267920 | -| policy_gradient_loss | 0.0379 | -| std | 0.00588 | -| value_loss | 5.13e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26794 | -| time_elapsed | 145646 | -| total_timesteps | 3429632 | -| train/ | | -| approx_kl | 0.15712473 | -| clip_fraction | 0.343 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0147 | -| learning_rate | 0.0003 | -| loss | 0.094 | -| n_updates | 267930 | -| policy_gradient_loss | 0.0443 | -| std | 0.00588 | -| value_loss | 2.85e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26795 | -| time_elapsed | 145649 | -| total_timesteps | 3429760 | -| train/ | | -| approx_kl | 0.00020742137 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0619 | -| learning_rate | 0.0003 | -| loss | -0.000602 | -| n_updates | 267940 | -| policy_gradient_loss | 0.038 | -| std | 0.00588 | -| value_loss | 2.04e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26796 | -| time_elapsed | 145654 | -| total_timesteps | 3429888 | -| train/ | | -| approx_kl | 0.21831258 | -| clip_fraction | 0.361 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0533 | -| learning_rate | 0.0003 | -| loss | 0.0569 | -| n_updates | 267950 | -| policy_gradient_loss | 0.0182 | -| std | 0.00588 | -| value_loss | 2e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26797 | -| time_elapsed | 145658 | -| total_timesteps | 3430016 | -| train/ | | -| approx_kl | 0.023912655 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | 0.0151 | -| n_updates | 267960 | -| policy_gradient_loss | 0.00654 | -| std | 0.00586 | -| value_loss | 9.32e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26798 | -| time_elapsed | 145667 | -| total_timesteps | 3430144 | -| train/ | | -| approx_kl | 0.043761224 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 267970 | -| policy_gradient_loss | -0.0071 | -| std | 0.00585 | -| value_loss | 0.000218 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26799 | -| time_elapsed | 145671 | -| total_timesteps | 3430272 | -| train/ | | -| approx_kl | 0.09837498 | -| clip_fraction | 0.404 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0619 | -| learning_rate | 0.0003 | -| loss | 0.0663 | -| n_updates | 267980 | -| policy_gradient_loss | 0.0454 | -| std | 0.00585 | -| value_loss | 2.05e-05 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26800 | -| time_elapsed | 145677 | -| total_timesteps | 3430400 | -| train/ | | -| approx_kl | 1.2577511e-06 | -| clip_fraction | 0.558 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0355 | -| learning_rate | 0.0003 | -| loss | 1.14e-05 | -| n_updates | 267990 | -| policy_gradient_loss | 0.0899 | -| std | 0.00584 | -| value_loss | 2.01e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26801 | -| time_elapsed | 145682 | -| total_timesteps | 3430528 | -| train/ | | -| approx_kl | 0.02387162 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.496 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 268000 | -| policy_gradient_loss | 0.0382 | -| std | 0.00584 | -| value_loss | 9.49e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26802 | -| time_elapsed | 145687 | -| total_timesteps | 3430656 | -| train/ | | -| approx_kl | 0.14017858 | -| clip_fraction | 0.347 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.563 | -| learning_rate | 0.0003 | -| loss | 0.0627 | -| n_updates | 268010 | -| policy_gradient_loss | 0.0291 | -| std | 0.00584 | -| value_loss | 1.42e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26803 | -| time_elapsed | 145692 | -| total_timesteps | 3430784 | -| train/ | | -| approx_kl | 0.00025923178 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.187 | -| learning_rate | 0.0003 | -| loss | -0.00139 | -| n_updates | 268020 | -| policy_gradient_loss | 0.0318 | -| std | 0.00584 | -| value_loss | 9.7e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26804 | -| time_elapsed | 145698 | -| total_timesteps | 3430912 | -| train/ | | -| approx_kl | 0.7205974 | -| clip_fraction | 0.526 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0535 | -| learning_rate | 0.0003 | -| loss | 0.227 | -| n_updates | 268030 | -| policy_gradient_loss | 0.0758 | -| std | 0.00584 | -| value_loss | 9.07e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26805 | -| time_elapsed | 145702 | -| total_timesteps | 3431040 | -| train/ | | -| approx_kl | 0.05196315 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.035 | -| learning_rate | 0.0003 | -| loss | 0.0157 | -| n_updates | 268040 | -| policy_gradient_loss | 0.00873 | -| std | 0.00584 | -| value_loss | 8.19e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26806 | -| time_elapsed | 145710 | -| total_timesteps | 3431168 | -| train/ | | -| approx_kl | 0.083577864 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.849 | -| learning_rate | 0.0003 | -| loss | 0.00532 | -| n_updates | 268050 | -| policy_gradient_loss | -0.000549 | -| std | 0.00584 | -| value_loss | 0.00105 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26807 | -| time_elapsed | 145715 | -| total_timesteps | 3431296 | -| train/ | | -| approx_kl | 0.019868385 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.3 | -| learning_rate | 0.0003 | -| loss | -0.0061 | -| n_updates | 268060 | -| policy_gradient_loss | 0.00951 | -| std | 0.00584 | -| value_loss | 4.72e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26808 | -| time_elapsed | 145719 | -| total_timesteps | 3431424 | -| train/ | | -| approx_kl | 0.003526758 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00321 | -| learning_rate | 0.0003 | -| loss | -0.000939 | -| n_updates | 268070 | -| policy_gradient_loss | 0.00901 | -| std | 0.00584 | -| value_loss | 1.38e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26809 | -| time_elapsed | 145723 | -| total_timesteps | 3431552 | -| train/ | | -| approx_kl | 0.001517266 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00451 | -| learning_rate | 0.0003 | -| loss | -0.00294 | -| n_updates | 268080 | -| policy_gradient_loss | 0.0147 | -| std | 0.00584 | -| value_loss | 7.91e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26810 | -| time_elapsed | 145727 | -| total_timesteps | 3431680 | -| train/ | | -| approx_kl | 0.05741878 | -| clip_fraction | 0.668 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0307 | -| learning_rate | 0.0003 | -| loss | 0.0616 | -| n_updates | 268090 | -| policy_gradient_loss | 0.167 | -| std | 0.00584 | -| value_loss | 7.33e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26811 | -| time_elapsed | 145732 | -| total_timesteps | 3431808 | -| train/ | | -| approx_kl | 0.013156913 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0235 | -| learning_rate | 0.0003 | -| loss | -0.00584 | -| n_updates | 268100 | -| policy_gradient_loss | 0.0315 | -| std | 0.00584 | -| value_loss | 6.73e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26812 | -| time_elapsed | 145735 | -| total_timesteps | 3431936 | -| train/ | | -| approx_kl | 0.8671474 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 268110 | -| policy_gradient_loss | 0.0712 | -| std | 0.00584 | -| value_loss | 5.95e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26813 | -| time_elapsed | 145739 | -| total_timesteps | 3432064 | -| train/ | | -| approx_kl | 0.07630788 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0207 | -| learning_rate | 0.0003 | -| loss | 0.0447 | -| n_updates | 268120 | -| policy_gradient_loss | 0.0221 | -| std | 0.00584 | -| value_loss | 4.62e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26814 | -| time_elapsed | 145747 | -| total_timesteps | 3432192 | -| train/ | | -| approx_kl | 0.0108638955 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.875 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 268130 | -| policy_gradient_loss | -0.0125 | -| std | 0.00584 | -| value_loss | 0.00308 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26815 | -| time_elapsed | 145753 | -| total_timesteps | 3432320 | -| train/ | | -| approx_kl | 0.2656668 | -| clip_fraction | 0.75 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.201 | -| learning_rate | 0.0003 | -| loss | 0.217 | -| n_updates | 268140 | -| policy_gradient_loss | 0.175 | -| std | 0.00584 | -| value_loss | 0.000339 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26816 | -| time_elapsed | 145758 | -| total_timesteps | 3432448 | -| train/ | | -| approx_kl | 0.18383473 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 268150 | -| policy_gradient_loss | 0.23 | -| std | 0.00584 | -| value_loss | 0.0001 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26817 | -| time_elapsed | 145763 | -| total_timesteps | 3432576 | -| train/ | | -| approx_kl | 0.2253201 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0173 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 268160 | -| policy_gradient_loss | 0.148 | -| std | 0.00584 | -| value_loss | 4.9e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26818 | -| time_elapsed | 145768 | -| total_timesteps | 3432704 | -| train/ | | -| approx_kl | 0.04169892 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.00798 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 268170 | -| policy_gradient_loss | 0.0314 | -| std | 0.00585 | -| value_loss | 3.25e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26819 | -| time_elapsed | 145773 | -| total_timesteps | 3432832 | -| train/ | | -| approx_kl | 0.8496859 | -| clip_fraction | 0.545 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0295 | -| learning_rate | 0.0003 | -| loss | 0.253 | -| n_updates | 268180 | -| policy_gradient_loss | 0.0811 | -| std | 0.00585 | -| value_loss | 2.91e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26820 | -| time_elapsed | 145777 | -| total_timesteps | 3432960 | -| train/ | | -| approx_kl | 0.04755181 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0259 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 268190 | -| policy_gradient_loss | 0.0173 | -| std | 0.00585 | -| value_loss | 1.37e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26821 | -| time_elapsed | 145780 | -| total_timesteps | 3433088 | -| train/ | | -| approx_kl | 0.0014993483 | -| clip_fraction | 0.321 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0109 | -| n_updates | 268200 | -| policy_gradient_loss | 0.00204 | -| std | 0.00585 | -| value_loss | 5.29e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26822 | -| time_elapsed | 145789 | -| total_timesteps | 3433216 | -| train/ | | -| approx_kl | 0.011879619 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.747 | -| learning_rate | 0.0003 | -| loss | -0.0174 | -| n_updates | 268210 | -| policy_gradient_loss | 0.000319 | -| std | 0.00585 | -| value_loss | 0.00358 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26823 | -| time_elapsed | 145794 | -| total_timesteps | 3433344 | -| train/ | | -| approx_kl | 0.000340207 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | 0.000629 | -| n_updates | 268220 | -| policy_gradient_loss | 0.0361 | -| std | 0.00585 | -| value_loss | 1.03e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26824 | -| time_elapsed | 145799 | -| total_timesteps | 3433472 | -| train/ | | -| approx_kl | 0.7210124 | -| clip_fraction | 0.567 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.409 | -| learning_rate | 0.0003 | -| loss | 0.159 | -| n_updates | 268230 | -| policy_gradient_loss | 0.0562 | -| std | 0.00585 | -| value_loss | 3.23e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26825 | -| time_elapsed | 145804 | -| total_timesteps | 3433600 | -| train/ | | -| approx_kl | 0.014559053 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.04 | -| learning_rate | 0.0003 | -| loss | -0.00352 | -| n_updates | 268240 | -| policy_gradient_loss | 0.0107 | -| std | 0.00585 | -| value_loss | 2.67e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26826 | -| time_elapsed | 145809 | -| total_timesteps | 3433728 | -| train/ | | -| approx_kl | 0.08501331 | -| clip_fraction | 0.328 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0332 | -| learning_rate | 0.0003 | -| loss | 0.0402 | -| n_updates | 268250 | -| policy_gradient_loss | 0.0151 | -| std | 0.00585 | -| value_loss | 2.25e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26827 | -| time_elapsed | 145815 | -| total_timesteps | 3433856 | -| train/ | | -| approx_kl | 0.015876587 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0354 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 268260 | -| policy_gradient_loss | 0.0102 | -| std | 0.00585 | -| value_loss | 1.93e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.1 | -| time/ | | -| fps | 23 | -| iterations | 26828 | -| time_elapsed | 145821 | -| total_timesteps | 3433984 | -| train/ | | -| approx_kl | 0.0038078912 | -| clip_fraction | 0.214 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.00458 | -| n_updates | 268270 | -| policy_gradient_loss | 0.00798 | -| std | 0.00585 | -| value_loss | 1.51e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26829 | -| time_elapsed | 145826 | -| total_timesteps | 3434112 | -| train/ | | -| approx_kl | 0.06061388 | -| clip_fraction | 0.659 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0431 | -| learning_rate | 0.0003 | -| loss | 0.0571 | -| n_updates | 268280 | -| policy_gradient_loss | 0.141 | -| std | 0.00585 | -| value_loss | 1.07e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26830 | -| time_elapsed | 145843 | -| total_timesteps | 3434240 | -| train/ | | -| approx_kl | 0.91860795 | -| clip_fraction | 0.698 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.47 | -| learning_rate | 0.0003 | -| loss | 0.093 | -| n_updates | 268290 | -| policy_gradient_loss | 0.0701 | -| std | 0.00585 | -| value_loss | 0.00186 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26831 | -| time_elapsed | 145849 | -| total_timesteps | 3434368 | -| train/ | | -| approx_kl | 0.26511797 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.995 | -| learning_rate | 0.0003 | -| loss | 0.134 | -| n_updates | 268300 | -| policy_gradient_loss | 0.146 | -| std | 0.00585 | -| value_loss | 1.5e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26832 | -| time_elapsed | 145852 | -| total_timesteps | 3434496 | -| train/ | | -| approx_kl | 0.22925696 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.83 | -| learning_rate | 0.0003 | -| loss | 0.092 | -| n_updates | 268310 | -| policy_gradient_loss | 0.0927 | -| std | 0.00585 | -| value_loss | 1.12e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26833 | -| time_elapsed | 145856 | -| total_timesteps | 3434624 | -| train/ | | -| approx_kl | 0.04596074 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -1.07 | -| learning_rate | 0.0003 | -| loss | 0.00835 | -| n_updates | 268320 | -| policy_gradient_loss | 0.0244 | -| std | 0.00585 | -| value_loss | 6.73e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26834 | -| time_elapsed | 145861 | -| total_timesteps | 3434752 | -| train/ | | -| approx_kl | 0.2346755 | -| clip_fraction | 0.412 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.234 | -| learning_rate | 0.0003 | -| loss | 0.0874 | -| n_updates | 268330 | -| policy_gradient_loss | 0.0261 | -| std | 0.00585 | -| value_loss | 1.98e-09 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26835 | -| time_elapsed | 145865 | -| total_timesteps | 3434880 | -| train/ | | -| approx_kl | 0.032068554 | -| clip_fraction | 0.489 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0908 | -| learning_rate | 0.0003 | -| loss | -0.00327 | -| n_updates | 268340 | -| policy_gradient_loss | 0.0324 | -| std | 0.00585 | -| value_loss | 1.79e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26836 | -| time_elapsed | 145870 | -| total_timesteps | 3435008 | -| train/ | | -| approx_kl | 0.11490187 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0413 | -| learning_rate | 0.0003 | -| loss | 0.0621 | -| n_updates | 268350 | -| policy_gradient_loss | 0.038 | -| std | 0.00585 | -| value_loss | 3.93e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26837 | -| time_elapsed | 145881 | -| total_timesteps | 3435136 | -| train/ | | -| approx_kl | 0.047936767 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.956 | -| learning_rate | 0.0003 | -| loss | -0.017 | -| n_updates | 268360 | -| policy_gradient_loss | -0.0052 | -| std | 0.00585 | -| value_loss | 0.000734 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26838 | -| time_elapsed | 145885 | -| total_timesteps | 3435264 | -| train/ | | -| approx_kl | 0.6084825 | -| clip_fraction | 0.55 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.348 | -| learning_rate | 0.0003 | -| loss | 0.224 | -| n_updates | 268370 | -| policy_gradient_loss | 0.0891 | -| std | 0.00584 | -| value_loss | 0.000201 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26839 | -| time_elapsed | 145889 | -| total_timesteps | 3435392 | -| train/ | | -| approx_kl | 0.086503536 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | 0.0651 | -| n_updates | 268380 | -| policy_gradient_loss | 0.015 | -| std | 0.00584 | -| value_loss | 4.26e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26840 | -| time_elapsed | 145893 | -| total_timesteps | 3435520 | -| train/ | | -| approx_kl | 0.002868637 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.65 | -| learning_rate | 0.0003 | -| loss | 0.00204 | -| n_updates | 268390 | -| policy_gradient_loss | 0.0103 | -| std | 0.00584 | -| value_loss | 1.63e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26841 | -| time_elapsed | 145896 | -| total_timesteps | 3435648 | -| train/ | | -| approx_kl | 0.07883247 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -6.05 | -| learning_rate | 0.0003 | -| loss | 0.00613 | -| n_updates | 268400 | -| policy_gradient_loss | 0.0175 | -| std | 0.00584 | -| value_loss | 2.51e-07 | ----------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26842 | -| time_elapsed | 145900 | -| total_timesteps | 3435776 | -| train/ | | -| approx_kl | 1.131306 | -| clip_fraction | 0.773 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.0138 | -| learning_rate | 0.0003 | -| loss | 0.552 | -| n_updates | 268410 | -| policy_gradient_loss | 0.213 | -| std | 0.00584 | -| value_loss | 8.95e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26843 | -| time_elapsed | 145906 | -| total_timesteps | 3435904 | -| train/ | | -| approx_kl | 0.06464658 | -| clip_fraction | 0.231 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0287 | -| learning_rate | 0.0003 | -| loss | 0.0492 | -| n_updates | 268420 | -| policy_gradient_loss | 0.00621 | -| std | 0.00584 | -| value_loss | 6.39e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26844 | -| time_elapsed | 145911 | -| total_timesteps | 3436032 | -| train/ | | -| approx_kl | 0.0014884733 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0594 | -| learning_rate | 0.0003 | -| loss | -0.00559 | -| n_updates | 268430 | -| policy_gradient_loss | 0.0447 | -| std | 0.00584 | -| value_loss | 3.68e-08 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26845 | -| time_elapsed | 145920 | -| total_timesteps | 3436160 | -| train/ | | -| approx_kl | 0.8466516 | -| clip_fraction | 0.581 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -3.92 | -| learning_rate | 0.0003 | -| loss | 0.0684 | -| n_updates | 268440 | -| policy_gradient_loss | 0.0141 | -| std | 0.00584 | -| value_loss | 0.00501 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26846 | -| time_elapsed | 145925 | -| total_timesteps | 3436288 | -| train/ | | -| approx_kl | 0.0074949972 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.314 | -| learning_rate | 0.0003 | -| loss | -0.00448 | -| n_updates | 268450 | -| policy_gradient_loss | 0.0078 | -| std | 0.00584 | -| value_loss | 7.17e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26847 | -| time_elapsed | 145930 | -| total_timesteps | 3436416 | -| train/ | | -| approx_kl | 0.002445072 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.00784 | -| learning_rate | 0.0003 | -| loss | -0.00623 | -| n_updates | 268460 | -| policy_gradient_loss | 0.0185 | -| std | 0.00584 | -| value_loss | 7.74e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26848 | -| time_elapsed | 145935 | -| total_timesteps | 3436544 | -| train/ | | -| approx_kl | 2.1848828e-06 | -| clip_fraction | 0.415 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0637 | -| learning_rate | 0.0003 | -| loss | -6.62e-05 | -| n_updates | 268470 | -| policy_gradient_loss | 0.0359 | -| std | 0.00584 | -| value_loss | 5.29e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26849 | -| time_elapsed | 145939 | -| total_timesteps | 3436672 | -| train/ | | -| approx_kl | 0.81733465 | -| clip_fraction | 0.772 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0674 | -| learning_rate | 0.0003 | -| loss | 0.353 | -| n_updates | 268480 | -| policy_gradient_loss | 0.28 | -| std | 0.00584 | -| value_loss | 4.05e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26850 | -| time_elapsed | 145943 | -| total_timesteps | 3436800 | -| train/ | | -| approx_kl | 0.016710164 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0575 | -| learning_rate | 0.0003 | -| loss | -0.00164 | -| n_updates | 268490 | -| policy_gradient_loss | 0.0345 | -| std | 0.00584 | -| value_loss | 4.13e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 26851 | -| time_elapsed | 145948 | -| total_timesteps | 3436928 | -| train/ | | -| approx_kl | 0.7797754 | -| clip_fraction | 0.508 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.033 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 268500 | -| policy_gradient_loss | 0.0565 | -| std | 0.00585 | -| value_loss | 2.17e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26852 | -| time_elapsed | 145952 | -| total_timesteps | 3437056 | -| train/ | | -| approx_kl | 0.06353853 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.109 | -| learning_rate | 0.0003 | -| loss | 0.00684 | -| n_updates | 268510 | -| policy_gradient_loss | 0.0046 | -| std | 0.00585 | -| value_loss | 1.48e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26853 | -| time_elapsed | 145960 | -| total_timesteps | 3437184 | -| train/ | | -| approx_kl | 0.09676856 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | 0.767 | -| learning_rate | 0.0003 | -| loss | 0.0234 | -| n_updates | 268520 | -| policy_gradient_loss | 0.00161 | -| std | 0.00585 | -| value_loss | 0.00902 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26854 | -| time_elapsed | 145964 | -| total_timesteps | 3437312 | -| train/ | | -| approx_kl | 0.0035781544 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -2.66 | -| learning_rate | 0.0003 | -| loss | -0.00171 | -| n_updates | 268530 | -| policy_gradient_loss | 0.0111 | -| std | 0.00585 | -| value_loss | 3.75e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26855 | -| time_elapsed | 145967 | -| total_timesteps | 3437440 | -| train/ | | -| approx_kl | 0.101297036 | -| clip_fraction | 0.599 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0106 | -| learning_rate | 0.0003 | -| loss | 0.0613 | -| n_updates | 268540 | -| policy_gradient_loss | 0.0911 | -| std | 0.00586 | -| value_loss | 2e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26856 | -| time_elapsed | 145972 | -| total_timesteps | 3437568 | -| train/ | | -| approx_kl | 0.36996418 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.242 | -| learning_rate | 0.0003 | -| loss | 0.141 | -| n_updates | 268550 | -| policy_gradient_loss | 0.0549 | -| std | 0.00586 | -| value_loss | 1.1e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26857 | -| time_elapsed | 145977 | -| total_timesteps | 3437696 | -| train/ | | -| approx_kl | 0.0018178369 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0833 | -| learning_rate | 0.0003 | -| loss | -0.00558 | -| n_updates | 268560 | -| policy_gradient_loss | 0.00317 | -| std | 0.00586 | -| value_loss | 1.02e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26858 | -| time_elapsed | 145981 | -| total_timesteps | 3437824 | -| train/ | | -| approx_kl | 3.999565e-06 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | -0.000409 | -| n_updates | 268570 | -| policy_gradient_loss | -0.00281 | -| std | 0.00586 | -| value_loss | 8.76e-07 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26859 | -| time_elapsed | 145986 | -| total_timesteps | 3437952 | -| train/ | | -| approx_kl | 0.00017001061 | -| clip_fraction | 0.209 | -| clip_range | 0.2 | -| entropy_loss | 3.72 | -| explained_variance | -0.0398 | -| learning_rate | 0.0003 | -| loss | -0.000267 | -| n_updates | 268580 | -| policy_gradient_loss | 0.0186 | -| std | 0.00584 | -| value_loss | 1.56e-06 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26860 | -| time_elapsed | 145991 | -| total_timesteps | 3438080 | -| train/ | | -| approx_kl | 0.00033165002 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.00487 | -| learning_rate | 0.0003 | -| loss | -0.00511 | -| n_updates | 268590 | -| policy_gradient_loss | 0.00288 | -| std | 0.00583 | -| value_loss | 9.28e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26861 | -| time_elapsed | 146001 | -| total_timesteps | 3438208 | -| train/ | | -| approx_kl | 0.16714986 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.896 | -| learning_rate | 0.0003 | -| loss | 0.0221 | -| n_updates | 268600 | -| policy_gradient_loss | 0.039 | -| std | 0.00582 | -| value_loss | 0.00245 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26862 | -| time_elapsed | 146006 | -| total_timesteps | 3438336 | -| train/ | | -| approx_kl | 0.41776884 | -| clip_fraction | 0.491 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.265 | -| learning_rate | 0.0003 | -| loss | 0.145 | -| n_updates | 268610 | -| policy_gradient_loss | 0.0525 | -| std | 0.00582 | -| value_loss | 2.2e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26863 | -| time_elapsed | 146012 | -| total_timesteps | 3438464 | -| train/ | | -| approx_kl | 0.00063726027 | -| clip_fraction | 0.253 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00559 | -| learning_rate | 0.0003 | -| loss | -0.00167 | -| n_updates | 268620 | -| policy_gradient_loss | 0.0182 | -| std | 0.00582 | -| value_loss | 1.64e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26864 | -| time_elapsed | 146016 | -| total_timesteps | 3438592 | -| train/ | | -| approx_kl | 0.11028895 | -| clip_fraction | 0.632 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.232 | -| learning_rate | 0.0003 | -| loss | 0.0543 | -| n_updates | 268630 | -| policy_gradient_loss | 0.108 | -| std | 0.00582 | -| value_loss | 1.09e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26865 | -| time_elapsed | 146021 | -| total_timesteps | 3438720 | -| train/ | | -| approx_kl | 0.41208905 | -| clip_fraction | 0.502 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.056 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 268640 | -| policy_gradient_loss | 0.0668 | -| std | 0.00582 | -| value_loss | 9.62e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26866 | -| time_elapsed | 146027 | -| total_timesteps | 3438848 | -| train/ | | -| approx_kl | 0.0018539922 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0412 | -| learning_rate | 0.0003 | -| loss | -0.000353 | -| n_updates | 268650 | -| policy_gradient_loss | 0.0253 | -| std | 0.00582 | -| value_loss | 1.03e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26867 | -| time_elapsed | 146032 | -| total_timesteps | 3438976 | -| train/ | | -| approx_kl | 0.103966236 | -| clip_fraction | 0.616 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.0582 | -| n_updates | 268660 | -| policy_gradient_loss | 0.0924 | -| std | 0.00583 | -| value_loss | 1.91e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26868 | -| time_elapsed | 146037 | -| total_timesteps | 3439104 | -| train/ | | -| approx_kl | 0.29141095 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0175 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 268670 | -| policy_gradient_loss | 0.0506 | -| std | 0.00583 | -| value_loss | 8.31e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26869 | -| time_elapsed | 146049 | -| total_timesteps | 3439232 | -| train/ | | -| approx_kl | 0.12328006 | -| clip_fraction | 0.314 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.465 | -| learning_rate | 0.0003 | -| loss | 0.00292 | -| n_updates | 268680 | -| policy_gradient_loss | -0.01 | -| std | 0.00583 | -| value_loss | 0.00191 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26870 | -| time_elapsed | 146053 | -| total_timesteps | 3439360 | -| train/ | | -| approx_kl | 0.03556849 | -| clip_fraction | 0.629 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -3.9 | -| learning_rate | 0.0003 | -| loss | 0.0175 | -| n_updates | 268690 | -| policy_gradient_loss | 0.112 | -| std | 0.00583 | -| value_loss | 4.56e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26871 | -| time_elapsed | 146056 | -| total_timesteps | 3439488 | -| train/ | | -| approx_kl | 0.01914463 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | -0.0313 | -| n_updates | 268700 | -| policy_gradient_loss | -0.00685 | -| std | 0.00583 | -| value_loss | 1.04e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26872 | -| time_elapsed | 146061 | -| total_timesteps | 3439616 | -| train/ | | -| approx_kl | 0.025448183 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00824 | -| learning_rate | 0.0003 | -| loss | 0.0271 | -| n_updates | 268710 | -| policy_gradient_loss | 0.0466 | -| std | 0.00583 | -| value_loss | 1.76e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26873 | -| time_elapsed | 146066 | -| total_timesteps | 3439744 | -| train/ | | -| approx_kl | 0.11242691 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0996 | -| learning_rate | 0.0003 | -| loss | 0.0563 | -| n_updates | 268720 | -| policy_gradient_loss | 0.0302 | -| std | 0.00583 | -| value_loss | 1.63e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 26874 | -| time_elapsed | 146071 | -| total_timesteps | 3439872 | -| train/ | | -| approx_kl | 0.0014934051 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0672 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 268730 | -| policy_gradient_loss | 0.00541 | -| std | 0.00583 | -| value_loss | 1.27e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26875 | -| time_elapsed | 146076 | -| total_timesteps | 3440000 | -| train/ | | -| approx_kl | 0.017728835 | -| clip_fraction | 0.516 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.276 | -| learning_rate | 0.0003 | -| loss | -0.00446 | -| n_updates | 268740 | -| policy_gradient_loss | 0.0361 | -| std | 0.00583 | -| value_loss | 4.12e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26876 | -| time_elapsed | 146080 | -| total_timesteps | 3440128 | -| train/ | | -| approx_kl | 0.42292908 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0101 | -| learning_rate | 0.0003 | -| loss | 0.253 | -| n_updates | 268750 | -| policy_gradient_loss | 0.178 | -| std | 0.00583 | -| value_loss | 2.93e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26877 | -| time_elapsed | 146089 | -| total_timesteps | 3440256 | -| train/ | | -| approx_kl | 0.30575824 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.857 | -| learning_rate | 0.0003 | -| loss | 0.0635 | -| n_updates | 268760 | -| policy_gradient_loss | 0.102 | -| std | 0.00583 | -| value_loss | 0.00399 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26878 | -| time_elapsed | 146093 | -| total_timesteps | 3440384 | -| train/ | | -| approx_kl | 0.4053036 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -3.22 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 268770 | -| policy_gradient_loss | 0.141 | -| std | 0.00583 | -| value_loss | 2.18e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26879 | -| time_elapsed | 146097 | -| total_timesteps | 3440512 | -| train/ | | -| approx_kl | 0.05999526 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.137 | -| learning_rate | 0.0003 | -| loss | 0.0358 | -| n_updates | 268780 | -| policy_gradient_loss | 0.032 | -| std | 0.00583 | -| value_loss | 4.51e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26880 | -| time_elapsed | 146101 | -| total_timesteps | 3440640 | -| train/ | | -| approx_kl | 0.0023911148 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.00354 | -| n_updates | 268790 | -| policy_gradient_loss | 0.0409 | -| std | 0.00583 | -| value_loss | 2.36e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26881 | -| time_elapsed | 146105 | -| total_timesteps | 3440768 | -| train/ | | -| approx_kl | 0.0008655847 | -| clip_fraction | 0.393 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0185 | -| learning_rate | 0.0003 | -| loss | -0.00249 | -| n_updates | 268800 | -| policy_gradient_loss | 0.0338 | -| std | 0.00583 | -| value_loss | 1.54e-07 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26882 | -| time_elapsed | 146109 | -| total_timesteps | 3440896 | -| train/ | | -| approx_kl | 0.0024419753 | -| clip_fraction | 0.382 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | -0.00389 | -| n_updates | 268810 | -| policy_gradient_loss | 0.035 | -| std | 0.00583 | -| value_loss | 1.11e-07 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26883 | -| time_elapsed | 146114 | -| total_timesteps | 3441024 | -| train/ | | -| approx_kl | 0.6475686 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 268820 | -| policy_gradient_loss | 0.081 | -| std | 0.00583 | -| value_loss | 7.67e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26884 | -| time_elapsed | 146125 | -| total_timesteps | 3441152 | -| train/ | | -| approx_kl | 0.015066078 | -| clip_fraction | 0.29 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -7.46 | -| learning_rate | 0.0003 | -| loss | -0.0103 | -| n_updates | 268830 | -| policy_gradient_loss | -7.58e-05 | -| std | 0.00583 | -| value_loss | 0.00584 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26885 | -| time_elapsed | 146129 | -| total_timesteps | 3441280 | -| train/ | | -| approx_kl | 0.00092456536 | -| clip_fraction | 0.299 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.502 | -| learning_rate | 0.0003 | -| loss | -0.0077 | -| n_updates | 268840 | -| policy_gradient_loss | -0.00521 | -| std | 0.00583 | -| value_loss | 2.91e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26886 | -| time_elapsed | 146132 | -| total_timesteps | 3441408 | -| train/ | | -| approx_kl | 0.010694249 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0541 | -| learning_rate | 0.0003 | -| loss | -0.00529 | -| n_updates | 268850 | -| policy_gradient_loss | 0.00484 | -| std | 0.00583 | -| value_loss | 2.23e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26887 | -| time_elapsed | 146136 | -| total_timesteps | 3441536 | -| train/ | | -| approx_kl | 0.0010101371 | -| clip_fraction | 0.226 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -7.76 | -| learning_rate | 0.0003 | -| loss | 0.00252 | -| n_updates | 268860 | -| policy_gradient_loss | 0.00412 | -| std | 0.00583 | -| value_loss | 1.88e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26888 | -| time_elapsed | 146141 | -| total_timesteps | 3441664 | -| train/ | | -| approx_kl | 0.06429099 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | 0.013 | -| n_updates | 268870 | -| policy_gradient_loss | 0.00459 | -| std | 0.00583 | -| value_loss | 3.47e-09 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26889 | -| time_elapsed | 146145 | -| total_timesteps | 3441792 | -| train/ | | -| approx_kl | 0.0657915 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.23 | -| learning_rate | 0.0003 | -| loss | 0.0225 | -| n_updates | 268880 | -| policy_gradient_loss | 0.0114 | -| std | 0.00583 | -| value_loss | 1.96e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 26890 | -| time_elapsed | 146149 | -| total_timesteps | 3441920 | -| train/ | | -| approx_kl | 0.06542277 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.078 | -| learning_rate | 0.0003 | -| loss | -0.00253 | -| n_updates | 268890 | -| policy_gradient_loss | -0.00128 | -| std | 0.00583 | -| value_loss | 1.84e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26891 | -| time_elapsed | 146153 | -| total_timesteps | 3442048 | -| train/ | | -| approx_kl | 0.009381993 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | 0.00145 | -| n_updates | 268900 | -| policy_gradient_loss | 0.00927 | -| std | 0.00583 | -| value_loss | 1.09e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26892 | -| time_elapsed | 146162 | -| total_timesteps | 3442176 | -| train/ | | -| approx_kl | 0.011317372 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.824 | -| learning_rate | 0.0003 | -| loss | -0.0261 | -| n_updates | 268910 | -| policy_gradient_loss | -0.00876 | -| std | 0.00583 | -| value_loss | 0.000947 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26893 | -| time_elapsed | 146169 | -| total_timesteps | 3442304 | -| train/ | | -| approx_kl | 0.014662288 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.257 | -| learning_rate | 0.0003 | -| loss | 0.0132 | -| n_updates | 268920 | -| policy_gradient_loss | 0.00759 | -| std | 0.00582 | -| value_loss | 1.5e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26894 | -| time_elapsed | 146174 | -| total_timesteps | 3442432 | -| train/ | | -| approx_kl | 0.046404205 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -47.4 | -| learning_rate | 0.0003 | -| loss | 0.00361 | -| n_updates | 268930 | -| policy_gradient_loss | 0.0155 | -| std | 0.00582 | -| value_loss | 2.16e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26895 | -| time_elapsed | 146179 | -| total_timesteps | 3442560 | -| train/ | | -| approx_kl | 1.0168402 | -| clip_fraction | 0.766 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.643 | -| learning_rate | 0.0003 | -| loss | 0.264 | -| n_updates | 268940 | -| policy_gradient_loss | 0.209 | -| std | 0.00582 | -| value_loss | 6.59e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26896 | -| time_elapsed | 146184 | -| total_timesteps | 3442688 | -| train/ | | -| approx_kl | 0.012363711 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0143 | -| learning_rate | 0.0003 | -| loss | -0.0264 | -| n_updates | 268950 | -| policy_gradient_loss | 0.0343 | -| std | 0.00582 | -| value_loss | 5.58e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26897 | -| time_elapsed | 146188 | -| total_timesteps | 3442816 | -| train/ | | -| approx_kl | 0.1620136 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.022 | -| learning_rate | 0.0003 | -| loss | 0.0484 | -| n_updates | 268960 | -| policy_gradient_loss | 0.0202 | -| std | 0.00581 | -| value_loss | 3.7e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26898 | -| time_elapsed | 146192 | -| total_timesteps | 3442944 | -| train/ | | -| approx_kl | 0.020914178 | -| clip_fraction | 0.172 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0427 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 268970 | -| policy_gradient_loss | 0.00889 | -| std | 0.00581 | -| value_loss | 2.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26899 | -| time_elapsed | 146196 | -| total_timesteps | 3443072 | -| train/ | | -| approx_kl | 0.03697512 | -| clip_fraction | 0.504 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.153 | -| learning_rate | 0.0003 | -| loss | 0.0131 | -| n_updates | 268980 | -| policy_gradient_loss | 0.0464 | -| std | 0.0058 | -| value_loss | 2.26e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26900 | -| time_elapsed | 146204 | -| total_timesteps | 3443200 | -| train/ | | -| approx_kl | 0.24112913 | -| clip_fraction | 0.375 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -1.7 | -| learning_rate | 0.0003 | -| loss | 0.05 | -| n_updates | 268990 | -| policy_gradient_loss | 0.00821 | -| std | 0.00579 | -| value_loss | 0.00399 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26901 | -| time_elapsed | 146208 | -| total_timesteps | 3443328 | -| train/ | | -| approx_kl | 0.030995393 | -| clip_fraction | 0.169 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.018 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 269000 | -| policy_gradient_loss | 0.00671 | -| std | 0.00579 | -| value_loss | 1.81e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26902 | -| time_elapsed | 146212 | -| total_timesteps | 3443456 | -| train/ | | -| approx_kl | 0.028042294 | -| clip_fraction | 0.427 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.0115 | -| learning_rate | 0.0003 | -| loss | 0.000682 | -| n_updates | 269010 | -| policy_gradient_loss | 0.0323 | -| std | 0.00579 | -| value_loss | 3.45e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26903 | -| time_elapsed | 146217 | -| total_timesteps | 3443584 | -| train/ | | -| approx_kl | 0.16419877 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0514 | -| learning_rate | 0.0003 | -| loss | 0.00337 | -| n_updates | 269020 | -| policy_gradient_loss | 0.0116 | -| std | 0.00579 | -| value_loss | 3.68e-07 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26904 | -| time_elapsed | 146221 | -| total_timesteps | 3443712 | -| train/ | | -| approx_kl | 0.00017498853 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0315 | -| learning_rate | 0.0003 | -| loss | -0.00131 | -| n_updates | 269030 | -| policy_gradient_loss | 0.0269 | -| std | 0.00579 | -| value_loss | 2.97e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26905 | -| time_elapsed | 146225 | -| total_timesteps | 3443840 | -| train/ | | -| approx_kl | 1.5955989 | -| clip_fraction | 0.569 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0337 | -| learning_rate | 0.0003 | -| loss | 0.541 | -| n_updates | 269040 | -| policy_gradient_loss | 0.128 | -| std | 0.00579 | -| value_loss | 2.38e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26906 | -| time_elapsed | 146229 | -| total_timesteps | 3443968 | -| train/ | | -| approx_kl | 0.014899451 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.032 | -| learning_rate | 0.0003 | -| loss | -0.0164 | -| n_updates | 269050 | -| policy_gradient_loss | 0.00446 | -| std | 0.00579 | -| value_loss | 2.12e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26907 | -| time_elapsed | 146235 | -| total_timesteps | 3444096 | -| train/ | | -| approx_kl | 0.09157352 | -| clip_fraction | 0.338 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0317 | -| learning_rate | 0.0003 | -| loss | 0.0238 | -| n_updates | 269060 | -| policy_gradient_loss | 0.00815 | -| std | 0.00579 | -| value_loss | 1.38e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26908 | -| time_elapsed | 146245 | -| total_timesteps | 3444224 | -| train/ | | -| approx_kl | 0.023556799 | -| clip_fraction | 0.186 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.701 | -| learning_rate | 0.0003 | -| loss | 0.0223 | -| n_updates | 269070 | -| policy_gradient_loss | 0.000581 | -| std | 0.0058 | -| value_loss | 0.0114 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26909 | -| time_elapsed | 146252 | -| total_timesteps | 3444352 | -| train/ | | -| approx_kl | 0.0973086 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.712 | -| learning_rate | 0.0003 | -| loss | 0.0468 | -| n_updates | 269080 | -| policy_gradient_loss | 0.0167 | -| std | 0.0058 | -| value_loss | 0.000515 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26910 | -| time_elapsed | 146256 | -| total_timesteps | 3444480 | -| train/ | | -| approx_kl | 0.018304158 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | 0.00657 | -| learning_rate | 0.0003 | -| loss | -0.00387 | -| n_updates | 269090 | -| policy_gradient_loss | 0.00855 | -| std | 0.0058 | -| value_loss | 4.96e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26911 | -| time_elapsed | 146260 | -| total_timesteps | 3444608 | -| train/ | | -| approx_kl | 0.072539434 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0711 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 269100 | -| policy_gradient_loss | 0.0115 | -| std | 0.0058 | -| value_loss | 4.48e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26912 | -| time_elapsed | 146264 | -| total_timesteps | 3444736 | -| train/ | | -| approx_kl | 0.017280884 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0655 | -| learning_rate | 0.0003 | -| loss | -0.000693 | -| n_updates | 269110 | -| policy_gradient_loss | 0.0128 | -| std | 0.0058 | -| value_loss | 3.5e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26913 | -| time_elapsed | 146268 | -| total_timesteps | 3444864 | -| train/ | | -| approx_kl | 0.028496241 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.73 | -| explained_variance | -0.0496 | -| learning_rate | 0.0003 | -| loss | 0.0228 | -| n_updates | 269120 | -| policy_gradient_loss | 0.0205 | -| std | 0.00578 | -| value_loss | 2.06e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26914 | -| time_elapsed | 146273 | -| total_timesteps | 3444992 | -| train/ | | -| approx_kl | 0.00013401499 | -| clip_fraction | 0.244 | -| clip_range | 0.2 | -| entropy_loss | 3.74 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.000256 | -| n_updates | 269130 | -| policy_gradient_loss | 0.013 | -| std | 0.00577 | -| value_loss | 0.000105 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26915 | -| time_elapsed | 146278 | -| total_timesteps | 3445120 | -| train/ | | -| approx_kl | 0.0006576977 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.74 | -| explained_variance | -0.00345 | -| learning_rate | 0.0003 | -| loss | 0.00126 | -| n_updates | 269140 | -| policy_gradient_loss | 0.0125 | -| std | 0.00576 | -| value_loss | 1.35e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26916 | -| time_elapsed | 146290 | -| total_timesteps | 3445248 | -| train/ | | -| approx_kl | 0.24268177 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.74 | -| explained_variance | 0.806 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 269150 | -| policy_gradient_loss | 0.0334 | -| std | 0.00576 | -| value_loss | 0.00338 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26917 | -| time_elapsed | 146296 | -| total_timesteps | 3445376 | -| train/ | | -| approx_kl | 0.90875196 | -| clip_fraction | 0.562 | -| clip_range | 0.2 | -| entropy_loss | 3.74 | -| explained_variance | -0.0366 | -| learning_rate | 0.0003 | -| loss | 0.371 | -| n_updates | 269160 | -| policy_gradient_loss | 0.105 | -| std | 0.00575 | -| value_loss | 0.000149 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26918 | -| time_elapsed | 146301 | -| total_timesteps | 3445504 | -| train/ | | -| approx_kl | 0.013730211 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.74 | -| explained_variance | 0.0184 | -| learning_rate | 0.0003 | -| loss | 0.00106 | -| n_updates | 269170 | -| policy_gradient_loss | 0.00757 | -| std | 0.00575 | -| value_loss | 4.38e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26919 | -| time_elapsed | 146306 | -| total_timesteps | 3445632 | -| train/ | | -| approx_kl | 0.00020785723 | -| clip_fraction | 0.146 | -| clip_range | 0.2 | -| entropy_loss | 3.74 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.000421 | -| n_updates | 269180 | -| policy_gradient_loss | 0.0104 | -| std | 0.00573 | -| value_loss | 3.55e-05 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26920 | -| time_elapsed | 146311 | -| total_timesteps | 3445760 | -| train/ | | -| approx_kl | 0.06885413 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.74 | -| explained_variance | -0.00805 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 269190 | -| policy_gradient_loss | 0.0382 | -| std | 0.00572 | -| value_loss | 0.000127 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26921 | -| time_elapsed | 146317 | -| total_timesteps | 3445888 | -| train/ | | -| approx_kl | 0.17984012 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -1.72 | -| learning_rate | 0.0003 | -| loss | 0.0135 | -| n_updates | 269200 | -| policy_gradient_loss | 0.00995 | -| std | 0.00571 | -| value_loss | 6.35e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26922 | -| time_elapsed | 146322 | -| total_timesteps | 3446016 | -| train/ | | -| approx_kl | 0.00078163156 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.314 | -| learning_rate | 0.0003 | -| loss | -0.00884 | -| n_updates | 269210 | -| policy_gradient_loss | 0.0284 | -| std | 0.00571 | -| value_loss | 1.93e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26923 | -| time_elapsed | 146334 | -| total_timesteps | 3446144 | -| train/ | | -| approx_kl | 0.6032334 | -| clip_fraction | 0.543 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.825 | -| learning_rate | 0.0003 | -| loss | 0.104 | -| n_updates | 269220 | -| policy_gradient_loss | 0.0492 | -| std | 0.0057 | -| value_loss | 0.0045 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26924 | -| time_elapsed | 146339 | -| total_timesteps | 3446272 | -| train/ | | -| approx_kl | 0.0042091473 | -| clip_fraction | 0.203 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0437 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 269230 | -| policy_gradient_loss | 0.00564 | -| std | 0.0057 | -| value_loss | 0.000143 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26925 | -| time_elapsed | 146344 | -| total_timesteps | 3446400 | -| train/ | | -| approx_kl | 0.050280802 | -| clip_fraction | 0.643 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.016 | -| learning_rate | 0.0003 | -| loss | 0.0525 | -| n_updates | 269240 | -| policy_gradient_loss | 0.128 | -| std | 0.0057 | -| value_loss | 5.34e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26926 | -| time_elapsed | 146348 | -| total_timesteps | 3446528 | -| train/ | | -| approx_kl | 0.016827164 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.00805 | -| n_updates | 269250 | -| policy_gradient_loss | 0.0366 | -| std | 0.0057 | -| value_loss | 2.73e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26927 | -| time_elapsed | 146352 | -| total_timesteps | 3446656 | -| train/ | | -| approx_kl | 0.8825121 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0903 | -| learning_rate | 0.0003 | -| loss | 0.246 | -| n_updates | 269260 | -| policy_gradient_loss | 0.0792 | -| std | 0.0057 | -| value_loss | 2.69e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26928 | -| time_elapsed | 146357 | -| total_timesteps | 3446784 | -| train/ | | -| approx_kl | 0.050085936 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0488 | -| learning_rate | 0.0003 | -| loss | 0.0367 | -| n_updates | 269270 | -| policy_gradient_loss | 0.0179 | -| std | 0.0057 | -| value_loss | 1.4e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26929 | -| time_elapsed | 146362 | -| total_timesteps | 3446912 | -| train/ | | -| approx_kl | 0.06812838 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.0325 | -| n_updates | 269280 | -| policy_gradient_loss | 0.0155 | -| std | 0.0057 | -| value_loss | 1.14e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26930 | -| time_elapsed | 146366 | -| total_timesteps | 3447040 | -| train/ | | -| approx_kl | 0.058230657 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0666 | -| learning_rate | 0.0003 | -| loss | 0.0402 | -| n_updates | 269290 | -| policy_gradient_loss | 0.0194 | -| std | 0.0057 | -| value_loss | 6.97e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26931 | -| time_elapsed | 146376 | -| total_timesteps | 3447168 | -| train/ | | -| approx_kl | 0.011140305 | -| clip_fraction | 0.26 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.361 | -| learning_rate | 0.0003 | -| loss | 0.0116 | -| n_updates | 269300 | -| policy_gradient_loss | 0.0111 | -| std | 0.00569 | -| value_loss | 0.0338 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26932 | -| time_elapsed | 146380 | -| total_timesteps | 3447296 | -| train/ | | -| approx_kl | 0.11021803 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.483 | -| learning_rate | 0.0003 | -| loss | 0.0459 | -| n_updates | 269310 | -| policy_gradient_loss | 0.0161 | -| std | 0.00569 | -| value_loss | 0.000204 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26933 | -| time_elapsed | 146386 | -| total_timesteps | 3447424 | -| train/ | | -| approx_kl | 0.0147919655 | -| clip_fraction | 0.235 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0186 | -| learning_rate | 0.0003 | -| loss | -0.00923 | -| n_updates | 269320 | -| policy_gradient_loss | 0.00637 | -| std | 0.00569 | -| value_loss | 6.19e-05 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26934 | -| time_elapsed | 146391 | -| total_timesteps | 3447552 | -| train/ | | -| approx_kl | 0.00086418446 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.00024 | -| learning_rate | 0.0003 | -| loss | 0.00214 | -| n_updates | 269330 | -| policy_gradient_loss | 0.00901 | -| std | 0.00569 | -| value_loss | 2.9e-05 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26935 | -| time_elapsed | 146396 | -| total_timesteps | 3447680 | -| train/ | | -| approx_kl | 0.0841286 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0535 | -| learning_rate | 0.0003 | -| loss | 0.0483 | -| n_updates | 269340 | -| policy_gradient_loss | 0.0221 | -| std | 0.00569 | -| value_loss | 1.51e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26936 | -| time_elapsed | 146401 | -| total_timesteps | 3447808 | -| train/ | | -| approx_kl | 0.017131515 | -| clip_fraction | 0.348 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | 0.00613 | -| n_updates | 269350 | -| policy_gradient_loss | 0.0184 | -| std | 0.00569 | -| value_loss | 1.12e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 26937 | -| time_elapsed | 146407 | -| total_timesteps | 3447936 | -| train/ | | -| approx_kl | 0.002782343 | -| clip_fraction | 0.212 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0724 | -| learning_rate | 0.0003 | -| loss | -0.00123 | -| n_updates | 269360 | -| policy_gradient_loss | 0.00909 | -| std | 0.00569 | -| value_loss | 7.34e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26938 | -| time_elapsed | 146412 | -| total_timesteps | 3448064 | -| train/ | | -| approx_kl | 4.039146e-06 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0954 | -| learning_rate | 0.0003 | -| loss | 0.000282 | -| n_updates | 269370 | -| policy_gradient_loss | 0.0502 | -| std | 0.00569 | -| value_loss | 7e-06 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26939 | -| time_elapsed | 146420 | -| total_timesteps | 3448192 | -| train/ | | -| approx_kl | 1.660765 | -| clip_fraction | 0.762 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -1.53 | -| learning_rate | 0.0003 | -| loss | 0.838 | -| n_updates | 269380 | -| policy_gradient_loss | 0.199 | -| std | 0.00569 | -| value_loss | 0.00426 | --------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26940 | -| time_elapsed | 146426 | -| total_timesteps | 3448320 | -| train/ | | -| approx_kl | 2.6545953e-05 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.562 | -| learning_rate | 0.0003 | -| loss | 0.000685 | -| n_updates | 269390 | -| policy_gradient_loss | 0.00991 | -| std | 0.00569 | -| value_loss | 3.2e-06 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26941 | -| time_elapsed | 146430 | -| total_timesteps | 3448448 | -| train/ | | -| approx_kl | 0.051593933 | -| clip_fraction | 0.442 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.467 | -| learning_rate | 0.0003 | -| loss | 0.0295 | -| n_updates | 269400 | -| policy_gradient_loss | 0.0497 | -| std | 0.00569 | -| value_loss | 5.87e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26942 | -| time_elapsed | 146435 | -| total_timesteps | 3448576 | -| train/ | | -| approx_kl | 1.3624277 | -| clip_fraction | 0.767 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.454 | -| n_updates | 269410 | -| policy_gradient_loss | 0.222 | -| std | 0.00569 | -| value_loss | 3.51e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26943 | -| time_elapsed | 146440 | -| total_timesteps | 3448704 | -| train/ | | -| approx_kl | 0.039897464 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | 0.0357 | -| n_updates | 269420 | -| policy_gradient_loss | 0.0244 | -| std | 0.00569 | -| value_loss | 3e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26944 | -| time_elapsed | 146443 | -| total_timesteps | 3448832 | -| train/ | | -| approx_kl | 0.09319068 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0758 | -| learning_rate | 0.0003 | -| loss | 0.0122 | -| n_updates | 269430 | -| policy_gradient_loss | 0.02 | -| std | 0.00569 | -| value_loss | 2.13e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26945 | -| time_elapsed | 146446 | -| total_timesteps | 3448960 | -| train/ | | -| approx_kl | 0.0001041824 | -| clip_fraction | 0.463 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0571 | -| learning_rate | 0.0003 | -| loss | 0.000423 | -| n_updates | 269440 | -| policy_gradient_loss | 0.0439 | -| std | 0.00569 | -| value_loss | 1.67e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26946 | -| time_elapsed | 146451 | -| total_timesteps | 3449088 | -| train/ | | -| approx_kl | 0.21122071 | -| clip_fraction | 0.366 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.051 | -| learning_rate | 0.0003 | -| loss | 0.0695 | -| n_updates | 269450 | -| policy_gradient_loss | 0.0224 | -| std | 0.00569 | -| value_loss | 1.47e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26947 | -| time_elapsed | 146460 | -| total_timesteps | 3449216 | -| train/ | | -| approx_kl | 0.051629767 | -| clip_fraction | 0.216 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0751 | -| learning_rate | 0.0003 | -| loss | 0.0187 | -| n_updates | 269460 | -| policy_gradient_loss | -0.00581 | -| std | 0.00569 | -| value_loss | 0.0049 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26948 | -| time_elapsed | 146464 | -| total_timesteps | 3449344 | -| train/ | | -| approx_kl | 0.016776355 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.356 | -| learning_rate | 0.0003 | -| loss | 0.00398 | -| n_updates | 269470 | -| policy_gradient_loss | 0.0531 | -| std | 0.00569 | -| value_loss | 0.000102 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26949 | -| time_elapsed | 146469 | -| total_timesteps | 3449472 | -| train/ | | -| approx_kl | 1.1029277 | -| clip_fraction | 0.778 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0108 | -| learning_rate | 0.0003 | -| loss | 0.478 | -| n_updates | 269480 | -| policy_gradient_loss | 0.217 | -| std | 0.00569 | -| value_loss | 2.07e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26950 | -| time_elapsed | 146473 | -| total_timesteps | 3449600 | -| train/ | | -| approx_kl | 0.09422074 | -| clip_fraction | 0.247 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.00836 | -| learning_rate | 0.0003 | -| loss | 0.0826 | -| n_updates | 269490 | -| policy_gradient_loss | 0.0127 | -| std | 0.00568 | -| value_loss | 9.85e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26951 | -| time_elapsed | 146478 | -| total_timesteps | 3449728 | -| train/ | | -| approx_kl | 0.6626358 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.091 | -| learning_rate | 0.0003 | -| loss | 0.173 | -| n_updates | 269500 | -| policy_gradient_loss | 0.068 | -| std | 0.00568 | -| value_loss | 4e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26952 | -| time_elapsed | 146483 | -| total_timesteps | 3449856 | -| train/ | | -| approx_kl | 0.05989751 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | 0.0347 | -| n_updates | 269510 | -| policy_gradient_loss | 0.0161 | -| std | 0.00568 | -| value_loss | 3.18e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26953 | -| time_elapsed | 146488 | -| total_timesteps | 3449984 | -| train/ | | -| approx_kl | 0.06916605 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0768 | -| learning_rate | 0.0003 | -| loss | -0.000721 | -| n_updates | 269520 | -| policy_gradient_loss | 2.68e-05 | -| std | 0.00568 | -| value_loss | 2.77e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26954 | -| time_elapsed | 146494 | -| total_timesteps | 3450112 | -| train/ | | -| approx_kl | 0.010932223 | -| clip_fraction | 0.243 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0466 | -| learning_rate | 0.0003 | -| loss | -0.0138 | -| n_updates | 269530 | -| policy_gradient_loss | 0.00727 | -| std | 0.00568 | -| value_loss | 2.45e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26955 | -| time_elapsed | 146505 | -| total_timesteps | 3450240 | -| train/ | | -| approx_kl | 0.30294076 | -| clip_fraction | 0.425 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 269540 | -| policy_gradient_loss | 0.0123 | -| std | 0.00568 | -| value_loss | 0.00283 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26956 | -| time_elapsed | 146510 | -| total_timesteps | 3450368 | -| train/ | | -| approx_kl | 0.012993759 | -| clip_fraction | 0.458 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.661 | -| learning_rate | 0.0003 | -| loss | 0.00751 | -| n_updates | 269550 | -| policy_gradient_loss | 0.0435 | -| std | 0.00568 | -| value_loss | 4.81e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26957 | -| time_elapsed | 146516 | -| total_timesteps | 3450496 | -| train/ | | -| approx_kl | 0.35426056 | -| clip_fraction | 0.431 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -3.9 | -| learning_rate | 0.0003 | -| loss | 0.092 | -| n_updates | 269560 | -| policy_gradient_loss | 0.0261 | -| std | 0.00567 | -| value_loss | 2.61e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26958 | -| time_elapsed | 146521 | -| total_timesteps | 3450624 | -| train/ | | -| approx_kl | 0.030161075 | -| clip_fraction | 0.195 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -1.16 | -| learning_rate | 0.0003 | -| loss | 0.0124 | -| n_updates | 269570 | -| policy_gradient_loss | 0.00489 | -| std | 0.00568 | -| value_loss | 2.57e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26959 | -| time_elapsed | 146526 | -| total_timesteps | 3450752 | -| train/ | | -| approx_kl | 0.020694394 | -| clip_fraction | 0.148 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.288 | -| learning_rate | 0.0003 | -| loss | 0.00666 | -| n_updates | 269580 | -| policy_gradient_loss | 0.00288 | -| std | 0.00568 | -| value_loss | 9.65e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26960 | -| time_elapsed | 146531 | -| total_timesteps | 3450880 | -| train/ | | -| approx_kl | 0.020183459 | -| clip_fraction | 0.159 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0373 | -| learning_rate | 0.0003 | -| loss | -0.0209 | -| n_updates | 269590 | -| policy_gradient_loss | -0.0108 | -| std | 0.00568 | -| value_loss | 4.31e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26961 | -| time_elapsed | 146537 | -| total_timesteps | 3451008 | -| train/ | | -| approx_kl | 0.015991226 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | -0.00659 | -| n_updates | 269600 | -| policy_gradient_loss | -0.00337 | -| std | 0.00568 | -| value_loss | 3.46e-09 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26962 | -| time_elapsed | 146548 | -| total_timesteps | 3451136 | -| train/ | | -| approx_kl | 0.0026737233 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.979 | -| learning_rate | 0.0003 | -| loss | 0.000803 | -| n_updates | 269610 | -| policy_gradient_loss | 0.00874 | -| std | 0.00568 | -| value_loss | 0.00028 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26963 | -| time_elapsed | 146552 | -| total_timesteps | 3451264 | -| train/ | | -| approx_kl | 0.71959305 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.468 | -| learning_rate | 0.0003 | -| loss | 0.23 | -| n_updates | 269620 | -| policy_gradient_loss | 0.17 | -| std | 0.00569 | -| value_loss | 0.000101 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26964 | -| time_elapsed | 146558 | -| total_timesteps | 3451392 | -| train/ | | -| approx_kl | 0.124570765 | -| clip_fraction | 0.38 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.255 | -| learning_rate | 0.0003 | -| loss | 0.0722 | -| n_updates | 269630 | -| policy_gradient_loss | 0.043 | -| std | 0.00569 | -| value_loss | 1.17e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26965 | -| time_elapsed | 146564 | -| total_timesteps | 3451520 | -| train/ | | -| approx_kl | 0.18422118 | -| clip_fraction | 0.357 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0179 | -| learning_rate | 0.0003 | -| loss | 0.0751 | -| n_updates | 269640 | -| policy_gradient_loss | 0.0265 | -| std | 0.00569 | -| value_loss | 3.44e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26966 | -| time_elapsed | 146569 | -| total_timesteps | 3451648 | -| train/ | | -| approx_kl | 0.015707014 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0304 | -| learning_rate | 0.0003 | -| loss | 0.00323 | -| n_updates | 269650 | -| policy_gradient_loss | 0.00157 | -| std | 0.00569 | -| value_loss | 1.63e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26967 | -| time_elapsed | 146573 | -| total_timesteps | 3451776 | -| train/ | | -| approx_kl | 0.03433777 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.0158 | -| n_updates | 269660 | -| policy_gradient_loss | 0.0396 | -| std | 0.00569 | -| value_loss | 9.3e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26968 | -| time_elapsed | 146577 | -| total_timesteps | 3451904 | -| train/ | | -| approx_kl | 0.42097974 | -| clip_fraction | 0.738 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0932 | -| learning_rate | 0.0003 | -| loss | 0.174 | -| n_updates | 269670 | -| policy_gradient_loss | 0.16 | -| std | 0.00569 | -| value_loss | 6.08e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26969 | -| time_elapsed | 146581 | -| total_timesteps | 3452032 | -| train/ | | -| approx_kl | 0.24817224 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | 0.175 | -| n_updates | 269680 | -| policy_gradient_loss | 0.165 | -| std | 0.00569 | -| value_loss | 6.2e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26970 | -| time_elapsed | 146593 | -| total_timesteps | 3452160 | -| train/ | | -| approx_kl | 0.009979617 | -| clip_fraction | 0.25 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.751 | -| learning_rate | 0.0003 | -| loss | 0.00183 | -| n_updates | 269690 | -| policy_gradient_loss | -0.00245 | -| std | 0.00569 | -| value_loss | 0.00969 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26971 | -| time_elapsed | 146598 | -| total_timesteps | 3452288 | -| train/ | | -| approx_kl | 0.2946175 | -| clip_fraction | 0.419 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -1.56 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 269700 | -| policy_gradient_loss | 0.0325 | -| std | 0.00569 | -| value_loss | 6.64e-05 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26972 | -| time_elapsed | 146603 | -| total_timesteps | 3452416 | -| train/ | | -| approx_kl | 0.69355226 | -| clip_fraction | 0.525 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0166 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 269710 | -| policy_gradient_loss | 0.0542 | -| std | 0.00569 | -| value_loss | 4.93e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26973 | -| time_elapsed | 146607 | -| total_timesteps | 3452544 | -| train/ | | -| approx_kl | 0.06421109 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.134 | -| learning_rate | 0.0003 | -| loss | 0.0548 | -| n_updates | 269720 | -| policy_gradient_loss | 0.0279 | -| std | 0.00569 | -| value_loss | 2.91e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26974 | -| time_elapsed | 146613 | -| total_timesteps | 3452672 | -| train/ | | -| approx_kl | 0.011962911 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0313 | -| learning_rate | 0.0003 | -| loss | -0.00488 | -| n_updates | 269730 | -| policy_gradient_loss | 0.0133 | -| std | 0.0057 | -| value_loss | 1.78e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26975 | -| time_elapsed | 146618 | -| total_timesteps | 3452800 | -| train/ | | -| approx_kl | 0.003400776 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0172 | -| learning_rate | 0.0003 | -| loss | -0.00398 | -| n_updates | 269740 | -| policy_gradient_loss | 0.0138 | -| std | 0.0057 | -| value_loss | 6.67e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26976 | -| time_elapsed | 146623 | -| total_timesteps | 3452928 | -| train/ | | -| approx_kl | 8.8848174e-07 | -| clip_fraction | 0.414 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0482 | -| learning_rate | 0.0003 | -| loss | -7.21e-06 | -| n_updates | 269750 | -| policy_gradient_loss | 0.0478 | -| std | 0.0057 | -| value_loss | 3.04e-06 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26977 | -| time_elapsed | 146628 | -| total_timesteps | 3453056 | -| train/ | | -| approx_kl | 1.2982621 | -| clip_fraction | 0.788 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.205 | -| learning_rate | 0.0003 | -| loss | 0.354 | -| n_updates | 269760 | -| policy_gradient_loss | 0.242 | -| std | 0.0057 | -| value_loss | 3.77e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26978 | -| time_elapsed | 146636 | -| total_timesteps | 3453184 | -| train/ | | -| approx_kl | 0.030330757 | -| clip_fraction | 0.333 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.912 | -| learning_rate | 0.0003 | -| loss | -0.013 | -| n_updates | 269770 | -| policy_gradient_loss | 0.0085 | -| std | 0.0057 | -| value_loss | 0.00185 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26979 | -| time_elapsed | 146641 | -| total_timesteps | 3453312 | -| train/ | | -| approx_kl | 0.033341173 | -| clip_fraction | 0.421 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0102 | -| learning_rate | 0.0003 | -| loss | 0.000262 | -| n_updates | 269780 | -| policy_gradient_loss | 0.0195 | -| std | 0.0057 | -| value_loss | 5.89e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26980 | -| time_elapsed | 146646 | -| total_timesteps | 3453440 | -| train/ | | -| approx_kl | 0.34592745 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.00428 | -| learning_rate | 0.0003 | -| loss | 0.186 | -| n_updates | 269790 | -| policy_gradient_loss | 0.159 | -| std | 0.0057 | -| value_loss | 2.8e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26981 | -| time_elapsed | 146650 | -| total_timesteps | 3453568 | -| train/ | | -| approx_kl | 0.19280332 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0284 | -| learning_rate | 0.0003 | -| loss | 0.16 | -| n_updates | 269800 | -| policy_gradient_loss | 0.129 | -| std | 0.0057 | -| value_loss | 2.22e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26982 | -| time_elapsed | 146654 | -| total_timesteps | 3453696 | -| train/ | | -| approx_kl | 0.20439135 | -| clip_fraction | 0.732 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 269810 | -| policy_gradient_loss | 0.123 | -| std | 0.0057 | -| value_loss | 1.69e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26983 | -| time_elapsed | 146658 | -| total_timesteps | 3453824 | -| train/ | | -| approx_kl | 0.041714024 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0429 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 269820 | -| policy_gradient_loss | 0.0343 | -| std | 0.0057 | -| value_loss | 1.11e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 26984 | -| time_elapsed | 146663 | -| total_timesteps | 3453952 | -| train/ | | -| approx_kl | 0.0027812822 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0596 | -| learning_rate | 0.0003 | -| loss | 0.000477 | -| n_updates | 269830 | -| policy_gradient_loss | 0.0443 | -| std | 0.0057 | -| value_loss | 1.09e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26985 | -| time_elapsed | 146668 | -| total_timesteps | 3454080 | -| train/ | | -| approx_kl | 6.400328e-05 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | 0.000889 | -| n_updates | 269840 | -| policy_gradient_loss | 0.0381 | -| std | 0.0057 | -| value_loss | 2.93e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26986 | -| time_elapsed | 146678 | -| total_timesteps | 3454208 | -| train/ | | -| approx_kl | 0.017313391 | -| clip_fraction | 0.315 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.531 | -| learning_rate | 0.0003 | -| loss | -0.0248 | -| n_updates | 269850 | -| policy_gradient_loss | -0.00791 | -| std | 0.0057 | -| value_loss | 0.00204 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26987 | -| time_elapsed | 146683 | -| total_timesteps | 3454336 | -| train/ | | -| approx_kl | 0.0065542697 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0202 | -| learning_rate | 0.0003 | -| loss | -0.00166 | -| n_updates | 269860 | -| policy_gradient_loss | 0.0139 | -| std | 0.0057 | -| value_loss | 8.04e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26988 | -| time_elapsed | 146688 | -| total_timesteps | 3454464 | -| train/ | | -| approx_kl | 0.12377132 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0199 | -| learning_rate | 0.0003 | -| loss | 0.0465 | -| n_updates | 269870 | -| policy_gradient_loss | 0.0161 | -| std | 0.0057 | -| value_loss | 2.76e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26989 | -| time_elapsed | 146693 | -| total_timesteps | 3454592 | -| train/ | | -| approx_kl | 0.061870717 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0245 | -| learning_rate | 0.0003 | -| loss | 0.0322 | -| n_updates | 269880 | -| policy_gradient_loss | 0.017 | -| std | 0.0057 | -| value_loss | 1.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26990 | -| time_elapsed | 146699 | -| total_timesteps | 3454720 | -| train/ | | -| approx_kl | 0.080750346 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0781 | -| learning_rate | 0.0003 | -| loss | 0.0344 | -| n_updates | 269890 | -| policy_gradient_loss | 0.0159 | -| std | 0.0057 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26991 | -| time_elapsed | 146704 | -| total_timesteps | 3454848 | -| train/ | | -| approx_kl | 0.012066416 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.0021 | -| n_updates | 269900 | -| policy_gradient_loss | 0.0123 | -| std | 0.0057 | -| value_loss | 7.39e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26992 | -| time_elapsed | 146708 | -| total_timesteps | 3454976 | -| train/ | | -| approx_kl | 0.0931971 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0679 | -| learning_rate | 0.0003 | -| loss | 0.0323 | -| n_updates | 269910 | -| policy_gradient_loss | 0.0113 | -| std | 0.0057 | -| value_loss | 6.54e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26993 | -| time_elapsed | 146712 | -| total_timesteps | 3455104 | -| train/ | | -| approx_kl | 0.01861172 | -| clip_fraction | 0.307 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0509 | -| learning_rate | 0.0003 | -| loss | -0.0109 | -| n_updates | 269920 | -| policy_gradient_loss | 0.00939 | -| std | 0.0057 | -| value_loss | 5.45e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26994 | -| time_elapsed | 146721 | -| total_timesteps | 3455232 | -| train/ | | -| approx_kl | 0.012801716 | -| clip_fraction | 0.21 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.842 | -| learning_rate | 0.0003 | -| loss | -0.00615 | -| n_updates | 269930 | -| policy_gradient_loss | -0.00358 | -| std | 0.0057 | -| value_loss | 0.00478 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26995 | -| time_elapsed | 146726 | -| total_timesteps | 3455360 | -| train/ | | -| approx_kl | 0.09794023 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.457 | -| learning_rate | 0.0003 | -| loss | 0.0649 | -| n_updates | 269940 | -| policy_gradient_loss | 0.109 | -| std | 0.00569 | -| value_loss | 7.05e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26996 | -| time_elapsed | 146731 | -| total_timesteps | 3455488 | -| train/ | | -| approx_kl | 0.2639346 | -| clip_fraction | 0.454 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0141 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 269950 | -| policy_gradient_loss | 0.056 | -| std | 0.00569 | -| value_loss | 4.06e-05 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26997 | -| time_elapsed | 146735 | -| total_timesteps | 3455616 | -| train/ | | -| approx_kl | 0.003056663 | -| clip_fraction | 0.227 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.527 | -| learning_rate | 0.0003 | -| loss | -0.0149 | -| n_updates | 269960 | -| policy_gradient_loss | -0.00244 | -| std | 0.00569 | -| value_loss | 3.05e-05 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26998 | -| time_elapsed | 146739 | -| total_timesteps | 3455744 | -| train/ | | -| approx_kl | 1.0245014e-05 | -| clip_fraction | 0.204 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.0169 | -| learning_rate | 0.0003 | -| loss | 0.000969 | -| n_updates | 269970 | -| policy_gradient_loss | -0.00275 | -| std | 0.00569 | -| value_loss | 1.14e-05 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 26999 | -| time_elapsed | 146743 | -| total_timesteps | 3455872 | -| train/ | | -| approx_kl | 0.00036624726 | -| clip_fraction | 0.218 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0251 | -| learning_rate | 0.0003 | -| loss | -0.00187 | -| n_updates | 269980 | -| policy_gradient_loss | 0.0172 | -| std | 0.00569 | -| value_loss | 6.82e-06 | -------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27000 | -| time_elapsed | 146747 | -| total_timesteps | 3456000 | -| train/ | | -| approx_kl | 0.0001355973 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0611 | -| learning_rate | 0.0003 | -| loss | -0.00112 | -| n_updates | 269990 | -| policy_gradient_loss | 0.0122 | -| std | 0.00569 | -| value_loss | 4.59e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27001 | -| time_elapsed | 146753 | -| total_timesteps | 3456128 | -| train/ | | -| approx_kl | 0.00019376678 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.00792 | -| learning_rate | 0.0003 | -| loss | -0.00047 | -| n_updates | 270000 | -| policy_gradient_loss | 0.0268 | -| std | 0.00569 | -| value_loss | 2.01e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27002 | -| time_elapsed | 146765 | -| total_timesteps | 3456256 | -| train/ | | -| approx_kl | 0.015853584 | -| clip_fraction | 0.615 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.874 | -| learning_rate | 0.0003 | -| loss | -0.018 | -| n_updates | 270010 | -| policy_gradient_loss | 0.0306 | -| std | 0.00568 | -| value_loss | 0.00383 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27003 | -| time_elapsed | 146770 | -| total_timesteps | 3456384 | -| train/ | | -| approx_kl | 0.047677975 | -| clip_fraction | 0.371 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.01 | -| learning_rate | 0.0003 | -| loss | 0.0467 | -| n_updates | 270020 | -| policy_gradient_loss | 0.0411 | -| std | 0.00568 | -| value_loss | 1.31e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27004 | -| time_elapsed | 146775 | -| total_timesteps | 3456512 | -| train/ | | -| approx_kl | 0.09246664 | -| clip_fraction | 0.258 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.017 | -| learning_rate | 0.0003 | -| loss | 0.0612 | -| n_updates | 270030 | -| policy_gradient_loss | 0.0171 | -| std | 0.00568 | -| value_loss | 2.62e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27005 | -| time_elapsed | 146779 | -| total_timesteps | 3456640 | -| train/ | | -| approx_kl | 0.011012685 | -| clip_fraction | 0.117 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0964 | -| learning_rate | 0.0003 | -| loss | -0.0119 | -| n_updates | 270040 | -| policy_gradient_loss | -0.00392 | -| std | 0.00567 | -| value_loss | 1.7e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27006 | -| time_elapsed | 146783 | -| total_timesteps | 3456768 | -| train/ | | -| approx_kl | 0.016719185 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0886 | -| learning_rate | 0.0003 | -| loss | 0.00504 | -| n_updates | 270050 | -| policy_gradient_loss | 0.0024 | -| std | 0.00565 | -| value_loss | 2.4e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27007 | -| time_elapsed | 146788 | -| total_timesteps | 3456896 | -| train/ | | -| approx_kl | 0.015425648 | -| clip_fraction | 0.121 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0298 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 270060 | -| policy_gradient_loss | -0.004 | -| std | 0.00565 | -| value_loss | 9.8e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27008 | -| time_elapsed | 146793 | -| total_timesteps | 3457024 | -| train/ | | -| approx_kl | 0.019606177 | -| clip_fraction | 0.145 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.083 | -| learning_rate | 0.0003 | -| loss | 0.00512 | -| n_updates | 270070 | -| policy_gradient_loss | 0.00254 | -| std | 0.00565 | -| value_loss | 6.25e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27009 | -| time_elapsed | 146804 | -| total_timesteps | 3457152 | -| train/ | | -| approx_kl | 0.005809688 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | 0.96 | -| learning_rate | 0.0003 | -| loss | -0.0107 | -| n_updates | 270080 | -| policy_gradient_loss | 0.021 | -| std | 0.00565 | -| value_loss | 0.000802 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27010 | -| time_elapsed | 146810 | -| total_timesteps | 3457280 | -| train/ | | -| approx_kl | 0.435785 | -| clip_fraction | 0.741 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.00247 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 270090 | -| policy_gradient_loss | 0.118 | -| std | 0.00565 | -| value_loss | 1.63e-05 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27011 | -| time_elapsed | 146815 | -| total_timesteps | 3457408 | -| train/ | | -| approx_kl | 0.17273524 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | 0.0172 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 270100 | -| policy_gradient_loss | 0.127 | -| std | 0.00565 | -| value_loss | 2.6e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27012 | -| time_elapsed | 146819 | -| total_timesteps | 3457536 | -| train/ | | -| approx_kl | 0.16810314 | -| clip_fraction | 0.703 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0129 | -| learning_rate | 0.0003 | -| loss | 0.084 | -| n_updates | 270110 | -| policy_gradient_loss | 0.109 | -| std | 0.00566 | -| value_loss | 1.6e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27013 | -| time_elapsed | 146824 | -| total_timesteps | 3457664 | -| train/ | | -| approx_kl | 0.17094602 | -| clip_fraction | 0.742 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -10.5 | -| learning_rate | 0.0003 | -| loss | 0.0419 | -| n_updates | 270120 | -| policy_gradient_loss | 0.0325 | -| std | 0.00566 | -| value_loss | 4.74e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27014 | -| time_elapsed | 146831 | -| total_timesteps | 3457792 | -| train/ | | -| approx_kl | 0.25654784 | -| clip_fraction | 0.743 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -1.66 | -| learning_rate | 0.0003 | -| loss | 0.164 | -| n_updates | 270130 | -| policy_gradient_loss | 0.186 | -| std | 0.00566 | -| value_loss | 1.43e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27015 | -| time_elapsed | 146835 | -| total_timesteps | 3457920 | -| train/ | | -| approx_kl | 0.19615287 | -| clip_fraction | 0.728 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.123 | -| learning_rate | 0.0003 | -| loss | 0.153 | -| n_updates | 270140 | -| policy_gradient_loss | 0.209 | -| std | 0.00566 | -| value_loss | 9.35e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27016 | -| time_elapsed | 146841 | -| total_timesteps | 3458048 | -| train/ | | -| approx_kl | 0.18695952 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0548 | -| learning_rate | 0.0003 | -| loss | 0.093 | -| n_updates | 270150 | -| policy_gradient_loss | 0.127 | -| std | 0.00567 | -| value_loss | 7.61e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27017 | -| time_elapsed | 146850 | -| total_timesteps | 3458176 | -| train/ | | -| approx_kl | 0.03874685 | -| clip_fraction | 0.612 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.969 | -| learning_rate | 0.0003 | -| loss | 0.0498 | -| n_updates | 270160 | -| policy_gradient_loss | 0.0534 | -| std | 0.00567 | -| value_loss | 0.000607 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27018 | -| time_elapsed | 146855 | -| total_timesteps | 3458304 | -| train/ | | -| approx_kl | 0.23551948 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.573 | -| learning_rate | 0.0003 | -| loss | 0.191 | -| n_updates | 270170 | -| policy_gradient_loss | 0.123 | -| std | 0.00567 | -| value_loss | 7.79e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27019 | -| time_elapsed | 146859 | -| total_timesteps | 3458432 | -| train/ | | -| approx_kl | 0.21543282 | -| clip_fraction | 0.736 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | 0.00675 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 270180 | -| policy_gradient_loss | 0.208 | -| std | 0.00567 | -| value_loss | 2.9e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27020 | -| time_elapsed | 146864 | -| total_timesteps | 3458560 | -| train/ | | -| approx_kl | 0.033927355 | -| clip_fraction | 0.39 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.000893 | -| learning_rate | 0.0003 | -| loss | 0.0177 | -| n_updates | 270190 | -| policy_gradient_loss | 0.0309 | -| std | 0.00567 | -| value_loss | 1.16e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27021 | -| time_elapsed | 146869 | -| total_timesteps | 3458688 | -| train/ | | -| approx_kl | 0.806334 | -| clip_fraction | 0.566 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0783 | -| learning_rate | 0.0003 | -| loss | 0.291 | -| n_updates | 270200 | -| policy_gradient_loss | 0.0881 | -| std | 0.00566 | -| value_loss | 7.41e-08 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27022 | -| time_elapsed | 146874 | -| total_timesteps | 3458816 | -| train/ | | -| approx_kl | 0.04007942 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.0978 | -| learning_rate | 0.0003 | -| loss | 0.0156 | -| n_updates | 270210 | -| policy_gradient_loss | 0.00811 | -| std | 0.00566 | -| value_loss | 5.02e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27023 | -| time_elapsed | 146879 | -| total_timesteps | 3458944 | -| train/ | | -| approx_kl | 0.07590356 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.75 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.0287 | -| n_updates | 270220 | -| policy_gradient_loss | 0.0134 | -| std | 0.00566 | -| value_loss | 3.8e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27024 | -| time_elapsed | 146883 | -| total_timesteps | 3459072 | -| train/ | | -| approx_kl | 0.011773137 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0819 | -| learning_rate | 0.0003 | -| loss | 0.000612 | -| n_updates | 270230 | -| policy_gradient_loss | 0.0102 | -| std | 0.00566 | -| value_loss | 2.4e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27025 | -| time_elapsed | 146892 | -| total_timesteps | 3459200 | -| train/ | | -| approx_kl | 0.10284126 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | 0.0171 | -| n_updates | 270240 | -| policy_gradient_loss | 0.00541 | -| std | 0.00566 | -| value_loss | 0.000166 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27026 | -| time_elapsed | 146897 | -| total_timesteps | 3459328 | -| train/ | | -| approx_kl | 0.01612898 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.445 | -| learning_rate | 0.0003 | -| loss | -0.00457 | -| n_updates | 270250 | -| policy_gradient_loss | 0.0062 | -| std | 0.00566 | -| value_loss | 9.1e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27027 | -| time_elapsed | 146902 | -| total_timesteps | 3459456 | -| train/ | | -| approx_kl | 0.0039639496 | -| clip_fraction | 0.251 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | 0.0159 | -| learning_rate | 0.0003 | -| loss | -0.00891 | -| n_updates | 270260 | -| policy_gradient_loss | 0.0102 | -| std | 0.00566 | -| value_loss | 1.81e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27028 | -| time_elapsed | 146907 | -| total_timesteps | 3459584 | -| train/ | | -| approx_kl | 0.107793495 | -| clip_fraction | 0.275 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0433 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 270270 | -| policy_gradient_loss | 0.00482 | -| std | 0.00566 | -| value_loss | 1.09e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27029 | -| time_elapsed | 146913 | -| total_timesteps | 3459712 | -| train/ | | -| approx_kl | 0.34462216 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0705 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 270280 | -| policy_gradient_loss | 0.0783 | -| std | 0.00564 | -| value_loss | 7.59e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27030 | -| time_elapsed | 146918 | -| total_timesteps | 3459840 | -| train/ | | -| approx_kl | 0.022637263 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -21.1 | -| learning_rate | 0.0003 | -| loss | 0.00662 | -| n_updates | 270290 | -| policy_gradient_loss | 0.0113 | -| std | 0.00563 | -| value_loss | 3.07e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27031 | -| time_elapsed | 146923 | -| total_timesteps | 3459968 | -| train/ | | -| approx_kl | 0.057114024 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.194 | -| learning_rate | 0.0003 | -| loss | 0.0206 | -| n_updates | 270300 | -| policy_gradient_loss | 0.071 | -| std | 0.00563 | -| value_loss | 5.33e-08 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27032 | -| time_elapsed | 146928 | -| total_timesteps | 3460096 | -| train/ | | -| approx_kl | 0.93126 | -| clip_fraction | 0.776 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -72.8 | -| learning_rate | 0.0003 | -| loss | 0.198 | -| n_updates | 270310 | -| policy_gradient_loss | 0.127 | -| std | 0.00563 | -| value_loss | 4.45e-09 | --------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27033 | -| time_elapsed | 146938 | -| total_timesteps | 3460224 | -| train/ | | -| approx_kl | 0.06718867 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | 0.99 | -| learning_rate | 0.0003 | -| loss | -0.00259 | -| n_updates | 270320 | -| policy_gradient_loss | 0.0157 | -| std | 0.00563 | -| value_loss | 0.0002 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27034 | -| time_elapsed | 146943 | -| total_timesteps | 3460352 | -| train/ | | -| approx_kl | 0.19121563 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.763 | -| learning_rate | 0.0003 | -| loss | 0.0414 | -| n_updates | 270330 | -| policy_gradient_loss | 0.0569 | -| std | 0.00563 | -| value_loss | 0.000732 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27035 | -| time_elapsed | 146947 | -| total_timesteps | 3460480 | -| train/ | | -| approx_kl | 0.24378604 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.198 | -| learning_rate | 0.0003 | -| loss | 0.124 | -| n_updates | 270340 | -| policy_gradient_loss | 0.0521 | -| std | 0.00563 | -| value_loss | 3.26e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27036 | -| time_elapsed | 146951 | -| total_timesteps | 3460608 | -| train/ | | -| approx_kl | 0.06891258 | -| clip_fraction | 0.621 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0441 | -| n_updates | 270350 | -| policy_gradient_loss | 0.0833 | -| std | 0.00562 | -| value_loss | 1.95e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27037 | -| time_elapsed | 146956 | -| total_timesteps | 3460736 | -| train/ | | -| approx_kl | 0.06888079 | -| clip_fraction | 0.41 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.226 | -| learning_rate | 0.0003 | -| loss | 0.0576 | -| n_updates | 270360 | -| policy_gradient_loss | 0.0423 | -| std | 0.00562 | -| value_loss | 1.3e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27038 | -| time_elapsed | 146961 | -| total_timesteps | 3460864 | -| train/ | | -| approx_kl | 0.26911116 | -| clip_fraction | 0.456 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.221 | -| learning_rate | 0.0003 | -| loss | 0.125 | -| n_updates | 270370 | -| policy_gradient_loss | 0.0513 | -| std | 0.00562 | -| value_loss | 9.72e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27039 | -| time_elapsed | 146964 | -| total_timesteps | 3460992 | -| train/ | | -| approx_kl | 0.10238086 | -| clip_fraction | 0.683 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.319 | -| learning_rate | 0.0003 | -| loss | 0.0405 | -| n_updates | 270380 | -| policy_gradient_loss | 0.122 | -| std | 0.00562 | -| value_loss | 5.95e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27040 | -| time_elapsed | 146970 | -| total_timesteps | 3461120 | -| train/ | | -| approx_kl | 0.0014290228 | -| clip_fraction | 0.547 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0327 | -| learning_rate | 0.0003 | -| loss | -3.54e-05 | -| n_updates | 270390 | -| policy_gradient_loss | 0.158 | -| std | 0.0056 | -| value_loss | 0.000208 | ------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27041 | -| time_elapsed | 146982 | -| total_timesteps | 3461248 | -| train/ | | -| approx_kl | 1.4958184 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.587 | -| learning_rate | 0.0003 | -| loss | 0.247 | -| n_updates | 270400 | -| policy_gradient_loss | 0.16 | -| std | 0.0056 | -| value_loss | 0.00443 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27042 | -| time_elapsed | 146987 | -| total_timesteps | 3461376 | -| train/ | | -| approx_kl | 0.02808912 | -| clip_fraction | 0.611 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.498 | -| learning_rate | 0.0003 | -| loss | 0.00587 | -| n_updates | 270410 | -| policy_gradient_loss | 0.0939 | -| std | 0.00561 | -| value_loss | 0.000145 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27043 | -| time_elapsed | 146990 | -| total_timesteps | 3461504 | -| train/ | | -| approx_kl | 0.111636594 | -| clip_fraction | 0.4 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.00897 | -| learning_rate | 0.0003 | -| loss | 0.0621 | -| n_updates | 270420 | -| policy_gradient_loss | 0.0323 | -| std | 0.00561 | -| value_loss | 2.03e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27044 | -| time_elapsed | 146995 | -| total_timesteps | 3461632 | -| train/ | | -| approx_kl | 0.13455069 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.76 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 270430 | -| policy_gradient_loss | 0.0267 | -| std | 0.0056 | -| value_loss | 2.11e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27045 | -| time_elapsed | 146998 | -| total_timesteps | 3461760 | -| train/ | | -| approx_kl | 0.004181468 | -| clip_fraction | 0.0508 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.417 | -| learning_rate | 0.0003 | -| loss | -0.00812 | -| n_updates | 270440 | -| policy_gradient_loss | -0.00197 | -| std | 0.0056 | -| value_loss | 4.25e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27046 | -| time_elapsed | 147003 | -| total_timesteps | 3461888 | -| train/ | | -| approx_kl | 0.11503218 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0904 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 270450 | -| policy_gradient_loss | 0.0222 | -| std | 0.0056 | -| value_loss | 1.68e-05 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27047 | -| time_elapsed | 147009 | -| total_timesteps | 3462016 | -| train/ | | -| approx_kl | 0.0088834055 | -| clip_fraction | 0.0898 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0147 | -| learning_rate | 0.0003 | -| loss | -0.000962 | -| n_updates | 270460 | -| policy_gradient_loss | 0.00149 | -| std | 0.0056 | -| value_loss | 4.45e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27048 | -| time_elapsed | 147021 | -| total_timesteps | 3462144 | -| train/ | | -| approx_kl | 0.049337838 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | -0.0079 | -| n_updates | 270470 | -| policy_gradient_loss | -0.00636 | -| std | 0.0056 | -| value_loss | 0.00124 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27049 | -| time_elapsed | 147026 | -| total_timesteps | 3462272 | -| train/ | | -| approx_kl | 0.075738184 | -| clip_fraction | 0.499 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.000463 | -| learning_rate | 0.0003 | -| loss | 0.0244 | -| n_updates | 270480 | -| policy_gradient_loss | 0.0313 | -| std | 0.0056 | -| value_loss | 6.39e-05 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27050 | -| time_elapsed | 147031 | -| total_timesteps | 3462400 | -| train/ | | -| approx_kl | 0.2018574 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -57.5 | -| learning_rate | 0.0003 | -| loss | 0.0363 | -| n_updates | 270490 | -| policy_gradient_loss | 0.0183 | -| std | 0.0056 | -| value_loss | 5.94e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27051 | -| time_elapsed | 147036 | -| total_timesteps | 3462528 | -| train/ | | -| approx_kl | 0.01587622 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.83 | -| learning_rate | 0.0003 | -| loss | 0.00404 | -| n_updates | 270500 | -| policy_gradient_loss | 0.0077 | -| std | 0.00558 | -| value_loss | 8.02e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27052 | -| time_elapsed | 147041 | -| total_timesteps | 3462656 | -| train/ | | -| approx_kl | 0.0031879013 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.08 | -| learning_rate | 0.0003 | -| loss | -0.00681 | -| n_updates | 270510 | -| policy_gradient_loss | 0.0039 | -| std | 0.00557 | -| value_loss | 2.06e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27053 | -| time_elapsed | 147047 | -| total_timesteps | 3462784 | -| train/ | | -| approx_kl | 3.7150458e-06 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.017 | -| learning_rate | 0.0003 | -| loss | 0.00023 | -| n_updates | 270520 | -| policy_gradient_loss | 0.00599 | -| std | 0.00557 | -| value_loss | 3.1e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27054 | -| time_elapsed | 147052 | -| total_timesteps | 3462912 | -| train/ | | -| approx_kl | 0.00033582374 | -| clip_fraction | 0.234 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0651 | -| learning_rate | 0.0003 | -| loss | -0.00274 | -| n_updates | 270530 | -| policy_gradient_loss | 0.00784 | -| std | 0.00557 | -| value_loss | 2.36e-09 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27055 | -| time_elapsed | 147056 | -| total_timesteps | 3463040 | -| train/ | | -| approx_kl | 9.8391436e-05 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0609 | -| learning_rate | 0.0003 | -| loss | -0.000504 | -| n_updates | 270540 | -| policy_gradient_loss | 0.0172 | -| std | 0.00557 | -| value_loss | 1.33e-09 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27056 | -| time_elapsed | 147064 | -| total_timesteps | 3463168 | -| train/ | | -| approx_kl | 0.12963581 | -| clip_fraction | 0.605 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.733 | -| learning_rate | 0.0003 | -| loss | 0.0595 | -| n_updates | 270550 | -| policy_gradient_loss | 0.0787 | -| std | 0.00557 | -| value_loss | 0.0133 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27057 | -| time_elapsed | 147069 | -| total_timesteps | 3463296 | -| train/ | | -| approx_kl | 0.14291526 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.608 | -| learning_rate | 0.0003 | -| loss | 0.116 | -| n_updates | 270560 | -| policy_gradient_loss | 0.0526 | -| std | 0.00557 | -| value_loss | 1.77e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27058 | -| time_elapsed | 147073 | -| total_timesteps | 3463424 | -| train/ | | -| approx_kl | 0.8951859 | -| clip_fraction | 0.697 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0122 | -| learning_rate | 0.0003 | -| loss | 0.392 | -| n_updates | 270570 | -| policy_gradient_loss | 0.216 | -| std | 0.00557 | -| value_loss | 5.55e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27059 | -| time_elapsed | 147078 | -| total_timesteps | 3463552 | -| train/ | | -| approx_kl | 0.12739135 | -| clip_fraction | 0.341 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0155 | -| learning_rate | 0.0003 | -| loss | 0.061 | -| n_updates | 270580 | -| policy_gradient_loss | 0.0362 | -| std | 0.00557 | -| value_loss | 3.51e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27060 | -| time_elapsed | 147082 | -| total_timesteps | 3463680 | -| train/ | | -| approx_kl | 0.0062857145 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0417 | -| learning_rate | 0.0003 | -| loss | 0.00284 | -| n_updates | 270590 | -| policy_gradient_loss | 0.0397 | -| std | 0.00557 | -| value_loss | 1.83e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27061 | -| time_elapsed | 147087 | -| total_timesteps | 3463808 | -| train/ | | -| approx_kl | 0.32589126 | -| clip_fraction | 0.448 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.12 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 270600 | -| policy_gradient_loss | 0.0283 | -| std | 0.00557 | -| value_loss | 1.38e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27062 | -| time_elapsed | 147093 | -| total_timesteps | 3463936 | -| train/ | | -| approx_kl | 0.024903066 | -| clip_fraction | 0.156 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0741 | -| learning_rate | 0.0003 | -| loss | 0.000856 | -| n_updates | 270610 | -| policy_gradient_loss | -0.00248 | -| std | 0.00557 | -| value_loss | 1.15e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27063 | -| time_elapsed | 147097 | -| total_timesteps | 3464064 | -| train/ | | -| approx_kl | 0.018969996 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0577 | -| learning_rate | 0.0003 | -| loss | 0.00074 | -| n_updates | 270620 | -| policy_gradient_loss | -0.000287 | -| std | 0.00557 | -| value_loss | 7.45e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27064 | -| time_elapsed | 147108 | -| total_timesteps | 3464192 | -| train/ | | -| approx_kl | 0.036312465 | -| clip_fraction | 0.492 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.536 | -| learning_rate | 0.0003 | -| loss | -0.0264 | -| n_updates | 270630 | -| policy_gradient_loss | -0.00314 | -| std | 0.00557 | -| value_loss | 0.00406 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27065 | -| time_elapsed | 147112 | -| total_timesteps | 3464320 | -| train/ | | -| approx_kl | 0.3801985 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -53.8 | -| learning_rate | 0.0003 | -| loss | 0.103 | -| n_updates | 270640 | -| policy_gradient_loss | 0.0614 | -| std | 0.00557 | -| value_loss | 5.73e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27066 | -| time_elapsed | 147117 | -| total_timesteps | 3464448 | -| train/ | | -| approx_kl | 0.06748068 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.57 | -| learning_rate | 0.0003 | -| loss | -0.00685 | -| n_updates | 270650 | -| policy_gradient_loss | 0.0133 | -| std | 0.00557 | -| value_loss | 9.53e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27067 | -| time_elapsed | 147121 | -| total_timesteps | 3464576 | -| train/ | | -| approx_kl | 0.27887994 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0725 | -| learning_rate | 0.0003 | -| loss | 0.0776 | -| n_updates | 270660 | -| policy_gradient_loss | 0.0268 | -| std | 0.00557 | -| value_loss | 7.74e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27068 | -| time_elapsed | 147124 | -| total_timesteps | 3464704 | -| train/ | | -| approx_kl | 0.019851414 | -| clip_fraction | 0.131 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0779 | -| learning_rate | 0.0003 | -| loss | -0.0106 | -| n_updates | 270670 | -| policy_gradient_loss | -0.00585 | -| std | 0.00557 | -| value_loss | 5.06e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27069 | -| time_elapsed | 147128 | -| total_timesteps | 3464832 | -| train/ | | -| approx_kl | 0.037367463 | -| clip_fraction | 0.498 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.0246 | -| n_updates | 270680 | -| policy_gradient_loss | 0.0467 | -| std | 0.00557 | -| value_loss | 3.19e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27070 | -| time_elapsed | 147132 | -| total_timesteps | 3464960 | -| train/ | | -| approx_kl | 0.18282907 | -| clip_fraction | 0.355 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.083 | -| learning_rate | 0.0003 | -| loss | 0.0861 | -| n_updates | 270690 | -| policy_gradient_loss | 0.0438 | -| std | 0.00557 | -| value_loss | 2.81e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27071 | -| time_elapsed | 147137 | -| total_timesteps | 3465088 | -| train/ | | -| approx_kl | 0.010827863 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | 0.00447 | -| n_updates | 270700 | -| policy_gradient_loss | 0.0347 | -| std | 0.00557 | -| value_loss | 6.78e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27072 | -| time_elapsed | 147146 | -| total_timesteps | 3465216 | -| train/ | | -| approx_kl | 0.0302488 | -| clip_fraction | 0.452 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | 0.011 | -| n_updates | 270710 | -| policy_gradient_loss | 0.0399 | -| std | 0.00557 | -| value_loss | 0.00718 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27073 | -| time_elapsed | 147150 | -| total_timesteps | 3465344 | -| train/ | | -| approx_kl | 1.1212518 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.17 | -| learning_rate | 0.0003 | -| loss | 0.412 | -| n_updates | 270720 | -| policy_gradient_loss | 0.11 | -| std | 0.00557 | -| value_loss | 0.00075 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27074 | -| time_elapsed | 147153 | -| total_timesteps | 3465472 | -| train/ | | -| approx_kl | 0.022298986 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.011 | -| learning_rate | 0.0003 | -| loss | 0.00599 | -| n_updates | 270730 | -| policy_gradient_loss | 0.0152 | -| std | 0.00557 | -| value_loss | 0.000133 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27075 | -| time_elapsed | 147158 | -| total_timesteps | 3465600 | -| train/ | | -| approx_kl | 0.08833505 | -| clip_fraction | 0.308 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | -0.00209 | -| n_updates | 270740 | -| policy_gradient_loss | -0.00561 | -| std | 0.00557 | -| value_loss | 0.000136 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27076 | -| time_elapsed | 147162 | -| total_timesteps | 3465728 | -| train/ | | -| approx_kl | 0.076746404 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0598 | -| learning_rate | 0.0003 | -| loss | 0.0485 | -| n_updates | 270750 | -| policy_gradient_loss | 0.0246 | -| std | 0.00557 | -| value_loss | 8.64e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27077 | -| time_elapsed | 147167 | -| total_timesteps | 3465856 | -| train/ | | -| approx_kl | 0.010660021 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0988 | -| learning_rate | 0.0003 | -| loss | -0.00725 | -| n_updates | 270760 | -| policy_gradient_loss | 0.0105 | -| std | 0.00557 | -| value_loss | 6.34e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27078 | -| time_elapsed | 147173 | -| total_timesteps | 3465984 | -| train/ | | -| approx_kl | 0.0021484196 | -| clip_fraction | 0.273 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.074 | -| learning_rate | 0.0003 | -| loss | -0.00103 | -| n_updates | 270770 | -| policy_gradient_loss | 0.0136 | -| std | 0.00557 | -| value_loss | 3.82e-05 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27079 | -| time_elapsed | 147178 | -| total_timesteps | 3466112 | -| train/ | | -| approx_kl | 0.05600677 | -| clip_fraction | 0.678 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.104 | -| learning_rate | 0.0003 | -| loss | 0.0412 | -| n_updates | 270780 | -| policy_gradient_loss | 0.149 | -| std | 0.00557 | -| value_loss | 2.75e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27080 | -| time_elapsed | 147188 | -| total_timesteps | 3466240 | -| train/ | | -| approx_kl | 0.15075614 | -| clip_fraction | 0.714 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.54 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 270790 | -| policy_gradient_loss | 0.154 | -| std | 0.00557 | -| value_loss | 0.014 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27081 | -| time_elapsed | 147194 | -| total_timesteps | 3466368 | -| train/ | | -| approx_kl | 0.15741664 | -| clip_fraction | 0.712 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0192 | -| learning_rate | 0.0003 | -| loss | 0.12 | -| n_updates | 270800 | -| policy_gradient_loss | 0.137 | -| std | 0.00557 | -| value_loss | 0.000101 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27082 | -| time_elapsed | 147199 | -| total_timesteps | 3466496 | -| train/ | | -| approx_kl | 0.21601877 | -| clip_fraction | 0.729 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.00872 | -| learning_rate | 0.0003 | -| loss | 0.155 | -| n_updates | 270810 | -| policy_gradient_loss | 0.175 | -| std | 0.00557 | -| value_loss | 5.63e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27083 | -| time_elapsed | 147204 | -| total_timesteps | 3466624 | -| train/ | | -| approx_kl | 0.028739996 | -| clip_fraction | 0.362 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.02 | -| learning_rate | 0.0003 | -| loss | -0.0142 | -| n_updates | 270820 | -| policy_gradient_loss | 0.0245 | -| std | 0.00557 | -| value_loss | 4.37e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27084 | -| time_elapsed | 147209 | -| total_timesteps | 3466752 | -| train/ | | -| approx_kl | 0.57376164 | -| clip_fraction | 0.51 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0328 | -| learning_rate | 0.0003 | -| loss | 0.208 | -| n_updates | 270830 | -| policy_gradient_loss | 0.0698 | -| std | 0.00557 | -| value_loss | 1.67e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27085 | -| time_elapsed | 147214 | -| total_timesteps | 3466880 | -| train/ | | -| approx_kl | 0.013612805 | -| clip_fraction | 0.261 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 270840 | -| policy_gradient_loss | 0.0105 | -| std | 0.00557 | -| value_loss | 2.49e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27086 | -| time_elapsed | 147219 | -| total_timesteps | 3467008 | -| train/ | | -| approx_kl | 0.104163125 | -| clip_fraction | 0.316 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0279 | -| learning_rate | 0.0003 | -| loss | 0.0184 | -| n_updates | 270850 | -| policy_gradient_loss | 0.00272 | -| std | 0.00557 | -| value_loss | 1.82e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27087 | -| time_elapsed | 147231 | -| total_timesteps | 3467136 | -| train/ | | -| approx_kl | 0.015769366 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.583 | -| learning_rate | 0.0003 | -| loss | -0.0255 | -| n_updates | 270860 | -| policy_gradient_loss | -0.0145 | -| std | 0.00557 | -| value_loss | 0.0021 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27088 | -| time_elapsed | 147236 | -| total_timesteps | 3467264 | -| train/ | | -| approx_kl | 0.26412886 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.806 | -| learning_rate | 0.0003 | -| loss | 0.0939 | -| n_updates | 270870 | -| policy_gradient_loss | 0.0816 | -| std | 0.00557 | -| value_loss | 2.27e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27089 | -| time_elapsed | 147242 | -| total_timesteps | 3467392 | -| train/ | | -| approx_kl | 0.17226702 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.24 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 270880 | -| policy_gradient_loss | 0.0184 | -| std | 0.00557 | -| value_loss | 1.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27090 | -| time_elapsed | 147246 | -| total_timesteps | 3467520 | -| train/ | | -| approx_kl | 0.13364919 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.223 | -| learning_rate | 0.0003 | -| loss | 0.0817 | -| n_updates | 270890 | -| policy_gradient_loss | 0.0462 | -| std | 0.00557 | -| value_loss | 4.85e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27091 | -| time_elapsed | 147253 | -| total_timesteps | 3467648 | -| train/ | | -| approx_kl | 0.0046081045 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.164 | -| learning_rate | 0.0003 | -| loss | -0.00239 | -| n_updates | 270900 | -| policy_gradient_loss | 0.0118 | -| std | 0.00557 | -| value_loss | 3.55e-07 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27092 | -| time_elapsed | 147258 | -| total_timesteps | 3467776 | -| train/ | | -| approx_kl | 0.23000054 | -| clip_fraction | 0.749 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.207 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 270910 | -| policy_gradient_loss | 0.145 | -| std | 0.00557 | -| value_loss | 3.07e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27093 | -| time_elapsed | 147263 | -| total_timesteps | 3467904 | -| train/ | | -| approx_kl | 0.20159648 | -| clip_fraction | 0.727 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0234 | -| learning_rate | 0.0003 | -| loss | 0.113 | -| n_updates | 270920 | -| policy_gradient_loss | 0.139 | -| std | 0.00557 | -| value_loss | 1.76e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27094 | -| time_elapsed | 147267 | -| total_timesteps | 3468032 | -| train/ | | -| approx_kl | 0.18151963 | -| clip_fraction | 0.739 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0518 | -| learning_rate | 0.0003 | -| loss | 0.131 | -| n_updates | 270930 | -| policy_gradient_loss | 0.136 | -| std | 0.00557 | -| value_loss | 1.45e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27095 | -| time_elapsed | 147278 | -| total_timesteps | 3468160 | -| train/ | | -| approx_kl | 0.10481066 | -| clip_fraction | 0.699 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.881 | -| learning_rate | 0.0003 | -| loss | 0.0682 | -| n_updates | 270940 | -| policy_gradient_loss | 0.0997 | -| std | 0.00557 | -| value_loss | 0.00095 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27096 | -| time_elapsed | 147283 | -| total_timesteps | 3468288 | -| train/ | | -| approx_kl | 0.066561766 | -| clip_fraction | 0.397 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0698 | -| learning_rate | 0.0003 | -| loss | 0.0477 | -| n_updates | 270950 | -| policy_gradient_loss | 0.0394 | -| std | 0.00557 | -| value_loss | 7.86e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27097 | -| time_elapsed | 147287 | -| total_timesteps | 3468416 | -| train/ | | -| approx_kl | 0.80939806 | -| clip_fraction | 0.528 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0174 | -| learning_rate | 0.0003 | -| loss | 0.305 | -| n_updates | 270960 | -| policy_gradient_loss | 0.0829 | -| std | 0.00557 | -| value_loss | 3.51e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27098 | -| time_elapsed | 147292 | -| total_timesteps | 3468544 | -| train/ | | -| approx_kl | 0.053174768 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0331 | -| learning_rate | 0.0003 | -| loss | 0.0337 | -| n_updates | 270970 | -| policy_gradient_loss | 0.0186 | -| std | 0.00557 | -| value_loss | 1.57e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27099 | -| time_elapsed | 147296 | -| total_timesteps | 3468672 | -| train/ | | -| approx_kl | 0.067225285 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.111 | -| learning_rate | 0.0003 | -| loss | 0.0198 | -| n_updates | 270980 | -| policy_gradient_loss | 0.00749 | -| std | 0.00557 | -| value_loss | 1.18e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27100 | -| time_elapsed | 147300 | -| total_timesteps | 3468800 | -| train/ | | -| approx_kl | 0.06559835 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0736 | -| learning_rate | 0.0003 | -| loss | 0.017 | -| n_updates | 270990 | -| policy_gradient_loss | 0.00924 | -| std | 0.00557 | -| value_loss | 9.57e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.09 | -| time/ | | -| fps | 23 | -| iterations | 27101 | -| time_elapsed | 147304 | -| total_timesteps | 3468928 | -| train/ | | -| approx_kl | 0.00873491 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0604 | -| learning_rate | 0.0003 | -| loss | -0.000345 | -| n_updates | 271000 | -| policy_gradient_loss | 0.0112 | -| std | 0.00557 | -| value_loss | 6.38e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27102 | -| time_elapsed | 147309 | -| total_timesteps | 3469056 | -| train/ | | -| approx_kl | 0.09184435 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0714 | -| learning_rate | 0.0003 | -| loss | 0.0368 | -| n_updates | 271010 | -| policy_gradient_loss | 0.0142 | -| std | 0.00557 | -| value_loss | 5.04e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27103 | -| time_elapsed | 147316 | -| total_timesteps | 3469184 | -| train/ | | -| approx_kl | 0.032020345 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -3.84 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 271020 | -| policy_gradient_loss | -0.00156 | -| std | 0.00557 | -| value_loss | 0.00588 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27104 | -| time_elapsed | 147322 | -| total_timesteps | 3469312 | -| train/ | | -| approx_kl | 0.08007808 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.1 | -| learning_rate | 0.0003 | -| loss | 0.00637 | -| n_updates | 271030 | -| policy_gradient_loss | -0.000857 | -| std | 0.00557 | -| value_loss | 1.57e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27105 | -| time_elapsed | 147327 | -| total_timesteps | 3469440 | -| train/ | | -| approx_kl | 0.05757884 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0273 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 271040 | -| policy_gradient_loss | 0.0116 | -| std | 0.00557 | -| value_loss | 2.34e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27106 | -| time_elapsed | 147332 | -| total_timesteps | 3469568 | -| train/ | | -| approx_kl | 0.0112302285 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0209 | -| learning_rate | 0.0003 | -| loss | -0.0136 | -| n_updates | 271050 | -| policy_gradient_loss | 0.0118 | -| std | 0.00557 | -| value_loss | 1.54e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27107 | -| time_elapsed | 147338 | -| total_timesteps | 3469696 | -| train/ | | -| approx_kl | 0.0017079972 | -| clip_fraction | 0.334 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.0104 | -| n_updates | 271060 | -| policy_gradient_loss | 0.00208 | -| std | 0.00557 | -| value_loss | 1.2e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27108 | -| time_elapsed | 147342 | -| total_timesteps | 3469824 | -| train/ | | -| approx_kl | 0.06639002 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0475 | -| learning_rate | 0.0003 | -| loss | 0.0424 | -| n_updates | 271070 | -| policy_gradient_loss | 0.0196 | -| std | 0.00557 | -| value_loss | 6.17e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27109 | -| time_elapsed | 147348 | -| total_timesteps | 3469952 | -| train/ | | -| approx_kl | 0.012552442 | -| clip_fraction | 0.287 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.145 | -| learning_rate | 0.0003 | -| loss | -0.00757 | -| n_updates | 271080 | -| policy_gradient_loss | 0.00774 | -| std | 0.00557 | -| value_loss | 5.64e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27110 | -| time_elapsed | 147353 | -| total_timesteps | 3470080 | -| train/ | | -| approx_kl | 0.108055055 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0439 | -| learning_rate | 0.0003 | -| loss | 0.0794 | -| n_updates | 271090 | -| policy_gradient_loss | 0.0311 | -| std | 0.00557 | -| value_loss | 4.39e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27111 | -| time_elapsed | 147362 | -| total_timesteps | 3470208 | -| train/ | | -| approx_kl | 0.00705754 | -| clip_fraction | 0.271 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.869 | -| learning_rate | 0.0003 | -| loss | -0.0224 | -| n_updates | 271100 | -| policy_gradient_loss | -0.00439 | -| std | 0.00557 | -| value_loss | 0.000847 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27112 | -| time_elapsed | 147366 | -| total_timesteps | 3470336 | -| train/ | | -| approx_kl | 0.06588769 | -| clip_fraction | 0.449 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0267 | -| learning_rate | 0.0003 | -| loss | 0.019 | -| n_updates | 271110 | -| policy_gradient_loss | 0.0334 | -| std | 0.00557 | -| value_loss | 4.82e-06 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27113 | -| time_elapsed | 147370 | -| total_timesteps | 3470464 | -| train/ | | -| approx_kl | 0.00029884744 | -| clip_fraction | 0.473 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.00648 | -| learning_rate | 0.0003 | -| loss | 9.53e-05 | -| n_updates | 271120 | -| policy_gradient_loss | 0.0475 | -| std | 0.00557 | -| value_loss | 7.45e-07 | -------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27114 | -| time_elapsed | 147375 | -| total_timesteps | 3470592 | -| train/ | | -| approx_kl | 0.00039311312 | -| clip_fraction | 0.363 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0504 | -| learning_rate | 0.0003 | -| loss | 0.00113 | -| n_updates | 271130 | -| policy_gradient_loss | 0.0405 | -| std | 0.00557 | -| value_loss | 5.81e-07 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27115 | -| time_elapsed | 147379 | -| total_timesteps | 3470720 | -| train/ | | -| approx_kl | 0.48557624 | -| clip_fraction | 0.52 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0612 | -| learning_rate | 0.0003 | -| loss | 0.065 | -| n_updates | 271140 | -| policy_gradient_loss | 0.0509 | -| std | 0.00558 | -| value_loss | 1.07e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27116 | -| time_elapsed | 147384 | -| total_timesteps | 3470848 | -| train/ | | -| approx_kl | 0.12285222 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -25.6 | -| learning_rate | 0.0003 | -| loss | 0.00417 | -| n_updates | 271150 | -| policy_gradient_loss | 0.0202 | -| std | 0.00558 | -| value_loss | 3.28e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27117 | -| time_elapsed | 147389 | -| total_timesteps | 3470976 | -| train/ | | -| approx_kl | 0.17809948 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.168 | -| learning_rate | 0.0003 | -| loss | 0.127 | -| n_updates | 271160 | -| policy_gradient_loss | 0.0876 | -| std | 0.00558 | -| value_loss | 8.55e-08 | ----------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27118 | -| time_elapsed | 147393 | -| total_timesteps | 3471104 | -| train/ | | -| approx_kl | 6.5664295e-05 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0687 | -| learning_rate | 0.0003 | -| loss | 0.000972 | -| n_updates | 271170 | -| policy_gradient_loss | 0.0102 | -| std | 0.00558 | -| value_loss | 7.87e-08 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27119 | -| time_elapsed | 147406 | -| total_timesteps | 3471232 | -| train/ | | -| approx_kl | 0.09364529 | -| clip_fraction | 0.305 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.231 | -| learning_rate | 0.0003 | -| loss | -0.0143 | -| n_updates | 271180 | -| policy_gradient_loss | -0.0109 | -| std | 0.00559 | -| value_loss | 0.0025 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27120 | -| time_elapsed | 147411 | -| total_timesteps | 3471360 | -| train/ | | -| approx_kl | 0.005574313 | -| clip_fraction | 0.281 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -2.15 | -| learning_rate | 0.0003 | -| loss | -0.0131 | -| n_updates | 271190 | -| policy_gradient_loss | 0.0185 | -| std | 0.00559 | -| value_loss | 5.24e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27121 | -| time_elapsed | 147416 | -| total_timesteps | 3471488 | -| train/ | | -| approx_kl | 0.09792739 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0616 | -| learning_rate | 0.0003 | -| loss | 0.0413 | -| n_updates | 271200 | -| policy_gradient_loss | 0.0155 | -| std | 0.00559 | -| value_loss | 1.4e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27122 | -| time_elapsed | 147420 | -| total_timesteps | 3471616 | -| train/ | | -| approx_kl | 0.042527325 | -| clip_fraction | 0.245 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.844 | -| learning_rate | 0.0003 | -| loss | 0.0313 | -| n_updates | 271210 | -| policy_gradient_loss | 0.0165 | -| std | 0.00558 | -| value_loss | 7.83e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27123 | -| time_elapsed | 147425 | -| total_timesteps | 3471744 | -| train/ | | -| approx_kl | 0.074517384 | -| clip_fraction | 0.285 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0955 | -| learning_rate | 0.0003 | -| loss | 0.042 | -| n_updates | 271220 | -| policy_gradient_loss | 0.0194 | -| std | 0.00558 | -| value_loss | 4.22e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27124 | -| time_elapsed | 147430 | -| total_timesteps | 3471872 | -| train/ | | -| approx_kl | 0.06647553 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0676 | -| learning_rate | 0.0003 | -| loss | 0.024 | -| n_updates | 271230 | -| policy_gradient_loss | 0.0119 | -| std | 0.00558 | -| value_loss | 3.49e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27125 | -| time_elapsed | 147434 | -| total_timesteps | 3472000 | -| train/ | | -| approx_kl | 0.070425615 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0551 | -| learning_rate | 0.0003 | -| loss | 0.0174 | -| n_updates | 271240 | -| policy_gradient_loss | 0.00838 | -| std | 0.00558 | -| value_loss | 2.8e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27126 | -| time_elapsed | 147439 | -| total_timesteps | 3472128 | -| train/ | | -| approx_kl | 0.07849149 | -| clip_fraction | 0.298 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.00573 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 271250 | -| policy_gradient_loss | 0.0106 | -| std | 0.00558 | -| value_loss | 1.63e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27127 | -| time_elapsed | 147449 | -| total_timesteps | 3472256 | -| train/ | | -| approx_kl | 0.048866414 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.707 | -| learning_rate | 0.0003 | -| loss | 0.000504 | -| n_updates | 271260 | -| policy_gradient_loss | -0.00094 | -| std | 0.00558 | -| value_loss | 0.0138 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27128 | -| time_elapsed | 147454 | -| total_timesteps | 3472384 | -| train/ | | -| approx_kl | 0.007499268 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.623 | -| learning_rate | 0.0003 | -| loss | -0.00688 | -| n_updates | 271270 | -| policy_gradient_loss | 0.0106 | -| std | 0.00558 | -| value_loss | 0.00014 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27129 | -| time_elapsed | 147458 | -| total_timesteps | 3472512 | -| train/ | | -| approx_kl | 0.0021431432 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0322 | -| learning_rate | 0.0003 | -| loss | -0.00336 | -| n_updates | 271280 | -| policy_gradient_loss | 0.0148 | -| std | 0.00558 | -| value_loss | 1.03e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27130 | -| time_elapsed | 147463 | -| total_timesteps | 3472640 | -| train/ | | -| approx_kl | 8.543953e-06 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0622 | -| learning_rate | 0.0003 | -| loss | -0.000523 | -| n_updates | 271290 | -| policy_gradient_loss | 0.0538 | -| std | 0.00558 | -| value_loss | 7.97e-06 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27131 | -| time_elapsed | 147467 | -| total_timesteps | 3472768 | -| train/ | | -| approx_kl | 1.166817 | -| clip_fraction | 0.79 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.052 | -| learning_rate | 0.0003 | -| loss | 0.337 | -| n_updates | 271300 | -| policy_gradient_loss | 0.238 | -| std | 0.00558 | -| value_loss | 4.17e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27132 | -| time_elapsed | 147470 | -| total_timesteps | 3472896 | -| train/ | | -| approx_kl | 0.033885166 | -| clip_fraction | 0.17 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.0168 | -| n_updates | 271310 | -| policy_gradient_loss | 0.00463 | -| std | 0.00558 | -| value_loss | 3.04e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27133 | -| time_elapsed | 147475 | -| total_timesteps | 3473024 | -| train/ | | -| approx_kl | 0.01962783 | -| clip_fraction | 0.151 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0851 | -| learning_rate | 0.0003 | -| loss | 0.000894 | -| n_updates | 271320 | -| policy_gradient_loss | -0.000586 | -| std | 0.00558 | -| value_loss | 2.09e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27134 | -| time_elapsed | 147485 | -| total_timesteps | 3473152 | -| train/ | | -| approx_kl | 0.049281728 | -| clip_fraction | 0.445 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.892 | -| learning_rate | 0.0003 | -| loss | -0.000767 | -| n_updates | 271330 | -| policy_gradient_loss | 0.00247 | -| std | 0.00558 | -| value_loss | 0.00264 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27135 | -| time_elapsed | 147489 | -| total_timesteps | 3473280 | -| train/ | | -| approx_kl | 0.100849904 | -| clip_fraction | 0.501 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.142 | -| learning_rate | 0.0003 | -| loss | 0.0211 | -| n_updates | 271340 | -| policy_gradient_loss | 0.0704 | -| std | 0.00558 | -| value_loss | 9.97e-06 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27136 | -| time_elapsed | 147493 | -| total_timesteps | 3473408 | -| train/ | | -| approx_kl | 0.282627 | -| clip_fraction | 0.479 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0151 | -| learning_rate | 0.0003 | -| loss | 0.123 | -| n_updates | 271350 | -| policy_gradient_loss | 0.0593 | -| std | 0.00558 | -| value_loss | 3.88e-06 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27137 | -| time_elapsed | 147497 | -| total_timesteps | 3473536 | -| train/ | | -| approx_kl | 0.004317252 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0323 | -| learning_rate | 0.0003 | -| loss | -0.0104 | -| n_updates | 271360 | -| policy_gradient_loss | 0.0119 | -| std | 0.00558 | -| value_loss | 2.9e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27138 | -| time_elapsed | 147502 | -| total_timesteps | 3473664 | -| train/ | | -| approx_kl | 0.090408295 | -| clip_fraction | 0.606 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0414 | -| learning_rate | 0.0003 | -| loss | 0.0482 | -| n_updates | 271370 | -| policy_gradient_loss | 0.0739 | -| std | 0.00558 | -| value_loss | 2.01e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27139 | -| time_elapsed | 147506 | -| total_timesteps | 3473792 | -| train/ | | -| approx_kl | 2.7634203e-05 | -| clip_fraction | 0.553 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0505 | -| learning_rate | 0.0003 | -| loss | -0.000766 | -| n_updates | 271380 | -| policy_gradient_loss | 0.0967 | -| std | 0.00558 | -| value_loss | 1.69e-06 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27140 | -| time_elapsed | 147511 | -| total_timesteps | 3473920 | -| train/ | | -| approx_kl | 0.22266929 | -| clip_fraction | 0.716 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0492 | -| learning_rate | 0.0003 | -| loss | 0.152 | -| n_updates | 271390 | -| policy_gradient_loss | 0.319 | -| std | 0.00558 | -| value_loss | 1.36e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27141 | -| time_elapsed | 147516 | -| total_timesteps | 3474048 | -| train/ | | -| approx_kl | 0.12422921 | -| clip_fraction | 0.418 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0601 | -| learning_rate | 0.0003 | -| loss | 0.0863 | -| n_updates | 271400 | -| policy_gradient_loss | 0.0454 | -| std | 0.00557 | -| value_loss | 5.25e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27142 | -| time_elapsed | 147526 | -| total_timesteps | 3474176 | -| train/ | | -| approx_kl | 0.30632383 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.986 | -| learning_rate | 0.0003 | -| loss | 0.0215 | -| n_updates | 271410 | -| policy_gradient_loss | 0.0404 | -| std | 0.00555 | -| value_loss | 0.000261 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27143 | -| time_elapsed | 147531 | -| total_timesteps | 3474304 | -| train/ | | -| approx_kl | 0.06212185 | -| clip_fraction | 0.302 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0231 | -| learning_rate | 0.0003 | -| loss | 0.021 | -| n_updates | 271420 | -| policy_gradient_loss | 0.0114 | -| std | 0.00555 | -| value_loss | 2.98e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27144 | -| time_elapsed | 147536 | -| total_timesteps | 3474432 | -| train/ | | -| approx_kl | 0.009598339 | -| clip_fraction | 0.257 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.695 | -| learning_rate | 0.0003 | -| loss | -0.00627 | -| n_updates | 271430 | -| policy_gradient_loss | 0.00662 | -| std | 0.00555 | -| value_loss | 2.91e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27145 | -| time_elapsed | 147542 | -| total_timesteps | 3474560 | -| train/ | | -| approx_kl | 0.002763831 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.108 | -| learning_rate | 0.0003 | -| loss | -0.00279 | -| n_updates | 271440 | -| policy_gradient_loss | 0.0094 | -| std | 0.00555 | -| value_loss | 1.82e-07 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27146 | -| time_elapsed | 147547 | -| total_timesteps | 3474688 | -| train/ | | -| approx_kl | 8.3399937e-07 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0936 | -| learning_rate | 0.0003 | -| loss | -0.000249 | -| n_updates | 271450 | -| policy_gradient_loss | 0.0652 | -| std | 0.00555 | -| value_loss | 1.42e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27147 | -| time_elapsed | 147552 | -| total_timesteps | 3474816 | -| train/ | | -| approx_kl | 1.7435739 | -| clip_fraction | 0.78 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.159 | -| learning_rate | 0.0003 | -| loss | 0.211 | -| n_updates | 271460 | -| policy_gradient_loss | 0.142 | -| std | 0.00555 | -| value_loss | 1.54e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27148 | -| time_elapsed | 147557 | -| total_timesteps | 3474944 | -| train/ | | -| approx_kl | 0.037807986 | -| clip_fraction | 0.191 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.418 | -| learning_rate | 0.0003 | -| loss | 0.0316 | -| n_updates | 271470 | -| policy_gradient_loss | 0.0119 | -| std | 0.00556 | -| value_loss | 4.23e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27149 | -| time_elapsed | 147561 | -| total_timesteps | 3475072 | -| train/ | | -| approx_kl | 0.025879372 | -| clip_fraction | 0.494 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0289 | -| learning_rate | 0.0003 | -| loss | -0.0117 | -| n_updates | 271480 | -| policy_gradient_loss | 0.0103 | -| std | 0.00556 | -| value_loss | 5.02e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27150 | -| time_elapsed | 147571 | -| total_timesteps | 3475200 | -| train/ | | -| approx_kl | 0.07658441 | -| clip_fraction | 0.367 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.774 | -| learning_rate | 0.0003 | -| loss | 0.0218 | -| n_updates | 271490 | -| policy_gradient_loss | 0.0188 | -| std | 0.00556 | -| value_loss | 0.0025 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27151 | -| time_elapsed | 147576 | -| total_timesteps | 3475328 | -| train/ | | -| approx_kl | 0.92253494 | -| clip_fraction | 0.57 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.19 | -| learning_rate | 0.0003 | -| loss | 0.176 | -| n_updates | 271500 | -| policy_gradient_loss | 0.0654 | -| std | 0.00557 | -| value_loss | 1.62e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27152 | -| time_elapsed | 147581 | -| total_timesteps | 3475456 | -| train/ | | -| approx_kl | 0.010968782 | -| clip_fraction | 0.199 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.00242 | -| n_updates | 271510 | -| policy_gradient_loss | 0.00642 | -| std | 0.00557 | -| value_loss | 1.35e-06 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27153 | -| time_elapsed | 147585 | -| total_timesteps | 3475584 | -| train/ | | -| approx_kl | 0.0038572946 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.116 | -| learning_rate | 0.0003 | -| loss | -0.000119 | -| n_updates | 271520 | -| policy_gradient_loss | 0.0145 | -| std | 0.00557 | -| value_loss | 2.66e-06 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27154 | -| time_elapsed | 147588 | -| total_timesteps | 3475712 | -| train/ | | -| approx_kl | 0.025996724 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.594 | -| learning_rate | 0.0003 | -| loss | 0.0169 | -| n_updates | 271530 | -| policy_gradient_loss | 0.0159 | -| std | 0.00557 | -| value_loss | 4.61e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27155 | -| time_elapsed | 147592 | -| total_timesteps | 3475840 | -| train/ | | -| approx_kl | 0.33673552 | -| clip_fraction | 0.515 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.133 | -| learning_rate | 0.0003 | -| loss | 0.161 | -| n_updates | 271540 | -| policy_gradient_loss | 0.0739 | -| std | 0.00556 | -| value_loss | 2.35e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27156 | -| time_elapsed | 147595 | -| total_timesteps | 3475968 | -| train/ | | -| approx_kl | 0.11490015 | -| clip_fraction | 0.327 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | 0.0475 | -| n_updates | 271550 | -| policy_gradient_loss | 0.0177 | -| std | 0.00556 | -| value_loss | 5.11e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27157 | -| time_elapsed | 147599 | -| total_timesteps | 3476096 | -| train/ | | -| approx_kl | 0.048294958 | -| clip_fraction | 0.279 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.127 | -| learning_rate | 0.0003 | -| loss | 0.0209 | -| n_updates | 271560 | -| policy_gradient_loss | 0.0118 | -| std | 0.00556 | -| value_loss | 3.48e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27158 | -| time_elapsed | 147607 | -| total_timesteps | 3476224 | -| train/ | | -| approx_kl | 0.014654671 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.978 | -| learning_rate | 0.0003 | -| loss | -0.0139 | -| n_updates | 271570 | -| policy_gradient_loss | -0.00678 | -| std | 0.00556 | -| value_loss | 0.00396 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27159 | -| time_elapsed | 147611 | -| total_timesteps | 3476352 | -| train/ | | -| approx_kl | 0.004887215 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.943 | -| learning_rate | 0.0003 | -| loss | 0.000386 | -| n_updates | 271580 | -| policy_gradient_loss | 0.0116 | -| std | 0.00556 | -| value_loss | 5.66e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27160 | -| time_elapsed | 147616 | -| total_timesteps | 3476480 | -| train/ | | -| approx_kl | 0.102360144 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | 0.0533 | -| n_updates | 271590 | -| policy_gradient_loss | 0.0197 | -| std | 0.00556 | -| value_loss | 1.05e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27161 | -| time_elapsed | 147622 | -| total_timesteps | 3476608 | -| train/ | | -| approx_kl | 0.022407735 | -| clip_fraction | 0.323 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0442 | -| learning_rate | 0.0003 | -| loss | -0.00178 | -| n_updates | 271600 | -| policy_gradient_loss | 0.0152 | -| std | 0.00556 | -| value_loss | 8.27e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27162 | -| time_elapsed | 147627 | -| total_timesteps | 3476736 | -| train/ | | -| approx_kl | 0.004994603 | -| clip_fraction | 0.293 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | -0.00169 | -| n_updates | 271610 | -| policy_gradient_loss | 0.0131 | -| std | 0.00556 | -| value_loss | 5.06e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27163 | -| time_elapsed | 147633 | -| total_timesteps | 3476864 | -| train/ | | -| approx_kl | 0.10111031 | -| clip_fraction | 0.267 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0674 | -| learning_rate | 0.0003 | -| loss | 0.0346 | -| n_updates | 271620 | -| policy_gradient_loss | 0.00922 | -| std | 0.00556 | -| value_loss | 3.75e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27164 | -| time_elapsed | 147638 | -| total_timesteps | 3476992 | -| train/ | | -| approx_kl | 0.23946679 | -| clip_fraction | 0.405 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.122 | -| learning_rate | 0.0003 | -| loss | 0.137 | -| n_updates | 271630 | -| policy_gradient_loss | 0.0352 | -| std | 0.00556 | -| value_loss | 1.93e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27165 | -| time_elapsed | 147642 | -| total_timesteps | 3477120 | -| train/ | | -| approx_kl | 0.7116665 | -| clip_fraction | 0.538 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.114 | -| learning_rate | 0.0003 | -| loss | 0.142 | -| n_updates | 271640 | -| policy_gradient_loss | 0.0521 | -| std | 0.00556 | -| value_loss | 1.5e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27166 | -| time_elapsed | 147654 | -| total_timesteps | 3477248 | -| train/ | | -| approx_kl | 0.012905357 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.997 | -| learning_rate | 0.0003 | -| loss | 0.00675 | -| n_updates | 271650 | -| policy_gradient_loss | 0.00367 | -| std | 0.00556 | -| value_loss | 4e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27167 | -| time_elapsed | 147658 | -| total_timesteps | 3477376 | -| train/ | | -| approx_kl | 0.006259503 | -| clip_fraction | 0.297 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.4 | -| learning_rate | 0.0003 | -| loss | -0.00585 | -| n_updates | 271660 | -| policy_gradient_loss | 0.00727 | -| std | 0.00556 | -| value_loss | 2.23e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27168 | -| time_elapsed | 147663 | -| total_timesteps | 3477504 | -| train/ | | -| approx_kl | 0.11127933 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.6 | -| learning_rate | 0.0003 | -| loss | 0.0311 | -| n_updates | 271670 | -| policy_gradient_loss | 0.00948 | -| std | 0.00556 | -| value_loss | 6.47e-08 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27169 | -| time_elapsed | 147667 | -| total_timesteps | 3477632 | -| train/ | | -| approx_kl | 0.1349357 | -| clip_fraction | 0.364 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0195 | -| learning_rate | 0.0003 | -| loss | 0.0207 | -| n_updates | 271680 | -| policy_gradient_loss | -0.000137 | -| std | 0.00556 | -| value_loss | 4.42e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27170 | -| time_elapsed | 147671 | -| total_timesteps | 3477760 | -| train/ | | -| approx_kl | 0.39325497 | -| clip_fraction | 0.513 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0877 | -| learning_rate | 0.0003 | -| loss | 0.128 | -| n_updates | 271690 | -| policy_gradient_loss | 0.052 | -| std | 0.00558 | -| value_loss | 1.67e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27171 | -| time_elapsed | 147675 | -| total_timesteps | 3477888 | -| train/ | | -| approx_kl | 0.31436437 | -| clip_fraction | 0.383 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.327 | -| learning_rate | 0.0003 | -| loss | 0.169 | -| n_updates | 271700 | -| policy_gradient_loss | 0.0606 | -| std | 0.00559 | -| value_loss | 4.58e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27172 | -| time_elapsed | 147680 | -| total_timesteps | 3478016 | -| train/ | | -| approx_kl | 0.16983235 | -| clip_fraction | 0.264 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.000774 | -| learning_rate | 0.0003 | -| loss | 0.0383 | -| n_updates | 271710 | -| policy_gradient_loss | 0.0085 | -| std | 0.00559 | -| value_loss | 1.25e-09 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27173 | -| time_elapsed | 147693 | -| total_timesteps | 3478144 | -| train/ | | -| approx_kl | 0.011429462 | -| clip_fraction | 0.475 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.975 | -| learning_rate | 0.0003 | -| loss | -0.0173 | -| n_updates | 271720 | -| policy_gradient_loss | -0.00346 | -| std | 0.00559 | -| value_loss | 0.0004 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27174 | -| time_elapsed | 147698 | -| total_timesteps | 3478272 | -| train/ | | -| approx_kl | 0.3105195 | -| clip_fraction | 0.701 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.51 | -| learning_rate | 0.0003 | -| loss | 0.162 | -| n_updates | 271730 | -| policy_gradient_loss | 0.0923 | -| std | 0.0056 | -| value_loss | 7.43e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27175 | -| time_elapsed | 147703 | -| total_timesteps | 3478400 | -| train/ | | -| approx_kl | 0.06704937 | -| clip_fraction | 0.423 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0583 | -| learning_rate | 0.0003 | -| loss | 0.0323 | -| n_updates | 271740 | -| policy_gradient_loss | 0.035 | -| std | 0.0056 | -| value_loss | 1.01e-07 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27176 | -| time_elapsed | 147708 | -| total_timesteps | 3478528 | -| train/ | | -| approx_kl | 0.0007842998 | -| clip_fraction | 0.391 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.000601 | -| learning_rate | 0.0003 | -| loss | 0.000388 | -| n_updates | 271750 | -| policy_gradient_loss | 0.0335 | -| std | 0.00559 | -| value_loss | 3.07e-08 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27177 | -| time_elapsed | 147713 | -| total_timesteps | 3478656 | -| train/ | | -| approx_kl | 0.00017386116 | -| clip_fraction | 0.372 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.147 | -| learning_rate | 0.0003 | -| loss | 0.00124 | -| n_updates | 271760 | -| policy_gradient_loss | 0.0303 | -| std | 0.00559 | -| value_loss | 4.44e-08 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27178 | -| time_elapsed | 147718 | -| total_timesteps | 3478784 | -| train/ | | -| approx_kl | 0.4828989 | -| clip_fraction | 0.527 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.421 | -| learning_rate | 0.0003 | -| loss | 0.11 | -| n_updates | 271770 | -| policy_gradient_loss | 0.0503 | -| std | 0.00559 | -| value_loss | 7.79e-09 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27179 | -| time_elapsed | 147722 | -| total_timesteps | 3478912 | -| train/ | | -| approx_kl | 0.01313534 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.181 | -| learning_rate | 0.0003 | -| loss | 0.0079 | -| n_updates | 271780 | -| policy_gradient_loss | 0.0174 | -| std | 0.00557 | -| value_loss | 8.78e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27180 | -| time_elapsed | 147727 | -| total_timesteps | 3479040 | -| train/ | | -| approx_kl | 0.07260618 | -| clip_fraction | 0.474 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.62 | -| learning_rate | 0.0003 | -| loss | 0.0383 | -| n_updates | 271790 | -| policy_gradient_loss | 0.0452 | -| std | 0.00555 | -| value_loss | 0.000101 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27181 | -| time_elapsed | 147738 | -| total_timesteps | 3479168 | -| train/ | | -| approx_kl | 0.015572317 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.78 | -| explained_variance | 0.752 | -| learning_rate | 0.0003 | -| loss | -0.0234 | -| n_updates | 271800 | -| policy_gradient_loss | -0.00614 | -| std | 0.00554 | -| value_loss | 0.00125 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27182 | -| time_elapsed | 147743 | -| total_timesteps | 3479296 | -| train/ | | -| approx_kl | 0.16197698 | -| clip_fraction | 0.708 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.00676 | -| learning_rate | 0.0003 | -| loss | 0.0526 | -| n_updates | 271810 | -| policy_gradient_loss | 0.087 | -| std | 0.00556 | -| value_loss | 0.000606 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27183 | -| time_elapsed | 147747 | -| total_timesteps | 3479424 | -| train/ | | -| approx_kl | 0.030577436 | -| clip_fraction | 0.411 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.81 | -| learning_rate | 0.0003 | -| loss | -0.0154 | -| n_updates | 271820 | -| policy_gradient_loss | 0.0294 | -| std | 0.00557 | -| value_loss | 3.25e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27184 | -| time_elapsed | 147751 | -| total_timesteps | 3479552 | -| train/ | | -| approx_kl | 0.28336525 | -| clip_fraction | 0.387 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0188 | -| learning_rate | 0.0003 | -| loss | 0.0971 | -| n_updates | 271830 | -| policy_gradient_loss | 0.0281 | -| std | 0.00557 | -| value_loss | 1.01e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27185 | -| time_elapsed | 147755 | -| total_timesteps | 3479680 | -| train/ | | -| approx_kl | 0.020008259 | -| clip_fraction | 0.138 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0265 | -| learning_rate | 0.0003 | -| loss | 0.0103 | -| n_updates | 271840 | -| policy_gradient_loss | 0.00414 | -| std | 0.00557 | -| value_loss | 4.67e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27186 | -| time_elapsed | 147760 | -| total_timesteps | 3479808 | -| train/ | | -| approx_kl | 0.030401662 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.097 | -| learning_rate | 0.0003 | -| loss | 0.0164 | -| n_updates | 271850 | -| policy_gradient_loss | 0.0426 | -| std | 0.00557 | -| value_loss | 2.8e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27187 | -| time_elapsed | 147765 | -| total_timesteps | 3479936 | -| train/ | | -| approx_kl | 0.39809453 | -| clip_fraction | 0.734 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0802 | -| learning_rate | 0.0003 | -| loss | 0.206 | -| n_updates | 271860 | -| policy_gradient_loss | 0.18 | -| std | 0.00557 | -| value_loss | 1.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27188 | -| time_elapsed | 147769 | -| total_timesteps | 3480064 | -| train/ | | -| approx_kl | 0.26613522 | -| clip_fraction | 0.71 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0787 | -| learning_rate | 0.0003 | -| loss | 0.168 | -| n_updates | 271870 | -| policy_gradient_loss | 0.187 | -| std | 0.00557 | -| value_loss | 1.61e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27189 | -| time_elapsed | 147776 | -| total_timesteps | 3480192 | -| train/ | | -| approx_kl | 0.2014052 | -| clip_fraction | 0.726 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.856 | -| learning_rate | 0.0003 | -| loss | 0.14 | -| n_updates | 271880 | -| policy_gradient_loss | 0.15 | -| std | 0.00557 | -| value_loss | 0.00401 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27190 | -| time_elapsed | 147780 | -| total_timesteps | 3480320 | -| train/ | | -| approx_kl | 0.044913523 | -| clip_fraction | 0.402 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0854 | -| learning_rate | 0.0003 | -| loss | 0.0251 | -| n_updates | 271890 | -| policy_gradient_loss | 0.0332 | -| std | 0.00557 | -| value_loss | 1.8e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27191 | -| time_elapsed | 147785 | -| total_timesteps | 3480448 | -| train/ | | -| approx_kl | 0.0021650204 | -| clip_fraction | 0.416 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.015 | -| learning_rate | 0.0003 | -| loss | 0.00297 | -| n_updates | 271900 | -| policy_gradient_loss | 0.0445 | -| std | 0.00557 | -| value_loss | 6.77e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27192 | -| time_elapsed | 147790 | -| total_timesteps | 3480576 | -| train/ | | -| approx_kl | 5.734712e-05 | -| clip_fraction | 0.358 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0299 | -| learning_rate | 0.0003 | -| loss | 0.000159 | -| n_updates | 271910 | -| policy_gradient_loss | 0.0321 | -| std | 0.00557 | -| value_loss | 3.28e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27193 | -| time_elapsed | 147794 | -| total_timesteps | 3480704 | -| train/ | | -| approx_kl | 0.0019400241 | -| clip_fraction | 0.339 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.172 | -| learning_rate | 0.0003 | -| loss | -0.00621 | -| n_updates | 271920 | -| policy_gradient_loss | 0.0444 | -| std | 0.00557 | -| value_loss | 2.68e-06 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27194 | -| time_elapsed | 147799 | -| total_timesteps | 3480832 | -| train/ | | -| approx_kl | 0.32645223 | -| clip_fraction | 0.413 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0387 | -| learning_rate | 0.0003 | -| loss | 0.0539 | -| n_updates | 271930 | -| policy_gradient_loss | 0.0114 | -| std | 0.00557 | -| value_loss | 1.81e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27195 | -| time_elapsed | 147803 | -| total_timesteps | 3480960 | -| train/ | | -| approx_kl | 0.029667959 | -| clip_fraction | 0.194 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0484 | -| learning_rate | 0.0003 | -| loss | 0.0147 | -| n_updates | 271940 | -| policy_gradient_loss | 0.00502 | -| std | 0.00557 | -| value_loss | 9.99e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27196 | -| time_elapsed | 147808 | -| total_timesteps | 3481088 | -| train/ | | -| approx_kl | 0.018431386 | -| clip_fraction | 0.129 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.115 | -| learning_rate | 0.0003 | -| loss | -0.0151 | -| n_updates | 271950 | -| policy_gradient_loss | -0.00852 | -| std | 0.00557 | -| value_loss | 6.79e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27197 | -| time_elapsed | 147818 | -| total_timesteps | 3481216 | -| train/ | | -| approx_kl | 0.19313401 | -| clip_fraction | 0.435 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.725 | -| learning_rate | 0.0003 | -| loss | 0.00764 | -| n_updates | 271960 | -| policy_gradient_loss | 0.00436 | -| std | 0.00557 | -| value_loss | 0.00176 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27198 | -| time_elapsed | 147821 | -| total_timesteps | 3481344 | -| train/ | | -| approx_kl | 0.18214962 | -| clip_fraction | 0.469 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0353 | -| learning_rate | 0.0003 | -| loss | 0.0806 | -| n_updates | 271970 | -| policy_gradient_loss | 0.0559 | -| std | 0.00557 | -| value_loss | 1.04e-05 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27199 | -| time_elapsed | 147826 | -| total_timesteps | 3481472 | -| train/ | | -| approx_kl | 0.5291617 | -| clip_fraction | 0.755 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0134 | -| learning_rate | 0.0003 | -| loss | 0.281 | -| n_updates | 271980 | -| policy_gradient_loss | 0.161 | -| std | 0.00557 | -| value_loss | 1.51e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27200 | -| time_elapsed | 147830 | -| total_timesteps | 3481600 | -| train/ | | -| approx_kl | 0.07154984 | -| clip_fraction | 0.384 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0669 | -| learning_rate | 0.0003 | -| loss | 0.039 | -| n_updates | 271990 | -| policy_gradient_loss | 0.0333 | -| std | 0.00557 | -| value_loss | 1.36e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27201 | -| time_elapsed | 147834 | -| total_timesteps | 3481728 | -| train/ | | -| approx_kl | 0.24227178 | -| clip_fraction | 0.408 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0487 | -| learning_rate | 0.0003 | -| loss | 0.0987 | -| n_updates | 272000 | -| policy_gradient_loss | 0.0321 | -| std | 0.00557 | -| value_loss | 1.06e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27202 | -| time_elapsed | 147838 | -| total_timesteps | 3481856 | -| train/ | | -| approx_kl | 0.24616018 | -| clip_fraction | 0.444 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0504 | -| learning_rate | 0.0003 | -| loss | 0.0615 | -| n_updates | 272010 | -| policy_gradient_loss | 0.0285 | -| std | 0.00557 | -| value_loss | 9.95e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27203 | -| time_elapsed | 147842 | -| total_timesteps | 3481984 | -| train/ | | -| approx_kl | 0.028456982 | -| clip_fraction | 0.35 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.292 | -| learning_rate | 0.0003 | -| loss | 0.0603 | -| n_updates | 272020 | -| policy_gradient_loss | 0.0377 | -| std | 0.00557 | -| value_loss | 3.69e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27204 | -| time_elapsed | 147847 | -| total_timesteps | 3482112 | -| train/ | | -| approx_kl | 0.5543758 | -| clip_fraction | 0.705 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.241 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 272030 | -| policy_gradient_loss | 0.118 | -| std | 0.00557 | -| value_loss | 1.21e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27205 | -| time_elapsed | 147858 | -| total_timesteps | 3482240 | -| train/ | | -| approx_kl | 0.04656551 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.889 | -| learning_rate | 0.0003 | -| loss | -0.00334 | -| n_updates | 272040 | -| policy_gradient_loss | 0.0321 | -| std | 0.00557 | -| value_loss | 0.000807 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27206 | -| time_elapsed | 147863 | -| total_timesteps | 3482368 | -| train/ | | -| approx_kl | 1.7415771 | -| clip_fraction | 0.784 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.171 | -| learning_rate | 0.0003 | -| loss | 0.715 | -| n_updates | 272050 | -| policy_gradient_loss | 0.226 | -| std | 0.00557 | -| value_loss | 8.93e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27207 | -| time_elapsed | 147868 | -| total_timesteps | 3482496 | -| train/ | | -| approx_kl | 0.038106155 | -| clip_fraction | 0.326 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0192 | -| learning_rate | 0.0003 | -| loss | 0.0348 | -| n_updates | 272060 | -| policy_gradient_loss | 0.0276 | -| std | 0.00557 | -| value_loss | 1.8e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27208 | -| time_elapsed | 147875 | -| total_timesteps | 3482624 | -| train/ | | -| approx_kl | 0.2822576 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.048 | -| learning_rate | 0.0003 | -| loss | 0.148 | -| n_updates | 272070 | -| policy_gradient_loss | 0.128 | -| std | 0.00557 | -| value_loss | 8.91e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27209 | -| time_elapsed | 147880 | -| total_timesteps | 3482752 | -| train/ | | -| approx_kl | 0.04152325 | -| clip_fraction | 0.37 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0718 | -| learning_rate | 0.0003 | -| loss | 0.0173 | -| n_updates | 272080 | -| policy_gradient_loss | 0.0243 | -| std | 0.00557 | -| value_loss | 7.1e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27210 | -| time_elapsed | 147885 | -| total_timesteps | 3482880 | -| train/ | | -| approx_kl | 0.16525672 | -| clip_fraction | 0.32 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0568 | -| learning_rate | 0.0003 | -| loss | 0.0666 | -| n_updates | 272090 | -| policy_gradient_loss | 0.0184 | -| std | 0.00557 | -| value_loss | 4.68e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27211 | -| time_elapsed | 147890 | -| total_timesteps | 3483008 | -| train/ | | -| approx_kl | 0.021249276 | -| clip_fraction | 0.155 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.082 | -| learning_rate | 0.0003 | -| loss | 0.01 | -| n_updates | 272100 | -| policy_gradient_loss | 0.00432 | -| std | 0.00557 | -| value_loss | 2.91e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27212 | -| time_elapsed | 147900 | -| total_timesteps | 3483136 | -| train/ | | -| approx_kl | 0.0541914 | -| clip_fraction | 0.438 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.83 | -| learning_rate | 0.0003 | -| loss | -0.023 | -| n_updates | 272110 | -| policy_gradient_loss | -0.0101 | -| std | 0.00557 | -| value_loss | 0.000935 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27213 | -| time_elapsed | 147905 | -| total_timesteps | 3483264 | -| train/ | | -| approx_kl | 0.018426385 | -| clip_fraction | 0.351 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.974 | -| learning_rate | 0.0003 | -| loss | -0.00382 | -| n_updates | 272120 | -| policy_gradient_loss | 0.0242 | -| std | 0.00557 | -| value_loss | 2.68e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27214 | -| time_elapsed | 147909 | -| total_timesteps | 3483392 | -| train/ | | -| approx_kl | 0.05870497 | -| clip_fraction | 0.497 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.278 | -| learning_rate | 0.0003 | -| loss | 0.0105 | -| n_updates | 272130 | -| policy_gradient_loss | 0.0736 | -| std | 0.00557 | -| value_loss | 4.22e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27215 | -| time_elapsed | 147913 | -| total_timesteps | 3483520 | -| train/ | | -| approx_kl | 0.24581914 | -| clip_fraction | 0.472 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.146 | -| learning_rate | 0.0003 | -| loss | 0.0739 | -| n_updates | 272140 | -| policy_gradient_loss | 0.052 | -| std | 0.00557 | -| value_loss | 1.75e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27216 | -| time_elapsed | 147917 | -| total_timesteps | 3483648 | -| train/ | | -| approx_kl | 0.0049045035 | -| clip_fraction | 0.252 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0683 | -| learning_rate | 0.0003 | -| loss | -0.00578 | -| n_updates | 272150 | -| policy_gradient_loss | 0.0161 | -| std | 0.00557 | -| value_loss | 1.36e-08 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27217 | -| time_elapsed | 147922 | -| total_timesteps | 3483776 | -| train/ | | -| approx_kl | 0.024736822 | -| clip_fraction | 0.626 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0566 | -| learning_rate | 0.0003 | -| loss | 0.0077 | -| n_updates | 272160 | -| policy_gradient_loss | 0.143 | -| std | 0.00557 | -| value_loss | 1.11e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27218 | -| time_elapsed | 147927 | -| total_timesteps | 3483904 | -| train/ | | -| approx_kl | 0.35803688 | -| clip_fraction | 0.482 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0394 | -| learning_rate | 0.0003 | -| loss | 0.0845 | -| n_updates | 272170 | -| policy_gradient_loss | 0.0372 | -| std | 0.00557 | -| value_loss | 9.19e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27219 | -| time_elapsed | 147931 | -| total_timesteps | 3484032 | -| train/ | | -| approx_kl | 0.09061738 | -| clip_fraction | 0.663 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0411 | -| learning_rate | 0.0003 | -| loss | 0.0304 | -| n_updates | 272180 | -| policy_gradient_loss | 0.0855 | -| std | 0.00557 | -| value_loss | 7.26e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27220 | -| time_elapsed | 147941 | -| total_timesteps | 3484160 | -| train/ | | -| approx_kl | 0.14333847 | -| clip_fraction | 0.462 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.946 | -| learning_rate | 0.0003 | -| loss | 0.0735 | -| n_updates | 272190 | -| policy_gradient_loss | 0.0525 | -| std | 0.00557 | -| value_loss | 0.000874 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27221 | -| time_elapsed | 147947 | -| total_timesteps | 3484288 | -| train/ | | -| approx_kl | 0.050024312 | -| clip_fraction | 0.628 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0942 | -| learning_rate | 0.0003 | -| loss | 0.0342 | -| n_updates | 272200 | -| policy_gradient_loss | 0.112 | -| std | 0.00556 | -| value_loss | 2.62e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27222 | -| time_elapsed | 147951 | -| total_timesteps | 3484416 | -| train/ | | -| approx_kl | 0.09707488 | -| clip_fraction | 0.359 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | 0.0811 | -| n_updates | 272210 | -| policy_gradient_loss | 0.0364 | -| std | 0.00556 | -| value_loss | 3.03e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27223 | -| time_elapsed | 147954 | -| total_timesteps | 3484544 | -| train/ | | -| approx_kl | 0.70200515 | -| clip_fraction | 0.704 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.213 | -| learning_rate | 0.0003 | -| loss | 0.254 | -| n_updates | 272220 | -| policy_gradient_loss | 0.198 | -| std | 0.00556 | -| value_loss | 2.04e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27224 | -| time_elapsed | 147960 | -| total_timesteps | 3484672 | -| train/ | | -| approx_kl | 0.39329907 | -| clip_fraction | 0.745 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.279 | -| learning_rate | 0.0003 | -| loss | 0.232 | -| n_updates | 272230 | -| policy_gradient_loss | 0.242 | -| std | 0.00556 | -| value_loss | 5.54e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27225 | -| time_elapsed | 147964 | -| total_timesteps | 3484800 | -| train/ | | -| approx_kl | 0.06744594 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0663 | -| learning_rate | 0.0003 | -| loss | 0.0309 | -| n_updates | 272240 | -| policy_gradient_loss | 0.0371 | -| std | 0.00556 | -| value_loss | 5.15e-07 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27226 | -| time_elapsed | 147969 | -| total_timesteps | 3484928 | -| train/ | | -| approx_kl | 0.75282377 | -| clip_fraction | 0.56 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0401 | -| learning_rate | 0.0003 | -| loss | 0.18 | -| n_updates | 272250 | -| policy_gradient_loss | 0.0652 | -| std | 0.00556 | -| value_loss | 4.27e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27227 | -| time_elapsed | 147973 | -| total_timesteps | 3485056 | -| train/ | | -| approx_kl | 0.015278364 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0395 | -| learning_rate | 0.0003 | -| loss | 0.00198 | -| n_updates | 272260 | -| policy_gradient_loss | 0.00875 | -| std | 0.00556 | -| value_loss | 2.3e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27228 | -| time_elapsed | 147982 | -| total_timesteps | 3485184 | -| train/ | | -| approx_kl | 0.0065082214 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.67 | -| learning_rate | 0.0003 | -| loss | -0.00484 | -| n_updates | 272270 | -| policy_gradient_loss | 0.00669 | -| std | 0.00556 | -| value_loss | 0.0135 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27229 | -| time_elapsed | 147987 | -| total_timesteps | 3485312 | -| train/ | | -| approx_kl | 0.012238264 | -| clip_fraction | 0.434 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.394 | -| learning_rate | 0.0003 | -| loss | -0.0192 | -| n_updates | 272280 | -| policy_gradient_loss | 0.0506 | -| std | 0.00556 | -| value_loss | 0.00049 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27230 | -| time_elapsed | 147994 | -| total_timesteps | 3485440 | -| train/ | | -| approx_kl | 0.6982827 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.00341 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 272290 | -| policy_gradient_loss | 0.0734 | -| std | 0.00556 | -| value_loss | 0.000121 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27231 | -| time_elapsed | 147998 | -| total_timesteps | 3485568 | -| train/ | | -| approx_kl | 0.07331952 | -| clip_fraction | 0.286 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.00643 | -| learning_rate | 0.0003 | -| loss | 0.0371 | -| n_updates | 272300 | -| policy_gradient_loss | 0.0179 | -| std | 0.00556 | -| value_loss | 6.37e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27232 | -| time_elapsed | 148004 | -| total_timesteps | 3485696 | -| train/ | | -| approx_kl | 0.06410524 | -| clip_fraction | 0.288 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0465 | -| learning_rate | 0.0003 | -| loss | 0.0439 | -| n_updates | 272310 | -| policy_gradient_loss | 0.0212 | -| std | 0.00556 | -| value_loss | 3.25e-05 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27233 | -| time_elapsed | 148008 | -| total_timesteps | 3485824 | -| train/ | | -| approx_kl | 0.010308707 | -| clip_fraction | 0.238 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.101 | -| learning_rate | 0.0003 | -| loss | -0.0075 | -| n_updates | 272320 | -| policy_gradient_loss | 0.00523 | -| std | 0.00556 | -| value_loss | 2.31e-05 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27234 | -| time_elapsed | 148012 | -| total_timesteps | 3485952 | -| train/ | | -| approx_kl | 0.076579265 | -| clip_fraction | 0.27 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.076 | -| learning_rate | 0.0003 | -| loss | 0.000205 | -| n_updates | 272330 | -| policy_gradient_loss | -0.00514 | -| std | 0.00556 | -| value_loss | 1.85e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27235 | -| time_elapsed | 148016 | -| total_timesteps | 3486080 | -| train/ | | -| approx_kl | 0.06931259 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0535 | -| learning_rate | 0.0003 | -| loss | 0.0419 | -| n_updates | 272340 | -| policy_gradient_loss | 0.0216 | -| std | 0.00556 | -| value_loss | 1.06e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27236 | -| time_elapsed | 148024 | -| total_timesteps | 3486208 | -| train/ | | -| approx_kl | 0.10624408 | -| clip_fraction | 0.259 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.982 | -| learning_rate | 0.0003 | -| loss | 0.0306 | -| n_updates | 272350 | -| policy_gradient_loss | -0.00106 | -| std | 0.00556 | -| value_loss | 0.000172 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27237 | -| time_elapsed | 148029 | -| total_timesteps | 3486336 | -| train/ | | -| approx_kl | 0.046061244 | -| clip_fraction | 0.453 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.149 | -| learning_rate | 0.0003 | -| loss | -0.0105 | -| n_updates | 272360 | -| policy_gradient_loss | 0.0195 | -| std | 0.00556 | -| value_loss | 4.41e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27238 | -| time_elapsed | 148032 | -| total_timesteps | 3486464 | -| train/ | | -| approx_kl | 0.19429813 | -| clip_fraction | 0.555 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.05 | -| learning_rate | 0.0003 | -| loss | 0.133 | -| n_updates | 272370 | -| policy_gradient_loss | 0.07 | -| std | 0.00556 | -| value_loss | 3.25e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27239 | -| time_elapsed | 148036 | -| total_timesteps | 3486592 | -| train/ | | -| approx_kl | 0.057470925 | -| clip_fraction | 0.471 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0519 | -| learning_rate | 0.0003 | -| loss | 0.000929 | -| n_updates | 272380 | -| policy_gradient_loss | 0.038 | -| std | 0.00556 | -| value_loss | 2.76e-06 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27240 | -| time_elapsed | 148041 | -| total_timesteps | 3486720 | -| train/ | | -| approx_kl | 1.0396255 | -| clip_fraction | 0.787 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0418 | -| learning_rate | 0.0003 | -| loss | 0.356 | -| n_updates | 272390 | -| policy_gradient_loss | 0.312 | -| std | 0.00556 | -| value_loss | 2.29e-06 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27241 | -| time_elapsed | 148047 | -| total_timesteps | 3486848 | -| train/ | | -| approx_kl | 0.07473517 | -| clip_fraction | 0.237 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0342 | -| learning_rate | 0.0003 | -| loss | 0.0814 | -| n_updates | 272400 | -| policy_gradient_loss | 0.00725 | -| std | 0.00556 | -| value_loss | 1.65e-06 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27242 | -| time_elapsed | 148052 | -| total_timesteps | 3486976 | -| train/ | | -| approx_kl | 0.0015738704 | -| clip_fraction | 0.422 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0763 | -| learning_rate | 0.0003 | -| loss | -0.0048 | -| n_updates | 272410 | -| policy_gradient_loss | 0.0418 | -| std | 0.00556 | -| value_loss | 7.7e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27243 | -| time_elapsed | 148056 | -| total_timesteps | 3487104 | -| train/ | | -| approx_kl | 0.003229998 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.118 | -| learning_rate | 0.0003 | -| loss | -0.00318 | -| n_updates | 272420 | -| policy_gradient_loss | 0.0356 | -| std | 0.00556 | -| value_loss | 7.1e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27244 | -| time_elapsed | 148066 | -| total_timesteps | 3487232 | -| train/ | | -| approx_kl | 0.016218157 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.01 | -| learning_rate | 0.0003 | -| loss | -0.0208 | -| n_updates | 272430 | -| policy_gradient_loss | -0.00179 | -| std | 0.00556 | -| value_loss | 0.0037 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27245 | -| time_elapsed | 148070 | -| total_timesteps | 3487360 | -| train/ | | -| approx_kl | 0.8001778 | -| clip_fraction | 0.541 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.87 | -| learning_rate | 0.0003 | -| loss | 0.188 | -| n_updates | 272440 | -| policy_gradient_loss | 0.0651 | -| std | 0.00556 | -| value_loss | 2.33e-06 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27246 | -| time_elapsed | 148074 | -| total_timesteps | 3487488 | -| train/ | | -| approx_kl | 0.011278815 | -| clip_fraction | 0.304 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0123 | -| learning_rate | 0.0003 | -| loss | -0.00312 | -| n_updates | 272450 | -| policy_gradient_loss | 0.0116 | -| std | 0.00556 | -| value_loss | 7.08e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27247 | -| time_elapsed | 148078 | -| total_timesteps | 3487616 | -| train/ | | -| approx_kl | 0.09791093 | -| clip_fraction | 0.276 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0201 | -| learning_rate | 0.0003 | -| loss | 0.0355 | -| n_updates | 272460 | -| policy_gradient_loss | 0.0128 | -| std | 0.00556 | -| value_loss | 5.12e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27248 | -| time_elapsed | 148082 | -| total_timesteps | 3487744 | -| train/ | | -| approx_kl | 0.060217433 | -| clip_fraction | 0.301 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.042 | -| learning_rate | 0.0003 | -| loss | 0.00839 | -| n_updates | 272470 | -| policy_gradient_loss | 0.0062 | -| std | 0.00556 | -| value_loss | 3.88e-07 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27249 | -| time_elapsed | 148087 | -| total_timesteps | 3487872 | -| train/ | | -| approx_kl | 0.07634279 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0405 | -| learning_rate | 0.0003 | -| loss | 0.0463 | -| n_updates | 272480 | -| policy_gradient_loss | 0.0216 | -| std | 0.00556 | -| value_loss | 3.04e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27250 | -| time_elapsed | 148091 | -| total_timesteps | 3488000 | -| train/ | | -| approx_kl | 0.012766983 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0434 | -| learning_rate | 0.0003 | -| loss | -0.0267 | -| n_updates | 272490 | -| policy_gradient_loss | 0.00594 | -| std | 0.00556 | -| value_loss | 2.37e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27251 | -| time_elapsed | 148097 | -| total_timesteps | 3488128 | -| train/ | | -| approx_kl | 0.051938925 | -| clip_fraction | 0.644 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.00523 | -| learning_rate | 0.0003 | -| loss | 0.0445 | -| n_updates | 272500 | -| policy_gradient_loss | 0.162 | -| std | 0.00556 | -| value_loss | 1.06e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27252 | -| time_elapsed | 148106 | -| total_timesteps | 3488256 | -| train/ | | -| approx_kl | 0.004072884 | -| clip_fraction | 0.379 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.736 | -| learning_rate | 0.0003 | -| loss | -0.0161 | -| n_updates | 272510 | -| policy_gradient_loss | 0.0194 | -| std | 0.00556 | -| value_loss | 0.00191 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27253 | -| time_elapsed | 148112 | -| total_timesteps | 3488384 | -| train/ | | -| approx_kl | 0.9833985 | -| clip_fraction | 0.769 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -2.09 | -| learning_rate | 0.0003 | -| loss | 0.3 | -| n_updates | 272520 | -| policy_gradient_loss | 0.165 | -| std | 0.00556 | -| value_loss | 6.66e-06 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27254 | -| time_elapsed | 148116 | -| total_timesteps | 3488512 | -| train/ | | -| approx_kl | 0.0378512 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0613 | -| learning_rate | 0.0003 | -| loss | 0.0293 | -| n_updates | 272530 | -| policy_gradient_loss | 0.0252 | -| std | 0.00555 | -| value_loss | 4.21e-07 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27255 | -| time_elapsed | 148121 | -| total_timesteps | 3488640 | -| train/ | | -| approx_kl | 0.32172817 | -| clip_fraction | 0.74 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.22 | -| learning_rate | 0.0003 | -| loss | 0.193 | -| n_updates | 272540 | -| policy_gradient_loss | 0.146 | -| std | 0.00555 | -| value_loss | 1.29e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27256 | -| time_elapsed | 148126 | -| total_timesteps | 3488768 | -| train/ | | -| approx_kl | 0.2537772 | -| clip_fraction | 0.731 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.138 | -| learning_rate | 0.0003 | -| loss | 0.157 | -| n_updates | 272550 | -| policy_gradient_loss | 0.224 | -| std | 0.00555 | -| value_loss | 8.35e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.08 | -| time/ | | -| fps | 23 | -| iterations | 27257 | -| time_elapsed | 148131 | -| total_timesteps | 3488896 | -| train/ | | -| approx_kl | 0.042285558 | -| clip_fraction | 0.395 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0502 | -| learning_rate | 0.0003 | -| loss | 0.0163 | -| n_updates | 272560 | -| policy_gradient_loss | 0.0341 | -| std | 0.00555 | -| value_loss | 7.67e-08 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27258 | -| time_elapsed | 148137 | -| total_timesteps | 3489024 | -| train/ | | -| approx_kl | 0.6237047 | -| clip_fraction | 0.537 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0367 | -| learning_rate | 0.0003 | -| loss | 0.126 | -| n_updates | 272570 | -| policy_gradient_loss | 0.0545 | -| std | 0.00555 | -| value_loss | 6.07e-08 | ---------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27259 | -| time_elapsed | 148149 | -| total_timesteps | 3489152 | -| train/ | | -| approx_kl | 0.0065654297 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -1.27 | -| learning_rate | 0.0003 | -| loss | -0.022 | -| n_updates | 272580 | -| policy_gradient_loss | -0.00903 | -| std | 0.00555 | -| value_loss | 0.00365 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27260 | -| time_elapsed | 148155 | -| total_timesteps | 3489280 | -| train/ | | -| approx_kl | 0.061860647 | -| clip_fraction | 0.461 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.399 | -| learning_rate | 0.0003 | -| loss | 0.0384 | -| n_updates | 272590 | -| policy_gradient_loss | 0.0574 | -| std | 0.00555 | -| value_loss | 3.22e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27261 | -| time_elapsed | 148159 | -| total_timesteps | 3489408 | -| train/ | | -| approx_kl | 0.17502724 | -| clip_fraction | 0.542 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0271 | -| learning_rate | 0.0003 | -| loss | 0.077 | -| n_updates | 272600 | -| policy_gradient_loss | 0.0504 | -| std | 0.00556 | -| value_loss | 3.25e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27262 | -| time_elapsed | 148164 | -| total_timesteps | 3489536 | -| train/ | | -| approx_kl | 0.020232815 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -5.97 | -| learning_rate | 0.0003 | -| loss | 0.00848 | -| n_updates | 272610 | -| policy_gradient_loss | 0.013 | -| std | 0.00556 | -| value_loss | 7.79e-08 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27263 | -| time_elapsed | 148170 | -| total_timesteps | 3489664 | -| train/ | | -| approx_kl | 0.0013347878 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0444 | -| learning_rate | 0.0003 | -| loss | 0.00319 | -| n_updates | 272620 | -| policy_gradient_loss | 0.0092 | -| std | 0.00556 | -| value_loss | 4.4e-09 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27264 | -| time_elapsed | 148174 | -| total_timesteps | 3489792 | -| train/ | | -| approx_kl | 3.977958e-05 | -| clip_fraction | 0.289 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.188 | -| learning_rate | 0.0003 | -| loss | 0.00104 | -| n_updates | 272630 | -| policy_gradient_loss | 0.00238 | -| std | 0.00556 | -| value_loss | 3.8e-09 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.07 | -| time/ | | -| fps | 23 | -| iterations | 27265 | -| time_elapsed | 148181 | -| total_timesteps | 3489920 | -| train/ | | -| approx_kl | 0.058385137 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.154 | -| learning_rate | 0.0003 | -| loss | 0.0253 | -| n_updates | 272640 | -| policy_gradient_loss | 0.0113 | -| std | 0.00556 | -| value_loss | 1.68e-09 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27266 | -| time_elapsed | 148187 | -| total_timesteps | 3490048 | -| train/ | | -| approx_kl | 0.054801434 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.136 | -| learning_rate | 0.0003 | -| loss | 0.00777 | -| n_updates | 272650 | -| policy_gradient_loss | 0.00434 | -| std | 0.00556 | -| value_loss | 1.24e-09 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27267 | -| time_elapsed | 148196 | -| total_timesteps | 3490176 | -| train/ | | -| approx_kl | 0.03979277 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0196 | -| learning_rate | 0.0003 | -| loss | -0.0291 | -| n_updates | 272660 | -| policy_gradient_loss | -0.0199 | -| std | 0.00556 | -| value_loss | 0.00233 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27268 | -| time_elapsed | 148200 | -| total_timesteps | 3490304 | -| train/ | | -| approx_kl | 0.0030227099 | -| clip_fraction | 0.239 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.301 | -| learning_rate | 0.0003 | -| loss | -0.00287 | -| n_updates | 272670 | -| policy_gradient_loss | 0.00833 | -| std | 0.00556 | -| value_loss | 2.31e-06 | ------------------------------------------- -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27269 | -| time_elapsed | 148204 | -| total_timesteps | 3490432 | -| train/ | | -| approx_kl | 1.9446015e-06 | -| clip_fraction | 0.385 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0117 | -| learning_rate | 0.0003 | -| loss | 0.000166 | -| n_updates | 272680 | -| policy_gradient_loss | 0.0508 | -| std | 0.00556 | -| value_loss | 1.46e-07 | -------------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27270 | -| time_elapsed | 148209 | -| total_timesteps | 3490560 | -| train/ | | -| approx_kl | 1.0251702 | -| clip_fraction | 0.784 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.119 | -| learning_rate | 0.0003 | -| loss | 0.807 | -| n_updates | 272690 | -| policy_gradient_loss | 0.215 | -| std | 0.00556 | -| value_loss | 6.92e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27271 | -| time_elapsed | 148213 | -| total_timesteps | 3490688 | -| train/ | | -| approx_kl | 0.013485316 | -| clip_fraction | 0.43 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0421 | -| learning_rate | 0.0003 | -| loss | -0.00991 | -| n_updates | 272700 | -| policy_gradient_loss | 0.02 | -| std | 0.00556 | -| value_loss | 5.39e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27272 | -| time_elapsed | 148218 | -| total_timesteps | 3490816 | -| train/ | | -| approx_kl | 0.12804833 | -| clip_fraction | 0.335 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0374 | -| learning_rate | 0.0003 | -| loss | 0.084 | -| n_updates | 272710 | -| policy_gradient_loss | 0.043 | -| std | 0.00556 | -| value_loss | 3.66e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.06 | -| time/ | | -| fps | 23 | -| iterations | 27273 | -| time_elapsed | 148223 | -| total_timesteps | 3490944 | -| train/ | | -| approx_kl | 0.16252752 | -| clip_fraction | 0.394 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | 0.0899 | -| n_updates | 272720 | -| policy_gradient_loss | 0.0346 | -| std | 0.00556 | -| value_loss | 2.61e-08 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27274 | -| time_elapsed | 148229 | -| total_timesteps | 3491072 | -| train/ | | -| approx_kl | 0.013611402 | -| clip_fraction | 0.124 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0497 | -| learning_rate | 0.0003 | -| loss | -0.00935 | -| n_updates | 272730 | -| policy_gradient_loss | -0.00454 | -| std | 0.00556 | -| value_loss | 1.9e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27275 | -| time_elapsed | 148237 | -| total_timesteps | 3491200 | -| train/ | | -| approx_kl | 0.04985476 | -| clip_fraction | 0.23 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.848 | -| learning_rate | 0.0003 | -| loss | -0.0147 | -| n_updates | 272740 | -| policy_gradient_loss | -0.00859 | -| std | 0.00556 | -| value_loss | 0.000907 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27276 | -| time_elapsed | 148244 | -| total_timesteps | 3491328 | -| train/ | | -| approx_kl | 0.19036083 | -| clip_fraction | 0.718 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.352 | -| learning_rate | 0.0003 | -| loss | 0.121 | -| n_updates | 272750 | -| policy_gradient_loss | 0.202 | -| std | 0.00556 | -| value_loss | 2.06e-05 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27277 | -| time_elapsed | 148248 | -| total_timesteps | 3491456 | -| train/ | | -| approx_kl | 0.03406636 | -| clip_fraction | 0.396 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0163 | -| learning_rate | 0.0003 | -| loss | 0.00359 | -| n_updates | 272760 | -| policy_gradient_loss | 0.0361 | -| std | 0.00556 | -| value_loss | 6.54e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27278 | -| time_elapsed | 148254 | -| total_timesteps | 3491584 | -| train/ | | -| approx_kl | 0.29445538 | -| clip_fraction | 0.398 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.000915 | -| learning_rate | 0.0003 | -| loss | 0.0858 | -| n_updates | 272770 | -| policy_gradient_loss | 0.0247 | -| std | 0.00556 | -| value_loss | 2.68e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27279 | -| time_elapsed | 148257 | -| total_timesteps | 3491712 | -| train/ | | -| approx_kl | 0.021953594 | -| clip_fraction | 0.141 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0495 | -| learning_rate | 0.0003 | -| loss | 0.00452 | -| n_updates | 272780 | -| policy_gradient_loss | 0.00129 | -| std | 0.00556 | -| value_loss | 1.59e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27280 | -| time_elapsed | 148262 | -| total_timesteps | 3491840 | -| train/ | | -| approx_kl | 0.034194835 | -| clip_fraction | 0.495 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0615 | -| learning_rate | 0.0003 | -| loss | 0.00213 | -| n_updates | 272790 | -| policy_gradient_loss | 0.0354 | -| std | 0.00556 | -| value_loss | 1.28e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27281 | -| time_elapsed | 148265 | -| total_timesteps | 3491968 | -| train/ | | -| approx_kl | 0.41892043 | -| clip_fraction | 0.73 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0382 | -| learning_rate | 0.0003 | -| loss | 0.199 | -| n_updates | 272800 | -| policy_gradient_loss | 0.159 | -| std | 0.00556 | -| value_loss | 3.96e-06 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27282 | -| time_elapsed | 148271 | -| total_timesteps | 3492096 | -| train/ | | -| approx_kl | 0.2764718 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.654 | -| learning_rate | 0.0003 | -| loss | 0.132 | -| n_updates | 272810 | -| policy_gradient_loss | 0.131 | -| std | 0.00556 | -| value_loss | 2.7e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27283 | -| time_elapsed | 148280 | -| total_timesteps | 3492224 | -| train/ | | -| approx_kl | 0.029874122 | -| clip_fraction | 0.309 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.991 | -| learning_rate | 0.0003 | -| loss | -0.0272 | -| n_updates | 272820 | -| policy_gradient_loss | -0.0099 | -| std | 0.00556 | -| value_loss | 6.79e-05 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27284 | -| time_elapsed | 148285 | -| total_timesteps | 3492352 | -| train/ | | -| approx_kl | 0.09316399 | -| clip_fraction | 0.268 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.132 | -| learning_rate | 0.0003 | -| loss | 0.0516 | -| n_updates | 272830 | -| policy_gradient_loss | 0.0142 | -| std | 0.00556 | -| value_loss | 1.73e-07 | ----------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27285 | -| time_elapsed | 148288 | -| total_timesteps | 3492480 | -| train/ | | -| approx_kl | 0.3123008 | -| clip_fraction | 0.417 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0626 | -| learning_rate | 0.0003 | -| loss | 0.181 | -| n_updates | 272840 | -| policy_gradient_loss | 0.0497 | -| std | 0.00556 | -| value_loss | 3.99e-08 | ---------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27286 | -| time_elapsed | 148292 | -| total_timesteps | 3492608 | -| train/ | | -| approx_kl | 0.76263976 | -| clip_fraction | 0.561 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.107 | -| learning_rate | 0.0003 | -| loss | 0.219 | -| n_updates | 272850 | -| policy_gradient_loss | 0.0751 | -| std | 0.00556 | -| value_loss | 3.21e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27287 | -| time_elapsed | 148296 | -| total_timesteps | 3492736 | -| train/ | | -| approx_kl | 0.05952725 | -| clip_fraction | 0.265 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.054 | -| learning_rate | 0.0003 | -| loss | 0.00516 | -| n_updates | 272860 | -| policy_gradient_loss | 0.00429 | -| std | 0.00556 | -| value_loss | 2.73e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27288 | -| time_elapsed | 148301 | -| total_timesteps | 3492864 | -| train/ | | -| approx_kl | 0.06763866 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.037 | -| learning_rate | 0.0003 | -| loss | 0.032 | -| n_updates | 272870 | -| policy_gradient_loss | 0.015 | -| std | 0.00557 | -| value_loss | 2.22e-08 | ----------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27289 | -| time_elapsed | 148307 | -| total_timesteps | 3492992 | -| train/ | | -| approx_kl | 0.0121424105 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0324 | -| learning_rate | 0.0003 | -| loss | -0.016 | -| n_updates | 272880 | -| policy_gradient_loss | 0.00679 | -| std | 0.00557 | -| value_loss | 1.69e-08 | ------------------------------------------- --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27290 | -| time_elapsed | 148312 | -| total_timesteps | 3493120 | -| train/ | | -| approx_kl | 0.084353 | -| clip_fraction | 0.31 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0361 | -| learning_rate | 0.0003 | -| loss | 0.044 | -| n_updates | 272890 | -| policy_gradient_loss | 0.0169 | -| std | 0.00557 | -| value_loss | 1.08e-08 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27291 | -| time_elapsed | 148324 | -| total_timesteps | 3493248 | -| train/ | | -| approx_kl | 0.015693018 | -| clip_fraction | 0.262 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.782 | -| learning_rate | 0.0003 | -| loss | -0.00402 | -| n_updates | 272900 | -| policy_gradient_loss | 0.00967 | -| std | 0.00557 | -| value_loss | 0.00513 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27292 | -| time_elapsed | 148327 | -| total_timesteps | 3493376 | -| train/ | | -| approx_kl | 0.00075646024 | -| clip_fraction | 0.278 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.254 | -| learning_rate | 0.0003 | -| loss | 0.00597 | -| n_updates | 272910 | -| policy_gradient_loss | 0.00607 | -| std | 0.00557 | -| value_loss | 3.82e-05 | -------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27293 | -| time_elapsed | 148333 | -| total_timesteps | 3493504 | -| train/ | | -| approx_kl | 0.008136084 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.151 | -| learning_rate | 0.0003 | -| loss | -0.00247 | -| n_updates | 272920 | -| policy_gradient_loss | 0.0104 | -| std | 0.00556 | -| value_loss | 5.93e-05 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27294 | -| time_elapsed | 148337 | -| total_timesteps | 3493632 | -| train/ | | -| approx_kl | 0.0017076698 | -| clip_fraction | 0.272 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -41.3 | -| learning_rate | 0.0003 | -| loss | 0.0051 | -| n_updates | 272930 | -| policy_gradient_loss | 0.00229 | -| std | 0.00556 | -| value_loss | 3.13e-06 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27295 | -| time_elapsed | 148342 | -| total_timesteps | 3493760 | -| train/ | | -| approx_kl | 0.0064799553 | -| clip_fraction | 0.241 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.935 | -| learning_rate | 0.0003 | -| loss | -0.00944 | -| n_updates | 272940 | -| policy_gradient_loss | 0.00671 | -| std | 0.00556 | -| value_loss | 3.53e-08 | ------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27296 | -| time_elapsed | 148346 | -| total_timesteps | 3493888 | -| train/ | | -| approx_kl | 0.03922241 | -| clip_fraction | 0.627 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.2 | -| learning_rate | 0.0003 | -| loss | 0.0537 | -| n_updates | 272950 | -| policy_gradient_loss | 0.112 | -| std | 0.00556 | -| value_loss | 1.32e-08 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27297 | -| time_elapsed | 148349 | -| total_timesteps | 3494016 | -| train/ | | -| approx_kl | 0.11902636 | -| clip_fraction | 0.724 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0157 | -| learning_rate | 0.0003 | -| loss | 0.0796 | -| n_updates | 272960 | -| policy_gradient_loss | 0.137 | -| std | 0.00556 | -| value_loss | 4.67e-09 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27298 | -| time_elapsed | 148359 | -| total_timesteps | 3494144 | -| train/ | | -| approx_kl | 0.19464488 | -| clip_fraction | 0.728 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.929 | -| learning_rate | 0.0003 | -| loss | 0.0823 | -| n_updates | 272970 | -| policy_gradient_loss | 0.0861 | -| std | 0.00556 | -| value_loss | 0.00118 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27299 | -| time_elapsed | 148364 | -| total_timesteps | 3494272 | -| train/ | | -| approx_kl | 0.22682017 | -| clip_fraction | 0.72 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.173 | -| learning_rate | 0.0003 | -| loss | 0.0991 | -| n_updates | 272980 | -| policy_gradient_loss | 0.113 | -| std | 0.00556 | -| value_loss | 3.27e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27300 | -| time_elapsed | 148368 | -| total_timesteps | 3494400 | -| train/ | | -| approx_kl | 0.043191146 | -| clip_fraction | 0.433 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0152 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 272990 | -| policy_gradient_loss | 0.0356 | -| std | 0.00556 | -| value_loss | 6.3e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27301 | -| time_elapsed | 148373 | -| total_timesteps | 3494528 | -| train/ | | -| approx_kl | 0.7354362 | -| clip_fraction | 0.559 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0152 | -| learning_rate | 0.0003 | -| loss | 0.221 | -| n_updates | 273000 | -| policy_gradient_loss | 0.0742 | -| std | 0.00556 | -| value_loss | 3.12e-07 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27302 | -| time_elapsed | 148377 | -| total_timesteps | 3494656 | -| train/ | | -| approx_kl | 0.016447753 | -| clip_fraction | 0.284 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.049 | -| learning_rate | 0.0003 | -| loss | -0.0284 | -| n_updates | 273010 | -| policy_gradient_loss | 0.00414 | -| std | 0.00556 | -| value_loss | 2.61e-07 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27303 | -| time_elapsed | 148382 | -| total_timesteps | 3494784 | -| train/ | | -| approx_kl | 0.0011482518 | -| clip_fraction | 0.312 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.046 | -| learning_rate | 0.0003 | -| loss | 0.00819 | -| n_updates | 273020 | -| policy_gradient_loss | 0.00457 | -| std | 0.00556 | -| value_loss | 1.31e-07 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.05 | -| time/ | | -| fps | 23 | -| iterations | 27304 | -| time_elapsed | 148387 | -| total_timesteps | 3494912 | -| train/ | | -| approx_kl | 0.074691616 | -| clip_fraction | 0.303 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0733 | -| learning_rate | 0.0003 | -| loss | 0.0181 | -| n_updates | 273030 | -| policy_gradient_loss | 0.00692 | -| std | 0.00556 | -| value_loss | 1.15e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27305 | -| time_elapsed | 148392 | -| total_timesteps | 3495040 | -| train/ | | -| approx_kl | 0.013863256 | -| clip_fraction | 0.274 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0422 | -| learning_rate | 0.0003 | -| loss | -0.00423 | -| n_updates | 273040 | -| policy_gradient_loss | 0.0116 | -| std | 0.00556 | -| value_loss | 9.24e-08 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27306 | -| time_elapsed | 148402 | -| total_timesteps | 3495168 | -| train/ | | -| approx_kl | 0.11914645 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.837 | -| learning_rate | 0.0003 | -| loss | 0.0183 | -| n_updates | 273050 | -| policy_gradient_loss | 0.00574 | -| std | 0.00556 | -| value_loss | 0.00109 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27307 | -| time_elapsed | 148406 | -| total_timesteps | 3495296 | -| train/ | | -| approx_kl | 0.016686257 | -| clip_fraction | 0.225 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.304 | -| learning_rate | 0.0003 | -| loss | 0.00129 | -| n_updates | 273060 | -| policy_gradient_loss | 0.0106 | -| std | 0.00556 | -| value_loss | 4.82e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27308 | -| time_elapsed | 148411 | -| total_timesteps | 3495424 | -| train/ | | -| approx_kl | 0.076508895 | -| clip_fraction | 0.337 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0178 | -| learning_rate | 0.0003 | -| loss | 0.0442 | -| n_updates | 273070 | -| policy_gradient_loss | 0.0174 | -| std | 0.00556 | -| value_loss | 1.02e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27309 | -| time_elapsed | 148416 | -| total_timesteps | 3495552 | -| train/ | | -| approx_kl | 0.054024767 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0237 | -| learning_rate | 0.0003 | -| loss | 0.0349 | -| n_updates | 273080 | -| policy_gradient_loss | 0.0173 | -| std | 0.00556 | -| value_loss | 5.71e-07 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27310 | -| time_elapsed | 148421 | -| total_timesteps | 3495680 | -| train/ | | -| approx_kl | 0.058233414 | -| clip_fraction | 0.28 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.064 | -| learning_rate | 0.0003 | -| loss | 0.0447 | -| n_updates | 273090 | -| policy_gradient_loss | 0.0216 | -| std | 0.00556 | -| value_loss | 1.5e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27311 | -| time_elapsed | 148426 | -| total_timesteps | 3495808 | -| train/ | | -| approx_kl | 0.06322235 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0553 | -| learning_rate | 0.0003 | -| loss | 0.0229 | -| n_updates | 273100 | -| policy_gradient_loss | 0.0109 | -| std | 0.00556 | -| value_loss | 4.9e-06 | ----------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27312 | -| time_elapsed | 148430 | -| total_timesteps | 3495936 | -| train/ | | -| approx_kl | 0.07079836 | -| clip_fraction | 0.311 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -3.07 | -| learning_rate | 0.0003 | -| loss | -0.0102 | -| n_updates | 273110 | -| policy_gradient_loss | -0.00451 | -| std | 0.00556 | -| value_loss | 4.4e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27313 | -| time_elapsed | 148435 | -| total_timesteps | 3496064 | -| train/ | | -| approx_kl | 0.010602955 | -| clip_fraction | 0.266 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0131 | -| learning_rate | 0.0003 | -| loss | -0.00588 | -| n_updates | 273120 | -| policy_gradient_loss | 0.00987 | -| std | 0.00556 | -| value_loss | 4.84e-08 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27314 | -| time_elapsed | 148442 | -| total_timesteps | 3496192 | -| train/ | | -| approx_kl | 0.046485562 | -| clip_fraction | 0.306 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.817 | -| learning_rate | 0.0003 | -| loss | 0.0299 | -| n_updates | 273130 | -| policy_gradient_loss | 0.0178 | -| std | 0.00556 | -| value_loss | 0.00254 | ------------------------------------------ ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27315 | -| time_elapsed | 148447 | -| total_timesteps | 3496320 | -| train/ | | -| approx_kl | 0.0063006794 | -| clip_fraction | 0.222 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.305 | -| learning_rate | 0.0003 | -| loss | -0.00525 | -| n_updates | 273140 | -| policy_gradient_loss | 0.0105 | -| std | 0.00556 | -| value_loss | 6.68e-05 | ------------------------------------------- ------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27316 | -| time_elapsed | 148451 | -| total_timesteps | 3496448 | -| train/ | | -| approx_kl | 0.0014512218 | -| clip_fraction | 0.236 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.0151 | -| learning_rate | 0.0003 | -| loss | 0.00874 | -| n_updates | 273150 | -| policy_gradient_loss | 0.00267 | -| std | 0.00556 | -| value_loss | 1.67e-05 | ------------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27317 | -| time_elapsed | 148456 | -| total_timesteps | 3496576 | -| train/ | | -| approx_kl | 0.007561687 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0449 | -| learning_rate | 0.0003 | -| loss | -0.00175 | -| n_updates | 273160 | -| policy_gradient_loss | 0.0115 | -| std | 0.00556 | -| value_loss | 9.63e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27318 | -| time_elapsed | 148460 | -| total_timesteps | 3496704 | -| train/ | | -| approx_kl | 0.109222695 | -| clip_fraction | 0.277 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0627 | -| learning_rate | 0.0003 | -| loss | 0.0642 | -| n_updates | 273170 | -| policy_gradient_loss | 0.0252 | -| std | 0.00556 | -| value_loss | 7.54e-06 | ------------------------------------------ ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27319 | -| time_elapsed | 148465 | -| total_timesteps | 3496832 | -| train/ | | -| approx_kl | 0.014571058 | -| clip_fraction | 0.233 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0507 | -| learning_rate | 0.0003 | -| loss | -0.00384 | -| n_updates | 273180 | -| policy_gradient_loss | 0.00933 | -| std | 0.00556 | -| value_loss | 5.74e-06 | ------------------------------------------ ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27320 | -| time_elapsed | 148470 | -| total_timesteps | 3496960 | -| train/ | | -| approx_kl | 0.10005542 | -| clip_fraction | 0.291 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0425 | -| learning_rate | 0.0003 | -| loss | 0.0647 | -| n_updates | 273190 | -| policy_gradient_loss | 0.027 | -| std | 0.00556 | -| value_loss | 3.37e-06 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27321 | -| time_elapsed | 148476 | -| total_timesteps | 3497088 | -| train/ | | -| approx_kl | 0.015709039 | -| clip_fraction | 0.248 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0932 | -| learning_rate | 0.0003 | -| loss | -0.00464 | -| n_updates | 273200 | -| policy_gradient_loss | 0.00888 | -| std | 0.00555 | -| value_loss | 2.91e-06 | ------------------------------------------ -------------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27322 | -| time_elapsed | 148485 | -| total_timesteps | 3497216 | -| train/ | | -| approx_kl | 0.00073336344 | -| clip_fraction | 0.295 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | 0.77 | -| learning_rate | 0.0003 | -| loss | -0.0135 | -| n_updates | 273210 | -| policy_gradient_loss | 0.00455 | -| std | 0.00555 | -| value_loss | 0.000972 | -------------------------------------------- ----------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27323 | -| time_elapsed | 148489 | -| total_timesteps | 3497344 | -| train/ | | -| approx_kl | 0.07646367 | -| clip_fraction | 0.693 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.175 | -| learning_rate | 0.0003 | -| loss | 0.07 | -| n_updates | 273220 | -| policy_gradient_loss | 0.113 | -| std | 0.00555 | -| value_loss | 9.73e-07 | ----------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27324 | -| time_elapsed | 148494 | -| total_timesteps | 3497472 | -| train/ | | -| approx_kl | 0.019050444 | -| clip_fraction | 0.42 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.197 | -| learning_rate | 0.0003 | -| loss | -0.011 | -| n_updates | 273230 | -| policy_gradient_loss | 0.0334 | -| std | 0.00555 | -| value_loss | 4.38e-07 | ------------------------------------------ --------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27325 | -| time_elapsed | 148498 | -| total_timesteps | 3497600 | -| train/ | | -| approx_kl | 0.917867 | -| clip_fraction | 0.591 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0667 | -| learning_rate | 0.0003 | -| loss | 0.296 | -| n_updates | 273240 | -| policy_gradient_loss | 0.087 | -| std | 0.00555 | -| value_loss | 2.55e-07 | --------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27326 | -| time_elapsed | 148503 | -| total_timesteps | 3497728 | -| train/ | | -| approx_kl | 0.012375573 | -| clip_fraction | 0.255 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0776 | -| learning_rate | 0.0003 | -| loss | -0.0153 | -| n_updates | 273250 | -| policy_gradient_loss | 0.00578 | -| std | 0.00555 | -| value_loss | 2.4e-07 | ------------------------------------------ ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27327 | -| time_elapsed | 148507 | -| total_timesteps | 3497856 | -| train/ | | -| approx_kl | 0.1006373 | -| clip_fraction | 0.477 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0448 | -| learning_rate | 0.0003 | -| loss | 0.00924 | -| n_updates | 273260 | -| policy_gradient_loss | 0.0256 | -| std | 0.00555 | -| value_loss | 1.61e-07 | ---------------------------------------- ---------------------------------------- -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27328 | -| time_elapsed | 148511 | -| total_timesteps | 3497984 | -| train/ | | -| approx_kl | 1.0652919 | -| clip_fraction | 0.762 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0614 | -| learning_rate | 0.0003 | -| loss | 0.252 | -| n_updates | 273270 | -| policy_gradient_loss | 0.22 | -| std | 0.00555 | -| value_loss | 8.87e-08 | ---------------------------------------- ------------------------------------------ -| rollout/ | | -| ep_len_mean | 1e+03 | -| ep_rew_mean | 1.04 | -| time/ | | -| fps | 23 | -| iterations | 27329 | -| time_elapsed | 148516 | -| total_timesteps | 3498112 | -| train/ | | -| approx_kl | 0.030854853 | -| clip_fraction | 0.319 | -| clip_range | 0.2 | -| entropy_loss | 3.77 | -| explained_variance | -0.0608 | -| learning_rate | 0.0003 | -| loss | 0.0329 | -| n_updates | 273280 | -| policy_gradient_loss | 0.0223 | -| std | 0.00555 | -| value_loss | 7.4e-08 | ------------------------------------------